program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "5.33.5"}, {"coremlc-version", "1877.40.3"}, {"coremltools-component-torch", "2.1.0"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "8.0"}})] { func main(tensor logmel_data) { tensor var_84_pad_type_0 = const()[name = tensor("op_84_pad_type_0"), val = tensor("custom")]; tensor var_84_pad_0 = const()[name = tensor("op_84_pad_0"), val = tensor([1, 1])]; tensor var_84_strides_0 = const()[name = tensor("op_84_strides_0"), val = tensor([1])]; tensor var_84_dilations_0 = const()[name = tensor("op_84_dilations_0"), val = tensor([1])]; tensor var_84_groups_0 = const()[name = tensor("op_84_groups_0"), val = tensor(1)]; tensor logmel_data_to_fp16_dtype_0 = const()[name = tensor("logmel_data_to_fp16_dtype_0"), val = tensor("fp16")]; tensor weight_3_to_fp16 = const()[name = tensor("weight_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor bias_3_to_fp16 = const()[name = tensor("bias_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(983168)))]; tensor logmel_data_to_fp16 = cast(dtype = logmel_data_to_fp16_dtype_0, x = logmel_data)[name = tensor("cast_131")]; tensor var_84_cast_fp16 = conv(bias = bias_3_to_fp16, dilations = var_84_dilations_0, groups = var_84_groups_0, pad = var_84_pad_0, pad_type = var_84_pad_type_0, strides = var_84_strides_0, weight = weight_3_to_fp16, x = logmel_data_to_fp16)[name = tensor("op_84_cast_fp16")]; tensor input_1_mode_0 = const()[name = tensor("input_1_mode_0"), val = tensor("EXACT")]; tensor input_1_cast_fp16 = gelu(mode = input_1_mode_0, x = var_84_cast_fp16)[name = tensor("input_1_cast_fp16")]; tensor var_102_pad_type_0 = const()[name = tensor("op_102_pad_type_0"), val = tensor("custom")]; tensor var_102_pad_0 = const()[name = tensor("op_102_pad_0"), val = tensor([1, 1])]; tensor var_102_strides_0 = const()[name = tensor("op_102_strides_0"), val = tensor([2])]; tensor var_102_dilations_0 = const()[name = tensor("op_102_dilations_0"), val = tensor([1])]; tensor var_102_groups_0 = const()[name = tensor("op_102_groups_0"), val = tensor(1)]; tensor weight_7_to_fp16 = const()[name = tensor("weight_7_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(985792)))]; tensor bias_7_to_fp16 = const()[name = tensor("bias_7_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10816256)))]; tensor var_102_cast_fp16 = conv(bias = bias_7_to_fp16, dilations = var_102_dilations_0, groups = var_102_groups_0, pad = var_102_pad_0, pad_type = var_102_pad_type_0, strides = var_102_strides_0, weight = weight_7_to_fp16, x = input_1_cast_fp16)[name = tensor("op_102_cast_fp16")]; tensor x_3_mode_0 = const()[name = tensor("x_3_mode_0"), val = tensor("EXACT")]; tensor x_3_cast_fp16 = gelu(mode = x_3_mode_0, x = var_102_cast_fp16)[name = tensor("x_3_cast_fp16")]; tensor var_107_to_fp16 = const()[name = tensor("op_107_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10818880)))]; tensor var_109_cast_fp16 = add(x = x_3_cast_fp16, y = var_107_to_fp16)[name = tensor("op_109_cast_fp16")]; tensor inputs_1_axes_0 = const()[name = tensor("inputs_1_axes_0"), val = tensor([2])]; tensor inputs_1_cast_fp16 = expand_dims(axes = inputs_1_axes_0, x = var_109_cast_fp16)[name = tensor("inputs_1_cast_fp16")]; tensor var_124 = const()[name = tensor("op_124"), val = tensor(1)]; tensor input_3_axes_0 = const()[name = tensor("input_3_axes_0"), val = tensor([1])]; tensor input_3_gamma_0_to_fp16 = const()[name = tensor("input_3_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14658944)))]; tensor input_3_beta_0_to_fp16 = const()[name = tensor("input_3_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14661568)))]; tensor var_140_to_fp16 = const()[name = tensor("op_140_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_3_cast_fp16 = layer_norm(axes = input_3_axes_0, beta = input_3_beta_0_to_fp16, epsilon = var_140_to_fp16, gamma = input_3_gamma_0_to_fp16, x = inputs_1_cast_fp16)[name = tensor("input_3_cast_fp16")]; tensor q_1_pad_type_0 = const()[name = tensor("q_1_pad_type_0"), val = tensor("valid")]; tensor q_1_strides_0 = const()[name = tensor("q_1_strides_0"), val = tensor([1, 1])]; tensor q_1_pad_0 = const()[name = tensor("q_1_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_1_dilations_0 = const()[name = tensor("q_1_dilations_0"), val = tensor([1, 1])]; tensor q_1_groups_0 = const()[name = tensor("q_1_groups_0"), val = tensor(1)]; tensor var_175_weight_0_to_fp16 = const()[name = tensor("op_175_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14664192)))]; tensor var_175_bias_0_to_fp16 = const()[name = tensor("op_175_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17941056)))]; tensor var_175_cast_fp16 = conv(bias = var_175_bias_0_to_fp16, dilations = q_1_dilations_0, groups = q_1_groups_0, pad = q_1_pad_0, pad_type = q_1_pad_type_0, strides = q_1_strides_0, weight = var_175_weight_0_to_fp16, x = input_3_cast_fp16)[name = tensor("op_175_cast_fp16")]; tensor k_1_pad_type_0 = const()[name = tensor("k_1_pad_type_0"), val = tensor("valid")]; tensor k_1_strides_0 = const()[name = tensor("k_1_strides_0"), val = tensor([1, 1])]; tensor k_1_pad_0 = const()[name = tensor("k_1_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_1_dilations_0 = const()[name = tensor("k_1_dilations_0"), val = tensor([1, 1])]; tensor k_1_groups_0 = const()[name = tensor("k_1_groups_0"), val = tensor(1)]; tensor blocks_0_attn_key_weight_to_fp16 = const()[name = tensor("blocks_0_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17943680)))]; tensor k_1_cast_fp16 = conv(dilations = k_1_dilations_0, groups = k_1_groups_0, pad = k_1_pad_0, pad_type = k_1_pad_type_0, strides = k_1_strides_0, weight = blocks_0_attn_key_weight_to_fp16, x = input_3_cast_fp16)[name = tensor("k_1_cast_fp16")]; tensor var_173_pad_type_0 = const()[name = tensor("op_173_pad_type_0"), val = tensor("valid")]; tensor var_173_strides_0 = const()[name = tensor("op_173_strides_0"), val = tensor([1, 1])]; tensor var_173_pad_0 = const()[name = tensor("op_173_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_173_dilations_0 = const()[name = tensor("op_173_dilations_0"), val = tensor([1, 1])]; tensor var_173_groups_0 = const()[name = tensor("op_173_groups_0"), val = tensor(1)]; tensor blocks_0_attn_value_weight_to_fp16 = const()[name = tensor("blocks_0_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21220544)))]; tensor blocks_0_attn_value_bias_to_fp16 = const()[name = tensor("blocks_0_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24497408)))]; tensor var_173_cast_fp16 = conv(bias = blocks_0_attn_value_bias_to_fp16, dilations = var_173_dilations_0, groups = var_173_groups_0, pad = var_173_pad_0, pad_type = var_173_pad_type_0, strides = var_173_strides_0, weight = blocks_0_attn_value_weight_to_fp16, x = input_3_cast_fp16)[name = tensor("op_173_cast_fp16")]; tensor tile_0 = const()[name = tensor("tile_0"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_176_axis_0 = const()[name = tensor("op_176_axis_0"), val = tensor(1)]; tensor var_176_cast_fp16_0, tensor var_176_cast_fp16_1, tensor var_176_cast_fp16_2, tensor var_176_cast_fp16_3, tensor var_176_cast_fp16_4, tensor var_176_cast_fp16_5, tensor var_176_cast_fp16_6, tensor var_176_cast_fp16_7, tensor var_176_cast_fp16_8, tensor var_176_cast_fp16_9, tensor var_176_cast_fp16_10, tensor var_176_cast_fp16_11, tensor var_176_cast_fp16_12, tensor var_176_cast_fp16_13, tensor var_176_cast_fp16_14, tensor var_176_cast_fp16_15, tensor var_176_cast_fp16_16, tensor var_176_cast_fp16_17, tensor var_176_cast_fp16_18, tensor var_176_cast_fp16_19 = split(axis = var_176_axis_0, split_sizes = tile_0, x = var_175_cast_fp16)[name = tensor("op_176_cast_fp16")]; tensor var_197_perm_0 = const()[name = tensor("op_197_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_1 = const()[name = tensor("tile_1"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_198_axis_0 = const()[name = tensor("op_198_axis_0"), val = tensor(3)]; tensor var_197_cast_fp16 = transpose(perm = var_197_perm_0, x = k_1_cast_fp16)[name = tensor("transpose_32")]; tensor var_198_cast_fp16_0, tensor var_198_cast_fp16_1, tensor var_198_cast_fp16_2, tensor var_198_cast_fp16_3, tensor var_198_cast_fp16_4, tensor var_198_cast_fp16_5, tensor var_198_cast_fp16_6, tensor var_198_cast_fp16_7, tensor var_198_cast_fp16_8, tensor var_198_cast_fp16_9, tensor var_198_cast_fp16_10, tensor var_198_cast_fp16_11, tensor var_198_cast_fp16_12, tensor var_198_cast_fp16_13, tensor var_198_cast_fp16_14, tensor var_198_cast_fp16_15, tensor var_198_cast_fp16_16, tensor var_198_cast_fp16_17, tensor var_198_cast_fp16_18, tensor var_198_cast_fp16_19 = split(axis = var_198_axis_0, split_sizes = tile_1, x = var_197_cast_fp16)[name = tensor("op_198_cast_fp16")]; tensor tile_2 = const()[name = tensor("tile_2"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_219_axis_0 = const()[name = tensor("op_219_axis_0"), val = tensor(1)]; tensor var_219_cast_fp16_0, tensor var_219_cast_fp16_1, tensor var_219_cast_fp16_2, tensor var_219_cast_fp16_3, tensor var_219_cast_fp16_4, tensor var_219_cast_fp16_5, tensor var_219_cast_fp16_6, tensor var_219_cast_fp16_7, tensor var_219_cast_fp16_8, tensor var_219_cast_fp16_9, tensor var_219_cast_fp16_10, tensor var_219_cast_fp16_11, tensor var_219_cast_fp16_12, tensor var_219_cast_fp16_13, tensor var_219_cast_fp16_14, tensor var_219_cast_fp16_15, tensor var_219_cast_fp16_16, tensor var_219_cast_fp16_17, tensor var_219_cast_fp16_18, tensor var_219_cast_fp16_19 = split(axis = var_219_axis_0, split_sizes = tile_2, x = var_173_cast_fp16)[name = tensor("op_219_cast_fp16")]; tensor aw_1_equation_0 = const()[name = tensor("aw_1_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1_cast_fp16 = einsum(equation = aw_1_equation_0, values = (var_198_cast_fp16_0, var_176_cast_fp16_0))[name = tensor("aw_1_cast_fp16")]; tensor aw_3_equation_0 = const()[name = tensor("aw_3_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_3_cast_fp16 = einsum(equation = aw_3_equation_0, values = (var_198_cast_fp16_1, var_176_cast_fp16_1))[name = tensor("aw_3_cast_fp16")]; tensor aw_5_equation_0 = const()[name = tensor("aw_5_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_5_cast_fp16 = einsum(equation = aw_5_equation_0, values = (var_198_cast_fp16_2, var_176_cast_fp16_2))[name = tensor("aw_5_cast_fp16")]; tensor aw_7_equation_0 = const()[name = tensor("aw_7_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_7_cast_fp16 = einsum(equation = aw_7_equation_0, values = (var_198_cast_fp16_3, var_176_cast_fp16_3))[name = tensor("aw_7_cast_fp16")]; tensor aw_9_equation_0 = const()[name = tensor("aw_9_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_9_cast_fp16 = einsum(equation = aw_9_equation_0, values = (var_198_cast_fp16_4, var_176_cast_fp16_4))[name = tensor("aw_9_cast_fp16")]; tensor aw_11_equation_0 = const()[name = tensor("aw_11_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_11_cast_fp16 = einsum(equation = aw_11_equation_0, values = (var_198_cast_fp16_5, var_176_cast_fp16_5))[name = tensor("aw_11_cast_fp16")]; tensor aw_13_equation_0 = const()[name = tensor("aw_13_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_13_cast_fp16 = einsum(equation = aw_13_equation_0, values = (var_198_cast_fp16_6, var_176_cast_fp16_6))[name = tensor("aw_13_cast_fp16")]; tensor aw_15_equation_0 = const()[name = tensor("aw_15_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_15_cast_fp16 = einsum(equation = aw_15_equation_0, values = (var_198_cast_fp16_7, var_176_cast_fp16_7))[name = tensor("aw_15_cast_fp16")]; tensor aw_17_equation_0 = const()[name = tensor("aw_17_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_17_cast_fp16 = einsum(equation = aw_17_equation_0, values = (var_198_cast_fp16_8, var_176_cast_fp16_8))[name = tensor("aw_17_cast_fp16")]; tensor aw_19_equation_0 = const()[name = tensor("aw_19_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_19_cast_fp16 = einsum(equation = aw_19_equation_0, values = (var_198_cast_fp16_9, var_176_cast_fp16_9))[name = tensor("aw_19_cast_fp16")]; tensor aw_21_equation_0 = const()[name = tensor("aw_21_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_21_cast_fp16 = einsum(equation = aw_21_equation_0, values = (var_198_cast_fp16_10, var_176_cast_fp16_10))[name = tensor("aw_21_cast_fp16")]; tensor aw_23_equation_0 = const()[name = tensor("aw_23_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_23_cast_fp16 = einsum(equation = aw_23_equation_0, values = (var_198_cast_fp16_11, var_176_cast_fp16_11))[name = tensor("aw_23_cast_fp16")]; tensor aw_25_equation_0 = const()[name = tensor("aw_25_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_25_cast_fp16 = einsum(equation = aw_25_equation_0, values = (var_198_cast_fp16_12, var_176_cast_fp16_12))[name = tensor("aw_25_cast_fp16")]; tensor aw_27_equation_0 = const()[name = tensor("aw_27_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_27_cast_fp16 = einsum(equation = aw_27_equation_0, values = (var_198_cast_fp16_13, var_176_cast_fp16_13))[name = tensor("aw_27_cast_fp16")]; tensor aw_29_equation_0 = const()[name = tensor("aw_29_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_29_cast_fp16 = einsum(equation = aw_29_equation_0, values = (var_198_cast_fp16_14, var_176_cast_fp16_14))[name = tensor("aw_29_cast_fp16")]; tensor aw_31_equation_0 = const()[name = tensor("aw_31_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_31_cast_fp16 = einsum(equation = aw_31_equation_0, values = (var_198_cast_fp16_15, var_176_cast_fp16_15))[name = tensor("aw_31_cast_fp16")]; tensor aw_33_equation_0 = const()[name = tensor("aw_33_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_33_cast_fp16 = einsum(equation = aw_33_equation_0, values = (var_198_cast_fp16_16, var_176_cast_fp16_16))[name = tensor("aw_33_cast_fp16")]; tensor aw_35_equation_0 = const()[name = tensor("aw_35_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_35_cast_fp16 = einsum(equation = aw_35_equation_0, values = (var_198_cast_fp16_17, var_176_cast_fp16_17))[name = tensor("aw_35_cast_fp16")]; tensor aw_37_equation_0 = const()[name = tensor("aw_37_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_37_cast_fp16 = einsum(equation = aw_37_equation_0, values = (var_198_cast_fp16_18, var_176_cast_fp16_18))[name = tensor("aw_37_cast_fp16")]; tensor aw_39_equation_0 = const()[name = tensor("aw_39_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_39_cast_fp16 = einsum(equation = aw_39_equation_0, values = (var_198_cast_fp16_19, var_176_cast_fp16_19))[name = tensor("aw_39_cast_fp16")]; tensor var_280_cast_fp16 = softmax(axis = var_124, x = aw_1_cast_fp16)[name = tensor("op_280_cast_fp16")]; tensor var_281_cast_fp16 = softmax(axis = var_124, x = aw_3_cast_fp16)[name = tensor("op_281_cast_fp16")]; tensor var_282_cast_fp16 = softmax(axis = var_124, x = aw_5_cast_fp16)[name = tensor("op_282_cast_fp16")]; tensor var_283_cast_fp16 = softmax(axis = var_124, x = aw_7_cast_fp16)[name = tensor("op_283_cast_fp16")]; tensor var_284_cast_fp16 = softmax(axis = var_124, x = aw_9_cast_fp16)[name = tensor("op_284_cast_fp16")]; tensor var_285_cast_fp16 = softmax(axis = var_124, x = aw_11_cast_fp16)[name = tensor("op_285_cast_fp16")]; tensor var_286_cast_fp16 = softmax(axis = var_124, x = aw_13_cast_fp16)[name = tensor("op_286_cast_fp16")]; tensor var_287_cast_fp16 = softmax(axis = var_124, x = aw_15_cast_fp16)[name = tensor("op_287_cast_fp16")]; tensor var_288_cast_fp16 = softmax(axis = var_124, x = aw_17_cast_fp16)[name = tensor("op_288_cast_fp16")]; tensor var_289_cast_fp16 = softmax(axis = var_124, x = aw_19_cast_fp16)[name = tensor("op_289_cast_fp16")]; tensor var_290_cast_fp16 = softmax(axis = var_124, x = aw_21_cast_fp16)[name = tensor("op_290_cast_fp16")]; tensor var_291_cast_fp16 = softmax(axis = var_124, x = aw_23_cast_fp16)[name = tensor("op_291_cast_fp16")]; tensor var_292_cast_fp16 = softmax(axis = var_124, x = aw_25_cast_fp16)[name = tensor("op_292_cast_fp16")]; tensor var_293_cast_fp16 = softmax(axis = var_124, x = aw_27_cast_fp16)[name = tensor("op_293_cast_fp16")]; tensor var_294_cast_fp16 = softmax(axis = var_124, x = aw_29_cast_fp16)[name = tensor("op_294_cast_fp16")]; tensor var_295_cast_fp16 = softmax(axis = var_124, x = aw_31_cast_fp16)[name = tensor("op_295_cast_fp16")]; tensor var_296_cast_fp16 = softmax(axis = var_124, x = aw_33_cast_fp16)[name = tensor("op_296_cast_fp16")]; tensor var_297_cast_fp16 = softmax(axis = var_124, x = aw_35_cast_fp16)[name = tensor("op_297_cast_fp16")]; tensor var_298_cast_fp16 = softmax(axis = var_124, x = aw_37_cast_fp16)[name = tensor("op_298_cast_fp16")]; tensor var_299_cast_fp16 = softmax(axis = var_124, x = aw_39_cast_fp16)[name = tensor("op_299_cast_fp16")]; tensor var_301_equation_0 = const()[name = tensor("op_301_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_301_cast_fp16 = einsum(equation = var_301_equation_0, values = (var_219_cast_fp16_0, var_280_cast_fp16))[name = tensor("op_301_cast_fp16")]; tensor var_303_equation_0 = const()[name = tensor("op_303_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_303_cast_fp16 = einsum(equation = var_303_equation_0, values = (var_219_cast_fp16_1, var_281_cast_fp16))[name = tensor("op_303_cast_fp16")]; tensor var_305_equation_0 = const()[name = tensor("op_305_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_305_cast_fp16 = einsum(equation = var_305_equation_0, values = (var_219_cast_fp16_2, var_282_cast_fp16))[name = tensor("op_305_cast_fp16")]; tensor var_307_equation_0 = const()[name = tensor("op_307_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_307_cast_fp16 = einsum(equation = var_307_equation_0, values = (var_219_cast_fp16_3, var_283_cast_fp16))[name = tensor("op_307_cast_fp16")]; tensor var_309_equation_0 = const()[name = tensor("op_309_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_309_cast_fp16 = einsum(equation = var_309_equation_0, values = (var_219_cast_fp16_4, var_284_cast_fp16))[name = tensor("op_309_cast_fp16")]; tensor var_311_equation_0 = const()[name = tensor("op_311_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_311_cast_fp16 = einsum(equation = var_311_equation_0, values = (var_219_cast_fp16_5, var_285_cast_fp16))[name = tensor("op_311_cast_fp16")]; tensor var_313_equation_0 = const()[name = tensor("op_313_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_313_cast_fp16 = einsum(equation = var_313_equation_0, values = (var_219_cast_fp16_6, var_286_cast_fp16))[name = tensor("op_313_cast_fp16")]; tensor var_315_equation_0 = const()[name = tensor("op_315_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_315_cast_fp16 = einsum(equation = var_315_equation_0, values = (var_219_cast_fp16_7, var_287_cast_fp16))[name = tensor("op_315_cast_fp16")]; tensor var_317_equation_0 = const()[name = tensor("op_317_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_317_cast_fp16 = einsum(equation = var_317_equation_0, values = (var_219_cast_fp16_8, var_288_cast_fp16))[name = tensor("op_317_cast_fp16")]; tensor var_319_equation_0 = const()[name = tensor("op_319_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_319_cast_fp16 = einsum(equation = var_319_equation_0, values = (var_219_cast_fp16_9, var_289_cast_fp16))[name = tensor("op_319_cast_fp16")]; tensor var_321_equation_0 = const()[name = tensor("op_321_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_321_cast_fp16 = einsum(equation = var_321_equation_0, values = (var_219_cast_fp16_10, var_290_cast_fp16))[name = tensor("op_321_cast_fp16")]; tensor var_323_equation_0 = const()[name = tensor("op_323_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_323_cast_fp16 = einsum(equation = var_323_equation_0, values = (var_219_cast_fp16_11, var_291_cast_fp16))[name = tensor("op_323_cast_fp16")]; tensor var_325_equation_0 = const()[name = tensor("op_325_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_325_cast_fp16 = einsum(equation = var_325_equation_0, values = (var_219_cast_fp16_12, var_292_cast_fp16))[name = tensor("op_325_cast_fp16")]; tensor var_327_equation_0 = const()[name = tensor("op_327_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_327_cast_fp16 = einsum(equation = var_327_equation_0, values = (var_219_cast_fp16_13, var_293_cast_fp16))[name = tensor("op_327_cast_fp16")]; tensor var_329_equation_0 = const()[name = tensor("op_329_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_329_cast_fp16 = einsum(equation = var_329_equation_0, values = (var_219_cast_fp16_14, var_294_cast_fp16))[name = tensor("op_329_cast_fp16")]; tensor var_331_equation_0 = const()[name = tensor("op_331_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_331_cast_fp16 = einsum(equation = var_331_equation_0, values = (var_219_cast_fp16_15, var_295_cast_fp16))[name = tensor("op_331_cast_fp16")]; tensor var_333_equation_0 = const()[name = tensor("op_333_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_333_cast_fp16 = einsum(equation = var_333_equation_0, values = (var_219_cast_fp16_16, var_296_cast_fp16))[name = tensor("op_333_cast_fp16")]; tensor var_335_equation_0 = const()[name = tensor("op_335_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_335_cast_fp16 = einsum(equation = var_335_equation_0, values = (var_219_cast_fp16_17, var_297_cast_fp16))[name = tensor("op_335_cast_fp16")]; tensor var_337_equation_0 = const()[name = tensor("op_337_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_337_cast_fp16 = einsum(equation = var_337_equation_0, values = (var_219_cast_fp16_18, var_298_cast_fp16))[name = tensor("op_337_cast_fp16")]; tensor var_339_equation_0 = const()[name = tensor("op_339_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_339_cast_fp16 = einsum(equation = var_339_equation_0, values = (var_219_cast_fp16_19, var_299_cast_fp16))[name = tensor("op_339_cast_fp16")]; tensor input_5_interleave_0 = const()[name = tensor("input_5_interleave_0"), val = tensor(false)]; tensor input_5_cast_fp16 = concat(axis = var_124, interleave = input_5_interleave_0, values = (var_301_cast_fp16, var_303_cast_fp16, var_305_cast_fp16, var_307_cast_fp16, var_309_cast_fp16, var_311_cast_fp16, var_313_cast_fp16, var_315_cast_fp16, var_317_cast_fp16, var_319_cast_fp16, var_321_cast_fp16, var_323_cast_fp16, var_325_cast_fp16, var_327_cast_fp16, var_329_cast_fp16, var_331_cast_fp16, var_333_cast_fp16, var_335_cast_fp16, var_337_cast_fp16, var_339_cast_fp16))[name = tensor("input_5_cast_fp16")]; tensor var_348_pad_type_0 = const()[name = tensor("op_348_pad_type_0"), val = tensor("valid")]; tensor var_348_strides_0 = const()[name = tensor("op_348_strides_0"), val = tensor([1, 1])]; tensor var_348_pad_0 = const()[name = tensor("op_348_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_348_dilations_0 = const()[name = tensor("op_348_dilations_0"), val = tensor([1, 1])]; tensor var_348_groups_0 = const()[name = tensor("op_348_groups_0"), val = tensor(1)]; tensor blocks_0_attn_out_weight_to_fp16 = const()[name = tensor("blocks_0_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24500032)))]; tensor blocks_0_attn_out_bias_to_fp16 = const()[name = tensor("blocks_0_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27776896)))]; tensor var_348_cast_fp16 = conv(bias = blocks_0_attn_out_bias_to_fp16, dilations = var_348_dilations_0, groups = var_348_groups_0, pad = var_348_pad_0, pad_type = var_348_pad_type_0, strides = var_348_strides_0, weight = blocks_0_attn_out_weight_to_fp16, x = input_5_cast_fp16)[name = tensor("op_348_cast_fp16")]; tensor inputs_3_cast_fp16 = add(x = inputs_1_cast_fp16, y = var_348_cast_fp16)[name = tensor("inputs_3_cast_fp16")]; tensor input_7_axes_0 = const()[name = tensor("input_7_axes_0"), val = tensor([1])]; tensor input_7_gamma_0_to_fp16 = const()[name = tensor("input_7_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27779520)))]; tensor input_7_beta_0_to_fp16 = const()[name = tensor("input_7_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27782144)))]; tensor var_358_to_fp16 = const()[name = tensor("op_358_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_7_cast_fp16 = layer_norm(axes = input_7_axes_0, beta = input_7_beta_0_to_fp16, epsilon = var_358_to_fp16, gamma = input_7_gamma_0_to_fp16, x = inputs_3_cast_fp16)[name = tensor("input_7_cast_fp16")]; tensor input_9_pad_type_0 = const()[name = tensor("input_9_pad_type_0"), val = tensor("valid")]; tensor input_9_strides_0 = const()[name = tensor("input_9_strides_0"), val = tensor([1, 1])]; tensor input_9_pad_0 = const()[name = tensor("input_9_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_9_dilations_0 = const()[name = tensor("input_9_dilations_0"), val = tensor([1, 1])]; tensor input_9_groups_0 = const()[name = tensor("input_9_groups_0"), val = tensor(1)]; tensor blocks_0_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_0_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27784768)))]; tensor blocks_0_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_0_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40892032)))]; tensor input_9_cast_fp16 = conv(bias = blocks_0_mlp_0_bias_to_fp16, dilations = input_9_dilations_0, groups = input_9_groups_0, pad = input_9_pad_0, pad_type = input_9_pad_type_0, strides = input_9_strides_0, weight = blocks_0_mlp_0_weight_to_fp16, x = input_7_cast_fp16)[name = tensor("input_9_cast_fp16")]; tensor input_11_mode_0 = const()[name = tensor("input_11_mode_0"), val = tensor("EXACT")]; tensor input_11_cast_fp16 = gelu(mode = input_11_mode_0, x = input_9_cast_fp16)[name = tensor("input_11_cast_fp16")]; tensor var_384_pad_type_0 = const()[name = tensor("op_384_pad_type_0"), val = tensor("valid")]; tensor var_384_strides_0 = const()[name = tensor("op_384_strides_0"), val = tensor([1, 1])]; tensor var_384_pad_0 = const()[name = tensor("op_384_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_384_dilations_0 = const()[name = tensor("op_384_dilations_0"), val = tensor([1, 1])]; tensor var_384_groups_0 = const()[name = tensor("op_384_groups_0"), val = tensor(1)]; tensor blocks_0_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_0_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40902336)))]; tensor blocks_0_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_0_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(54009600)))]; tensor var_384_cast_fp16 = conv(bias = blocks_0_mlp_2_bias_to_fp16, dilations = var_384_dilations_0, groups = var_384_groups_0, pad = var_384_pad_0, pad_type = var_384_pad_type_0, strides = var_384_strides_0, weight = blocks_0_mlp_2_weight_to_fp16, x = input_11_cast_fp16)[name = tensor("op_384_cast_fp16")]; tensor inputs_5_cast_fp16 = add(x = inputs_3_cast_fp16, y = var_384_cast_fp16)[name = tensor("inputs_5_cast_fp16")]; tensor var_393 = const()[name = tensor("op_393"), val = tensor(1)]; tensor input_13_axes_0 = const()[name = tensor("input_13_axes_0"), val = tensor([1])]; tensor input_13_gamma_0_to_fp16 = const()[name = tensor("input_13_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(54012224)))]; tensor input_13_beta_0_to_fp16 = const()[name = tensor("input_13_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(54014848)))]; tensor var_409_to_fp16 = const()[name = tensor("op_409_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_13_cast_fp16 = layer_norm(axes = input_13_axes_0, beta = input_13_beta_0_to_fp16, epsilon = var_409_to_fp16, gamma = input_13_gamma_0_to_fp16, x = inputs_5_cast_fp16)[name = tensor("input_13_cast_fp16")]; tensor q_3_pad_type_0 = const()[name = tensor("q_3_pad_type_0"), val = tensor("valid")]; tensor q_3_strides_0 = const()[name = tensor("q_3_strides_0"), val = tensor([1, 1])]; tensor q_3_pad_0 = const()[name = tensor("q_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_3_dilations_0 = const()[name = tensor("q_3_dilations_0"), val = tensor([1, 1])]; tensor q_3_groups_0 = const()[name = tensor("q_3_groups_0"), val = tensor(1)]; tensor var_444_weight_0_to_fp16 = const()[name = tensor("op_444_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(54017472)))]; tensor var_444_bias_0_to_fp16 = const()[name = tensor("op_444_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57294336)))]; tensor var_444_cast_fp16 = conv(bias = var_444_bias_0_to_fp16, dilations = q_3_dilations_0, groups = q_3_groups_0, pad = q_3_pad_0, pad_type = q_3_pad_type_0, strides = q_3_strides_0, weight = var_444_weight_0_to_fp16, x = input_13_cast_fp16)[name = tensor("op_444_cast_fp16")]; tensor k_3_pad_type_0 = const()[name = tensor("k_3_pad_type_0"), val = tensor("valid")]; tensor k_3_strides_0 = const()[name = tensor("k_3_strides_0"), val = tensor([1, 1])]; tensor k_3_pad_0 = const()[name = tensor("k_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_3_dilations_0 = const()[name = tensor("k_3_dilations_0"), val = tensor([1, 1])]; tensor k_3_groups_0 = const()[name = tensor("k_3_groups_0"), val = tensor(1)]; tensor blocks_1_attn_key_weight_to_fp16 = const()[name = tensor("blocks_1_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57296960)))]; tensor k_3_cast_fp16 = conv(dilations = k_3_dilations_0, groups = k_3_groups_0, pad = k_3_pad_0, pad_type = k_3_pad_type_0, strides = k_3_strides_0, weight = blocks_1_attn_key_weight_to_fp16, x = input_13_cast_fp16)[name = tensor("k_3_cast_fp16")]; tensor var_442_pad_type_0 = const()[name = tensor("op_442_pad_type_0"), val = tensor("valid")]; tensor var_442_strides_0 = const()[name = tensor("op_442_strides_0"), val = tensor([1, 1])]; tensor var_442_pad_0 = const()[name = tensor("op_442_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_442_dilations_0 = const()[name = tensor("op_442_dilations_0"), val = tensor([1, 1])]; tensor var_442_groups_0 = const()[name = tensor("op_442_groups_0"), val = tensor(1)]; tensor blocks_1_attn_value_weight_to_fp16 = const()[name = tensor("blocks_1_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(60573824)))]; tensor blocks_1_attn_value_bias_to_fp16 = const()[name = tensor("blocks_1_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(63850688)))]; tensor var_442_cast_fp16 = conv(bias = blocks_1_attn_value_bias_to_fp16, dilations = var_442_dilations_0, groups = var_442_groups_0, pad = var_442_pad_0, pad_type = var_442_pad_type_0, strides = var_442_strides_0, weight = blocks_1_attn_value_weight_to_fp16, x = input_13_cast_fp16)[name = tensor("op_442_cast_fp16")]; tensor tile_3 = const()[name = tensor("tile_3"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_445_axis_0 = const()[name = tensor("op_445_axis_0"), val = tensor(1)]; tensor var_445_cast_fp16_0, tensor var_445_cast_fp16_1, tensor var_445_cast_fp16_2, tensor var_445_cast_fp16_3, tensor var_445_cast_fp16_4, tensor var_445_cast_fp16_5, tensor var_445_cast_fp16_6, tensor var_445_cast_fp16_7, tensor var_445_cast_fp16_8, tensor var_445_cast_fp16_9, tensor var_445_cast_fp16_10, tensor var_445_cast_fp16_11, tensor var_445_cast_fp16_12, tensor var_445_cast_fp16_13, tensor var_445_cast_fp16_14, tensor var_445_cast_fp16_15, tensor var_445_cast_fp16_16, tensor var_445_cast_fp16_17, tensor var_445_cast_fp16_18, tensor var_445_cast_fp16_19 = split(axis = var_445_axis_0, split_sizes = tile_3, x = var_444_cast_fp16)[name = tensor("op_445_cast_fp16")]; tensor var_466_perm_0 = const()[name = tensor("op_466_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_4 = const()[name = tensor("tile_4"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_467_axis_0 = const()[name = tensor("op_467_axis_0"), val = tensor(3)]; tensor var_466_cast_fp16 = transpose(perm = var_466_perm_0, x = k_3_cast_fp16)[name = tensor("transpose_31")]; tensor var_467_cast_fp16_0, tensor var_467_cast_fp16_1, tensor var_467_cast_fp16_2, tensor var_467_cast_fp16_3, tensor var_467_cast_fp16_4, tensor var_467_cast_fp16_5, tensor var_467_cast_fp16_6, tensor var_467_cast_fp16_7, tensor var_467_cast_fp16_8, tensor var_467_cast_fp16_9, tensor var_467_cast_fp16_10, tensor var_467_cast_fp16_11, tensor var_467_cast_fp16_12, tensor var_467_cast_fp16_13, tensor var_467_cast_fp16_14, tensor var_467_cast_fp16_15, tensor var_467_cast_fp16_16, tensor var_467_cast_fp16_17, tensor var_467_cast_fp16_18, tensor var_467_cast_fp16_19 = split(axis = var_467_axis_0, split_sizes = tile_4, x = var_466_cast_fp16)[name = tensor("op_467_cast_fp16")]; tensor tile_5 = const()[name = tensor("tile_5"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_488_axis_0 = const()[name = tensor("op_488_axis_0"), val = tensor(1)]; tensor var_488_cast_fp16_0, tensor var_488_cast_fp16_1, tensor var_488_cast_fp16_2, tensor var_488_cast_fp16_3, tensor var_488_cast_fp16_4, tensor var_488_cast_fp16_5, tensor var_488_cast_fp16_6, tensor var_488_cast_fp16_7, tensor var_488_cast_fp16_8, tensor var_488_cast_fp16_9, tensor var_488_cast_fp16_10, tensor var_488_cast_fp16_11, tensor var_488_cast_fp16_12, tensor var_488_cast_fp16_13, tensor var_488_cast_fp16_14, tensor var_488_cast_fp16_15, tensor var_488_cast_fp16_16, tensor var_488_cast_fp16_17, tensor var_488_cast_fp16_18, tensor var_488_cast_fp16_19 = split(axis = var_488_axis_0, split_sizes = tile_5, x = var_442_cast_fp16)[name = tensor("op_488_cast_fp16")]; tensor aw_41_equation_0 = const()[name = tensor("aw_41_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_41_cast_fp16 = einsum(equation = aw_41_equation_0, values = (var_467_cast_fp16_0, var_445_cast_fp16_0))[name = tensor("aw_41_cast_fp16")]; tensor aw_43_equation_0 = const()[name = tensor("aw_43_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_43_cast_fp16 = einsum(equation = aw_43_equation_0, values = (var_467_cast_fp16_1, var_445_cast_fp16_1))[name = tensor("aw_43_cast_fp16")]; tensor aw_45_equation_0 = const()[name = tensor("aw_45_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_45_cast_fp16 = einsum(equation = aw_45_equation_0, values = (var_467_cast_fp16_2, var_445_cast_fp16_2))[name = tensor("aw_45_cast_fp16")]; tensor aw_47_equation_0 = const()[name = tensor("aw_47_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_47_cast_fp16 = einsum(equation = aw_47_equation_0, values = (var_467_cast_fp16_3, var_445_cast_fp16_3))[name = tensor("aw_47_cast_fp16")]; tensor aw_49_equation_0 = const()[name = tensor("aw_49_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_49_cast_fp16 = einsum(equation = aw_49_equation_0, values = (var_467_cast_fp16_4, var_445_cast_fp16_4))[name = tensor("aw_49_cast_fp16")]; tensor aw_51_equation_0 = const()[name = tensor("aw_51_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_51_cast_fp16 = einsum(equation = aw_51_equation_0, values = (var_467_cast_fp16_5, var_445_cast_fp16_5))[name = tensor("aw_51_cast_fp16")]; tensor aw_53_equation_0 = const()[name = tensor("aw_53_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_53_cast_fp16 = einsum(equation = aw_53_equation_0, values = (var_467_cast_fp16_6, var_445_cast_fp16_6))[name = tensor("aw_53_cast_fp16")]; tensor aw_55_equation_0 = const()[name = tensor("aw_55_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_55_cast_fp16 = einsum(equation = aw_55_equation_0, values = (var_467_cast_fp16_7, var_445_cast_fp16_7))[name = tensor("aw_55_cast_fp16")]; tensor aw_57_equation_0 = const()[name = tensor("aw_57_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_57_cast_fp16 = einsum(equation = aw_57_equation_0, values = (var_467_cast_fp16_8, var_445_cast_fp16_8))[name = tensor("aw_57_cast_fp16")]; tensor aw_59_equation_0 = const()[name = tensor("aw_59_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_59_cast_fp16 = einsum(equation = aw_59_equation_0, values = (var_467_cast_fp16_9, var_445_cast_fp16_9))[name = tensor("aw_59_cast_fp16")]; tensor aw_61_equation_0 = const()[name = tensor("aw_61_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_61_cast_fp16 = einsum(equation = aw_61_equation_0, values = (var_467_cast_fp16_10, var_445_cast_fp16_10))[name = tensor("aw_61_cast_fp16")]; tensor aw_63_equation_0 = const()[name = tensor("aw_63_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_63_cast_fp16 = einsum(equation = aw_63_equation_0, values = (var_467_cast_fp16_11, var_445_cast_fp16_11))[name = tensor("aw_63_cast_fp16")]; tensor aw_65_equation_0 = const()[name = tensor("aw_65_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_65_cast_fp16 = einsum(equation = aw_65_equation_0, values = (var_467_cast_fp16_12, var_445_cast_fp16_12))[name = tensor("aw_65_cast_fp16")]; tensor aw_67_equation_0 = const()[name = tensor("aw_67_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_67_cast_fp16 = einsum(equation = aw_67_equation_0, values = (var_467_cast_fp16_13, var_445_cast_fp16_13))[name = tensor("aw_67_cast_fp16")]; tensor aw_69_equation_0 = const()[name = tensor("aw_69_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_69_cast_fp16 = einsum(equation = aw_69_equation_0, values = (var_467_cast_fp16_14, var_445_cast_fp16_14))[name = tensor("aw_69_cast_fp16")]; tensor aw_71_equation_0 = const()[name = tensor("aw_71_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_71_cast_fp16 = einsum(equation = aw_71_equation_0, values = (var_467_cast_fp16_15, var_445_cast_fp16_15))[name = tensor("aw_71_cast_fp16")]; tensor aw_73_equation_0 = const()[name = tensor("aw_73_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_73_cast_fp16 = einsum(equation = aw_73_equation_0, values = (var_467_cast_fp16_16, var_445_cast_fp16_16))[name = tensor("aw_73_cast_fp16")]; tensor aw_75_equation_0 = const()[name = tensor("aw_75_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_75_cast_fp16 = einsum(equation = aw_75_equation_0, values = (var_467_cast_fp16_17, var_445_cast_fp16_17))[name = tensor("aw_75_cast_fp16")]; tensor aw_77_equation_0 = const()[name = tensor("aw_77_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_77_cast_fp16 = einsum(equation = aw_77_equation_0, values = (var_467_cast_fp16_18, var_445_cast_fp16_18))[name = tensor("aw_77_cast_fp16")]; tensor aw_79_equation_0 = const()[name = tensor("aw_79_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_79_cast_fp16 = einsum(equation = aw_79_equation_0, values = (var_467_cast_fp16_19, var_445_cast_fp16_19))[name = tensor("aw_79_cast_fp16")]; tensor var_549_cast_fp16 = softmax(axis = var_393, x = aw_41_cast_fp16)[name = tensor("op_549_cast_fp16")]; tensor var_550_cast_fp16 = softmax(axis = var_393, x = aw_43_cast_fp16)[name = tensor("op_550_cast_fp16")]; tensor var_551_cast_fp16 = softmax(axis = var_393, x = aw_45_cast_fp16)[name = tensor("op_551_cast_fp16")]; tensor var_552_cast_fp16 = softmax(axis = var_393, x = aw_47_cast_fp16)[name = tensor("op_552_cast_fp16")]; tensor var_553_cast_fp16 = softmax(axis = var_393, x = aw_49_cast_fp16)[name = tensor("op_553_cast_fp16")]; tensor var_554_cast_fp16 = softmax(axis = var_393, x = aw_51_cast_fp16)[name = tensor("op_554_cast_fp16")]; tensor var_555_cast_fp16 = softmax(axis = var_393, x = aw_53_cast_fp16)[name = tensor("op_555_cast_fp16")]; tensor var_556_cast_fp16 = softmax(axis = var_393, x = aw_55_cast_fp16)[name = tensor("op_556_cast_fp16")]; tensor var_557_cast_fp16 = softmax(axis = var_393, x = aw_57_cast_fp16)[name = tensor("op_557_cast_fp16")]; tensor var_558_cast_fp16 = softmax(axis = var_393, x = aw_59_cast_fp16)[name = tensor("op_558_cast_fp16")]; tensor var_559_cast_fp16 = softmax(axis = var_393, x = aw_61_cast_fp16)[name = tensor("op_559_cast_fp16")]; tensor var_560_cast_fp16 = softmax(axis = var_393, x = aw_63_cast_fp16)[name = tensor("op_560_cast_fp16")]; tensor var_561_cast_fp16 = softmax(axis = var_393, x = aw_65_cast_fp16)[name = tensor("op_561_cast_fp16")]; tensor var_562_cast_fp16 = softmax(axis = var_393, x = aw_67_cast_fp16)[name = tensor("op_562_cast_fp16")]; tensor var_563_cast_fp16 = softmax(axis = var_393, x = aw_69_cast_fp16)[name = tensor("op_563_cast_fp16")]; tensor var_564_cast_fp16 = softmax(axis = var_393, x = aw_71_cast_fp16)[name = tensor("op_564_cast_fp16")]; tensor var_565_cast_fp16 = softmax(axis = var_393, x = aw_73_cast_fp16)[name = tensor("op_565_cast_fp16")]; tensor var_566_cast_fp16 = softmax(axis = var_393, x = aw_75_cast_fp16)[name = tensor("op_566_cast_fp16")]; tensor var_567_cast_fp16 = softmax(axis = var_393, x = aw_77_cast_fp16)[name = tensor("op_567_cast_fp16")]; tensor var_568_cast_fp16 = softmax(axis = var_393, x = aw_79_cast_fp16)[name = tensor("op_568_cast_fp16")]; tensor var_570_equation_0 = const()[name = tensor("op_570_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_570_cast_fp16 = einsum(equation = var_570_equation_0, values = (var_488_cast_fp16_0, var_549_cast_fp16))[name = tensor("op_570_cast_fp16")]; tensor var_572_equation_0 = const()[name = tensor("op_572_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_572_cast_fp16 = einsum(equation = var_572_equation_0, values = (var_488_cast_fp16_1, var_550_cast_fp16))[name = tensor("op_572_cast_fp16")]; tensor var_574_equation_0 = const()[name = tensor("op_574_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_574_cast_fp16 = einsum(equation = var_574_equation_0, values = (var_488_cast_fp16_2, var_551_cast_fp16))[name = tensor("op_574_cast_fp16")]; tensor var_576_equation_0 = const()[name = tensor("op_576_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_576_cast_fp16 = einsum(equation = var_576_equation_0, values = (var_488_cast_fp16_3, var_552_cast_fp16))[name = tensor("op_576_cast_fp16")]; tensor var_578_equation_0 = const()[name = tensor("op_578_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_578_cast_fp16 = einsum(equation = var_578_equation_0, values = (var_488_cast_fp16_4, var_553_cast_fp16))[name = tensor("op_578_cast_fp16")]; tensor var_580_equation_0 = const()[name = tensor("op_580_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_580_cast_fp16 = einsum(equation = var_580_equation_0, values = (var_488_cast_fp16_5, var_554_cast_fp16))[name = tensor("op_580_cast_fp16")]; tensor var_582_equation_0 = const()[name = tensor("op_582_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_582_cast_fp16 = einsum(equation = var_582_equation_0, values = (var_488_cast_fp16_6, var_555_cast_fp16))[name = tensor("op_582_cast_fp16")]; tensor var_584_equation_0 = const()[name = tensor("op_584_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_584_cast_fp16 = einsum(equation = var_584_equation_0, values = (var_488_cast_fp16_7, var_556_cast_fp16))[name = tensor("op_584_cast_fp16")]; tensor var_586_equation_0 = const()[name = tensor("op_586_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_586_cast_fp16 = einsum(equation = var_586_equation_0, values = (var_488_cast_fp16_8, var_557_cast_fp16))[name = tensor("op_586_cast_fp16")]; tensor var_588_equation_0 = const()[name = tensor("op_588_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_588_cast_fp16 = einsum(equation = var_588_equation_0, values = (var_488_cast_fp16_9, var_558_cast_fp16))[name = tensor("op_588_cast_fp16")]; tensor var_590_equation_0 = const()[name = tensor("op_590_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_590_cast_fp16 = einsum(equation = var_590_equation_0, values = (var_488_cast_fp16_10, var_559_cast_fp16))[name = tensor("op_590_cast_fp16")]; tensor var_592_equation_0 = const()[name = tensor("op_592_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_592_cast_fp16 = einsum(equation = var_592_equation_0, values = (var_488_cast_fp16_11, var_560_cast_fp16))[name = tensor("op_592_cast_fp16")]; tensor var_594_equation_0 = const()[name = tensor("op_594_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_594_cast_fp16 = einsum(equation = var_594_equation_0, values = (var_488_cast_fp16_12, var_561_cast_fp16))[name = tensor("op_594_cast_fp16")]; tensor var_596_equation_0 = const()[name = tensor("op_596_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_596_cast_fp16 = einsum(equation = var_596_equation_0, values = (var_488_cast_fp16_13, var_562_cast_fp16))[name = tensor("op_596_cast_fp16")]; tensor var_598_equation_0 = const()[name = tensor("op_598_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_598_cast_fp16 = einsum(equation = var_598_equation_0, values = (var_488_cast_fp16_14, var_563_cast_fp16))[name = tensor("op_598_cast_fp16")]; tensor var_600_equation_0 = const()[name = tensor("op_600_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_600_cast_fp16 = einsum(equation = var_600_equation_0, values = (var_488_cast_fp16_15, var_564_cast_fp16))[name = tensor("op_600_cast_fp16")]; tensor var_602_equation_0 = const()[name = tensor("op_602_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_602_cast_fp16 = einsum(equation = var_602_equation_0, values = (var_488_cast_fp16_16, var_565_cast_fp16))[name = tensor("op_602_cast_fp16")]; tensor var_604_equation_0 = const()[name = tensor("op_604_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_604_cast_fp16 = einsum(equation = var_604_equation_0, values = (var_488_cast_fp16_17, var_566_cast_fp16))[name = tensor("op_604_cast_fp16")]; tensor var_606_equation_0 = const()[name = tensor("op_606_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_606_cast_fp16 = einsum(equation = var_606_equation_0, values = (var_488_cast_fp16_18, var_567_cast_fp16))[name = tensor("op_606_cast_fp16")]; tensor var_608_equation_0 = const()[name = tensor("op_608_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_608_cast_fp16 = einsum(equation = var_608_equation_0, values = (var_488_cast_fp16_19, var_568_cast_fp16))[name = tensor("op_608_cast_fp16")]; tensor input_15_interleave_0 = const()[name = tensor("input_15_interleave_0"), val = tensor(false)]; tensor input_15_cast_fp16 = concat(axis = var_393, interleave = input_15_interleave_0, values = (var_570_cast_fp16, var_572_cast_fp16, var_574_cast_fp16, var_576_cast_fp16, var_578_cast_fp16, var_580_cast_fp16, var_582_cast_fp16, var_584_cast_fp16, var_586_cast_fp16, var_588_cast_fp16, var_590_cast_fp16, var_592_cast_fp16, var_594_cast_fp16, var_596_cast_fp16, var_598_cast_fp16, var_600_cast_fp16, var_602_cast_fp16, var_604_cast_fp16, var_606_cast_fp16, var_608_cast_fp16))[name = tensor("input_15_cast_fp16")]; tensor var_617_pad_type_0 = const()[name = tensor("op_617_pad_type_0"), val = tensor("valid")]; tensor var_617_strides_0 = const()[name = tensor("op_617_strides_0"), val = tensor([1, 1])]; tensor var_617_pad_0 = const()[name = tensor("op_617_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_617_dilations_0 = const()[name = tensor("op_617_dilations_0"), val = tensor([1, 1])]; tensor var_617_groups_0 = const()[name = tensor("op_617_groups_0"), val = tensor(1)]; tensor blocks_1_attn_out_weight_to_fp16 = const()[name = tensor("blocks_1_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(63853312)))]; tensor blocks_1_attn_out_bias_to_fp16 = const()[name = tensor("blocks_1_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67130176)))]; tensor var_617_cast_fp16 = conv(bias = blocks_1_attn_out_bias_to_fp16, dilations = var_617_dilations_0, groups = var_617_groups_0, pad = var_617_pad_0, pad_type = var_617_pad_type_0, strides = var_617_strides_0, weight = blocks_1_attn_out_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("op_617_cast_fp16")]; tensor inputs_7_cast_fp16 = add(x = inputs_5_cast_fp16, y = var_617_cast_fp16)[name = tensor("inputs_7_cast_fp16")]; tensor input_17_axes_0 = const()[name = tensor("input_17_axes_0"), val = tensor([1])]; tensor input_17_gamma_0_to_fp16 = const()[name = tensor("input_17_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67132800)))]; tensor input_17_beta_0_to_fp16 = const()[name = tensor("input_17_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67135424)))]; tensor var_627_to_fp16 = const()[name = tensor("op_627_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_17_cast_fp16 = layer_norm(axes = input_17_axes_0, beta = input_17_beta_0_to_fp16, epsilon = var_627_to_fp16, gamma = input_17_gamma_0_to_fp16, x = inputs_7_cast_fp16)[name = tensor("input_17_cast_fp16")]; tensor input_19_pad_type_0 = const()[name = tensor("input_19_pad_type_0"), val = tensor("valid")]; tensor input_19_strides_0 = const()[name = tensor("input_19_strides_0"), val = tensor([1, 1])]; tensor input_19_pad_0 = const()[name = tensor("input_19_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_19_dilations_0 = const()[name = tensor("input_19_dilations_0"), val = tensor([1, 1])]; tensor input_19_groups_0 = const()[name = tensor("input_19_groups_0"), val = tensor(1)]; tensor blocks_1_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_1_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67138048)))]; tensor blocks_1_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_1_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80245312)))]; tensor input_19_cast_fp16 = conv(bias = blocks_1_mlp_0_bias_to_fp16, dilations = input_19_dilations_0, groups = input_19_groups_0, pad = input_19_pad_0, pad_type = input_19_pad_type_0, strides = input_19_strides_0, weight = blocks_1_mlp_0_weight_to_fp16, x = input_17_cast_fp16)[name = tensor("input_19_cast_fp16")]; tensor input_21_mode_0 = const()[name = tensor("input_21_mode_0"), val = tensor("EXACT")]; tensor input_21_cast_fp16 = gelu(mode = input_21_mode_0, x = input_19_cast_fp16)[name = tensor("input_21_cast_fp16")]; tensor var_653_pad_type_0 = const()[name = tensor("op_653_pad_type_0"), val = tensor("valid")]; tensor var_653_strides_0 = const()[name = tensor("op_653_strides_0"), val = tensor([1, 1])]; tensor var_653_pad_0 = const()[name = tensor("op_653_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_653_dilations_0 = const()[name = tensor("op_653_dilations_0"), val = tensor([1, 1])]; tensor var_653_groups_0 = const()[name = tensor("op_653_groups_0"), val = tensor(1)]; tensor blocks_1_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_1_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80255616)))]; tensor blocks_1_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_1_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93362880)))]; tensor var_653_cast_fp16 = conv(bias = blocks_1_mlp_2_bias_to_fp16, dilations = var_653_dilations_0, groups = var_653_groups_0, pad = var_653_pad_0, pad_type = var_653_pad_type_0, strides = var_653_strides_0, weight = blocks_1_mlp_2_weight_to_fp16, x = input_21_cast_fp16)[name = tensor("op_653_cast_fp16")]; tensor inputs_9_cast_fp16 = add(x = inputs_7_cast_fp16, y = var_653_cast_fp16)[name = tensor("inputs_9_cast_fp16")]; tensor var_662 = const()[name = tensor("op_662"), val = tensor(1)]; tensor input_23_axes_0 = const()[name = tensor("input_23_axes_0"), val = tensor([1])]; tensor input_23_gamma_0_to_fp16 = const()[name = tensor("input_23_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93365504)))]; tensor input_23_beta_0_to_fp16 = const()[name = tensor("input_23_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93368128)))]; tensor var_678_to_fp16 = const()[name = tensor("op_678_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_23_cast_fp16 = layer_norm(axes = input_23_axes_0, beta = input_23_beta_0_to_fp16, epsilon = var_678_to_fp16, gamma = input_23_gamma_0_to_fp16, x = inputs_9_cast_fp16)[name = tensor("input_23_cast_fp16")]; tensor q_5_pad_type_0 = const()[name = tensor("q_5_pad_type_0"), val = tensor("valid")]; tensor q_5_strides_0 = const()[name = tensor("q_5_strides_0"), val = tensor([1, 1])]; tensor q_5_pad_0 = const()[name = tensor("q_5_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_5_dilations_0 = const()[name = tensor("q_5_dilations_0"), val = tensor([1, 1])]; tensor q_5_groups_0 = const()[name = tensor("q_5_groups_0"), val = tensor(1)]; tensor var_713_weight_0_to_fp16 = const()[name = tensor("op_713_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93370752)))]; tensor var_713_bias_0_to_fp16 = const()[name = tensor("op_713_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(96647616)))]; tensor var_713_cast_fp16 = conv(bias = var_713_bias_0_to_fp16, dilations = q_5_dilations_0, groups = q_5_groups_0, pad = q_5_pad_0, pad_type = q_5_pad_type_0, strides = q_5_strides_0, weight = var_713_weight_0_to_fp16, x = input_23_cast_fp16)[name = tensor("op_713_cast_fp16")]; tensor k_5_pad_type_0 = const()[name = tensor("k_5_pad_type_0"), val = tensor("valid")]; tensor k_5_strides_0 = const()[name = tensor("k_5_strides_0"), val = tensor([1, 1])]; tensor k_5_pad_0 = const()[name = tensor("k_5_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_5_dilations_0 = const()[name = tensor("k_5_dilations_0"), val = tensor([1, 1])]; tensor k_5_groups_0 = const()[name = tensor("k_5_groups_0"), val = tensor(1)]; tensor blocks_2_attn_key_weight_to_fp16 = const()[name = tensor("blocks_2_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(96650240)))]; tensor k_5_cast_fp16 = conv(dilations = k_5_dilations_0, groups = k_5_groups_0, pad = k_5_pad_0, pad_type = k_5_pad_type_0, strides = k_5_strides_0, weight = blocks_2_attn_key_weight_to_fp16, x = input_23_cast_fp16)[name = tensor("k_5_cast_fp16")]; tensor var_711_pad_type_0 = const()[name = tensor("op_711_pad_type_0"), val = tensor("valid")]; tensor var_711_strides_0 = const()[name = tensor("op_711_strides_0"), val = tensor([1, 1])]; tensor var_711_pad_0 = const()[name = tensor("op_711_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_711_dilations_0 = const()[name = tensor("op_711_dilations_0"), val = tensor([1, 1])]; tensor var_711_groups_0 = const()[name = tensor("op_711_groups_0"), val = tensor(1)]; tensor blocks_2_attn_value_weight_to_fp16 = const()[name = tensor("blocks_2_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(99927104)))]; tensor blocks_2_attn_value_bias_to_fp16 = const()[name = tensor("blocks_2_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(103203968)))]; tensor var_711_cast_fp16 = conv(bias = blocks_2_attn_value_bias_to_fp16, dilations = var_711_dilations_0, groups = var_711_groups_0, pad = var_711_pad_0, pad_type = var_711_pad_type_0, strides = var_711_strides_0, weight = blocks_2_attn_value_weight_to_fp16, x = input_23_cast_fp16)[name = tensor("op_711_cast_fp16")]; tensor tile_6 = const()[name = tensor("tile_6"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_714_axis_0 = const()[name = tensor("op_714_axis_0"), val = tensor(1)]; tensor var_714_cast_fp16_0, tensor var_714_cast_fp16_1, tensor var_714_cast_fp16_2, tensor var_714_cast_fp16_3, tensor var_714_cast_fp16_4, tensor var_714_cast_fp16_5, tensor var_714_cast_fp16_6, tensor var_714_cast_fp16_7, tensor var_714_cast_fp16_8, tensor var_714_cast_fp16_9, tensor var_714_cast_fp16_10, tensor var_714_cast_fp16_11, tensor var_714_cast_fp16_12, tensor var_714_cast_fp16_13, tensor var_714_cast_fp16_14, tensor var_714_cast_fp16_15, tensor var_714_cast_fp16_16, tensor var_714_cast_fp16_17, tensor var_714_cast_fp16_18, tensor var_714_cast_fp16_19 = split(axis = var_714_axis_0, split_sizes = tile_6, x = var_713_cast_fp16)[name = tensor("op_714_cast_fp16")]; tensor var_735_perm_0 = const()[name = tensor("op_735_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_7 = const()[name = tensor("tile_7"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_736_axis_0 = const()[name = tensor("op_736_axis_0"), val = tensor(3)]; tensor var_735_cast_fp16 = transpose(perm = var_735_perm_0, x = k_5_cast_fp16)[name = tensor("transpose_30")]; tensor var_736_cast_fp16_0, tensor var_736_cast_fp16_1, tensor var_736_cast_fp16_2, tensor var_736_cast_fp16_3, tensor var_736_cast_fp16_4, tensor var_736_cast_fp16_5, tensor var_736_cast_fp16_6, tensor var_736_cast_fp16_7, tensor var_736_cast_fp16_8, tensor var_736_cast_fp16_9, tensor var_736_cast_fp16_10, tensor var_736_cast_fp16_11, tensor var_736_cast_fp16_12, tensor var_736_cast_fp16_13, tensor var_736_cast_fp16_14, tensor var_736_cast_fp16_15, tensor var_736_cast_fp16_16, tensor var_736_cast_fp16_17, tensor var_736_cast_fp16_18, tensor var_736_cast_fp16_19 = split(axis = var_736_axis_0, split_sizes = tile_7, x = var_735_cast_fp16)[name = tensor("op_736_cast_fp16")]; tensor tile_8 = const()[name = tensor("tile_8"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_757_axis_0 = const()[name = tensor("op_757_axis_0"), val = tensor(1)]; tensor var_757_cast_fp16_0, tensor var_757_cast_fp16_1, tensor var_757_cast_fp16_2, tensor var_757_cast_fp16_3, tensor var_757_cast_fp16_4, tensor var_757_cast_fp16_5, tensor var_757_cast_fp16_6, tensor var_757_cast_fp16_7, tensor var_757_cast_fp16_8, tensor var_757_cast_fp16_9, tensor var_757_cast_fp16_10, tensor var_757_cast_fp16_11, tensor var_757_cast_fp16_12, tensor var_757_cast_fp16_13, tensor var_757_cast_fp16_14, tensor var_757_cast_fp16_15, tensor var_757_cast_fp16_16, tensor var_757_cast_fp16_17, tensor var_757_cast_fp16_18, tensor var_757_cast_fp16_19 = split(axis = var_757_axis_0, split_sizes = tile_8, x = var_711_cast_fp16)[name = tensor("op_757_cast_fp16")]; tensor aw_81_equation_0 = const()[name = tensor("aw_81_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_81_cast_fp16 = einsum(equation = aw_81_equation_0, values = (var_736_cast_fp16_0, var_714_cast_fp16_0))[name = tensor("aw_81_cast_fp16")]; tensor aw_83_equation_0 = const()[name = tensor("aw_83_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_83_cast_fp16 = einsum(equation = aw_83_equation_0, values = (var_736_cast_fp16_1, var_714_cast_fp16_1))[name = tensor("aw_83_cast_fp16")]; tensor aw_85_equation_0 = const()[name = tensor("aw_85_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_85_cast_fp16 = einsum(equation = aw_85_equation_0, values = (var_736_cast_fp16_2, var_714_cast_fp16_2))[name = tensor("aw_85_cast_fp16")]; tensor aw_87_equation_0 = const()[name = tensor("aw_87_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_87_cast_fp16 = einsum(equation = aw_87_equation_0, values = (var_736_cast_fp16_3, var_714_cast_fp16_3))[name = tensor("aw_87_cast_fp16")]; tensor aw_89_equation_0 = const()[name = tensor("aw_89_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_89_cast_fp16 = einsum(equation = aw_89_equation_0, values = (var_736_cast_fp16_4, var_714_cast_fp16_4))[name = tensor("aw_89_cast_fp16")]; tensor aw_91_equation_0 = const()[name = tensor("aw_91_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_91_cast_fp16 = einsum(equation = aw_91_equation_0, values = (var_736_cast_fp16_5, var_714_cast_fp16_5))[name = tensor("aw_91_cast_fp16")]; tensor aw_93_equation_0 = const()[name = tensor("aw_93_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_93_cast_fp16 = einsum(equation = aw_93_equation_0, values = (var_736_cast_fp16_6, var_714_cast_fp16_6))[name = tensor("aw_93_cast_fp16")]; tensor aw_95_equation_0 = const()[name = tensor("aw_95_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_95_cast_fp16 = einsum(equation = aw_95_equation_0, values = (var_736_cast_fp16_7, var_714_cast_fp16_7))[name = tensor("aw_95_cast_fp16")]; tensor aw_97_equation_0 = const()[name = tensor("aw_97_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_97_cast_fp16 = einsum(equation = aw_97_equation_0, values = (var_736_cast_fp16_8, var_714_cast_fp16_8))[name = tensor("aw_97_cast_fp16")]; tensor aw_99_equation_0 = const()[name = tensor("aw_99_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_99_cast_fp16 = einsum(equation = aw_99_equation_0, values = (var_736_cast_fp16_9, var_714_cast_fp16_9))[name = tensor("aw_99_cast_fp16")]; tensor aw_101_equation_0 = const()[name = tensor("aw_101_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_101_cast_fp16 = einsum(equation = aw_101_equation_0, values = (var_736_cast_fp16_10, var_714_cast_fp16_10))[name = tensor("aw_101_cast_fp16")]; tensor aw_103_equation_0 = const()[name = tensor("aw_103_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_103_cast_fp16 = einsum(equation = aw_103_equation_0, values = (var_736_cast_fp16_11, var_714_cast_fp16_11))[name = tensor("aw_103_cast_fp16")]; tensor aw_105_equation_0 = const()[name = tensor("aw_105_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_105_cast_fp16 = einsum(equation = aw_105_equation_0, values = (var_736_cast_fp16_12, var_714_cast_fp16_12))[name = tensor("aw_105_cast_fp16")]; tensor aw_107_equation_0 = const()[name = tensor("aw_107_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_107_cast_fp16 = einsum(equation = aw_107_equation_0, values = (var_736_cast_fp16_13, var_714_cast_fp16_13))[name = tensor("aw_107_cast_fp16")]; tensor aw_109_equation_0 = const()[name = tensor("aw_109_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_109_cast_fp16 = einsum(equation = aw_109_equation_0, values = (var_736_cast_fp16_14, var_714_cast_fp16_14))[name = tensor("aw_109_cast_fp16")]; tensor aw_111_equation_0 = const()[name = tensor("aw_111_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_111_cast_fp16 = einsum(equation = aw_111_equation_0, values = (var_736_cast_fp16_15, var_714_cast_fp16_15))[name = tensor("aw_111_cast_fp16")]; tensor aw_113_equation_0 = const()[name = tensor("aw_113_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_113_cast_fp16 = einsum(equation = aw_113_equation_0, values = (var_736_cast_fp16_16, var_714_cast_fp16_16))[name = tensor("aw_113_cast_fp16")]; tensor aw_115_equation_0 = const()[name = tensor("aw_115_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_115_cast_fp16 = einsum(equation = aw_115_equation_0, values = (var_736_cast_fp16_17, var_714_cast_fp16_17))[name = tensor("aw_115_cast_fp16")]; tensor aw_117_equation_0 = const()[name = tensor("aw_117_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_117_cast_fp16 = einsum(equation = aw_117_equation_0, values = (var_736_cast_fp16_18, var_714_cast_fp16_18))[name = tensor("aw_117_cast_fp16")]; tensor aw_119_equation_0 = const()[name = tensor("aw_119_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_119_cast_fp16 = einsum(equation = aw_119_equation_0, values = (var_736_cast_fp16_19, var_714_cast_fp16_19))[name = tensor("aw_119_cast_fp16")]; tensor var_818_cast_fp16 = softmax(axis = var_662, x = aw_81_cast_fp16)[name = tensor("op_818_cast_fp16")]; tensor var_819_cast_fp16 = softmax(axis = var_662, x = aw_83_cast_fp16)[name = tensor("op_819_cast_fp16")]; tensor var_820_cast_fp16 = softmax(axis = var_662, x = aw_85_cast_fp16)[name = tensor("op_820_cast_fp16")]; tensor var_821_cast_fp16 = softmax(axis = var_662, x = aw_87_cast_fp16)[name = tensor("op_821_cast_fp16")]; tensor var_822_cast_fp16 = softmax(axis = var_662, x = aw_89_cast_fp16)[name = tensor("op_822_cast_fp16")]; tensor var_823_cast_fp16 = softmax(axis = var_662, x = aw_91_cast_fp16)[name = tensor("op_823_cast_fp16")]; tensor var_824_cast_fp16 = softmax(axis = var_662, x = aw_93_cast_fp16)[name = tensor("op_824_cast_fp16")]; tensor var_825_cast_fp16 = softmax(axis = var_662, x = aw_95_cast_fp16)[name = tensor("op_825_cast_fp16")]; tensor var_826_cast_fp16 = softmax(axis = var_662, x = aw_97_cast_fp16)[name = tensor("op_826_cast_fp16")]; tensor var_827_cast_fp16 = softmax(axis = var_662, x = aw_99_cast_fp16)[name = tensor("op_827_cast_fp16")]; tensor var_828_cast_fp16 = softmax(axis = var_662, x = aw_101_cast_fp16)[name = tensor("op_828_cast_fp16")]; tensor var_829_cast_fp16 = softmax(axis = var_662, x = aw_103_cast_fp16)[name = tensor("op_829_cast_fp16")]; tensor var_830_cast_fp16 = softmax(axis = var_662, x = aw_105_cast_fp16)[name = tensor("op_830_cast_fp16")]; tensor var_831_cast_fp16 = softmax(axis = var_662, x = aw_107_cast_fp16)[name = tensor("op_831_cast_fp16")]; tensor var_832_cast_fp16 = softmax(axis = var_662, x = aw_109_cast_fp16)[name = tensor("op_832_cast_fp16")]; tensor var_833_cast_fp16 = softmax(axis = var_662, x = aw_111_cast_fp16)[name = tensor("op_833_cast_fp16")]; tensor var_834_cast_fp16 = softmax(axis = var_662, x = aw_113_cast_fp16)[name = tensor("op_834_cast_fp16")]; tensor var_835_cast_fp16 = softmax(axis = var_662, x = aw_115_cast_fp16)[name = tensor("op_835_cast_fp16")]; tensor var_836_cast_fp16 = softmax(axis = var_662, x = aw_117_cast_fp16)[name = tensor("op_836_cast_fp16")]; tensor var_837_cast_fp16 = softmax(axis = var_662, x = aw_119_cast_fp16)[name = tensor("op_837_cast_fp16")]; tensor var_839_equation_0 = const()[name = tensor("op_839_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_839_cast_fp16 = einsum(equation = var_839_equation_0, values = (var_757_cast_fp16_0, var_818_cast_fp16))[name = tensor("op_839_cast_fp16")]; tensor var_841_equation_0 = const()[name = tensor("op_841_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_841_cast_fp16 = einsum(equation = var_841_equation_0, values = (var_757_cast_fp16_1, var_819_cast_fp16))[name = tensor("op_841_cast_fp16")]; tensor var_843_equation_0 = const()[name = tensor("op_843_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_843_cast_fp16 = einsum(equation = var_843_equation_0, values = (var_757_cast_fp16_2, var_820_cast_fp16))[name = tensor("op_843_cast_fp16")]; tensor var_845_equation_0 = const()[name = tensor("op_845_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_845_cast_fp16 = einsum(equation = var_845_equation_0, values = (var_757_cast_fp16_3, var_821_cast_fp16))[name = tensor("op_845_cast_fp16")]; tensor var_847_equation_0 = const()[name = tensor("op_847_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_847_cast_fp16 = einsum(equation = var_847_equation_0, values = (var_757_cast_fp16_4, var_822_cast_fp16))[name = tensor("op_847_cast_fp16")]; tensor var_849_equation_0 = const()[name = tensor("op_849_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_849_cast_fp16 = einsum(equation = var_849_equation_0, values = (var_757_cast_fp16_5, var_823_cast_fp16))[name = tensor("op_849_cast_fp16")]; tensor var_851_equation_0 = const()[name = tensor("op_851_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_851_cast_fp16 = einsum(equation = var_851_equation_0, values = (var_757_cast_fp16_6, var_824_cast_fp16))[name = tensor("op_851_cast_fp16")]; tensor var_853_equation_0 = const()[name = tensor("op_853_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_853_cast_fp16 = einsum(equation = var_853_equation_0, values = (var_757_cast_fp16_7, var_825_cast_fp16))[name = tensor("op_853_cast_fp16")]; tensor var_855_equation_0 = const()[name = tensor("op_855_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_855_cast_fp16 = einsum(equation = var_855_equation_0, values = (var_757_cast_fp16_8, var_826_cast_fp16))[name = tensor("op_855_cast_fp16")]; tensor var_857_equation_0 = const()[name = tensor("op_857_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_857_cast_fp16 = einsum(equation = var_857_equation_0, values = (var_757_cast_fp16_9, var_827_cast_fp16))[name = tensor("op_857_cast_fp16")]; tensor var_859_equation_0 = const()[name = tensor("op_859_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_859_cast_fp16 = einsum(equation = var_859_equation_0, values = (var_757_cast_fp16_10, var_828_cast_fp16))[name = tensor("op_859_cast_fp16")]; tensor var_861_equation_0 = const()[name = tensor("op_861_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_861_cast_fp16 = einsum(equation = var_861_equation_0, values = (var_757_cast_fp16_11, var_829_cast_fp16))[name = tensor("op_861_cast_fp16")]; tensor var_863_equation_0 = const()[name = tensor("op_863_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_863_cast_fp16 = einsum(equation = var_863_equation_0, values = (var_757_cast_fp16_12, var_830_cast_fp16))[name = tensor("op_863_cast_fp16")]; tensor var_865_equation_0 = const()[name = tensor("op_865_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_865_cast_fp16 = einsum(equation = var_865_equation_0, values = (var_757_cast_fp16_13, var_831_cast_fp16))[name = tensor("op_865_cast_fp16")]; tensor var_867_equation_0 = const()[name = tensor("op_867_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_867_cast_fp16 = einsum(equation = var_867_equation_0, values = (var_757_cast_fp16_14, var_832_cast_fp16))[name = tensor("op_867_cast_fp16")]; tensor var_869_equation_0 = const()[name = tensor("op_869_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_869_cast_fp16 = einsum(equation = var_869_equation_0, values = (var_757_cast_fp16_15, var_833_cast_fp16))[name = tensor("op_869_cast_fp16")]; tensor var_871_equation_0 = const()[name = tensor("op_871_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_871_cast_fp16 = einsum(equation = var_871_equation_0, values = (var_757_cast_fp16_16, var_834_cast_fp16))[name = tensor("op_871_cast_fp16")]; tensor var_873_equation_0 = const()[name = tensor("op_873_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_873_cast_fp16 = einsum(equation = var_873_equation_0, values = (var_757_cast_fp16_17, var_835_cast_fp16))[name = tensor("op_873_cast_fp16")]; tensor var_875_equation_0 = const()[name = tensor("op_875_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_875_cast_fp16 = einsum(equation = var_875_equation_0, values = (var_757_cast_fp16_18, var_836_cast_fp16))[name = tensor("op_875_cast_fp16")]; tensor var_877_equation_0 = const()[name = tensor("op_877_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_877_cast_fp16 = einsum(equation = var_877_equation_0, values = (var_757_cast_fp16_19, var_837_cast_fp16))[name = tensor("op_877_cast_fp16")]; tensor input_25_interleave_0 = const()[name = tensor("input_25_interleave_0"), val = tensor(false)]; tensor input_25_cast_fp16 = concat(axis = var_662, interleave = input_25_interleave_0, values = (var_839_cast_fp16, var_841_cast_fp16, var_843_cast_fp16, var_845_cast_fp16, var_847_cast_fp16, var_849_cast_fp16, var_851_cast_fp16, var_853_cast_fp16, var_855_cast_fp16, var_857_cast_fp16, var_859_cast_fp16, var_861_cast_fp16, var_863_cast_fp16, var_865_cast_fp16, var_867_cast_fp16, var_869_cast_fp16, var_871_cast_fp16, var_873_cast_fp16, var_875_cast_fp16, var_877_cast_fp16))[name = tensor("input_25_cast_fp16")]; tensor var_886_pad_type_0 = const()[name = tensor("op_886_pad_type_0"), val = tensor("valid")]; tensor var_886_strides_0 = const()[name = tensor("op_886_strides_0"), val = tensor([1, 1])]; tensor var_886_pad_0 = const()[name = tensor("op_886_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_886_dilations_0 = const()[name = tensor("op_886_dilations_0"), val = tensor([1, 1])]; tensor var_886_groups_0 = const()[name = tensor("op_886_groups_0"), val = tensor(1)]; tensor blocks_2_attn_out_weight_to_fp16 = const()[name = tensor("blocks_2_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(103206592)))]; tensor blocks_2_attn_out_bias_to_fp16 = const()[name = tensor("blocks_2_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106483456)))]; tensor var_886_cast_fp16 = conv(bias = blocks_2_attn_out_bias_to_fp16, dilations = var_886_dilations_0, groups = var_886_groups_0, pad = var_886_pad_0, pad_type = var_886_pad_type_0, strides = var_886_strides_0, weight = blocks_2_attn_out_weight_to_fp16, x = input_25_cast_fp16)[name = tensor("op_886_cast_fp16")]; tensor inputs_11_cast_fp16 = add(x = inputs_9_cast_fp16, y = var_886_cast_fp16)[name = tensor("inputs_11_cast_fp16")]; tensor input_27_axes_0 = const()[name = tensor("input_27_axes_0"), val = tensor([1])]; tensor input_27_gamma_0_to_fp16 = const()[name = tensor("input_27_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106486080)))]; tensor input_27_beta_0_to_fp16 = const()[name = tensor("input_27_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106488704)))]; tensor var_896_to_fp16 = const()[name = tensor("op_896_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_27_cast_fp16 = layer_norm(axes = input_27_axes_0, beta = input_27_beta_0_to_fp16, epsilon = var_896_to_fp16, gamma = input_27_gamma_0_to_fp16, x = inputs_11_cast_fp16)[name = tensor("input_27_cast_fp16")]; tensor input_29_pad_type_0 = const()[name = tensor("input_29_pad_type_0"), val = tensor("valid")]; tensor input_29_strides_0 = const()[name = tensor("input_29_strides_0"), val = tensor([1, 1])]; tensor input_29_pad_0 = const()[name = tensor("input_29_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_29_dilations_0 = const()[name = tensor("input_29_dilations_0"), val = tensor([1, 1])]; tensor input_29_groups_0 = const()[name = tensor("input_29_groups_0"), val = tensor(1)]; tensor blocks_2_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_2_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106491328)))]; tensor blocks_2_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_2_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119598592)))]; tensor input_29_cast_fp16 = conv(bias = blocks_2_mlp_0_bias_to_fp16, dilations = input_29_dilations_0, groups = input_29_groups_0, pad = input_29_pad_0, pad_type = input_29_pad_type_0, strides = input_29_strides_0, weight = blocks_2_mlp_0_weight_to_fp16, x = input_27_cast_fp16)[name = tensor("input_29_cast_fp16")]; tensor input_31_mode_0 = const()[name = tensor("input_31_mode_0"), val = tensor("EXACT")]; tensor input_31_cast_fp16 = gelu(mode = input_31_mode_0, x = input_29_cast_fp16)[name = tensor("input_31_cast_fp16")]; tensor var_922_pad_type_0 = const()[name = tensor("op_922_pad_type_0"), val = tensor("valid")]; tensor var_922_strides_0 = const()[name = tensor("op_922_strides_0"), val = tensor([1, 1])]; tensor var_922_pad_0 = const()[name = tensor("op_922_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_922_dilations_0 = const()[name = tensor("op_922_dilations_0"), val = tensor([1, 1])]; tensor var_922_groups_0 = const()[name = tensor("op_922_groups_0"), val = tensor(1)]; tensor blocks_2_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_2_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119608896)))]; tensor blocks_2_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_2_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132716160)))]; tensor var_922_cast_fp16 = conv(bias = blocks_2_mlp_2_bias_to_fp16, dilations = var_922_dilations_0, groups = var_922_groups_0, pad = var_922_pad_0, pad_type = var_922_pad_type_0, strides = var_922_strides_0, weight = blocks_2_mlp_2_weight_to_fp16, x = input_31_cast_fp16)[name = tensor("op_922_cast_fp16")]; tensor inputs_13_cast_fp16 = add(x = inputs_11_cast_fp16, y = var_922_cast_fp16)[name = tensor("inputs_13_cast_fp16")]; tensor var_931 = const()[name = tensor("op_931"), val = tensor(1)]; tensor input_33_axes_0 = const()[name = tensor("input_33_axes_0"), val = tensor([1])]; tensor input_33_gamma_0_to_fp16 = const()[name = tensor("input_33_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132718784)))]; tensor input_33_beta_0_to_fp16 = const()[name = tensor("input_33_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132721408)))]; tensor var_947_to_fp16 = const()[name = tensor("op_947_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_33_cast_fp16 = layer_norm(axes = input_33_axes_0, beta = input_33_beta_0_to_fp16, epsilon = var_947_to_fp16, gamma = input_33_gamma_0_to_fp16, x = inputs_13_cast_fp16)[name = tensor("input_33_cast_fp16")]; tensor q_7_pad_type_0 = const()[name = tensor("q_7_pad_type_0"), val = tensor("valid")]; tensor q_7_strides_0 = const()[name = tensor("q_7_strides_0"), val = tensor([1, 1])]; tensor q_7_pad_0 = const()[name = tensor("q_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_7_dilations_0 = const()[name = tensor("q_7_dilations_0"), val = tensor([1, 1])]; tensor q_7_groups_0 = const()[name = tensor("q_7_groups_0"), val = tensor(1)]; tensor var_982_weight_0_to_fp16 = const()[name = tensor("op_982_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132724032)))]; tensor var_982_bias_0_to_fp16 = const()[name = tensor("op_982_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(136000896)))]; tensor var_982_cast_fp16 = conv(bias = var_982_bias_0_to_fp16, dilations = q_7_dilations_0, groups = q_7_groups_0, pad = q_7_pad_0, pad_type = q_7_pad_type_0, strides = q_7_strides_0, weight = var_982_weight_0_to_fp16, x = input_33_cast_fp16)[name = tensor("op_982_cast_fp16")]; tensor k_7_pad_type_0 = const()[name = tensor("k_7_pad_type_0"), val = tensor("valid")]; tensor k_7_strides_0 = const()[name = tensor("k_7_strides_0"), val = tensor([1, 1])]; tensor k_7_pad_0 = const()[name = tensor("k_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_7_dilations_0 = const()[name = tensor("k_7_dilations_0"), val = tensor([1, 1])]; tensor k_7_groups_0 = const()[name = tensor("k_7_groups_0"), val = tensor(1)]; tensor blocks_3_attn_key_weight_to_fp16 = const()[name = tensor("blocks_3_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(136003520)))]; tensor k_7_cast_fp16 = conv(dilations = k_7_dilations_0, groups = k_7_groups_0, pad = k_7_pad_0, pad_type = k_7_pad_type_0, strides = k_7_strides_0, weight = blocks_3_attn_key_weight_to_fp16, x = input_33_cast_fp16)[name = tensor("k_7_cast_fp16")]; tensor var_980_pad_type_0 = const()[name = tensor("op_980_pad_type_0"), val = tensor("valid")]; tensor var_980_strides_0 = const()[name = tensor("op_980_strides_0"), val = tensor([1, 1])]; tensor var_980_pad_0 = const()[name = tensor("op_980_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_980_dilations_0 = const()[name = tensor("op_980_dilations_0"), val = tensor([1, 1])]; tensor var_980_groups_0 = const()[name = tensor("op_980_groups_0"), val = tensor(1)]; tensor blocks_3_attn_value_weight_to_fp16 = const()[name = tensor("blocks_3_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139280384)))]; tensor blocks_3_attn_value_bias_to_fp16 = const()[name = tensor("blocks_3_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(142557248)))]; tensor var_980_cast_fp16 = conv(bias = blocks_3_attn_value_bias_to_fp16, dilations = var_980_dilations_0, groups = var_980_groups_0, pad = var_980_pad_0, pad_type = var_980_pad_type_0, strides = var_980_strides_0, weight = blocks_3_attn_value_weight_to_fp16, x = input_33_cast_fp16)[name = tensor("op_980_cast_fp16")]; tensor tile_9 = const()[name = tensor("tile_9"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_983_axis_0 = const()[name = tensor("op_983_axis_0"), val = tensor(1)]; tensor var_983_cast_fp16_0, tensor var_983_cast_fp16_1, tensor var_983_cast_fp16_2, tensor var_983_cast_fp16_3, tensor var_983_cast_fp16_4, tensor var_983_cast_fp16_5, tensor var_983_cast_fp16_6, tensor var_983_cast_fp16_7, tensor var_983_cast_fp16_8, tensor var_983_cast_fp16_9, tensor var_983_cast_fp16_10, tensor var_983_cast_fp16_11, tensor var_983_cast_fp16_12, tensor var_983_cast_fp16_13, tensor var_983_cast_fp16_14, tensor var_983_cast_fp16_15, tensor var_983_cast_fp16_16, tensor var_983_cast_fp16_17, tensor var_983_cast_fp16_18, tensor var_983_cast_fp16_19 = split(axis = var_983_axis_0, split_sizes = tile_9, x = var_982_cast_fp16)[name = tensor("op_983_cast_fp16")]; tensor var_1004_perm_0 = const()[name = tensor("op_1004_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_10 = const()[name = tensor("tile_10"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_1005_axis_0 = const()[name = tensor("op_1005_axis_0"), val = tensor(3)]; tensor var_1004_cast_fp16 = transpose(perm = var_1004_perm_0, x = k_7_cast_fp16)[name = tensor("transpose_29")]; tensor var_1005_cast_fp16_0, tensor var_1005_cast_fp16_1, tensor var_1005_cast_fp16_2, tensor var_1005_cast_fp16_3, tensor var_1005_cast_fp16_4, tensor var_1005_cast_fp16_5, tensor var_1005_cast_fp16_6, tensor var_1005_cast_fp16_7, tensor var_1005_cast_fp16_8, tensor var_1005_cast_fp16_9, tensor var_1005_cast_fp16_10, tensor var_1005_cast_fp16_11, tensor var_1005_cast_fp16_12, tensor var_1005_cast_fp16_13, tensor var_1005_cast_fp16_14, tensor var_1005_cast_fp16_15, tensor var_1005_cast_fp16_16, tensor var_1005_cast_fp16_17, tensor var_1005_cast_fp16_18, tensor var_1005_cast_fp16_19 = split(axis = var_1005_axis_0, split_sizes = tile_10, x = var_1004_cast_fp16)[name = tensor("op_1005_cast_fp16")]; tensor tile_11 = const()[name = tensor("tile_11"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_1026_axis_0 = const()[name = tensor("op_1026_axis_0"), val = tensor(1)]; tensor var_1026_cast_fp16_0, tensor var_1026_cast_fp16_1, tensor var_1026_cast_fp16_2, tensor var_1026_cast_fp16_3, tensor var_1026_cast_fp16_4, tensor var_1026_cast_fp16_5, tensor var_1026_cast_fp16_6, tensor var_1026_cast_fp16_7, tensor var_1026_cast_fp16_8, tensor var_1026_cast_fp16_9, tensor var_1026_cast_fp16_10, tensor var_1026_cast_fp16_11, tensor var_1026_cast_fp16_12, tensor var_1026_cast_fp16_13, tensor var_1026_cast_fp16_14, tensor var_1026_cast_fp16_15, tensor var_1026_cast_fp16_16, tensor var_1026_cast_fp16_17, tensor var_1026_cast_fp16_18, tensor var_1026_cast_fp16_19 = split(axis = var_1026_axis_0, split_sizes = tile_11, x = var_980_cast_fp16)[name = tensor("op_1026_cast_fp16")]; tensor aw_121_equation_0 = const()[name = tensor("aw_121_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_121_cast_fp16 = einsum(equation = aw_121_equation_0, values = (var_1005_cast_fp16_0, var_983_cast_fp16_0))[name = tensor("aw_121_cast_fp16")]; tensor aw_123_equation_0 = const()[name = tensor("aw_123_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_123_cast_fp16 = einsum(equation = aw_123_equation_0, values = (var_1005_cast_fp16_1, var_983_cast_fp16_1))[name = tensor("aw_123_cast_fp16")]; tensor aw_125_equation_0 = const()[name = tensor("aw_125_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_125_cast_fp16 = einsum(equation = aw_125_equation_0, values = (var_1005_cast_fp16_2, var_983_cast_fp16_2))[name = tensor("aw_125_cast_fp16")]; tensor aw_127_equation_0 = const()[name = tensor("aw_127_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_127_cast_fp16 = einsum(equation = aw_127_equation_0, values = (var_1005_cast_fp16_3, var_983_cast_fp16_3))[name = tensor("aw_127_cast_fp16")]; tensor aw_129_equation_0 = const()[name = tensor("aw_129_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_129_cast_fp16 = einsum(equation = aw_129_equation_0, values = (var_1005_cast_fp16_4, var_983_cast_fp16_4))[name = tensor("aw_129_cast_fp16")]; tensor aw_131_equation_0 = const()[name = tensor("aw_131_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_131_cast_fp16 = einsum(equation = aw_131_equation_0, values = (var_1005_cast_fp16_5, var_983_cast_fp16_5))[name = tensor("aw_131_cast_fp16")]; tensor aw_133_equation_0 = const()[name = tensor("aw_133_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_133_cast_fp16 = einsum(equation = aw_133_equation_0, values = (var_1005_cast_fp16_6, var_983_cast_fp16_6))[name = tensor("aw_133_cast_fp16")]; tensor aw_135_equation_0 = const()[name = tensor("aw_135_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_135_cast_fp16 = einsum(equation = aw_135_equation_0, values = (var_1005_cast_fp16_7, var_983_cast_fp16_7))[name = tensor("aw_135_cast_fp16")]; tensor aw_137_equation_0 = const()[name = tensor("aw_137_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_137_cast_fp16 = einsum(equation = aw_137_equation_0, values = (var_1005_cast_fp16_8, var_983_cast_fp16_8))[name = tensor("aw_137_cast_fp16")]; tensor aw_139_equation_0 = const()[name = tensor("aw_139_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_139_cast_fp16 = einsum(equation = aw_139_equation_0, values = (var_1005_cast_fp16_9, var_983_cast_fp16_9))[name = tensor("aw_139_cast_fp16")]; tensor aw_141_equation_0 = const()[name = tensor("aw_141_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_141_cast_fp16 = einsum(equation = aw_141_equation_0, values = (var_1005_cast_fp16_10, var_983_cast_fp16_10))[name = tensor("aw_141_cast_fp16")]; tensor aw_143_equation_0 = const()[name = tensor("aw_143_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_143_cast_fp16 = einsum(equation = aw_143_equation_0, values = (var_1005_cast_fp16_11, var_983_cast_fp16_11))[name = tensor("aw_143_cast_fp16")]; tensor aw_145_equation_0 = const()[name = tensor("aw_145_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_145_cast_fp16 = einsum(equation = aw_145_equation_0, values = (var_1005_cast_fp16_12, var_983_cast_fp16_12))[name = tensor("aw_145_cast_fp16")]; tensor aw_147_equation_0 = const()[name = tensor("aw_147_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_147_cast_fp16 = einsum(equation = aw_147_equation_0, values = (var_1005_cast_fp16_13, var_983_cast_fp16_13))[name = tensor("aw_147_cast_fp16")]; tensor aw_149_equation_0 = const()[name = tensor("aw_149_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_149_cast_fp16 = einsum(equation = aw_149_equation_0, values = (var_1005_cast_fp16_14, var_983_cast_fp16_14))[name = tensor("aw_149_cast_fp16")]; tensor aw_151_equation_0 = const()[name = tensor("aw_151_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_151_cast_fp16 = einsum(equation = aw_151_equation_0, values = (var_1005_cast_fp16_15, var_983_cast_fp16_15))[name = tensor("aw_151_cast_fp16")]; tensor aw_153_equation_0 = const()[name = tensor("aw_153_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_153_cast_fp16 = einsum(equation = aw_153_equation_0, values = (var_1005_cast_fp16_16, var_983_cast_fp16_16))[name = tensor("aw_153_cast_fp16")]; tensor aw_155_equation_0 = const()[name = tensor("aw_155_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_155_cast_fp16 = einsum(equation = aw_155_equation_0, values = (var_1005_cast_fp16_17, var_983_cast_fp16_17))[name = tensor("aw_155_cast_fp16")]; tensor aw_157_equation_0 = const()[name = tensor("aw_157_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_157_cast_fp16 = einsum(equation = aw_157_equation_0, values = (var_1005_cast_fp16_18, var_983_cast_fp16_18))[name = tensor("aw_157_cast_fp16")]; tensor aw_159_equation_0 = const()[name = tensor("aw_159_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_159_cast_fp16 = einsum(equation = aw_159_equation_0, values = (var_1005_cast_fp16_19, var_983_cast_fp16_19))[name = tensor("aw_159_cast_fp16")]; tensor var_1087_cast_fp16 = softmax(axis = var_931, x = aw_121_cast_fp16)[name = tensor("op_1087_cast_fp16")]; tensor var_1088_cast_fp16 = softmax(axis = var_931, x = aw_123_cast_fp16)[name = tensor("op_1088_cast_fp16")]; tensor var_1089_cast_fp16 = softmax(axis = var_931, x = aw_125_cast_fp16)[name = tensor("op_1089_cast_fp16")]; tensor var_1090_cast_fp16 = softmax(axis = var_931, x = aw_127_cast_fp16)[name = tensor("op_1090_cast_fp16")]; tensor var_1091_cast_fp16 = softmax(axis = var_931, x = aw_129_cast_fp16)[name = tensor("op_1091_cast_fp16")]; tensor var_1092_cast_fp16 = softmax(axis = var_931, x = aw_131_cast_fp16)[name = tensor("op_1092_cast_fp16")]; tensor var_1093_cast_fp16 = softmax(axis = var_931, x = aw_133_cast_fp16)[name = tensor("op_1093_cast_fp16")]; tensor var_1094_cast_fp16 = softmax(axis = var_931, x = aw_135_cast_fp16)[name = tensor("op_1094_cast_fp16")]; tensor var_1095_cast_fp16 = softmax(axis = var_931, x = aw_137_cast_fp16)[name = tensor("op_1095_cast_fp16")]; tensor var_1096_cast_fp16 = softmax(axis = var_931, x = aw_139_cast_fp16)[name = tensor("op_1096_cast_fp16")]; tensor var_1097_cast_fp16 = softmax(axis = var_931, x = aw_141_cast_fp16)[name = tensor("op_1097_cast_fp16")]; tensor var_1098_cast_fp16 = softmax(axis = var_931, x = aw_143_cast_fp16)[name = tensor("op_1098_cast_fp16")]; tensor var_1099_cast_fp16 = softmax(axis = var_931, x = aw_145_cast_fp16)[name = tensor("op_1099_cast_fp16")]; tensor var_1100_cast_fp16 = softmax(axis = var_931, x = aw_147_cast_fp16)[name = tensor("op_1100_cast_fp16")]; tensor var_1101_cast_fp16 = softmax(axis = var_931, x = aw_149_cast_fp16)[name = tensor("op_1101_cast_fp16")]; tensor var_1102_cast_fp16 = softmax(axis = var_931, x = aw_151_cast_fp16)[name = tensor("op_1102_cast_fp16")]; tensor var_1103_cast_fp16 = softmax(axis = var_931, x = aw_153_cast_fp16)[name = tensor("op_1103_cast_fp16")]; tensor var_1104_cast_fp16 = softmax(axis = var_931, x = aw_155_cast_fp16)[name = tensor("op_1104_cast_fp16")]; tensor var_1105_cast_fp16 = softmax(axis = var_931, x = aw_157_cast_fp16)[name = tensor("op_1105_cast_fp16")]; tensor var_1106_cast_fp16 = softmax(axis = var_931, x = aw_159_cast_fp16)[name = tensor("op_1106_cast_fp16")]; tensor var_1108_equation_0 = const()[name = tensor("op_1108_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1108_cast_fp16 = einsum(equation = var_1108_equation_0, values = (var_1026_cast_fp16_0, var_1087_cast_fp16))[name = tensor("op_1108_cast_fp16")]; tensor var_1110_equation_0 = const()[name = tensor("op_1110_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1110_cast_fp16 = einsum(equation = var_1110_equation_0, values = (var_1026_cast_fp16_1, var_1088_cast_fp16))[name = tensor("op_1110_cast_fp16")]; tensor var_1112_equation_0 = const()[name = tensor("op_1112_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1112_cast_fp16 = einsum(equation = var_1112_equation_0, values = (var_1026_cast_fp16_2, var_1089_cast_fp16))[name = tensor("op_1112_cast_fp16")]; tensor var_1114_equation_0 = const()[name = tensor("op_1114_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1114_cast_fp16 = einsum(equation = var_1114_equation_0, values = (var_1026_cast_fp16_3, var_1090_cast_fp16))[name = tensor("op_1114_cast_fp16")]; tensor var_1116_equation_0 = const()[name = tensor("op_1116_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1116_cast_fp16 = einsum(equation = var_1116_equation_0, values = (var_1026_cast_fp16_4, var_1091_cast_fp16))[name = tensor("op_1116_cast_fp16")]; tensor var_1118_equation_0 = const()[name = tensor("op_1118_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1118_cast_fp16 = einsum(equation = var_1118_equation_0, values = (var_1026_cast_fp16_5, var_1092_cast_fp16))[name = tensor("op_1118_cast_fp16")]; tensor var_1120_equation_0 = const()[name = tensor("op_1120_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1120_cast_fp16 = einsum(equation = var_1120_equation_0, values = (var_1026_cast_fp16_6, var_1093_cast_fp16))[name = tensor("op_1120_cast_fp16")]; tensor var_1122_equation_0 = const()[name = tensor("op_1122_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1122_cast_fp16 = einsum(equation = var_1122_equation_0, values = (var_1026_cast_fp16_7, var_1094_cast_fp16))[name = tensor("op_1122_cast_fp16")]; tensor var_1124_equation_0 = const()[name = tensor("op_1124_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1124_cast_fp16 = einsum(equation = var_1124_equation_0, values = (var_1026_cast_fp16_8, var_1095_cast_fp16))[name = tensor("op_1124_cast_fp16")]; tensor var_1126_equation_0 = const()[name = tensor("op_1126_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1126_cast_fp16 = einsum(equation = var_1126_equation_0, values = (var_1026_cast_fp16_9, var_1096_cast_fp16))[name = tensor("op_1126_cast_fp16")]; tensor var_1128_equation_0 = const()[name = tensor("op_1128_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1128_cast_fp16 = einsum(equation = var_1128_equation_0, values = (var_1026_cast_fp16_10, var_1097_cast_fp16))[name = tensor("op_1128_cast_fp16")]; tensor var_1130_equation_0 = const()[name = tensor("op_1130_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1130_cast_fp16 = einsum(equation = var_1130_equation_0, values = (var_1026_cast_fp16_11, var_1098_cast_fp16))[name = tensor("op_1130_cast_fp16")]; tensor var_1132_equation_0 = const()[name = tensor("op_1132_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1132_cast_fp16 = einsum(equation = var_1132_equation_0, values = (var_1026_cast_fp16_12, var_1099_cast_fp16))[name = tensor("op_1132_cast_fp16")]; tensor var_1134_equation_0 = const()[name = tensor("op_1134_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1134_cast_fp16 = einsum(equation = var_1134_equation_0, values = (var_1026_cast_fp16_13, var_1100_cast_fp16))[name = tensor("op_1134_cast_fp16")]; tensor var_1136_equation_0 = const()[name = tensor("op_1136_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1136_cast_fp16 = einsum(equation = var_1136_equation_0, values = (var_1026_cast_fp16_14, var_1101_cast_fp16))[name = tensor("op_1136_cast_fp16")]; tensor var_1138_equation_0 = const()[name = tensor("op_1138_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1138_cast_fp16 = einsum(equation = var_1138_equation_0, values = (var_1026_cast_fp16_15, var_1102_cast_fp16))[name = tensor("op_1138_cast_fp16")]; tensor var_1140_equation_0 = const()[name = tensor("op_1140_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1140_cast_fp16 = einsum(equation = var_1140_equation_0, values = (var_1026_cast_fp16_16, var_1103_cast_fp16))[name = tensor("op_1140_cast_fp16")]; tensor var_1142_equation_0 = const()[name = tensor("op_1142_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1142_cast_fp16 = einsum(equation = var_1142_equation_0, values = (var_1026_cast_fp16_17, var_1104_cast_fp16))[name = tensor("op_1142_cast_fp16")]; tensor var_1144_equation_0 = const()[name = tensor("op_1144_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1144_cast_fp16 = einsum(equation = var_1144_equation_0, values = (var_1026_cast_fp16_18, var_1105_cast_fp16))[name = tensor("op_1144_cast_fp16")]; tensor var_1146_equation_0 = const()[name = tensor("op_1146_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1146_cast_fp16 = einsum(equation = var_1146_equation_0, values = (var_1026_cast_fp16_19, var_1106_cast_fp16))[name = tensor("op_1146_cast_fp16")]; tensor input_35_interleave_0 = const()[name = tensor("input_35_interleave_0"), val = tensor(false)]; tensor input_35_cast_fp16 = concat(axis = var_931, interleave = input_35_interleave_0, values = (var_1108_cast_fp16, var_1110_cast_fp16, var_1112_cast_fp16, var_1114_cast_fp16, var_1116_cast_fp16, var_1118_cast_fp16, var_1120_cast_fp16, var_1122_cast_fp16, var_1124_cast_fp16, var_1126_cast_fp16, var_1128_cast_fp16, var_1130_cast_fp16, var_1132_cast_fp16, var_1134_cast_fp16, var_1136_cast_fp16, var_1138_cast_fp16, var_1140_cast_fp16, var_1142_cast_fp16, var_1144_cast_fp16, var_1146_cast_fp16))[name = tensor("input_35_cast_fp16")]; tensor var_1155_pad_type_0 = const()[name = tensor("op_1155_pad_type_0"), val = tensor("valid")]; tensor var_1155_strides_0 = const()[name = tensor("op_1155_strides_0"), val = tensor([1, 1])]; tensor var_1155_pad_0 = const()[name = tensor("op_1155_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_1155_dilations_0 = const()[name = tensor("op_1155_dilations_0"), val = tensor([1, 1])]; tensor var_1155_groups_0 = const()[name = tensor("op_1155_groups_0"), val = tensor(1)]; tensor blocks_3_attn_out_weight_to_fp16 = const()[name = tensor("blocks_3_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(142559872)))]; tensor blocks_3_attn_out_bias_to_fp16 = const()[name = tensor("blocks_3_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145836736)))]; tensor var_1155_cast_fp16 = conv(bias = blocks_3_attn_out_bias_to_fp16, dilations = var_1155_dilations_0, groups = var_1155_groups_0, pad = var_1155_pad_0, pad_type = var_1155_pad_type_0, strides = var_1155_strides_0, weight = blocks_3_attn_out_weight_to_fp16, x = input_35_cast_fp16)[name = tensor("op_1155_cast_fp16")]; tensor inputs_15_cast_fp16 = add(x = inputs_13_cast_fp16, y = var_1155_cast_fp16)[name = tensor("inputs_15_cast_fp16")]; tensor input_37_axes_0 = const()[name = tensor("input_37_axes_0"), val = tensor([1])]; tensor input_37_gamma_0_to_fp16 = const()[name = tensor("input_37_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145839360)))]; tensor input_37_beta_0_to_fp16 = const()[name = tensor("input_37_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145841984)))]; tensor var_1165_to_fp16 = const()[name = tensor("op_1165_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_37_cast_fp16 = layer_norm(axes = input_37_axes_0, beta = input_37_beta_0_to_fp16, epsilon = var_1165_to_fp16, gamma = input_37_gamma_0_to_fp16, x = inputs_15_cast_fp16)[name = tensor("input_37_cast_fp16")]; tensor input_39_pad_type_0 = const()[name = tensor("input_39_pad_type_0"), val = tensor("valid")]; tensor input_39_strides_0 = const()[name = tensor("input_39_strides_0"), val = tensor([1, 1])]; tensor input_39_pad_0 = const()[name = tensor("input_39_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_39_dilations_0 = const()[name = tensor("input_39_dilations_0"), val = tensor([1, 1])]; tensor input_39_groups_0 = const()[name = tensor("input_39_groups_0"), val = tensor(1)]; tensor blocks_3_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_3_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145844608)))]; tensor blocks_3_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_3_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(158951872)))]; tensor input_39_cast_fp16 = conv(bias = blocks_3_mlp_0_bias_to_fp16, dilations = input_39_dilations_0, groups = input_39_groups_0, pad = input_39_pad_0, pad_type = input_39_pad_type_0, strides = input_39_strides_0, weight = blocks_3_mlp_0_weight_to_fp16, x = input_37_cast_fp16)[name = tensor("input_39_cast_fp16")]; tensor input_41_mode_0 = const()[name = tensor("input_41_mode_0"), val = tensor("EXACT")]; tensor input_41_cast_fp16 = gelu(mode = input_41_mode_0, x = input_39_cast_fp16)[name = tensor("input_41_cast_fp16")]; tensor var_1191_pad_type_0 = const()[name = tensor("op_1191_pad_type_0"), val = tensor("valid")]; tensor var_1191_strides_0 = const()[name = tensor("op_1191_strides_0"), val = tensor([1, 1])]; tensor var_1191_pad_0 = const()[name = tensor("op_1191_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_1191_dilations_0 = const()[name = tensor("op_1191_dilations_0"), val = tensor([1, 1])]; tensor var_1191_groups_0 = const()[name = tensor("op_1191_groups_0"), val = tensor(1)]; tensor blocks_3_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_3_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(158962176)))]; tensor blocks_3_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_3_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(172069440)))]; tensor var_1191_cast_fp16 = conv(bias = blocks_3_mlp_2_bias_to_fp16, dilations = var_1191_dilations_0, groups = var_1191_groups_0, pad = var_1191_pad_0, pad_type = var_1191_pad_type_0, strides = var_1191_strides_0, weight = blocks_3_mlp_2_weight_to_fp16, x = input_41_cast_fp16)[name = tensor("op_1191_cast_fp16")]; tensor inputs_17_cast_fp16 = add(x = inputs_15_cast_fp16, y = var_1191_cast_fp16)[name = tensor("inputs_17_cast_fp16")]; tensor var_1200 = const()[name = tensor("op_1200"), val = tensor(1)]; tensor input_43_axes_0 = const()[name = tensor("input_43_axes_0"), val = tensor([1])]; tensor input_43_gamma_0_to_fp16 = const()[name = tensor("input_43_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(172072064)))]; tensor input_43_beta_0_to_fp16 = const()[name = tensor("input_43_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(172074688)))]; tensor var_1216_to_fp16 = const()[name = tensor("op_1216_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_43_cast_fp16 = layer_norm(axes = input_43_axes_0, beta = input_43_beta_0_to_fp16, epsilon = var_1216_to_fp16, gamma = input_43_gamma_0_to_fp16, x = inputs_17_cast_fp16)[name = tensor("input_43_cast_fp16")]; tensor q_9_pad_type_0 = const()[name = tensor("q_9_pad_type_0"), val = tensor("valid")]; tensor q_9_strides_0 = const()[name = tensor("q_9_strides_0"), val = tensor([1, 1])]; tensor q_9_pad_0 = const()[name = tensor("q_9_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_9_dilations_0 = const()[name = tensor("q_9_dilations_0"), val = tensor([1, 1])]; tensor q_9_groups_0 = const()[name = tensor("q_9_groups_0"), val = tensor(1)]; tensor var_1251_weight_0_to_fp16 = const()[name = tensor("op_1251_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(172077312)))]; tensor var_1251_bias_0_to_fp16 = const()[name = tensor("op_1251_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(175354176)))]; tensor var_1251_cast_fp16 = conv(bias = var_1251_bias_0_to_fp16, dilations = q_9_dilations_0, groups = q_9_groups_0, pad = q_9_pad_0, pad_type = q_9_pad_type_0, strides = q_9_strides_0, weight = var_1251_weight_0_to_fp16, x = input_43_cast_fp16)[name = tensor("op_1251_cast_fp16")]; tensor k_9_pad_type_0 = const()[name = tensor("k_9_pad_type_0"), val = tensor("valid")]; tensor k_9_strides_0 = const()[name = tensor("k_9_strides_0"), val = tensor([1, 1])]; tensor k_9_pad_0 = const()[name = tensor("k_9_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_9_dilations_0 = const()[name = tensor("k_9_dilations_0"), val = tensor([1, 1])]; tensor k_9_groups_0 = const()[name = tensor("k_9_groups_0"), val = tensor(1)]; tensor blocks_4_attn_key_weight_to_fp16 = const()[name = tensor("blocks_4_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(175356800)))]; tensor k_9_cast_fp16 = conv(dilations = k_9_dilations_0, groups = k_9_groups_0, pad = k_9_pad_0, pad_type = k_9_pad_type_0, strides = k_9_strides_0, weight = blocks_4_attn_key_weight_to_fp16, x = input_43_cast_fp16)[name = tensor("k_9_cast_fp16")]; tensor var_1249_pad_type_0 = const()[name = tensor("op_1249_pad_type_0"), val = tensor("valid")]; tensor var_1249_strides_0 = const()[name = tensor("op_1249_strides_0"), val = tensor([1, 1])]; tensor var_1249_pad_0 = const()[name = tensor("op_1249_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_1249_dilations_0 = const()[name = tensor("op_1249_dilations_0"), val = tensor([1, 1])]; tensor var_1249_groups_0 = const()[name = tensor("op_1249_groups_0"), val = tensor(1)]; tensor blocks_4_attn_value_weight_to_fp16 = const()[name = tensor("blocks_4_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178633664)))]; tensor blocks_4_attn_value_bias_to_fp16 = const()[name = tensor("blocks_4_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181910528)))]; tensor var_1249_cast_fp16 = conv(bias = blocks_4_attn_value_bias_to_fp16, dilations = var_1249_dilations_0, groups = var_1249_groups_0, pad = var_1249_pad_0, pad_type = var_1249_pad_type_0, strides = var_1249_strides_0, weight = blocks_4_attn_value_weight_to_fp16, x = input_43_cast_fp16)[name = tensor("op_1249_cast_fp16")]; tensor tile_12 = const()[name = tensor("tile_12"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_1252_axis_0 = const()[name = tensor("op_1252_axis_0"), val = tensor(1)]; tensor var_1252_cast_fp16_0, tensor var_1252_cast_fp16_1, tensor var_1252_cast_fp16_2, tensor var_1252_cast_fp16_3, tensor var_1252_cast_fp16_4, tensor var_1252_cast_fp16_5, tensor var_1252_cast_fp16_6, tensor var_1252_cast_fp16_7, tensor var_1252_cast_fp16_8, tensor var_1252_cast_fp16_9, tensor var_1252_cast_fp16_10, tensor var_1252_cast_fp16_11, tensor var_1252_cast_fp16_12, tensor var_1252_cast_fp16_13, tensor var_1252_cast_fp16_14, tensor var_1252_cast_fp16_15, tensor var_1252_cast_fp16_16, tensor var_1252_cast_fp16_17, tensor var_1252_cast_fp16_18, tensor var_1252_cast_fp16_19 = split(axis = var_1252_axis_0, split_sizes = tile_12, x = var_1251_cast_fp16)[name = tensor("op_1252_cast_fp16")]; tensor var_1273_perm_0 = const()[name = tensor("op_1273_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_13 = const()[name = tensor("tile_13"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_1274_axis_0 = const()[name = tensor("op_1274_axis_0"), val = tensor(3)]; tensor var_1273_cast_fp16 = transpose(perm = var_1273_perm_0, x = k_9_cast_fp16)[name = tensor("transpose_28")]; tensor var_1274_cast_fp16_0, tensor var_1274_cast_fp16_1, tensor var_1274_cast_fp16_2, tensor var_1274_cast_fp16_3, tensor var_1274_cast_fp16_4, tensor var_1274_cast_fp16_5, tensor var_1274_cast_fp16_6, tensor var_1274_cast_fp16_7, tensor var_1274_cast_fp16_8, tensor var_1274_cast_fp16_9, tensor var_1274_cast_fp16_10, tensor var_1274_cast_fp16_11, tensor var_1274_cast_fp16_12, tensor var_1274_cast_fp16_13, tensor var_1274_cast_fp16_14, tensor var_1274_cast_fp16_15, tensor var_1274_cast_fp16_16, tensor var_1274_cast_fp16_17, tensor var_1274_cast_fp16_18, tensor var_1274_cast_fp16_19 = split(axis = var_1274_axis_0, split_sizes = tile_13, x = var_1273_cast_fp16)[name = tensor("op_1274_cast_fp16")]; tensor tile_14 = const()[name = tensor("tile_14"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_1295_axis_0 = const()[name = tensor("op_1295_axis_0"), val = tensor(1)]; tensor var_1295_cast_fp16_0, tensor var_1295_cast_fp16_1, tensor var_1295_cast_fp16_2, tensor var_1295_cast_fp16_3, tensor var_1295_cast_fp16_4, tensor var_1295_cast_fp16_5, tensor var_1295_cast_fp16_6, tensor var_1295_cast_fp16_7, tensor var_1295_cast_fp16_8, tensor var_1295_cast_fp16_9, tensor var_1295_cast_fp16_10, tensor var_1295_cast_fp16_11, tensor var_1295_cast_fp16_12, tensor var_1295_cast_fp16_13, tensor var_1295_cast_fp16_14, tensor var_1295_cast_fp16_15, tensor var_1295_cast_fp16_16, tensor var_1295_cast_fp16_17, tensor var_1295_cast_fp16_18, tensor var_1295_cast_fp16_19 = split(axis = var_1295_axis_0, split_sizes = tile_14, x = var_1249_cast_fp16)[name = tensor("op_1295_cast_fp16")]; tensor aw_161_equation_0 = const()[name = tensor("aw_161_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_161_cast_fp16 = einsum(equation = aw_161_equation_0, values = (var_1274_cast_fp16_0, var_1252_cast_fp16_0))[name = tensor("aw_161_cast_fp16")]; tensor aw_163_equation_0 = const()[name = tensor("aw_163_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_163_cast_fp16 = einsum(equation = aw_163_equation_0, values = (var_1274_cast_fp16_1, var_1252_cast_fp16_1))[name = tensor("aw_163_cast_fp16")]; tensor aw_165_equation_0 = const()[name = tensor("aw_165_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_165_cast_fp16 = einsum(equation = aw_165_equation_0, values = (var_1274_cast_fp16_2, var_1252_cast_fp16_2))[name = tensor("aw_165_cast_fp16")]; tensor aw_167_equation_0 = const()[name = tensor("aw_167_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_167_cast_fp16 = einsum(equation = aw_167_equation_0, values = (var_1274_cast_fp16_3, var_1252_cast_fp16_3))[name = tensor("aw_167_cast_fp16")]; tensor aw_169_equation_0 = const()[name = tensor("aw_169_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_169_cast_fp16 = einsum(equation = aw_169_equation_0, values = (var_1274_cast_fp16_4, var_1252_cast_fp16_4))[name = tensor("aw_169_cast_fp16")]; tensor aw_171_equation_0 = const()[name = tensor("aw_171_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_171_cast_fp16 = einsum(equation = aw_171_equation_0, values = (var_1274_cast_fp16_5, var_1252_cast_fp16_5))[name = tensor("aw_171_cast_fp16")]; tensor aw_173_equation_0 = const()[name = tensor("aw_173_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_173_cast_fp16 = einsum(equation = aw_173_equation_0, values = (var_1274_cast_fp16_6, var_1252_cast_fp16_6))[name = tensor("aw_173_cast_fp16")]; tensor aw_175_equation_0 = const()[name = tensor("aw_175_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_175_cast_fp16 = einsum(equation = aw_175_equation_0, values = (var_1274_cast_fp16_7, var_1252_cast_fp16_7))[name = tensor("aw_175_cast_fp16")]; tensor aw_177_equation_0 = const()[name = tensor("aw_177_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_177_cast_fp16 = einsum(equation = aw_177_equation_0, values = (var_1274_cast_fp16_8, var_1252_cast_fp16_8))[name = tensor("aw_177_cast_fp16")]; tensor aw_179_equation_0 = const()[name = tensor("aw_179_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_179_cast_fp16 = einsum(equation = aw_179_equation_0, values = (var_1274_cast_fp16_9, var_1252_cast_fp16_9))[name = tensor("aw_179_cast_fp16")]; tensor aw_181_equation_0 = const()[name = tensor("aw_181_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_181_cast_fp16 = einsum(equation = aw_181_equation_0, values = (var_1274_cast_fp16_10, var_1252_cast_fp16_10))[name = tensor("aw_181_cast_fp16")]; tensor aw_183_equation_0 = const()[name = tensor("aw_183_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_183_cast_fp16 = einsum(equation = aw_183_equation_0, values = (var_1274_cast_fp16_11, var_1252_cast_fp16_11))[name = tensor("aw_183_cast_fp16")]; tensor aw_185_equation_0 = const()[name = tensor("aw_185_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_185_cast_fp16 = einsum(equation = aw_185_equation_0, values = (var_1274_cast_fp16_12, var_1252_cast_fp16_12))[name = tensor("aw_185_cast_fp16")]; tensor aw_187_equation_0 = const()[name = tensor("aw_187_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_187_cast_fp16 = einsum(equation = aw_187_equation_0, values = (var_1274_cast_fp16_13, var_1252_cast_fp16_13))[name = tensor("aw_187_cast_fp16")]; tensor aw_189_equation_0 = const()[name = tensor("aw_189_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_189_cast_fp16 = einsum(equation = aw_189_equation_0, values = (var_1274_cast_fp16_14, var_1252_cast_fp16_14))[name = tensor("aw_189_cast_fp16")]; tensor aw_191_equation_0 = const()[name = tensor("aw_191_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_191_cast_fp16 = einsum(equation = aw_191_equation_0, values = (var_1274_cast_fp16_15, var_1252_cast_fp16_15))[name = tensor("aw_191_cast_fp16")]; tensor aw_193_equation_0 = const()[name = tensor("aw_193_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_193_cast_fp16 = einsum(equation = aw_193_equation_0, values = (var_1274_cast_fp16_16, var_1252_cast_fp16_16))[name = tensor("aw_193_cast_fp16")]; tensor aw_195_equation_0 = const()[name = tensor("aw_195_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_195_cast_fp16 = einsum(equation = aw_195_equation_0, values = (var_1274_cast_fp16_17, var_1252_cast_fp16_17))[name = tensor("aw_195_cast_fp16")]; tensor aw_197_equation_0 = const()[name = tensor("aw_197_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_197_cast_fp16 = einsum(equation = aw_197_equation_0, values = (var_1274_cast_fp16_18, var_1252_cast_fp16_18))[name = tensor("aw_197_cast_fp16")]; tensor aw_199_equation_0 = const()[name = tensor("aw_199_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_199_cast_fp16 = einsum(equation = aw_199_equation_0, values = (var_1274_cast_fp16_19, var_1252_cast_fp16_19))[name = tensor("aw_199_cast_fp16")]; tensor var_1356_cast_fp16 = softmax(axis = var_1200, x = aw_161_cast_fp16)[name = tensor("op_1356_cast_fp16")]; tensor var_1357_cast_fp16 = softmax(axis = var_1200, x = aw_163_cast_fp16)[name = tensor("op_1357_cast_fp16")]; tensor var_1358_cast_fp16 = softmax(axis = var_1200, x = aw_165_cast_fp16)[name = tensor("op_1358_cast_fp16")]; tensor var_1359_cast_fp16 = softmax(axis = var_1200, x = aw_167_cast_fp16)[name = tensor("op_1359_cast_fp16")]; tensor var_1360_cast_fp16 = softmax(axis = var_1200, x = aw_169_cast_fp16)[name = tensor("op_1360_cast_fp16")]; tensor var_1361_cast_fp16 = softmax(axis = var_1200, x = aw_171_cast_fp16)[name = tensor("op_1361_cast_fp16")]; tensor var_1362_cast_fp16 = softmax(axis = var_1200, x = aw_173_cast_fp16)[name = tensor("op_1362_cast_fp16")]; tensor var_1363_cast_fp16 = softmax(axis = var_1200, x = aw_175_cast_fp16)[name = tensor("op_1363_cast_fp16")]; tensor var_1364_cast_fp16 = softmax(axis = var_1200, x = aw_177_cast_fp16)[name = tensor("op_1364_cast_fp16")]; tensor var_1365_cast_fp16 = softmax(axis = var_1200, x = aw_179_cast_fp16)[name = tensor("op_1365_cast_fp16")]; tensor var_1366_cast_fp16 = softmax(axis = var_1200, x = aw_181_cast_fp16)[name = tensor("op_1366_cast_fp16")]; tensor var_1367_cast_fp16 = softmax(axis = var_1200, x = aw_183_cast_fp16)[name = tensor("op_1367_cast_fp16")]; tensor var_1368_cast_fp16 = softmax(axis = var_1200, x = aw_185_cast_fp16)[name = tensor("op_1368_cast_fp16")]; tensor var_1369_cast_fp16 = softmax(axis = var_1200, x = aw_187_cast_fp16)[name = tensor("op_1369_cast_fp16")]; tensor var_1370_cast_fp16 = softmax(axis = var_1200, x = aw_189_cast_fp16)[name = tensor("op_1370_cast_fp16")]; tensor var_1371_cast_fp16 = softmax(axis = var_1200, x = aw_191_cast_fp16)[name = tensor("op_1371_cast_fp16")]; tensor var_1372_cast_fp16 = softmax(axis = var_1200, x = aw_193_cast_fp16)[name = tensor("op_1372_cast_fp16")]; tensor var_1373_cast_fp16 = softmax(axis = var_1200, x = aw_195_cast_fp16)[name = tensor("op_1373_cast_fp16")]; tensor var_1374_cast_fp16 = softmax(axis = var_1200, x = aw_197_cast_fp16)[name = tensor("op_1374_cast_fp16")]; tensor var_1375_cast_fp16 = softmax(axis = var_1200, x = aw_199_cast_fp16)[name = tensor("op_1375_cast_fp16")]; tensor var_1377_equation_0 = const()[name = tensor("op_1377_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1377_cast_fp16 = einsum(equation = var_1377_equation_0, values = (var_1295_cast_fp16_0, var_1356_cast_fp16))[name = tensor("op_1377_cast_fp16")]; tensor var_1379_equation_0 = const()[name = tensor("op_1379_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1379_cast_fp16 = einsum(equation = var_1379_equation_0, values = (var_1295_cast_fp16_1, var_1357_cast_fp16))[name = tensor("op_1379_cast_fp16")]; tensor var_1381_equation_0 = const()[name = tensor("op_1381_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1381_cast_fp16 = einsum(equation = var_1381_equation_0, values = (var_1295_cast_fp16_2, var_1358_cast_fp16))[name = tensor("op_1381_cast_fp16")]; tensor var_1383_equation_0 = const()[name = tensor("op_1383_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1383_cast_fp16 = einsum(equation = var_1383_equation_0, values = (var_1295_cast_fp16_3, var_1359_cast_fp16))[name = tensor("op_1383_cast_fp16")]; tensor var_1385_equation_0 = const()[name = tensor("op_1385_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1385_cast_fp16 = einsum(equation = var_1385_equation_0, values = (var_1295_cast_fp16_4, var_1360_cast_fp16))[name = tensor("op_1385_cast_fp16")]; tensor var_1387_equation_0 = const()[name = tensor("op_1387_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1387_cast_fp16 = einsum(equation = var_1387_equation_0, values = (var_1295_cast_fp16_5, var_1361_cast_fp16))[name = tensor("op_1387_cast_fp16")]; tensor var_1389_equation_0 = const()[name = tensor("op_1389_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1389_cast_fp16 = einsum(equation = var_1389_equation_0, values = (var_1295_cast_fp16_6, var_1362_cast_fp16))[name = tensor("op_1389_cast_fp16")]; tensor var_1391_equation_0 = const()[name = tensor("op_1391_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1391_cast_fp16 = einsum(equation = var_1391_equation_0, values = (var_1295_cast_fp16_7, var_1363_cast_fp16))[name = tensor("op_1391_cast_fp16")]; tensor var_1393_equation_0 = const()[name = tensor("op_1393_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1393_cast_fp16 = einsum(equation = var_1393_equation_0, values = (var_1295_cast_fp16_8, var_1364_cast_fp16))[name = tensor("op_1393_cast_fp16")]; tensor var_1395_equation_0 = const()[name = tensor("op_1395_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1395_cast_fp16 = einsum(equation = var_1395_equation_0, values = (var_1295_cast_fp16_9, var_1365_cast_fp16))[name = tensor("op_1395_cast_fp16")]; tensor var_1397_equation_0 = const()[name = tensor("op_1397_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1397_cast_fp16 = einsum(equation = var_1397_equation_0, values = (var_1295_cast_fp16_10, var_1366_cast_fp16))[name = tensor("op_1397_cast_fp16")]; tensor var_1399_equation_0 = const()[name = tensor("op_1399_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1399_cast_fp16 = einsum(equation = var_1399_equation_0, values = (var_1295_cast_fp16_11, var_1367_cast_fp16))[name = tensor("op_1399_cast_fp16")]; tensor var_1401_equation_0 = const()[name = tensor("op_1401_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1401_cast_fp16 = einsum(equation = var_1401_equation_0, values = (var_1295_cast_fp16_12, var_1368_cast_fp16))[name = tensor("op_1401_cast_fp16")]; tensor var_1403_equation_0 = const()[name = tensor("op_1403_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1403_cast_fp16 = einsum(equation = var_1403_equation_0, values = (var_1295_cast_fp16_13, var_1369_cast_fp16))[name = tensor("op_1403_cast_fp16")]; tensor var_1405_equation_0 = const()[name = tensor("op_1405_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1405_cast_fp16 = einsum(equation = var_1405_equation_0, values = (var_1295_cast_fp16_14, var_1370_cast_fp16))[name = tensor("op_1405_cast_fp16")]; tensor var_1407_equation_0 = const()[name = tensor("op_1407_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1407_cast_fp16 = einsum(equation = var_1407_equation_0, values = (var_1295_cast_fp16_15, var_1371_cast_fp16))[name = tensor("op_1407_cast_fp16")]; tensor var_1409_equation_0 = const()[name = tensor("op_1409_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1409_cast_fp16 = einsum(equation = var_1409_equation_0, values = (var_1295_cast_fp16_16, var_1372_cast_fp16))[name = tensor("op_1409_cast_fp16")]; tensor var_1411_equation_0 = const()[name = tensor("op_1411_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1411_cast_fp16 = einsum(equation = var_1411_equation_0, values = (var_1295_cast_fp16_17, var_1373_cast_fp16))[name = tensor("op_1411_cast_fp16")]; tensor var_1413_equation_0 = const()[name = tensor("op_1413_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1413_cast_fp16 = einsum(equation = var_1413_equation_0, values = (var_1295_cast_fp16_18, var_1374_cast_fp16))[name = tensor("op_1413_cast_fp16")]; tensor var_1415_equation_0 = const()[name = tensor("op_1415_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1415_cast_fp16 = einsum(equation = var_1415_equation_0, values = (var_1295_cast_fp16_19, var_1375_cast_fp16))[name = tensor("op_1415_cast_fp16")]; tensor input_45_interleave_0 = const()[name = tensor("input_45_interleave_0"), val = tensor(false)]; tensor input_45_cast_fp16 = concat(axis = var_1200, interleave = input_45_interleave_0, values = (var_1377_cast_fp16, var_1379_cast_fp16, var_1381_cast_fp16, var_1383_cast_fp16, var_1385_cast_fp16, var_1387_cast_fp16, var_1389_cast_fp16, var_1391_cast_fp16, var_1393_cast_fp16, var_1395_cast_fp16, var_1397_cast_fp16, var_1399_cast_fp16, var_1401_cast_fp16, var_1403_cast_fp16, var_1405_cast_fp16, var_1407_cast_fp16, var_1409_cast_fp16, var_1411_cast_fp16, var_1413_cast_fp16, var_1415_cast_fp16))[name = tensor("input_45_cast_fp16")]; tensor var_1424_pad_type_0 = const()[name = tensor("op_1424_pad_type_0"), val = tensor("valid")]; tensor var_1424_strides_0 = const()[name = tensor("op_1424_strides_0"), val = tensor([1, 1])]; tensor var_1424_pad_0 = const()[name = tensor("op_1424_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_1424_dilations_0 = const()[name = tensor("op_1424_dilations_0"), val = tensor([1, 1])]; tensor var_1424_groups_0 = const()[name = tensor("op_1424_groups_0"), val = tensor(1)]; tensor blocks_4_attn_out_weight_to_fp16 = const()[name = tensor("blocks_4_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181913152)))]; tensor blocks_4_attn_out_bias_to_fp16 = const()[name = tensor("blocks_4_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185190016)))]; tensor var_1424_cast_fp16 = conv(bias = blocks_4_attn_out_bias_to_fp16, dilations = var_1424_dilations_0, groups = var_1424_groups_0, pad = var_1424_pad_0, pad_type = var_1424_pad_type_0, strides = var_1424_strides_0, weight = blocks_4_attn_out_weight_to_fp16, x = input_45_cast_fp16)[name = tensor("op_1424_cast_fp16")]; tensor inputs_19_cast_fp16 = add(x = inputs_17_cast_fp16, y = var_1424_cast_fp16)[name = tensor("inputs_19_cast_fp16")]; tensor input_47_axes_0 = const()[name = tensor("input_47_axes_0"), val = tensor([1])]; tensor input_47_gamma_0_to_fp16 = const()[name = tensor("input_47_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185192640)))]; tensor input_47_beta_0_to_fp16 = const()[name = tensor("input_47_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185195264)))]; tensor var_1434_to_fp16 = const()[name = tensor("op_1434_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_47_cast_fp16 = layer_norm(axes = input_47_axes_0, beta = input_47_beta_0_to_fp16, epsilon = var_1434_to_fp16, gamma = input_47_gamma_0_to_fp16, x = inputs_19_cast_fp16)[name = tensor("input_47_cast_fp16")]; tensor input_49_pad_type_0 = const()[name = tensor("input_49_pad_type_0"), val = tensor("valid")]; tensor input_49_strides_0 = const()[name = tensor("input_49_strides_0"), val = tensor([1, 1])]; tensor input_49_pad_0 = const()[name = tensor("input_49_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_49_dilations_0 = const()[name = tensor("input_49_dilations_0"), val = tensor([1, 1])]; tensor input_49_groups_0 = const()[name = tensor("input_49_groups_0"), val = tensor(1)]; tensor blocks_4_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_4_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185197888)))]; tensor blocks_4_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_4_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198305152)))]; tensor input_49_cast_fp16 = conv(bias = blocks_4_mlp_0_bias_to_fp16, dilations = input_49_dilations_0, groups = input_49_groups_0, pad = input_49_pad_0, pad_type = input_49_pad_type_0, strides = input_49_strides_0, weight = blocks_4_mlp_0_weight_to_fp16, x = input_47_cast_fp16)[name = tensor("input_49_cast_fp16")]; tensor input_51_mode_0 = const()[name = tensor("input_51_mode_0"), val = tensor("EXACT")]; tensor input_51_cast_fp16 = gelu(mode = input_51_mode_0, x = input_49_cast_fp16)[name = tensor("input_51_cast_fp16")]; tensor var_1460_pad_type_0 = const()[name = tensor("op_1460_pad_type_0"), val = tensor("valid")]; tensor var_1460_strides_0 = const()[name = tensor("op_1460_strides_0"), val = tensor([1, 1])]; tensor var_1460_pad_0 = const()[name = tensor("op_1460_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_1460_dilations_0 = const()[name = tensor("op_1460_dilations_0"), val = tensor([1, 1])]; tensor var_1460_groups_0 = const()[name = tensor("op_1460_groups_0"), val = tensor(1)]; tensor blocks_4_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_4_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198315456)))]; tensor blocks_4_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_4_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211422720)))]; tensor var_1460_cast_fp16 = conv(bias = blocks_4_mlp_2_bias_to_fp16, dilations = var_1460_dilations_0, groups = var_1460_groups_0, pad = var_1460_pad_0, pad_type = var_1460_pad_type_0, strides = var_1460_strides_0, weight = blocks_4_mlp_2_weight_to_fp16, x = input_51_cast_fp16)[name = tensor("op_1460_cast_fp16")]; tensor inputs_21_cast_fp16 = add(x = inputs_19_cast_fp16, y = var_1460_cast_fp16)[name = tensor("inputs_21_cast_fp16")]; tensor var_1469 = const()[name = tensor("op_1469"), val = tensor(1)]; tensor input_53_axes_0 = const()[name = tensor("input_53_axes_0"), val = tensor([1])]; tensor input_53_gamma_0_to_fp16 = const()[name = tensor("input_53_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211425344)))]; tensor input_53_beta_0_to_fp16 = const()[name = tensor("input_53_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211427968)))]; tensor var_1485_to_fp16 = const()[name = tensor("op_1485_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_53_cast_fp16 = layer_norm(axes = input_53_axes_0, beta = input_53_beta_0_to_fp16, epsilon = var_1485_to_fp16, gamma = input_53_gamma_0_to_fp16, x = inputs_21_cast_fp16)[name = tensor("input_53_cast_fp16")]; tensor q_11_pad_type_0 = const()[name = tensor("q_11_pad_type_0"), val = tensor("valid")]; tensor q_11_strides_0 = const()[name = tensor("q_11_strides_0"), val = tensor([1, 1])]; tensor q_11_pad_0 = const()[name = tensor("q_11_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_11_dilations_0 = const()[name = tensor("q_11_dilations_0"), val = tensor([1, 1])]; tensor q_11_groups_0 = const()[name = tensor("q_11_groups_0"), val = tensor(1)]; tensor var_1520_weight_0_to_fp16 = const()[name = tensor("op_1520_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211430592)))]; tensor var_1520_bias_0_to_fp16 = const()[name = tensor("op_1520_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(214707456)))]; tensor var_1520_cast_fp16 = conv(bias = var_1520_bias_0_to_fp16, dilations = q_11_dilations_0, groups = q_11_groups_0, pad = q_11_pad_0, pad_type = q_11_pad_type_0, strides = q_11_strides_0, weight = var_1520_weight_0_to_fp16, x = input_53_cast_fp16)[name = tensor("op_1520_cast_fp16")]; tensor k_11_pad_type_0 = const()[name = tensor("k_11_pad_type_0"), val = tensor("valid")]; tensor k_11_strides_0 = const()[name = tensor("k_11_strides_0"), val = tensor([1, 1])]; tensor k_11_pad_0 = const()[name = tensor("k_11_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_11_dilations_0 = const()[name = tensor("k_11_dilations_0"), val = tensor([1, 1])]; tensor k_11_groups_0 = const()[name = tensor("k_11_groups_0"), val = tensor(1)]; tensor blocks_5_attn_key_weight_to_fp16 = const()[name = tensor("blocks_5_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(214710080)))]; tensor k_11_cast_fp16 = conv(dilations = k_11_dilations_0, groups = k_11_groups_0, pad = k_11_pad_0, pad_type = k_11_pad_type_0, strides = k_11_strides_0, weight = blocks_5_attn_key_weight_to_fp16, x = input_53_cast_fp16)[name = tensor("k_11_cast_fp16")]; tensor var_1518_pad_type_0 = const()[name = tensor("op_1518_pad_type_0"), val = tensor("valid")]; tensor var_1518_strides_0 = const()[name = tensor("op_1518_strides_0"), val = tensor([1, 1])]; tensor var_1518_pad_0 = const()[name = tensor("op_1518_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_1518_dilations_0 = const()[name = tensor("op_1518_dilations_0"), val = tensor([1, 1])]; tensor var_1518_groups_0 = const()[name = tensor("op_1518_groups_0"), val = tensor(1)]; tensor blocks_5_attn_value_weight_to_fp16 = const()[name = tensor("blocks_5_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217986944)))]; tensor blocks_5_attn_value_bias_to_fp16 = const()[name = tensor("blocks_5_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(221263808)))]; tensor var_1518_cast_fp16 = conv(bias = blocks_5_attn_value_bias_to_fp16, dilations = var_1518_dilations_0, groups = var_1518_groups_0, pad = var_1518_pad_0, pad_type = var_1518_pad_type_0, strides = var_1518_strides_0, weight = blocks_5_attn_value_weight_to_fp16, x = input_53_cast_fp16)[name = tensor("op_1518_cast_fp16")]; tensor tile_15 = const()[name = tensor("tile_15"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_1521_axis_0 = const()[name = tensor("op_1521_axis_0"), val = tensor(1)]; tensor var_1521_cast_fp16_0, tensor var_1521_cast_fp16_1, tensor var_1521_cast_fp16_2, tensor var_1521_cast_fp16_3, tensor var_1521_cast_fp16_4, tensor var_1521_cast_fp16_5, tensor var_1521_cast_fp16_6, tensor var_1521_cast_fp16_7, tensor var_1521_cast_fp16_8, tensor var_1521_cast_fp16_9, tensor var_1521_cast_fp16_10, tensor var_1521_cast_fp16_11, tensor var_1521_cast_fp16_12, tensor var_1521_cast_fp16_13, tensor var_1521_cast_fp16_14, tensor var_1521_cast_fp16_15, tensor var_1521_cast_fp16_16, tensor var_1521_cast_fp16_17, tensor var_1521_cast_fp16_18, tensor var_1521_cast_fp16_19 = split(axis = var_1521_axis_0, split_sizes = tile_15, x = var_1520_cast_fp16)[name = tensor("op_1521_cast_fp16")]; tensor var_1542_perm_0 = const()[name = tensor("op_1542_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_16 = const()[name = tensor("tile_16"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_1543_axis_0 = const()[name = tensor("op_1543_axis_0"), val = tensor(3)]; tensor var_1542_cast_fp16 = transpose(perm = var_1542_perm_0, x = k_11_cast_fp16)[name = tensor("transpose_27")]; tensor var_1543_cast_fp16_0, tensor var_1543_cast_fp16_1, tensor var_1543_cast_fp16_2, tensor var_1543_cast_fp16_3, tensor var_1543_cast_fp16_4, tensor var_1543_cast_fp16_5, tensor var_1543_cast_fp16_6, tensor var_1543_cast_fp16_7, tensor var_1543_cast_fp16_8, tensor var_1543_cast_fp16_9, tensor var_1543_cast_fp16_10, tensor var_1543_cast_fp16_11, tensor var_1543_cast_fp16_12, tensor var_1543_cast_fp16_13, tensor var_1543_cast_fp16_14, tensor var_1543_cast_fp16_15, tensor var_1543_cast_fp16_16, tensor var_1543_cast_fp16_17, tensor var_1543_cast_fp16_18, tensor var_1543_cast_fp16_19 = split(axis = var_1543_axis_0, split_sizes = tile_16, x = var_1542_cast_fp16)[name = tensor("op_1543_cast_fp16")]; tensor tile_17 = const()[name = tensor("tile_17"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_1564_axis_0 = const()[name = tensor("op_1564_axis_0"), val = tensor(1)]; tensor var_1564_cast_fp16_0, tensor var_1564_cast_fp16_1, tensor var_1564_cast_fp16_2, tensor var_1564_cast_fp16_3, tensor var_1564_cast_fp16_4, tensor var_1564_cast_fp16_5, tensor var_1564_cast_fp16_6, tensor var_1564_cast_fp16_7, tensor var_1564_cast_fp16_8, tensor var_1564_cast_fp16_9, tensor var_1564_cast_fp16_10, tensor var_1564_cast_fp16_11, tensor var_1564_cast_fp16_12, tensor var_1564_cast_fp16_13, tensor var_1564_cast_fp16_14, tensor var_1564_cast_fp16_15, tensor var_1564_cast_fp16_16, tensor var_1564_cast_fp16_17, tensor var_1564_cast_fp16_18, tensor var_1564_cast_fp16_19 = split(axis = var_1564_axis_0, split_sizes = tile_17, x = var_1518_cast_fp16)[name = tensor("op_1564_cast_fp16")]; tensor aw_201_equation_0 = const()[name = tensor("aw_201_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_201_cast_fp16 = einsum(equation = aw_201_equation_0, values = (var_1543_cast_fp16_0, var_1521_cast_fp16_0))[name = tensor("aw_201_cast_fp16")]; tensor aw_203_equation_0 = const()[name = tensor("aw_203_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_203_cast_fp16 = einsum(equation = aw_203_equation_0, values = (var_1543_cast_fp16_1, var_1521_cast_fp16_1))[name = tensor("aw_203_cast_fp16")]; tensor aw_205_equation_0 = const()[name = tensor("aw_205_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_205_cast_fp16 = einsum(equation = aw_205_equation_0, values = (var_1543_cast_fp16_2, var_1521_cast_fp16_2))[name = tensor("aw_205_cast_fp16")]; tensor aw_207_equation_0 = const()[name = tensor("aw_207_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_207_cast_fp16 = einsum(equation = aw_207_equation_0, values = (var_1543_cast_fp16_3, var_1521_cast_fp16_3))[name = tensor("aw_207_cast_fp16")]; tensor aw_209_equation_0 = const()[name = tensor("aw_209_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_209_cast_fp16 = einsum(equation = aw_209_equation_0, values = (var_1543_cast_fp16_4, var_1521_cast_fp16_4))[name = tensor("aw_209_cast_fp16")]; tensor aw_211_equation_0 = const()[name = tensor("aw_211_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_211_cast_fp16 = einsum(equation = aw_211_equation_0, values = (var_1543_cast_fp16_5, var_1521_cast_fp16_5))[name = tensor("aw_211_cast_fp16")]; tensor aw_213_equation_0 = const()[name = tensor("aw_213_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_213_cast_fp16 = einsum(equation = aw_213_equation_0, values = (var_1543_cast_fp16_6, var_1521_cast_fp16_6))[name = tensor("aw_213_cast_fp16")]; tensor aw_215_equation_0 = const()[name = tensor("aw_215_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_215_cast_fp16 = einsum(equation = aw_215_equation_0, values = (var_1543_cast_fp16_7, var_1521_cast_fp16_7))[name = tensor("aw_215_cast_fp16")]; tensor aw_217_equation_0 = const()[name = tensor("aw_217_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_217_cast_fp16 = einsum(equation = aw_217_equation_0, values = (var_1543_cast_fp16_8, var_1521_cast_fp16_8))[name = tensor("aw_217_cast_fp16")]; tensor aw_219_equation_0 = const()[name = tensor("aw_219_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_219_cast_fp16 = einsum(equation = aw_219_equation_0, values = (var_1543_cast_fp16_9, var_1521_cast_fp16_9))[name = tensor("aw_219_cast_fp16")]; tensor aw_221_equation_0 = const()[name = tensor("aw_221_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_221_cast_fp16 = einsum(equation = aw_221_equation_0, values = (var_1543_cast_fp16_10, var_1521_cast_fp16_10))[name = tensor("aw_221_cast_fp16")]; tensor aw_223_equation_0 = const()[name = tensor("aw_223_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_223_cast_fp16 = einsum(equation = aw_223_equation_0, values = (var_1543_cast_fp16_11, var_1521_cast_fp16_11))[name = tensor("aw_223_cast_fp16")]; tensor aw_225_equation_0 = const()[name = tensor("aw_225_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_225_cast_fp16 = einsum(equation = aw_225_equation_0, values = (var_1543_cast_fp16_12, var_1521_cast_fp16_12))[name = tensor("aw_225_cast_fp16")]; tensor aw_227_equation_0 = const()[name = tensor("aw_227_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_227_cast_fp16 = einsum(equation = aw_227_equation_0, values = (var_1543_cast_fp16_13, var_1521_cast_fp16_13))[name = tensor("aw_227_cast_fp16")]; tensor aw_229_equation_0 = const()[name = tensor("aw_229_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_229_cast_fp16 = einsum(equation = aw_229_equation_0, values = (var_1543_cast_fp16_14, var_1521_cast_fp16_14))[name = tensor("aw_229_cast_fp16")]; tensor aw_231_equation_0 = const()[name = tensor("aw_231_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_231_cast_fp16 = einsum(equation = aw_231_equation_0, values = (var_1543_cast_fp16_15, var_1521_cast_fp16_15))[name = tensor("aw_231_cast_fp16")]; tensor aw_233_equation_0 = const()[name = tensor("aw_233_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_233_cast_fp16 = einsum(equation = aw_233_equation_0, values = (var_1543_cast_fp16_16, var_1521_cast_fp16_16))[name = tensor("aw_233_cast_fp16")]; tensor aw_235_equation_0 = const()[name = tensor("aw_235_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_235_cast_fp16 = einsum(equation = aw_235_equation_0, values = (var_1543_cast_fp16_17, var_1521_cast_fp16_17))[name = tensor("aw_235_cast_fp16")]; tensor aw_237_equation_0 = const()[name = tensor("aw_237_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_237_cast_fp16 = einsum(equation = aw_237_equation_0, values = (var_1543_cast_fp16_18, var_1521_cast_fp16_18))[name = tensor("aw_237_cast_fp16")]; tensor aw_239_equation_0 = const()[name = tensor("aw_239_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_239_cast_fp16 = einsum(equation = aw_239_equation_0, values = (var_1543_cast_fp16_19, var_1521_cast_fp16_19))[name = tensor("aw_239_cast_fp16")]; tensor var_1625_cast_fp16 = softmax(axis = var_1469, x = aw_201_cast_fp16)[name = tensor("op_1625_cast_fp16")]; tensor var_1626_cast_fp16 = softmax(axis = var_1469, x = aw_203_cast_fp16)[name = tensor("op_1626_cast_fp16")]; tensor var_1627_cast_fp16 = softmax(axis = var_1469, x = aw_205_cast_fp16)[name = tensor("op_1627_cast_fp16")]; tensor var_1628_cast_fp16 = softmax(axis = var_1469, x = aw_207_cast_fp16)[name = tensor("op_1628_cast_fp16")]; tensor var_1629_cast_fp16 = softmax(axis = var_1469, x = aw_209_cast_fp16)[name = tensor("op_1629_cast_fp16")]; tensor var_1630_cast_fp16 = softmax(axis = var_1469, x = aw_211_cast_fp16)[name = tensor("op_1630_cast_fp16")]; tensor var_1631_cast_fp16 = softmax(axis = var_1469, x = aw_213_cast_fp16)[name = tensor("op_1631_cast_fp16")]; tensor var_1632_cast_fp16 = softmax(axis = var_1469, x = aw_215_cast_fp16)[name = tensor("op_1632_cast_fp16")]; tensor var_1633_cast_fp16 = softmax(axis = var_1469, x = aw_217_cast_fp16)[name = tensor("op_1633_cast_fp16")]; tensor var_1634_cast_fp16 = softmax(axis = var_1469, x = aw_219_cast_fp16)[name = tensor("op_1634_cast_fp16")]; tensor var_1635_cast_fp16 = softmax(axis = var_1469, x = aw_221_cast_fp16)[name = tensor("op_1635_cast_fp16")]; tensor var_1636_cast_fp16 = softmax(axis = var_1469, x = aw_223_cast_fp16)[name = tensor("op_1636_cast_fp16")]; tensor var_1637_cast_fp16 = softmax(axis = var_1469, x = aw_225_cast_fp16)[name = tensor("op_1637_cast_fp16")]; tensor var_1638_cast_fp16 = softmax(axis = var_1469, x = aw_227_cast_fp16)[name = tensor("op_1638_cast_fp16")]; tensor var_1639_cast_fp16 = softmax(axis = var_1469, x = aw_229_cast_fp16)[name = tensor("op_1639_cast_fp16")]; tensor var_1640_cast_fp16 = softmax(axis = var_1469, x = aw_231_cast_fp16)[name = tensor("op_1640_cast_fp16")]; tensor var_1641_cast_fp16 = softmax(axis = var_1469, x = aw_233_cast_fp16)[name = tensor("op_1641_cast_fp16")]; tensor var_1642_cast_fp16 = softmax(axis = var_1469, x = aw_235_cast_fp16)[name = tensor("op_1642_cast_fp16")]; tensor var_1643_cast_fp16 = softmax(axis = var_1469, x = aw_237_cast_fp16)[name = tensor("op_1643_cast_fp16")]; tensor var_1644_cast_fp16 = softmax(axis = var_1469, x = aw_239_cast_fp16)[name = tensor("op_1644_cast_fp16")]; tensor var_1646_equation_0 = const()[name = tensor("op_1646_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1646_cast_fp16 = einsum(equation = var_1646_equation_0, values = (var_1564_cast_fp16_0, var_1625_cast_fp16))[name = tensor("op_1646_cast_fp16")]; tensor var_1648_equation_0 = const()[name = tensor("op_1648_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1648_cast_fp16 = einsum(equation = var_1648_equation_0, values = (var_1564_cast_fp16_1, var_1626_cast_fp16))[name = tensor("op_1648_cast_fp16")]; tensor var_1650_equation_0 = const()[name = tensor("op_1650_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1650_cast_fp16 = einsum(equation = var_1650_equation_0, values = (var_1564_cast_fp16_2, var_1627_cast_fp16))[name = tensor("op_1650_cast_fp16")]; tensor var_1652_equation_0 = const()[name = tensor("op_1652_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1652_cast_fp16 = einsum(equation = var_1652_equation_0, values = (var_1564_cast_fp16_3, var_1628_cast_fp16))[name = tensor("op_1652_cast_fp16")]; tensor var_1654_equation_0 = const()[name = tensor("op_1654_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1654_cast_fp16 = einsum(equation = var_1654_equation_0, values = (var_1564_cast_fp16_4, var_1629_cast_fp16))[name = tensor("op_1654_cast_fp16")]; tensor var_1656_equation_0 = const()[name = tensor("op_1656_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1656_cast_fp16 = einsum(equation = var_1656_equation_0, values = (var_1564_cast_fp16_5, var_1630_cast_fp16))[name = tensor("op_1656_cast_fp16")]; tensor var_1658_equation_0 = const()[name = tensor("op_1658_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1658_cast_fp16 = einsum(equation = var_1658_equation_0, values = (var_1564_cast_fp16_6, var_1631_cast_fp16))[name = tensor("op_1658_cast_fp16")]; tensor var_1660_equation_0 = const()[name = tensor("op_1660_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1660_cast_fp16 = einsum(equation = var_1660_equation_0, values = (var_1564_cast_fp16_7, var_1632_cast_fp16))[name = tensor("op_1660_cast_fp16")]; tensor var_1662_equation_0 = const()[name = tensor("op_1662_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1662_cast_fp16 = einsum(equation = var_1662_equation_0, values = (var_1564_cast_fp16_8, var_1633_cast_fp16))[name = tensor("op_1662_cast_fp16")]; tensor var_1664_equation_0 = const()[name = tensor("op_1664_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1664_cast_fp16 = einsum(equation = var_1664_equation_0, values = (var_1564_cast_fp16_9, var_1634_cast_fp16))[name = tensor("op_1664_cast_fp16")]; tensor var_1666_equation_0 = const()[name = tensor("op_1666_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1666_cast_fp16 = einsum(equation = var_1666_equation_0, values = (var_1564_cast_fp16_10, var_1635_cast_fp16))[name = tensor("op_1666_cast_fp16")]; tensor var_1668_equation_0 = const()[name = tensor("op_1668_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1668_cast_fp16 = einsum(equation = var_1668_equation_0, values = (var_1564_cast_fp16_11, var_1636_cast_fp16))[name = tensor("op_1668_cast_fp16")]; tensor var_1670_equation_0 = const()[name = tensor("op_1670_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1670_cast_fp16 = einsum(equation = var_1670_equation_0, values = (var_1564_cast_fp16_12, var_1637_cast_fp16))[name = tensor("op_1670_cast_fp16")]; tensor var_1672_equation_0 = const()[name = tensor("op_1672_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1672_cast_fp16 = einsum(equation = var_1672_equation_0, values = (var_1564_cast_fp16_13, var_1638_cast_fp16))[name = tensor("op_1672_cast_fp16")]; tensor var_1674_equation_0 = const()[name = tensor("op_1674_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1674_cast_fp16 = einsum(equation = var_1674_equation_0, values = (var_1564_cast_fp16_14, var_1639_cast_fp16))[name = tensor("op_1674_cast_fp16")]; tensor var_1676_equation_0 = const()[name = tensor("op_1676_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1676_cast_fp16 = einsum(equation = var_1676_equation_0, values = (var_1564_cast_fp16_15, var_1640_cast_fp16))[name = tensor("op_1676_cast_fp16")]; tensor var_1678_equation_0 = const()[name = tensor("op_1678_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1678_cast_fp16 = einsum(equation = var_1678_equation_0, values = (var_1564_cast_fp16_16, var_1641_cast_fp16))[name = tensor("op_1678_cast_fp16")]; tensor var_1680_equation_0 = const()[name = tensor("op_1680_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1680_cast_fp16 = einsum(equation = var_1680_equation_0, values = (var_1564_cast_fp16_17, var_1642_cast_fp16))[name = tensor("op_1680_cast_fp16")]; tensor var_1682_equation_0 = const()[name = tensor("op_1682_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1682_cast_fp16 = einsum(equation = var_1682_equation_0, values = (var_1564_cast_fp16_18, var_1643_cast_fp16))[name = tensor("op_1682_cast_fp16")]; tensor var_1684_equation_0 = const()[name = tensor("op_1684_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1684_cast_fp16 = einsum(equation = var_1684_equation_0, values = (var_1564_cast_fp16_19, var_1644_cast_fp16))[name = tensor("op_1684_cast_fp16")]; tensor input_55_interleave_0 = const()[name = tensor("input_55_interleave_0"), val = tensor(false)]; tensor input_55_cast_fp16 = concat(axis = var_1469, interleave = input_55_interleave_0, values = (var_1646_cast_fp16, var_1648_cast_fp16, var_1650_cast_fp16, var_1652_cast_fp16, var_1654_cast_fp16, var_1656_cast_fp16, var_1658_cast_fp16, var_1660_cast_fp16, var_1662_cast_fp16, var_1664_cast_fp16, var_1666_cast_fp16, var_1668_cast_fp16, var_1670_cast_fp16, var_1672_cast_fp16, var_1674_cast_fp16, var_1676_cast_fp16, var_1678_cast_fp16, var_1680_cast_fp16, var_1682_cast_fp16, var_1684_cast_fp16))[name = tensor("input_55_cast_fp16")]; tensor var_1693_pad_type_0 = const()[name = tensor("op_1693_pad_type_0"), val = tensor("valid")]; tensor var_1693_strides_0 = const()[name = tensor("op_1693_strides_0"), val = tensor([1, 1])]; tensor var_1693_pad_0 = const()[name = tensor("op_1693_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_1693_dilations_0 = const()[name = tensor("op_1693_dilations_0"), val = tensor([1, 1])]; tensor var_1693_groups_0 = const()[name = tensor("op_1693_groups_0"), val = tensor(1)]; tensor blocks_5_attn_out_weight_to_fp16 = const()[name = tensor("blocks_5_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(221266432)))]; tensor blocks_5_attn_out_bias_to_fp16 = const()[name = tensor("blocks_5_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(224543296)))]; tensor var_1693_cast_fp16 = conv(bias = blocks_5_attn_out_bias_to_fp16, dilations = var_1693_dilations_0, groups = var_1693_groups_0, pad = var_1693_pad_0, pad_type = var_1693_pad_type_0, strides = var_1693_strides_0, weight = blocks_5_attn_out_weight_to_fp16, x = input_55_cast_fp16)[name = tensor("op_1693_cast_fp16")]; tensor inputs_23_cast_fp16 = add(x = inputs_21_cast_fp16, y = var_1693_cast_fp16)[name = tensor("inputs_23_cast_fp16")]; tensor input_57_axes_0 = const()[name = tensor("input_57_axes_0"), val = tensor([1])]; tensor input_57_gamma_0_to_fp16 = const()[name = tensor("input_57_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(224545920)))]; tensor input_57_beta_0_to_fp16 = const()[name = tensor("input_57_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(224548544)))]; tensor var_1703_to_fp16 = const()[name = tensor("op_1703_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_57_cast_fp16 = layer_norm(axes = input_57_axes_0, beta = input_57_beta_0_to_fp16, epsilon = var_1703_to_fp16, gamma = input_57_gamma_0_to_fp16, x = inputs_23_cast_fp16)[name = tensor("input_57_cast_fp16")]; tensor input_59_pad_type_0 = const()[name = tensor("input_59_pad_type_0"), val = tensor("valid")]; tensor input_59_strides_0 = const()[name = tensor("input_59_strides_0"), val = tensor([1, 1])]; tensor input_59_pad_0 = const()[name = tensor("input_59_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_59_dilations_0 = const()[name = tensor("input_59_dilations_0"), val = tensor([1, 1])]; tensor input_59_groups_0 = const()[name = tensor("input_59_groups_0"), val = tensor(1)]; tensor blocks_5_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_5_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(224551168)))]; tensor blocks_5_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_5_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(237658432)))]; tensor input_59_cast_fp16 = conv(bias = blocks_5_mlp_0_bias_to_fp16, dilations = input_59_dilations_0, groups = input_59_groups_0, pad = input_59_pad_0, pad_type = input_59_pad_type_0, strides = input_59_strides_0, weight = blocks_5_mlp_0_weight_to_fp16, x = input_57_cast_fp16)[name = tensor("input_59_cast_fp16")]; tensor input_61_mode_0 = const()[name = tensor("input_61_mode_0"), val = tensor("EXACT")]; tensor input_61_cast_fp16 = gelu(mode = input_61_mode_0, x = input_59_cast_fp16)[name = tensor("input_61_cast_fp16")]; tensor var_1729_pad_type_0 = const()[name = tensor("op_1729_pad_type_0"), val = tensor("valid")]; tensor var_1729_strides_0 = const()[name = tensor("op_1729_strides_0"), val = tensor([1, 1])]; tensor var_1729_pad_0 = const()[name = tensor("op_1729_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_1729_dilations_0 = const()[name = tensor("op_1729_dilations_0"), val = tensor([1, 1])]; tensor var_1729_groups_0 = const()[name = tensor("op_1729_groups_0"), val = tensor(1)]; tensor blocks_5_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_5_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(237668736)))]; tensor blocks_5_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_5_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(250776000)))]; tensor var_1729_cast_fp16 = conv(bias = blocks_5_mlp_2_bias_to_fp16, dilations = var_1729_dilations_0, groups = var_1729_groups_0, pad = var_1729_pad_0, pad_type = var_1729_pad_type_0, strides = var_1729_strides_0, weight = blocks_5_mlp_2_weight_to_fp16, x = input_61_cast_fp16)[name = tensor("op_1729_cast_fp16")]; tensor inputs_25_cast_fp16 = add(x = inputs_23_cast_fp16, y = var_1729_cast_fp16)[name = tensor("inputs_25_cast_fp16")]; tensor var_1738 = const()[name = tensor("op_1738"), val = tensor(1)]; tensor input_63_axes_0 = const()[name = tensor("input_63_axes_0"), val = tensor([1])]; tensor input_63_gamma_0_to_fp16 = const()[name = tensor("input_63_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(250778624)))]; tensor input_63_beta_0_to_fp16 = const()[name = tensor("input_63_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(250781248)))]; tensor var_1754_to_fp16 = const()[name = tensor("op_1754_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_63_cast_fp16 = layer_norm(axes = input_63_axes_0, beta = input_63_beta_0_to_fp16, epsilon = var_1754_to_fp16, gamma = input_63_gamma_0_to_fp16, x = inputs_25_cast_fp16)[name = tensor("input_63_cast_fp16")]; tensor q_13_pad_type_0 = const()[name = tensor("q_13_pad_type_0"), val = tensor("valid")]; tensor q_13_strides_0 = const()[name = tensor("q_13_strides_0"), val = tensor([1, 1])]; tensor q_13_pad_0 = const()[name = tensor("q_13_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_13_dilations_0 = const()[name = tensor("q_13_dilations_0"), val = tensor([1, 1])]; tensor q_13_groups_0 = const()[name = tensor("q_13_groups_0"), val = tensor(1)]; tensor var_1789_weight_0_to_fp16 = const()[name = tensor("op_1789_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(250783872)))]; tensor var_1789_bias_0_to_fp16 = const()[name = tensor("op_1789_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(254060736)))]; tensor var_1789_cast_fp16 = conv(bias = var_1789_bias_0_to_fp16, dilations = q_13_dilations_0, groups = q_13_groups_0, pad = q_13_pad_0, pad_type = q_13_pad_type_0, strides = q_13_strides_0, weight = var_1789_weight_0_to_fp16, x = input_63_cast_fp16)[name = tensor("op_1789_cast_fp16")]; tensor k_13_pad_type_0 = const()[name = tensor("k_13_pad_type_0"), val = tensor("valid")]; tensor k_13_strides_0 = const()[name = tensor("k_13_strides_0"), val = tensor([1, 1])]; tensor k_13_pad_0 = const()[name = tensor("k_13_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_13_dilations_0 = const()[name = tensor("k_13_dilations_0"), val = tensor([1, 1])]; tensor k_13_groups_0 = const()[name = tensor("k_13_groups_0"), val = tensor(1)]; tensor blocks_6_attn_key_weight_to_fp16 = const()[name = tensor("blocks_6_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(254063360)))]; tensor k_13_cast_fp16 = conv(dilations = k_13_dilations_0, groups = k_13_groups_0, pad = k_13_pad_0, pad_type = k_13_pad_type_0, strides = k_13_strides_0, weight = blocks_6_attn_key_weight_to_fp16, x = input_63_cast_fp16)[name = tensor("k_13_cast_fp16")]; tensor var_1787_pad_type_0 = const()[name = tensor("op_1787_pad_type_0"), val = tensor("valid")]; tensor var_1787_strides_0 = const()[name = tensor("op_1787_strides_0"), val = tensor([1, 1])]; tensor var_1787_pad_0 = const()[name = tensor("op_1787_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_1787_dilations_0 = const()[name = tensor("op_1787_dilations_0"), val = tensor([1, 1])]; tensor var_1787_groups_0 = const()[name = tensor("op_1787_groups_0"), val = tensor(1)]; tensor blocks_6_attn_value_weight_to_fp16 = const()[name = tensor("blocks_6_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(257340224)))]; tensor blocks_6_attn_value_bias_to_fp16 = const()[name = tensor("blocks_6_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(260617088)))]; tensor var_1787_cast_fp16 = conv(bias = blocks_6_attn_value_bias_to_fp16, dilations = var_1787_dilations_0, groups = var_1787_groups_0, pad = var_1787_pad_0, pad_type = var_1787_pad_type_0, strides = var_1787_strides_0, weight = blocks_6_attn_value_weight_to_fp16, x = input_63_cast_fp16)[name = tensor("op_1787_cast_fp16")]; tensor tile_18 = const()[name = tensor("tile_18"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_1790_axis_0 = const()[name = tensor("op_1790_axis_0"), val = tensor(1)]; tensor var_1790_cast_fp16_0, tensor var_1790_cast_fp16_1, tensor var_1790_cast_fp16_2, tensor var_1790_cast_fp16_3, tensor var_1790_cast_fp16_4, tensor var_1790_cast_fp16_5, tensor var_1790_cast_fp16_6, tensor var_1790_cast_fp16_7, tensor var_1790_cast_fp16_8, tensor var_1790_cast_fp16_9, tensor var_1790_cast_fp16_10, tensor var_1790_cast_fp16_11, tensor var_1790_cast_fp16_12, tensor var_1790_cast_fp16_13, tensor var_1790_cast_fp16_14, tensor var_1790_cast_fp16_15, tensor var_1790_cast_fp16_16, tensor var_1790_cast_fp16_17, tensor var_1790_cast_fp16_18, tensor var_1790_cast_fp16_19 = split(axis = var_1790_axis_0, split_sizes = tile_18, x = var_1789_cast_fp16)[name = tensor("op_1790_cast_fp16")]; tensor var_1811_perm_0 = const()[name = tensor("op_1811_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_19 = const()[name = tensor("tile_19"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_1812_axis_0 = const()[name = tensor("op_1812_axis_0"), val = tensor(3)]; tensor var_1811_cast_fp16 = transpose(perm = var_1811_perm_0, x = k_13_cast_fp16)[name = tensor("transpose_26")]; tensor var_1812_cast_fp16_0, tensor var_1812_cast_fp16_1, tensor var_1812_cast_fp16_2, tensor var_1812_cast_fp16_3, tensor var_1812_cast_fp16_4, tensor var_1812_cast_fp16_5, tensor var_1812_cast_fp16_6, tensor var_1812_cast_fp16_7, tensor var_1812_cast_fp16_8, tensor var_1812_cast_fp16_9, tensor var_1812_cast_fp16_10, tensor var_1812_cast_fp16_11, tensor var_1812_cast_fp16_12, tensor var_1812_cast_fp16_13, tensor var_1812_cast_fp16_14, tensor var_1812_cast_fp16_15, tensor var_1812_cast_fp16_16, tensor var_1812_cast_fp16_17, tensor var_1812_cast_fp16_18, tensor var_1812_cast_fp16_19 = split(axis = var_1812_axis_0, split_sizes = tile_19, x = var_1811_cast_fp16)[name = tensor("op_1812_cast_fp16")]; tensor tile_20 = const()[name = tensor("tile_20"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_1833_axis_0 = const()[name = tensor("op_1833_axis_0"), val = tensor(1)]; tensor var_1833_cast_fp16_0, tensor var_1833_cast_fp16_1, tensor var_1833_cast_fp16_2, tensor var_1833_cast_fp16_3, tensor var_1833_cast_fp16_4, tensor var_1833_cast_fp16_5, tensor var_1833_cast_fp16_6, tensor var_1833_cast_fp16_7, tensor var_1833_cast_fp16_8, tensor var_1833_cast_fp16_9, tensor var_1833_cast_fp16_10, tensor var_1833_cast_fp16_11, tensor var_1833_cast_fp16_12, tensor var_1833_cast_fp16_13, tensor var_1833_cast_fp16_14, tensor var_1833_cast_fp16_15, tensor var_1833_cast_fp16_16, tensor var_1833_cast_fp16_17, tensor var_1833_cast_fp16_18, tensor var_1833_cast_fp16_19 = split(axis = var_1833_axis_0, split_sizes = tile_20, x = var_1787_cast_fp16)[name = tensor("op_1833_cast_fp16")]; tensor aw_241_equation_0 = const()[name = tensor("aw_241_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_241_cast_fp16 = einsum(equation = aw_241_equation_0, values = (var_1812_cast_fp16_0, var_1790_cast_fp16_0))[name = tensor("aw_241_cast_fp16")]; tensor aw_243_equation_0 = const()[name = tensor("aw_243_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_243_cast_fp16 = einsum(equation = aw_243_equation_0, values = (var_1812_cast_fp16_1, var_1790_cast_fp16_1))[name = tensor("aw_243_cast_fp16")]; tensor aw_245_equation_0 = const()[name = tensor("aw_245_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_245_cast_fp16 = einsum(equation = aw_245_equation_0, values = (var_1812_cast_fp16_2, var_1790_cast_fp16_2))[name = tensor("aw_245_cast_fp16")]; tensor aw_247_equation_0 = const()[name = tensor("aw_247_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_247_cast_fp16 = einsum(equation = aw_247_equation_0, values = (var_1812_cast_fp16_3, var_1790_cast_fp16_3))[name = tensor("aw_247_cast_fp16")]; tensor aw_249_equation_0 = const()[name = tensor("aw_249_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_249_cast_fp16 = einsum(equation = aw_249_equation_0, values = (var_1812_cast_fp16_4, var_1790_cast_fp16_4))[name = tensor("aw_249_cast_fp16")]; tensor aw_251_equation_0 = const()[name = tensor("aw_251_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_251_cast_fp16 = einsum(equation = aw_251_equation_0, values = (var_1812_cast_fp16_5, var_1790_cast_fp16_5))[name = tensor("aw_251_cast_fp16")]; tensor aw_253_equation_0 = const()[name = tensor("aw_253_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_253_cast_fp16 = einsum(equation = aw_253_equation_0, values = (var_1812_cast_fp16_6, var_1790_cast_fp16_6))[name = tensor("aw_253_cast_fp16")]; tensor aw_255_equation_0 = const()[name = tensor("aw_255_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_255_cast_fp16 = einsum(equation = aw_255_equation_0, values = (var_1812_cast_fp16_7, var_1790_cast_fp16_7))[name = tensor("aw_255_cast_fp16")]; tensor aw_257_equation_0 = const()[name = tensor("aw_257_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_257_cast_fp16 = einsum(equation = aw_257_equation_0, values = (var_1812_cast_fp16_8, var_1790_cast_fp16_8))[name = tensor("aw_257_cast_fp16")]; tensor aw_259_equation_0 = const()[name = tensor("aw_259_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_259_cast_fp16 = einsum(equation = aw_259_equation_0, values = (var_1812_cast_fp16_9, var_1790_cast_fp16_9))[name = tensor("aw_259_cast_fp16")]; tensor aw_261_equation_0 = const()[name = tensor("aw_261_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_261_cast_fp16 = einsum(equation = aw_261_equation_0, values = (var_1812_cast_fp16_10, var_1790_cast_fp16_10))[name = tensor("aw_261_cast_fp16")]; tensor aw_263_equation_0 = const()[name = tensor("aw_263_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_263_cast_fp16 = einsum(equation = aw_263_equation_0, values = (var_1812_cast_fp16_11, var_1790_cast_fp16_11))[name = tensor("aw_263_cast_fp16")]; tensor aw_265_equation_0 = const()[name = tensor("aw_265_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_265_cast_fp16 = einsum(equation = aw_265_equation_0, values = (var_1812_cast_fp16_12, var_1790_cast_fp16_12))[name = tensor("aw_265_cast_fp16")]; tensor aw_267_equation_0 = const()[name = tensor("aw_267_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_267_cast_fp16 = einsum(equation = aw_267_equation_0, values = (var_1812_cast_fp16_13, var_1790_cast_fp16_13))[name = tensor("aw_267_cast_fp16")]; tensor aw_269_equation_0 = const()[name = tensor("aw_269_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_269_cast_fp16 = einsum(equation = aw_269_equation_0, values = (var_1812_cast_fp16_14, var_1790_cast_fp16_14))[name = tensor("aw_269_cast_fp16")]; tensor aw_271_equation_0 = const()[name = tensor("aw_271_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_271_cast_fp16 = einsum(equation = aw_271_equation_0, values = (var_1812_cast_fp16_15, var_1790_cast_fp16_15))[name = tensor("aw_271_cast_fp16")]; tensor aw_273_equation_0 = const()[name = tensor("aw_273_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_273_cast_fp16 = einsum(equation = aw_273_equation_0, values = (var_1812_cast_fp16_16, var_1790_cast_fp16_16))[name = tensor("aw_273_cast_fp16")]; tensor aw_275_equation_0 = const()[name = tensor("aw_275_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_275_cast_fp16 = einsum(equation = aw_275_equation_0, values = (var_1812_cast_fp16_17, var_1790_cast_fp16_17))[name = tensor("aw_275_cast_fp16")]; tensor aw_277_equation_0 = const()[name = tensor("aw_277_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_277_cast_fp16 = einsum(equation = aw_277_equation_0, values = (var_1812_cast_fp16_18, var_1790_cast_fp16_18))[name = tensor("aw_277_cast_fp16")]; tensor aw_279_equation_0 = const()[name = tensor("aw_279_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_279_cast_fp16 = einsum(equation = aw_279_equation_0, values = (var_1812_cast_fp16_19, var_1790_cast_fp16_19))[name = tensor("aw_279_cast_fp16")]; tensor var_1894_cast_fp16 = softmax(axis = var_1738, x = aw_241_cast_fp16)[name = tensor("op_1894_cast_fp16")]; tensor var_1895_cast_fp16 = softmax(axis = var_1738, x = aw_243_cast_fp16)[name = tensor("op_1895_cast_fp16")]; tensor var_1896_cast_fp16 = softmax(axis = var_1738, x = aw_245_cast_fp16)[name = tensor("op_1896_cast_fp16")]; tensor var_1897_cast_fp16 = softmax(axis = var_1738, x = aw_247_cast_fp16)[name = tensor("op_1897_cast_fp16")]; tensor var_1898_cast_fp16 = softmax(axis = var_1738, x = aw_249_cast_fp16)[name = tensor("op_1898_cast_fp16")]; tensor var_1899_cast_fp16 = softmax(axis = var_1738, x = aw_251_cast_fp16)[name = tensor("op_1899_cast_fp16")]; tensor var_1900_cast_fp16 = softmax(axis = var_1738, x = aw_253_cast_fp16)[name = tensor("op_1900_cast_fp16")]; tensor var_1901_cast_fp16 = softmax(axis = var_1738, x = aw_255_cast_fp16)[name = tensor("op_1901_cast_fp16")]; tensor var_1902_cast_fp16 = softmax(axis = var_1738, x = aw_257_cast_fp16)[name = tensor("op_1902_cast_fp16")]; tensor var_1903_cast_fp16 = softmax(axis = var_1738, x = aw_259_cast_fp16)[name = tensor("op_1903_cast_fp16")]; tensor var_1904_cast_fp16 = softmax(axis = var_1738, x = aw_261_cast_fp16)[name = tensor("op_1904_cast_fp16")]; tensor var_1905_cast_fp16 = softmax(axis = var_1738, x = aw_263_cast_fp16)[name = tensor("op_1905_cast_fp16")]; tensor var_1906_cast_fp16 = softmax(axis = var_1738, x = aw_265_cast_fp16)[name = tensor("op_1906_cast_fp16")]; tensor var_1907_cast_fp16 = softmax(axis = var_1738, x = aw_267_cast_fp16)[name = tensor("op_1907_cast_fp16")]; tensor var_1908_cast_fp16 = softmax(axis = var_1738, x = aw_269_cast_fp16)[name = tensor("op_1908_cast_fp16")]; tensor var_1909_cast_fp16 = softmax(axis = var_1738, x = aw_271_cast_fp16)[name = tensor("op_1909_cast_fp16")]; tensor var_1910_cast_fp16 = softmax(axis = var_1738, x = aw_273_cast_fp16)[name = tensor("op_1910_cast_fp16")]; tensor var_1911_cast_fp16 = softmax(axis = var_1738, x = aw_275_cast_fp16)[name = tensor("op_1911_cast_fp16")]; tensor var_1912_cast_fp16 = softmax(axis = var_1738, x = aw_277_cast_fp16)[name = tensor("op_1912_cast_fp16")]; tensor var_1913_cast_fp16 = softmax(axis = var_1738, x = aw_279_cast_fp16)[name = tensor("op_1913_cast_fp16")]; tensor var_1915_equation_0 = const()[name = tensor("op_1915_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1915_cast_fp16 = einsum(equation = var_1915_equation_0, values = (var_1833_cast_fp16_0, var_1894_cast_fp16))[name = tensor("op_1915_cast_fp16")]; tensor var_1917_equation_0 = const()[name = tensor("op_1917_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1917_cast_fp16 = einsum(equation = var_1917_equation_0, values = (var_1833_cast_fp16_1, var_1895_cast_fp16))[name = tensor("op_1917_cast_fp16")]; tensor var_1919_equation_0 = const()[name = tensor("op_1919_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1919_cast_fp16 = einsum(equation = var_1919_equation_0, values = (var_1833_cast_fp16_2, var_1896_cast_fp16))[name = tensor("op_1919_cast_fp16")]; tensor var_1921_equation_0 = const()[name = tensor("op_1921_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1921_cast_fp16 = einsum(equation = var_1921_equation_0, values = (var_1833_cast_fp16_3, var_1897_cast_fp16))[name = tensor("op_1921_cast_fp16")]; tensor var_1923_equation_0 = const()[name = tensor("op_1923_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1923_cast_fp16 = einsum(equation = var_1923_equation_0, values = (var_1833_cast_fp16_4, var_1898_cast_fp16))[name = tensor("op_1923_cast_fp16")]; tensor var_1925_equation_0 = const()[name = tensor("op_1925_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1925_cast_fp16 = einsum(equation = var_1925_equation_0, values = (var_1833_cast_fp16_5, var_1899_cast_fp16))[name = tensor("op_1925_cast_fp16")]; tensor var_1927_equation_0 = const()[name = tensor("op_1927_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1927_cast_fp16 = einsum(equation = var_1927_equation_0, values = (var_1833_cast_fp16_6, var_1900_cast_fp16))[name = tensor("op_1927_cast_fp16")]; tensor var_1929_equation_0 = const()[name = tensor("op_1929_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1929_cast_fp16 = einsum(equation = var_1929_equation_0, values = (var_1833_cast_fp16_7, var_1901_cast_fp16))[name = tensor("op_1929_cast_fp16")]; tensor var_1931_equation_0 = const()[name = tensor("op_1931_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1931_cast_fp16 = einsum(equation = var_1931_equation_0, values = (var_1833_cast_fp16_8, var_1902_cast_fp16))[name = tensor("op_1931_cast_fp16")]; tensor var_1933_equation_0 = const()[name = tensor("op_1933_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1933_cast_fp16 = einsum(equation = var_1933_equation_0, values = (var_1833_cast_fp16_9, var_1903_cast_fp16))[name = tensor("op_1933_cast_fp16")]; tensor var_1935_equation_0 = const()[name = tensor("op_1935_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1935_cast_fp16 = einsum(equation = var_1935_equation_0, values = (var_1833_cast_fp16_10, var_1904_cast_fp16))[name = tensor("op_1935_cast_fp16")]; tensor var_1937_equation_0 = const()[name = tensor("op_1937_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1937_cast_fp16 = einsum(equation = var_1937_equation_0, values = (var_1833_cast_fp16_11, var_1905_cast_fp16))[name = tensor("op_1937_cast_fp16")]; tensor var_1939_equation_0 = const()[name = tensor("op_1939_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1939_cast_fp16 = einsum(equation = var_1939_equation_0, values = (var_1833_cast_fp16_12, var_1906_cast_fp16))[name = tensor("op_1939_cast_fp16")]; tensor var_1941_equation_0 = const()[name = tensor("op_1941_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1941_cast_fp16 = einsum(equation = var_1941_equation_0, values = (var_1833_cast_fp16_13, var_1907_cast_fp16))[name = tensor("op_1941_cast_fp16")]; tensor var_1943_equation_0 = const()[name = tensor("op_1943_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1943_cast_fp16 = einsum(equation = var_1943_equation_0, values = (var_1833_cast_fp16_14, var_1908_cast_fp16))[name = tensor("op_1943_cast_fp16")]; tensor var_1945_equation_0 = const()[name = tensor("op_1945_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1945_cast_fp16 = einsum(equation = var_1945_equation_0, values = (var_1833_cast_fp16_15, var_1909_cast_fp16))[name = tensor("op_1945_cast_fp16")]; tensor var_1947_equation_0 = const()[name = tensor("op_1947_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1947_cast_fp16 = einsum(equation = var_1947_equation_0, values = (var_1833_cast_fp16_16, var_1910_cast_fp16))[name = tensor("op_1947_cast_fp16")]; tensor var_1949_equation_0 = const()[name = tensor("op_1949_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1949_cast_fp16 = einsum(equation = var_1949_equation_0, values = (var_1833_cast_fp16_17, var_1911_cast_fp16))[name = tensor("op_1949_cast_fp16")]; tensor var_1951_equation_0 = const()[name = tensor("op_1951_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1951_cast_fp16 = einsum(equation = var_1951_equation_0, values = (var_1833_cast_fp16_18, var_1912_cast_fp16))[name = tensor("op_1951_cast_fp16")]; tensor var_1953_equation_0 = const()[name = tensor("op_1953_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1953_cast_fp16 = einsum(equation = var_1953_equation_0, values = (var_1833_cast_fp16_19, var_1913_cast_fp16))[name = tensor("op_1953_cast_fp16")]; tensor input_65_interleave_0 = const()[name = tensor("input_65_interleave_0"), val = tensor(false)]; tensor input_65_cast_fp16 = concat(axis = var_1738, interleave = input_65_interleave_0, values = (var_1915_cast_fp16, var_1917_cast_fp16, var_1919_cast_fp16, var_1921_cast_fp16, var_1923_cast_fp16, var_1925_cast_fp16, var_1927_cast_fp16, var_1929_cast_fp16, var_1931_cast_fp16, var_1933_cast_fp16, var_1935_cast_fp16, var_1937_cast_fp16, var_1939_cast_fp16, var_1941_cast_fp16, var_1943_cast_fp16, var_1945_cast_fp16, var_1947_cast_fp16, var_1949_cast_fp16, var_1951_cast_fp16, var_1953_cast_fp16))[name = tensor("input_65_cast_fp16")]; tensor var_1962_pad_type_0 = const()[name = tensor("op_1962_pad_type_0"), val = tensor("valid")]; tensor var_1962_strides_0 = const()[name = tensor("op_1962_strides_0"), val = tensor([1, 1])]; tensor var_1962_pad_0 = const()[name = tensor("op_1962_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_1962_dilations_0 = const()[name = tensor("op_1962_dilations_0"), val = tensor([1, 1])]; tensor var_1962_groups_0 = const()[name = tensor("op_1962_groups_0"), val = tensor(1)]; tensor blocks_6_attn_out_weight_to_fp16 = const()[name = tensor("blocks_6_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(260619712)))]; tensor blocks_6_attn_out_bias_to_fp16 = const()[name = tensor("blocks_6_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(263896576)))]; tensor var_1962_cast_fp16 = conv(bias = blocks_6_attn_out_bias_to_fp16, dilations = var_1962_dilations_0, groups = var_1962_groups_0, pad = var_1962_pad_0, pad_type = var_1962_pad_type_0, strides = var_1962_strides_0, weight = blocks_6_attn_out_weight_to_fp16, x = input_65_cast_fp16)[name = tensor("op_1962_cast_fp16")]; tensor inputs_27_cast_fp16 = add(x = inputs_25_cast_fp16, y = var_1962_cast_fp16)[name = tensor("inputs_27_cast_fp16")]; tensor input_67_axes_0 = const()[name = tensor("input_67_axes_0"), val = tensor([1])]; tensor input_67_gamma_0_to_fp16 = const()[name = tensor("input_67_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(263899200)))]; tensor input_67_beta_0_to_fp16 = const()[name = tensor("input_67_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(263901824)))]; tensor var_1972_to_fp16 = const()[name = tensor("op_1972_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_67_cast_fp16 = layer_norm(axes = input_67_axes_0, beta = input_67_beta_0_to_fp16, epsilon = var_1972_to_fp16, gamma = input_67_gamma_0_to_fp16, x = inputs_27_cast_fp16)[name = tensor("input_67_cast_fp16")]; tensor input_69_pad_type_0 = const()[name = tensor("input_69_pad_type_0"), val = tensor("valid")]; tensor input_69_strides_0 = const()[name = tensor("input_69_strides_0"), val = tensor([1, 1])]; tensor input_69_pad_0 = const()[name = tensor("input_69_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_69_dilations_0 = const()[name = tensor("input_69_dilations_0"), val = tensor([1, 1])]; tensor input_69_groups_0 = const()[name = tensor("input_69_groups_0"), val = tensor(1)]; tensor blocks_6_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_6_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(263904448)))]; tensor blocks_6_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_6_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(277011712)))]; tensor input_69_cast_fp16 = conv(bias = blocks_6_mlp_0_bias_to_fp16, dilations = input_69_dilations_0, groups = input_69_groups_0, pad = input_69_pad_0, pad_type = input_69_pad_type_0, strides = input_69_strides_0, weight = blocks_6_mlp_0_weight_to_fp16, x = input_67_cast_fp16)[name = tensor("input_69_cast_fp16")]; tensor input_71_mode_0 = const()[name = tensor("input_71_mode_0"), val = tensor("EXACT")]; tensor input_71_cast_fp16 = gelu(mode = input_71_mode_0, x = input_69_cast_fp16)[name = tensor("input_71_cast_fp16")]; tensor var_1998_pad_type_0 = const()[name = tensor("op_1998_pad_type_0"), val = tensor("valid")]; tensor var_1998_strides_0 = const()[name = tensor("op_1998_strides_0"), val = tensor([1, 1])]; tensor var_1998_pad_0 = const()[name = tensor("op_1998_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_1998_dilations_0 = const()[name = tensor("op_1998_dilations_0"), val = tensor([1, 1])]; tensor var_1998_groups_0 = const()[name = tensor("op_1998_groups_0"), val = tensor(1)]; tensor blocks_6_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_6_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(277022016)))]; tensor blocks_6_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_6_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(290129280)))]; tensor var_1998_cast_fp16 = conv(bias = blocks_6_mlp_2_bias_to_fp16, dilations = var_1998_dilations_0, groups = var_1998_groups_0, pad = var_1998_pad_0, pad_type = var_1998_pad_type_0, strides = var_1998_strides_0, weight = blocks_6_mlp_2_weight_to_fp16, x = input_71_cast_fp16)[name = tensor("op_1998_cast_fp16")]; tensor inputs_29_cast_fp16 = add(x = inputs_27_cast_fp16, y = var_1998_cast_fp16)[name = tensor("inputs_29_cast_fp16")]; tensor var_2007 = const()[name = tensor("op_2007"), val = tensor(1)]; tensor input_73_axes_0 = const()[name = tensor("input_73_axes_0"), val = tensor([1])]; tensor input_73_gamma_0_to_fp16 = const()[name = tensor("input_73_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(290131904)))]; tensor input_73_beta_0_to_fp16 = const()[name = tensor("input_73_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(290134528)))]; tensor var_2023_to_fp16 = const()[name = tensor("op_2023_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_73_cast_fp16 = layer_norm(axes = input_73_axes_0, beta = input_73_beta_0_to_fp16, epsilon = var_2023_to_fp16, gamma = input_73_gamma_0_to_fp16, x = inputs_29_cast_fp16)[name = tensor("input_73_cast_fp16")]; tensor q_15_pad_type_0 = const()[name = tensor("q_15_pad_type_0"), val = tensor("valid")]; tensor q_15_strides_0 = const()[name = tensor("q_15_strides_0"), val = tensor([1, 1])]; tensor q_15_pad_0 = const()[name = tensor("q_15_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_15_dilations_0 = const()[name = tensor("q_15_dilations_0"), val = tensor([1, 1])]; tensor q_15_groups_0 = const()[name = tensor("q_15_groups_0"), val = tensor(1)]; tensor var_2058_weight_0_to_fp16 = const()[name = tensor("op_2058_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(290137152)))]; tensor var_2058_bias_0_to_fp16 = const()[name = tensor("op_2058_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293414016)))]; tensor var_2058_cast_fp16 = conv(bias = var_2058_bias_0_to_fp16, dilations = q_15_dilations_0, groups = q_15_groups_0, pad = q_15_pad_0, pad_type = q_15_pad_type_0, strides = q_15_strides_0, weight = var_2058_weight_0_to_fp16, x = input_73_cast_fp16)[name = tensor("op_2058_cast_fp16")]; tensor k_15_pad_type_0 = const()[name = tensor("k_15_pad_type_0"), val = tensor("valid")]; tensor k_15_strides_0 = const()[name = tensor("k_15_strides_0"), val = tensor([1, 1])]; tensor k_15_pad_0 = const()[name = tensor("k_15_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_15_dilations_0 = const()[name = tensor("k_15_dilations_0"), val = tensor([1, 1])]; tensor k_15_groups_0 = const()[name = tensor("k_15_groups_0"), val = tensor(1)]; tensor blocks_7_attn_key_weight_to_fp16 = const()[name = tensor("blocks_7_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293416640)))]; tensor k_15_cast_fp16 = conv(dilations = k_15_dilations_0, groups = k_15_groups_0, pad = k_15_pad_0, pad_type = k_15_pad_type_0, strides = k_15_strides_0, weight = blocks_7_attn_key_weight_to_fp16, x = input_73_cast_fp16)[name = tensor("k_15_cast_fp16")]; tensor var_2056_pad_type_0 = const()[name = tensor("op_2056_pad_type_0"), val = tensor("valid")]; tensor var_2056_strides_0 = const()[name = tensor("op_2056_strides_0"), val = tensor([1, 1])]; tensor var_2056_pad_0 = const()[name = tensor("op_2056_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_2056_dilations_0 = const()[name = tensor("op_2056_dilations_0"), val = tensor([1, 1])]; tensor var_2056_groups_0 = const()[name = tensor("op_2056_groups_0"), val = tensor(1)]; tensor blocks_7_attn_value_weight_to_fp16 = const()[name = tensor("blocks_7_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(296693504)))]; tensor blocks_7_attn_value_bias_to_fp16 = const()[name = tensor("blocks_7_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(299970368)))]; tensor var_2056_cast_fp16 = conv(bias = blocks_7_attn_value_bias_to_fp16, dilations = var_2056_dilations_0, groups = var_2056_groups_0, pad = var_2056_pad_0, pad_type = var_2056_pad_type_0, strides = var_2056_strides_0, weight = blocks_7_attn_value_weight_to_fp16, x = input_73_cast_fp16)[name = tensor("op_2056_cast_fp16")]; tensor tile_21 = const()[name = tensor("tile_21"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_2059_axis_0 = const()[name = tensor("op_2059_axis_0"), val = tensor(1)]; tensor var_2059_cast_fp16_0, tensor var_2059_cast_fp16_1, tensor var_2059_cast_fp16_2, tensor var_2059_cast_fp16_3, tensor var_2059_cast_fp16_4, tensor var_2059_cast_fp16_5, tensor var_2059_cast_fp16_6, tensor var_2059_cast_fp16_7, tensor var_2059_cast_fp16_8, tensor var_2059_cast_fp16_9, tensor var_2059_cast_fp16_10, tensor var_2059_cast_fp16_11, tensor var_2059_cast_fp16_12, tensor var_2059_cast_fp16_13, tensor var_2059_cast_fp16_14, tensor var_2059_cast_fp16_15, tensor var_2059_cast_fp16_16, tensor var_2059_cast_fp16_17, tensor var_2059_cast_fp16_18, tensor var_2059_cast_fp16_19 = split(axis = var_2059_axis_0, split_sizes = tile_21, x = var_2058_cast_fp16)[name = tensor("op_2059_cast_fp16")]; tensor var_2080_perm_0 = const()[name = tensor("op_2080_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_22 = const()[name = tensor("tile_22"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_2081_axis_0 = const()[name = tensor("op_2081_axis_0"), val = tensor(3)]; tensor var_2080_cast_fp16 = transpose(perm = var_2080_perm_0, x = k_15_cast_fp16)[name = tensor("transpose_25")]; tensor var_2081_cast_fp16_0, tensor var_2081_cast_fp16_1, tensor var_2081_cast_fp16_2, tensor var_2081_cast_fp16_3, tensor var_2081_cast_fp16_4, tensor var_2081_cast_fp16_5, tensor var_2081_cast_fp16_6, tensor var_2081_cast_fp16_7, tensor var_2081_cast_fp16_8, tensor var_2081_cast_fp16_9, tensor var_2081_cast_fp16_10, tensor var_2081_cast_fp16_11, tensor var_2081_cast_fp16_12, tensor var_2081_cast_fp16_13, tensor var_2081_cast_fp16_14, tensor var_2081_cast_fp16_15, tensor var_2081_cast_fp16_16, tensor var_2081_cast_fp16_17, tensor var_2081_cast_fp16_18, tensor var_2081_cast_fp16_19 = split(axis = var_2081_axis_0, split_sizes = tile_22, x = var_2080_cast_fp16)[name = tensor("op_2081_cast_fp16")]; tensor tile_23 = const()[name = tensor("tile_23"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_2102_axis_0 = const()[name = tensor("op_2102_axis_0"), val = tensor(1)]; tensor var_2102_cast_fp16_0, tensor var_2102_cast_fp16_1, tensor var_2102_cast_fp16_2, tensor var_2102_cast_fp16_3, tensor var_2102_cast_fp16_4, tensor var_2102_cast_fp16_5, tensor var_2102_cast_fp16_6, tensor var_2102_cast_fp16_7, tensor var_2102_cast_fp16_8, tensor var_2102_cast_fp16_9, tensor var_2102_cast_fp16_10, tensor var_2102_cast_fp16_11, tensor var_2102_cast_fp16_12, tensor var_2102_cast_fp16_13, tensor var_2102_cast_fp16_14, tensor var_2102_cast_fp16_15, tensor var_2102_cast_fp16_16, tensor var_2102_cast_fp16_17, tensor var_2102_cast_fp16_18, tensor var_2102_cast_fp16_19 = split(axis = var_2102_axis_0, split_sizes = tile_23, x = var_2056_cast_fp16)[name = tensor("op_2102_cast_fp16")]; tensor aw_281_equation_0 = const()[name = tensor("aw_281_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_281_cast_fp16 = einsum(equation = aw_281_equation_0, values = (var_2081_cast_fp16_0, var_2059_cast_fp16_0))[name = tensor("aw_281_cast_fp16")]; tensor aw_283_equation_0 = const()[name = tensor("aw_283_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_283_cast_fp16 = einsum(equation = aw_283_equation_0, values = (var_2081_cast_fp16_1, var_2059_cast_fp16_1))[name = tensor("aw_283_cast_fp16")]; tensor aw_285_equation_0 = const()[name = tensor("aw_285_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_285_cast_fp16 = einsum(equation = aw_285_equation_0, values = (var_2081_cast_fp16_2, var_2059_cast_fp16_2))[name = tensor("aw_285_cast_fp16")]; tensor aw_287_equation_0 = const()[name = tensor("aw_287_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_287_cast_fp16 = einsum(equation = aw_287_equation_0, values = (var_2081_cast_fp16_3, var_2059_cast_fp16_3))[name = tensor("aw_287_cast_fp16")]; tensor aw_289_equation_0 = const()[name = tensor("aw_289_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_289_cast_fp16 = einsum(equation = aw_289_equation_0, values = (var_2081_cast_fp16_4, var_2059_cast_fp16_4))[name = tensor("aw_289_cast_fp16")]; tensor aw_291_equation_0 = const()[name = tensor("aw_291_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_291_cast_fp16 = einsum(equation = aw_291_equation_0, values = (var_2081_cast_fp16_5, var_2059_cast_fp16_5))[name = tensor("aw_291_cast_fp16")]; tensor aw_293_equation_0 = const()[name = tensor("aw_293_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_293_cast_fp16 = einsum(equation = aw_293_equation_0, values = (var_2081_cast_fp16_6, var_2059_cast_fp16_6))[name = tensor("aw_293_cast_fp16")]; tensor aw_295_equation_0 = const()[name = tensor("aw_295_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_295_cast_fp16 = einsum(equation = aw_295_equation_0, values = (var_2081_cast_fp16_7, var_2059_cast_fp16_7))[name = tensor("aw_295_cast_fp16")]; tensor aw_297_equation_0 = const()[name = tensor("aw_297_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_297_cast_fp16 = einsum(equation = aw_297_equation_0, values = (var_2081_cast_fp16_8, var_2059_cast_fp16_8))[name = tensor("aw_297_cast_fp16")]; tensor aw_299_equation_0 = const()[name = tensor("aw_299_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_299_cast_fp16 = einsum(equation = aw_299_equation_0, values = (var_2081_cast_fp16_9, var_2059_cast_fp16_9))[name = tensor("aw_299_cast_fp16")]; tensor aw_301_equation_0 = const()[name = tensor("aw_301_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_301_cast_fp16 = einsum(equation = aw_301_equation_0, values = (var_2081_cast_fp16_10, var_2059_cast_fp16_10))[name = tensor("aw_301_cast_fp16")]; tensor aw_303_equation_0 = const()[name = tensor("aw_303_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_303_cast_fp16 = einsum(equation = aw_303_equation_0, values = (var_2081_cast_fp16_11, var_2059_cast_fp16_11))[name = tensor("aw_303_cast_fp16")]; tensor aw_305_equation_0 = const()[name = tensor("aw_305_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_305_cast_fp16 = einsum(equation = aw_305_equation_0, values = (var_2081_cast_fp16_12, var_2059_cast_fp16_12))[name = tensor("aw_305_cast_fp16")]; tensor aw_307_equation_0 = const()[name = tensor("aw_307_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_307_cast_fp16 = einsum(equation = aw_307_equation_0, values = (var_2081_cast_fp16_13, var_2059_cast_fp16_13))[name = tensor("aw_307_cast_fp16")]; tensor aw_309_equation_0 = const()[name = tensor("aw_309_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_309_cast_fp16 = einsum(equation = aw_309_equation_0, values = (var_2081_cast_fp16_14, var_2059_cast_fp16_14))[name = tensor("aw_309_cast_fp16")]; tensor aw_311_equation_0 = const()[name = tensor("aw_311_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_311_cast_fp16 = einsum(equation = aw_311_equation_0, values = (var_2081_cast_fp16_15, var_2059_cast_fp16_15))[name = tensor("aw_311_cast_fp16")]; tensor aw_313_equation_0 = const()[name = tensor("aw_313_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_313_cast_fp16 = einsum(equation = aw_313_equation_0, values = (var_2081_cast_fp16_16, var_2059_cast_fp16_16))[name = tensor("aw_313_cast_fp16")]; tensor aw_315_equation_0 = const()[name = tensor("aw_315_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_315_cast_fp16 = einsum(equation = aw_315_equation_0, values = (var_2081_cast_fp16_17, var_2059_cast_fp16_17))[name = tensor("aw_315_cast_fp16")]; tensor aw_317_equation_0 = const()[name = tensor("aw_317_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_317_cast_fp16 = einsum(equation = aw_317_equation_0, values = (var_2081_cast_fp16_18, var_2059_cast_fp16_18))[name = tensor("aw_317_cast_fp16")]; tensor aw_319_equation_0 = const()[name = tensor("aw_319_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_319_cast_fp16 = einsum(equation = aw_319_equation_0, values = (var_2081_cast_fp16_19, var_2059_cast_fp16_19))[name = tensor("aw_319_cast_fp16")]; tensor var_2163_cast_fp16 = softmax(axis = var_2007, x = aw_281_cast_fp16)[name = tensor("op_2163_cast_fp16")]; tensor var_2164_cast_fp16 = softmax(axis = var_2007, x = aw_283_cast_fp16)[name = tensor("op_2164_cast_fp16")]; tensor var_2165_cast_fp16 = softmax(axis = var_2007, x = aw_285_cast_fp16)[name = tensor("op_2165_cast_fp16")]; tensor var_2166_cast_fp16 = softmax(axis = var_2007, x = aw_287_cast_fp16)[name = tensor("op_2166_cast_fp16")]; tensor var_2167_cast_fp16 = softmax(axis = var_2007, x = aw_289_cast_fp16)[name = tensor("op_2167_cast_fp16")]; tensor var_2168_cast_fp16 = softmax(axis = var_2007, x = aw_291_cast_fp16)[name = tensor("op_2168_cast_fp16")]; tensor var_2169_cast_fp16 = softmax(axis = var_2007, x = aw_293_cast_fp16)[name = tensor("op_2169_cast_fp16")]; tensor var_2170_cast_fp16 = softmax(axis = var_2007, x = aw_295_cast_fp16)[name = tensor("op_2170_cast_fp16")]; tensor var_2171_cast_fp16 = softmax(axis = var_2007, x = aw_297_cast_fp16)[name = tensor("op_2171_cast_fp16")]; tensor var_2172_cast_fp16 = softmax(axis = var_2007, x = aw_299_cast_fp16)[name = tensor("op_2172_cast_fp16")]; tensor var_2173_cast_fp16 = softmax(axis = var_2007, x = aw_301_cast_fp16)[name = tensor("op_2173_cast_fp16")]; tensor var_2174_cast_fp16 = softmax(axis = var_2007, x = aw_303_cast_fp16)[name = tensor("op_2174_cast_fp16")]; tensor var_2175_cast_fp16 = softmax(axis = var_2007, x = aw_305_cast_fp16)[name = tensor("op_2175_cast_fp16")]; tensor var_2176_cast_fp16 = softmax(axis = var_2007, x = aw_307_cast_fp16)[name = tensor("op_2176_cast_fp16")]; tensor var_2177_cast_fp16 = softmax(axis = var_2007, x = aw_309_cast_fp16)[name = tensor("op_2177_cast_fp16")]; tensor var_2178_cast_fp16 = softmax(axis = var_2007, x = aw_311_cast_fp16)[name = tensor("op_2178_cast_fp16")]; tensor var_2179_cast_fp16 = softmax(axis = var_2007, x = aw_313_cast_fp16)[name = tensor("op_2179_cast_fp16")]; tensor var_2180_cast_fp16 = softmax(axis = var_2007, x = aw_315_cast_fp16)[name = tensor("op_2180_cast_fp16")]; tensor var_2181_cast_fp16 = softmax(axis = var_2007, x = aw_317_cast_fp16)[name = tensor("op_2181_cast_fp16")]; tensor var_2182_cast_fp16 = softmax(axis = var_2007, x = aw_319_cast_fp16)[name = tensor("op_2182_cast_fp16")]; tensor var_2184_equation_0 = const()[name = tensor("op_2184_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2184_cast_fp16 = einsum(equation = var_2184_equation_0, values = (var_2102_cast_fp16_0, var_2163_cast_fp16))[name = tensor("op_2184_cast_fp16")]; tensor var_2186_equation_0 = const()[name = tensor("op_2186_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2186_cast_fp16 = einsum(equation = var_2186_equation_0, values = (var_2102_cast_fp16_1, var_2164_cast_fp16))[name = tensor("op_2186_cast_fp16")]; tensor var_2188_equation_0 = const()[name = tensor("op_2188_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2188_cast_fp16 = einsum(equation = var_2188_equation_0, values = (var_2102_cast_fp16_2, var_2165_cast_fp16))[name = tensor("op_2188_cast_fp16")]; tensor var_2190_equation_0 = const()[name = tensor("op_2190_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2190_cast_fp16 = einsum(equation = var_2190_equation_0, values = (var_2102_cast_fp16_3, var_2166_cast_fp16))[name = tensor("op_2190_cast_fp16")]; tensor var_2192_equation_0 = const()[name = tensor("op_2192_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2192_cast_fp16 = einsum(equation = var_2192_equation_0, values = (var_2102_cast_fp16_4, var_2167_cast_fp16))[name = tensor("op_2192_cast_fp16")]; tensor var_2194_equation_0 = const()[name = tensor("op_2194_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2194_cast_fp16 = einsum(equation = var_2194_equation_0, values = (var_2102_cast_fp16_5, var_2168_cast_fp16))[name = tensor("op_2194_cast_fp16")]; tensor var_2196_equation_0 = const()[name = tensor("op_2196_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2196_cast_fp16 = einsum(equation = var_2196_equation_0, values = (var_2102_cast_fp16_6, var_2169_cast_fp16))[name = tensor("op_2196_cast_fp16")]; tensor var_2198_equation_0 = const()[name = tensor("op_2198_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2198_cast_fp16 = einsum(equation = var_2198_equation_0, values = (var_2102_cast_fp16_7, var_2170_cast_fp16))[name = tensor("op_2198_cast_fp16")]; tensor var_2200_equation_0 = const()[name = tensor("op_2200_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2200_cast_fp16 = einsum(equation = var_2200_equation_0, values = (var_2102_cast_fp16_8, var_2171_cast_fp16))[name = tensor("op_2200_cast_fp16")]; tensor var_2202_equation_0 = const()[name = tensor("op_2202_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2202_cast_fp16 = einsum(equation = var_2202_equation_0, values = (var_2102_cast_fp16_9, var_2172_cast_fp16))[name = tensor("op_2202_cast_fp16")]; tensor var_2204_equation_0 = const()[name = tensor("op_2204_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2204_cast_fp16 = einsum(equation = var_2204_equation_0, values = (var_2102_cast_fp16_10, var_2173_cast_fp16))[name = tensor("op_2204_cast_fp16")]; tensor var_2206_equation_0 = const()[name = tensor("op_2206_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2206_cast_fp16 = einsum(equation = var_2206_equation_0, values = (var_2102_cast_fp16_11, var_2174_cast_fp16))[name = tensor("op_2206_cast_fp16")]; tensor var_2208_equation_0 = const()[name = tensor("op_2208_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2208_cast_fp16 = einsum(equation = var_2208_equation_0, values = (var_2102_cast_fp16_12, var_2175_cast_fp16))[name = tensor("op_2208_cast_fp16")]; tensor var_2210_equation_0 = const()[name = tensor("op_2210_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2210_cast_fp16 = einsum(equation = var_2210_equation_0, values = (var_2102_cast_fp16_13, var_2176_cast_fp16))[name = tensor("op_2210_cast_fp16")]; tensor var_2212_equation_0 = const()[name = tensor("op_2212_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2212_cast_fp16 = einsum(equation = var_2212_equation_0, values = (var_2102_cast_fp16_14, var_2177_cast_fp16))[name = tensor("op_2212_cast_fp16")]; tensor var_2214_equation_0 = const()[name = tensor("op_2214_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2214_cast_fp16 = einsum(equation = var_2214_equation_0, values = (var_2102_cast_fp16_15, var_2178_cast_fp16))[name = tensor("op_2214_cast_fp16")]; tensor var_2216_equation_0 = const()[name = tensor("op_2216_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2216_cast_fp16 = einsum(equation = var_2216_equation_0, values = (var_2102_cast_fp16_16, var_2179_cast_fp16))[name = tensor("op_2216_cast_fp16")]; tensor var_2218_equation_0 = const()[name = tensor("op_2218_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2218_cast_fp16 = einsum(equation = var_2218_equation_0, values = (var_2102_cast_fp16_17, var_2180_cast_fp16))[name = tensor("op_2218_cast_fp16")]; tensor var_2220_equation_0 = const()[name = tensor("op_2220_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2220_cast_fp16 = einsum(equation = var_2220_equation_0, values = (var_2102_cast_fp16_18, var_2181_cast_fp16))[name = tensor("op_2220_cast_fp16")]; tensor var_2222_equation_0 = const()[name = tensor("op_2222_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2222_cast_fp16 = einsum(equation = var_2222_equation_0, values = (var_2102_cast_fp16_19, var_2182_cast_fp16))[name = tensor("op_2222_cast_fp16")]; tensor input_75_interleave_0 = const()[name = tensor("input_75_interleave_0"), val = tensor(false)]; tensor input_75_cast_fp16 = concat(axis = var_2007, interleave = input_75_interleave_0, values = (var_2184_cast_fp16, var_2186_cast_fp16, var_2188_cast_fp16, var_2190_cast_fp16, var_2192_cast_fp16, var_2194_cast_fp16, var_2196_cast_fp16, var_2198_cast_fp16, var_2200_cast_fp16, var_2202_cast_fp16, var_2204_cast_fp16, var_2206_cast_fp16, var_2208_cast_fp16, var_2210_cast_fp16, var_2212_cast_fp16, var_2214_cast_fp16, var_2216_cast_fp16, var_2218_cast_fp16, var_2220_cast_fp16, var_2222_cast_fp16))[name = tensor("input_75_cast_fp16")]; tensor var_2231_pad_type_0 = const()[name = tensor("op_2231_pad_type_0"), val = tensor("valid")]; tensor var_2231_strides_0 = const()[name = tensor("op_2231_strides_0"), val = tensor([1, 1])]; tensor var_2231_pad_0 = const()[name = tensor("op_2231_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_2231_dilations_0 = const()[name = tensor("op_2231_dilations_0"), val = tensor([1, 1])]; tensor var_2231_groups_0 = const()[name = tensor("op_2231_groups_0"), val = tensor(1)]; tensor blocks_7_attn_out_weight_to_fp16 = const()[name = tensor("blocks_7_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(299972992)))]; tensor blocks_7_attn_out_bias_to_fp16 = const()[name = tensor("blocks_7_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303249856)))]; tensor var_2231_cast_fp16 = conv(bias = blocks_7_attn_out_bias_to_fp16, dilations = var_2231_dilations_0, groups = var_2231_groups_0, pad = var_2231_pad_0, pad_type = var_2231_pad_type_0, strides = var_2231_strides_0, weight = blocks_7_attn_out_weight_to_fp16, x = input_75_cast_fp16)[name = tensor("op_2231_cast_fp16")]; tensor inputs_31_cast_fp16 = add(x = inputs_29_cast_fp16, y = var_2231_cast_fp16)[name = tensor("inputs_31_cast_fp16")]; tensor input_77_axes_0 = const()[name = tensor("input_77_axes_0"), val = tensor([1])]; tensor input_77_gamma_0_to_fp16 = const()[name = tensor("input_77_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303252480)))]; tensor input_77_beta_0_to_fp16 = const()[name = tensor("input_77_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303255104)))]; tensor var_2241_to_fp16 = const()[name = tensor("op_2241_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_77_cast_fp16 = layer_norm(axes = input_77_axes_0, beta = input_77_beta_0_to_fp16, epsilon = var_2241_to_fp16, gamma = input_77_gamma_0_to_fp16, x = inputs_31_cast_fp16)[name = tensor("input_77_cast_fp16")]; tensor input_79_pad_type_0 = const()[name = tensor("input_79_pad_type_0"), val = tensor("valid")]; tensor input_79_strides_0 = const()[name = tensor("input_79_strides_0"), val = tensor([1, 1])]; tensor input_79_pad_0 = const()[name = tensor("input_79_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_79_dilations_0 = const()[name = tensor("input_79_dilations_0"), val = tensor([1, 1])]; tensor input_79_groups_0 = const()[name = tensor("input_79_groups_0"), val = tensor(1)]; tensor blocks_7_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_7_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303257728)))]; tensor blocks_7_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_7_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316364992)))]; tensor input_79_cast_fp16 = conv(bias = blocks_7_mlp_0_bias_to_fp16, dilations = input_79_dilations_0, groups = input_79_groups_0, pad = input_79_pad_0, pad_type = input_79_pad_type_0, strides = input_79_strides_0, weight = blocks_7_mlp_0_weight_to_fp16, x = input_77_cast_fp16)[name = tensor("input_79_cast_fp16")]; tensor input_81_mode_0 = const()[name = tensor("input_81_mode_0"), val = tensor("EXACT")]; tensor input_81_cast_fp16 = gelu(mode = input_81_mode_0, x = input_79_cast_fp16)[name = tensor("input_81_cast_fp16")]; tensor var_2267_pad_type_0 = const()[name = tensor("op_2267_pad_type_0"), val = tensor("valid")]; tensor var_2267_strides_0 = const()[name = tensor("op_2267_strides_0"), val = tensor([1, 1])]; tensor var_2267_pad_0 = const()[name = tensor("op_2267_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_2267_dilations_0 = const()[name = tensor("op_2267_dilations_0"), val = tensor([1, 1])]; tensor var_2267_groups_0 = const()[name = tensor("op_2267_groups_0"), val = tensor(1)]; tensor blocks_7_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_7_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316375296)))]; tensor blocks_7_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_7_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329482560)))]; tensor var_2267_cast_fp16 = conv(bias = blocks_7_mlp_2_bias_to_fp16, dilations = var_2267_dilations_0, groups = var_2267_groups_0, pad = var_2267_pad_0, pad_type = var_2267_pad_type_0, strides = var_2267_strides_0, weight = blocks_7_mlp_2_weight_to_fp16, x = input_81_cast_fp16)[name = tensor("op_2267_cast_fp16")]; tensor inputs_33_cast_fp16 = add(x = inputs_31_cast_fp16, y = var_2267_cast_fp16)[name = tensor("inputs_33_cast_fp16")]; tensor var_2276 = const()[name = tensor("op_2276"), val = tensor(1)]; tensor input_83_axes_0 = const()[name = tensor("input_83_axes_0"), val = tensor([1])]; tensor input_83_gamma_0_to_fp16 = const()[name = tensor("input_83_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329485184)))]; tensor input_83_beta_0_to_fp16 = const()[name = tensor("input_83_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329487808)))]; tensor var_2292_to_fp16 = const()[name = tensor("op_2292_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_83_cast_fp16 = layer_norm(axes = input_83_axes_0, beta = input_83_beta_0_to_fp16, epsilon = var_2292_to_fp16, gamma = input_83_gamma_0_to_fp16, x = inputs_33_cast_fp16)[name = tensor("input_83_cast_fp16")]; tensor q_17_pad_type_0 = const()[name = tensor("q_17_pad_type_0"), val = tensor("valid")]; tensor q_17_strides_0 = const()[name = tensor("q_17_strides_0"), val = tensor([1, 1])]; tensor q_17_pad_0 = const()[name = tensor("q_17_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_17_dilations_0 = const()[name = tensor("q_17_dilations_0"), val = tensor([1, 1])]; tensor q_17_groups_0 = const()[name = tensor("q_17_groups_0"), val = tensor(1)]; tensor var_2327_weight_0_to_fp16 = const()[name = tensor("op_2327_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329490432)))]; tensor var_2327_bias_0_to_fp16 = const()[name = tensor("op_2327_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(332767296)))]; tensor var_2327_cast_fp16 = conv(bias = var_2327_bias_0_to_fp16, dilations = q_17_dilations_0, groups = q_17_groups_0, pad = q_17_pad_0, pad_type = q_17_pad_type_0, strides = q_17_strides_0, weight = var_2327_weight_0_to_fp16, x = input_83_cast_fp16)[name = tensor("op_2327_cast_fp16")]; tensor k_17_pad_type_0 = const()[name = tensor("k_17_pad_type_0"), val = tensor("valid")]; tensor k_17_strides_0 = const()[name = tensor("k_17_strides_0"), val = tensor([1, 1])]; tensor k_17_pad_0 = const()[name = tensor("k_17_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_17_dilations_0 = const()[name = tensor("k_17_dilations_0"), val = tensor([1, 1])]; tensor k_17_groups_0 = const()[name = tensor("k_17_groups_0"), val = tensor(1)]; tensor blocks_8_attn_key_weight_to_fp16 = const()[name = tensor("blocks_8_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(332769920)))]; tensor k_17_cast_fp16 = conv(dilations = k_17_dilations_0, groups = k_17_groups_0, pad = k_17_pad_0, pad_type = k_17_pad_type_0, strides = k_17_strides_0, weight = blocks_8_attn_key_weight_to_fp16, x = input_83_cast_fp16)[name = tensor("k_17_cast_fp16")]; tensor var_2325_pad_type_0 = const()[name = tensor("op_2325_pad_type_0"), val = tensor("valid")]; tensor var_2325_strides_0 = const()[name = tensor("op_2325_strides_0"), val = tensor([1, 1])]; tensor var_2325_pad_0 = const()[name = tensor("op_2325_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_2325_dilations_0 = const()[name = tensor("op_2325_dilations_0"), val = tensor([1, 1])]; tensor var_2325_groups_0 = const()[name = tensor("op_2325_groups_0"), val = tensor(1)]; tensor blocks_8_attn_value_weight_to_fp16 = const()[name = tensor("blocks_8_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(336046784)))]; tensor blocks_8_attn_value_bias_to_fp16 = const()[name = tensor("blocks_8_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(339323648)))]; tensor var_2325_cast_fp16 = conv(bias = blocks_8_attn_value_bias_to_fp16, dilations = var_2325_dilations_0, groups = var_2325_groups_0, pad = var_2325_pad_0, pad_type = var_2325_pad_type_0, strides = var_2325_strides_0, weight = blocks_8_attn_value_weight_to_fp16, x = input_83_cast_fp16)[name = tensor("op_2325_cast_fp16")]; tensor tile_24 = const()[name = tensor("tile_24"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_2328_axis_0 = const()[name = tensor("op_2328_axis_0"), val = tensor(1)]; tensor var_2328_cast_fp16_0, tensor var_2328_cast_fp16_1, tensor var_2328_cast_fp16_2, tensor var_2328_cast_fp16_3, tensor var_2328_cast_fp16_4, tensor var_2328_cast_fp16_5, tensor var_2328_cast_fp16_6, tensor var_2328_cast_fp16_7, tensor var_2328_cast_fp16_8, tensor var_2328_cast_fp16_9, tensor var_2328_cast_fp16_10, tensor var_2328_cast_fp16_11, tensor var_2328_cast_fp16_12, tensor var_2328_cast_fp16_13, tensor var_2328_cast_fp16_14, tensor var_2328_cast_fp16_15, tensor var_2328_cast_fp16_16, tensor var_2328_cast_fp16_17, tensor var_2328_cast_fp16_18, tensor var_2328_cast_fp16_19 = split(axis = var_2328_axis_0, split_sizes = tile_24, x = var_2327_cast_fp16)[name = tensor("op_2328_cast_fp16")]; tensor var_2349_perm_0 = const()[name = tensor("op_2349_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_25 = const()[name = tensor("tile_25"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_2350_axis_0 = const()[name = tensor("op_2350_axis_0"), val = tensor(3)]; tensor var_2349_cast_fp16 = transpose(perm = var_2349_perm_0, x = k_17_cast_fp16)[name = tensor("transpose_24")]; tensor var_2350_cast_fp16_0, tensor var_2350_cast_fp16_1, tensor var_2350_cast_fp16_2, tensor var_2350_cast_fp16_3, tensor var_2350_cast_fp16_4, tensor var_2350_cast_fp16_5, tensor var_2350_cast_fp16_6, tensor var_2350_cast_fp16_7, tensor var_2350_cast_fp16_8, tensor var_2350_cast_fp16_9, tensor var_2350_cast_fp16_10, tensor var_2350_cast_fp16_11, tensor var_2350_cast_fp16_12, tensor var_2350_cast_fp16_13, tensor var_2350_cast_fp16_14, tensor var_2350_cast_fp16_15, tensor var_2350_cast_fp16_16, tensor var_2350_cast_fp16_17, tensor var_2350_cast_fp16_18, tensor var_2350_cast_fp16_19 = split(axis = var_2350_axis_0, split_sizes = tile_25, x = var_2349_cast_fp16)[name = tensor("op_2350_cast_fp16")]; tensor tile_26 = const()[name = tensor("tile_26"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_2371_axis_0 = const()[name = tensor("op_2371_axis_0"), val = tensor(1)]; tensor var_2371_cast_fp16_0, tensor var_2371_cast_fp16_1, tensor var_2371_cast_fp16_2, tensor var_2371_cast_fp16_3, tensor var_2371_cast_fp16_4, tensor var_2371_cast_fp16_5, tensor var_2371_cast_fp16_6, tensor var_2371_cast_fp16_7, tensor var_2371_cast_fp16_8, tensor var_2371_cast_fp16_9, tensor var_2371_cast_fp16_10, tensor var_2371_cast_fp16_11, tensor var_2371_cast_fp16_12, tensor var_2371_cast_fp16_13, tensor var_2371_cast_fp16_14, tensor var_2371_cast_fp16_15, tensor var_2371_cast_fp16_16, tensor var_2371_cast_fp16_17, tensor var_2371_cast_fp16_18, tensor var_2371_cast_fp16_19 = split(axis = var_2371_axis_0, split_sizes = tile_26, x = var_2325_cast_fp16)[name = tensor("op_2371_cast_fp16")]; tensor aw_321_equation_0 = const()[name = tensor("aw_321_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_321_cast_fp16 = einsum(equation = aw_321_equation_0, values = (var_2350_cast_fp16_0, var_2328_cast_fp16_0))[name = tensor("aw_321_cast_fp16")]; tensor aw_323_equation_0 = const()[name = tensor("aw_323_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_323_cast_fp16 = einsum(equation = aw_323_equation_0, values = (var_2350_cast_fp16_1, var_2328_cast_fp16_1))[name = tensor("aw_323_cast_fp16")]; tensor aw_325_equation_0 = const()[name = tensor("aw_325_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_325_cast_fp16 = einsum(equation = aw_325_equation_0, values = (var_2350_cast_fp16_2, var_2328_cast_fp16_2))[name = tensor("aw_325_cast_fp16")]; tensor aw_327_equation_0 = const()[name = tensor("aw_327_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_327_cast_fp16 = einsum(equation = aw_327_equation_0, values = (var_2350_cast_fp16_3, var_2328_cast_fp16_3))[name = tensor("aw_327_cast_fp16")]; tensor aw_329_equation_0 = const()[name = tensor("aw_329_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_329_cast_fp16 = einsum(equation = aw_329_equation_0, values = (var_2350_cast_fp16_4, var_2328_cast_fp16_4))[name = tensor("aw_329_cast_fp16")]; tensor aw_331_equation_0 = const()[name = tensor("aw_331_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_331_cast_fp16 = einsum(equation = aw_331_equation_0, values = (var_2350_cast_fp16_5, var_2328_cast_fp16_5))[name = tensor("aw_331_cast_fp16")]; tensor aw_333_equation_0 = const()[name = tensor("aw_333_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_333_cast_fp16 = einsum(equation = aw_333_equation_0, values = (var_2350_cast_fp16_6, var_2328_cast_fp16_6))[name = tensor("aw_333_cast_fp16")]; tensor aw_335_equation_0 = const()[name = tensor("aw_335_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_335_cast_fp16 = einsum(equation = aw_335_equation_0, values = (var_2350_cast_fp16_7, var_2328_cast_fp16_7))[name = tensor("aw_335_cast_fp16")]; tensor aw_337_equation_0 = const()[name = tensor("aw_337_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_337_cast_fp16 = einsum(equation = aw_337_equation_0, values = (var_2350_cast_fp16_8, var_2328_cast_fp16_8))[name = tensor("aw_337_cast_fp16")]; tensor aw_339_equation_0 = const()[name = tensor("aw_339_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_339_cast_fp16 = einsum(equation = aw_339_equation_0, values = (var_2350_cast_fp16_9, var_2328_cast_fp16_9))[name = tensor("aw_339_cast_fp16")]; tensor aw_341_equation_0 = const()[name = tensor("aw_341_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_341_cast_fp16 = einsum(equation = aw_341_equation_0, values = (var_2350_cast_fp16_10, var_2328_cast_fp16_10))[name = tensor("aw_341_cast_fp16")]; tensor aw_343_equation_0 = const()[name = tensor("aw_343_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_343_cast_fp16 = einsum(equation = aw_343_equation_0, values = (var_2350_cast_fp16_11, var_2328_cast_fp16_11))[name = tensor("aw_343_cast_fp16")]; tensor aw_345_equation_0 = const()[name = tensor("aw_345_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_345_cast_fp16 = einsum(equation = aw_345_equation_0, values = (var_2350_cast_fp16_12, var_2328_cast_fp16_12))[name = tensor("aw_345_cast_fp16")]; tensor aw_347_equation_0 = const()[name = tensor("aw_347_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_347_cast_fp16 = einsum(equation = aw_347_equation_0, values = (var_2350_cast_fp16_13, var_2328_cast_fp16_13))[name = tensor("aw_347_cast_fp16")]; tensor aw_349_equation_0 = const()[name = tensor("aw_349_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_349_cast_fp16 = einsum(equation = aw_349_equation_0, values = (var_2350_cast_fp16_14, var_2328_cast_fp16_14))[name = tensor("aw_349_cast_fp16")]; tensor aw_351_equation_0 = const()[name = tensor("aw_351_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_351_cast_fp16 = einsum(equation = aw_351_equation_0, values = (var_2350_cast_fp16_15, var_2328_cast_fp16_15))[name = tensor("aw_351_cast_fp16")]; tensor aw_353_equation_0 = const()[name = tensor("aw_353_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_353_cast_fp16 = einsum(equation = aw_353_equation_0, values = (var_2350_cast_fp16_16, var_2328_cast_fp16_16))[name = tensor("aw_353_cast_fp16")]; tensor aw_355_equation_0 = const()[name = tensor("aw_355_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_355_cast_fp16 = einsum(equation = aw_355_equation_0, values = (var_2350_cast_fp16_17, var_2328_cast_fp16_17))[name = tensor("aw_355_cast_fp16")]; tensor aw_357_equation_0 = const()[name = tensor("aw_357_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_357_cast_fp16 = einsum(equation = aw_357_equation_0, values = (var_2350_cast_fp16_18, var_2328_cast_fp16_18))[name = tensor("aw_357_cast_fp16")]; tensor aw_359_equation_0 = const()[name = tensor("aw_359_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_359_cast_fp16 = einsum(equation = aw_359_equation_0, values = (var_2350_cast_fp16_19, var_2328_cast_fp16_19))[name = tensor("aw_359_cast_fp16")]; tensor var_2432_cast_fp16 = softmax(axis = var_2276, x = aw_321_cast_fp16)[name = tensor("op_2432_cast_fp16")]; tensor var_2433_cast_fp16 = softmax(axis = var_2276, x = aw_323_cast_fp16)[name = tensor("op_2433_cast_fp16")]; tensor var_2434_cast_fp16 = softmax(axis = var_2276, x = aw_325_cast_fp16)[name = tensor("op_2434_cast_fp16")]; tensor var_2435_cast_fp16 = softmax(axis = var_2276, x = aw_327_cast_fp16)[name = tensor("op_2435_cast_fp16")]; tensor var_2436_cast_fp16 = softmax(axis = var_2276, x = aw_329_cast_fp16)[name = tensor("op_2436_cast_fp16")]; tensor var_2437_cast_fp16 = softmax(axis = var_2276, x = aw_331_cast_fp16)[name = tensor("op_2437_cast_fp16")]; tensor var_2438_cast_fp16 = softmax(axis = var_2276, x = aw_333_cast_fp16)[name = tensor("op_2438_cast_fp16")]; tensor var_2439_cast_fp16 = softmax(axis = var_2276, x = aw_335_cast_fp16)[name = tensor("op_2439_cast_fp16")]; tensor var_2440_cast_fp16 = softmax(axis = var_2276, x = aw_337_cast_fp16)[name = tensor("op_2440_cast_fp16")]; tensor var_2441_cast_fp16 = softmax(axis = var_2276, x = aw_339_cast_fp16)[name = tensor("op_2441_cast_fp16")]; tensor var_2442_cast_fp16 = softmax(axis = var_2276, x = aw_341_cast_fp16)[name = tensor("op_2442_cast_fp16")]; tensor var_2443_cast_fp16 = softmax(axis = var_2276, x = aw_343_cast_fp16)[name = tensor("op_2443_cast_fp16")]; tensor var_2444_cast_fp16 = softmax(axis = var_2276, x = aw_345_cast_fp16)[name = tensor("op_2444_cast_fp16")]; tensor var_2445_cast_fp16 = softmax(axis = var_2276, x = aw_347_cast_fp16)[name = tensor("op_2445_cast_fp16")]; tensor var_2446_cast_fp16 = softmax(axis = var_2276, x = aw_349_cast_fp16)[name = tensor("op_2446_cast_fp16")]; tensor var_2447_cast_fp16 = softmax(axis = var_2276, x = aw_351_cast_fp16)[name = tensor("op_2447_cast_fp16")]; tensor var_2448_cast_fp16 = softmax(axis = var_2276, x = aw_353_cast_fp16)[name = tensor("op_2448_cast_fp16")]; tensor var_2449_cast_fp16 = softmax(axis = var_2276, x = aw_355_cast_fp16)[name = tensor("op_2449_cast_fp16")]; tensor var_2450_cast_fp16 = softmax(axis = var_2276, x = aw_357_cast_fp16)[name = tensor("op_2450_cast_fp16")]; tensor var_2451_cast_fp16 = softmax(axis = var_2276, x = aw_359_cast_fp16)[name = tensor("op_2451_cast_fp16")]; tensor var_2453_equation_0 = const()[name = tensor("op_2453_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2453_cast_fp16 = einsum(equation = var_2453_equation_0, values = (var_2371_cast_fp16_0, var_2432_cast_fp16))[name = tensor("op_2453_cast_fp16")]; tensor var_2455_equation_0 = const()[name = tensor("op_2455_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2455_cast_fp16 = einsum(equation = var_2455_equation_0, values = (var_2371_cast_fp16_1, var_2433_cast_fp16))[name = tensor("op_2455_cast_fp16")]; tensor var_2457_equation_0 = const()[name = tensor("op_2457_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2457_cast_fp16 = einsum(equation = var_2457_equation_0, values = (var_2371_cast_fp16_2, var_2434_cast_fp16))[name = tensor("op_2457_cast_fp16")]; tensor var_2459_equation_0 = const()[name = tensor("op_2459_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2459_cast_fp16 = einsum(equation = var_2459_equation_0, values = (var_2371_cast_fp16_3, var_2435_cast_fp16))[name = tensor("op_2459_cast_fp16")]; tensor var_2461_equation_0 = const()[name = tensor("op_2461_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2461_cast_fp16 = einsum(equation = var_2461_equation_0, values = (var_2371_cast_fp16_4, var_2436_cast_fp16))[name = tensor("op_2461_cast_fp16")]; tensor var_2463_equation_0 = const()[name = tensor("op_2463_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2463_cast_fp16 = einsum(equation = var_2463_equation_0, values = (var_2371_cast_fp16_5, var_2437_cast_fp16))[name = tensor("op_2463_cast_fp16")]; tensor var_2465_equation_0 = const()[name = tensor("op_2465_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2465_cast_fp16 = einsum(equation = var_2465_equation_0, values = (var_2371_cast_fp16_6, var_2438_cast_fp16))[name = tensor("op_2465_cast_fp16")]; tensor var_2467_equation_0 = const()[name = tensor("op_2467_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2467_cast_fp16 = einsum(equation = var_2467_equation_0, values = (var_2371_cast_fp16_7, var_2439_cast_fp16))[name = tensor("op_2467_cast_fp16")]; tensor var_2469_equation_0 = const()[name = tensor("op_2469_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2469_cast_fp16 = einsum(equation = var_2469_equation_0, values = (var_2371_cast_fp16_8, var_2440_cast_fp16))[name = tensor("op_2469_cast_fp16")]; tensor var_2471_equation_0 = const()[name = tensor("op_2471_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2471_cast_fp16 = einsum(equation = var_2471_equation_0, values = (var_2371_cast_fp16_9, var_2441_cast_fp16))[name = tensor("op_2471_cast_fp16")]; tensor var_2473_equation_0 = const()[name = tensor("op_2473_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2473_cast_fp16 = einsum(equation = var_2473_equation_0, values = (var_2371_cast_fp16_10, var_2442_cast_fp16))[name = tensor("op_2473_cast_fp16")]; tensor var_2475_equation_0 = const()[name = tensor("op_2475_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2475_cast_fp16 = einsum(equation = var_2475_equation_0, values = (var_2371_cast_fp16_11, var_2443_cast_fp16))[name = tensor("op_2475_cast_fp16")]; tensor var_2477_equation_0 = const()[name = tensor("op_2477_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2477_cast_fp16 = einsum(equation = var_2477_equation_0, values = (var_2371_cast_fp16_12, var_2444_cast_fp16))[name = tensor("op_2477_cast_fp16")]; tensor var_2479_equation_0 = const()[name = tensor("op_2479_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2479_cast_fp16 = einsum(equation = var_2479_equation_0, values = (var_2371_cast_fp16_13, var_2445_cast_fp16))[name = tensor("op_2479_cast_fp16")]; tensor var_2481_equation_0 = const()[name = tensor("op_2481_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2481_cast_fp16 = einsum(equation = var_2481_equation_0, values = (var_2371_cast_fp16_14, var_2446_cast_fp16))[name = tensor("op_2481_cast_fp16")]; tensor var_2483_equation_0 = const()[name = tensor("op_2483_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2483_cast_fp16 = einsum(equation = var_2483_equation_0, values = (var_2371_cast_fp16_15, var_2447_cast_fp16))[name = tensor("op_2483_cast_fp16")]; tensor var_2485_equation_0 = const()[name = tensor("op_2485_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2485_cast_fp16 = einsum(equation = var_2485_equation_0, values = (var_2371_cast_fp16_16, var_2448_cast_fp16))[name = tensor("op_2485_cast_fp16")]; tensor var_2487_equation_0 = const()[name = tensor("op_2487_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2487_cast_fp16 = einsum(equation = var_2487_equation_0, values = (var_2371_cast_fp16_17, var_2449_cast_fp16))[name = tensor("op_2487_cast_fp16")]; tensor var_2489_equation_0 = const()[name = tensor("op_2489_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2489_cast_fp16 = einsum(equation = var_2489_equation_0, values = (var_2371_cast_fp16_18, var_2450_cast_fp16))[name = tensor("op_2489_cast_fp16")]; tensor var_2491_equation_0 = const()[name = tensor("op_2491_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2491_cast_fp16 = einsum(equation = var_2491_equation_0, values = (var_2371_cast_fp16_19, var_2451_cast_fp16))[name = tensor("op_2491_cast_fp16")]; tensor input_85_interleave_0 = const()[name = tensor("input_85_interleave_0"), val = tensor(false)]; tensor input_85_cast_fp16 = concat(axis = var_2276, interleave = input_85_interleave_0, values = (var_2453_cast_fp16, var_2455_cast_fp16, var_2457_cast_fp16, var_2459_cast_fp16, var_2461_cast_fp16, var_2463_cast_fp16, var_2465_cast_fp16, var_2467_cast_fp16, var_2469_cast_fp16, var_2471_cast_fp16, var_2473_cast_fp16, var_2475_cast_fp16, var_2477_cast_fp16, var_2479_cast_fp16, var_2481_cast_fp16, var_2483_cast_fp16, var_2485_cast_fp16, var_2487_cast_fp16, var_2489_cast_fp16, var_2491_cast_fp16))[name = tensor("input_85_cast_fp16")]; tensor var_2500_pad_type_0 = const()[name = tensor("op_2500_pad_type_0"), val = tensor("valid")]; tensor var_2500_strides_0 = const()[name = tensor("op_2500_strides_0"), val = tensor([1, 1])]; tensor var_2500_pad_0 = const()[name = tensor("op_2500_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_2500_dilations_0 = const()[name = tensor("op_2500_dilations_0"), val = tensor([1, 1])]; tensor var_2500_groups_0 = const()[name = tensor("op_2500_groups_0"), val = tensor(1)]; tensor blocks_8_attn_out_weight_to_fp16 = const()[name = tensor("blocks_8_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(339326272)))]; tensor blocks_8_attn_out_bias_to_fp16 = const()[name = tensor("blocks_8_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(342603136)))]; tensor var_2500_cast_fp16 = conv(bias = blocks_8_attn_out_bias_to_fp16, dilations = var_2500_dilations_0, groups = var_2500_groups_0, pad = var_2500_pad_0, pad_type = var_2500_pad_type_0, strides = var_2500_strides_0, weight = blocks_8_attn_out_weight_to_fp16, x = input_85_cast_fp16)[name = tensor("op_2500_cast_fp16")]; tensor inputs_35_cast_fp16 = add(x = inputs_33_cast_fp16, y = var_2500_cast_fp16)[name = tensor("inputs_35_cast_fp16")]; tensor input_87_axes_0 = const()[name = tensor("input_87_axes_0"), val = tensor([1])]; tensor input_87_gamma_0_to_fp16 = const()[name = tensor("input_87_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(342605760)))]; tensor input_87_beta_0_to_fp16 = const()[name = tensor("input_87_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(342608384)))]; tensor var_2510_to_fp16 = const()[name = tensor("op_2510_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_87_cast_fp16 = layer_norm(axes = input_87_axes_0, beta = input_87_beta_0_to_fp16, epsilon = var_2510_to_fp16, gamma = input_87_gamma_0_to_fp16, x = inputs_35_cast_fp16)[name = tensor("input_87_cast_fp16")]; tensor input_89_pad_type_0 = const()[name = tensor("input_89_pad_type_0"), val = tensor("valid")]; tensor input_89_strides_0 = const()[name = tensor("input_89_strides_0"), val = tensor([1, 1])]; tensor input_89_pad_0 = const()[name = tensor("input_89_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_89_dilations_0 = const()[name = tensor("input_89_dilations_0"), val = tensor([1, 1])]; tensor input_89_groups_0 = const()[name = tensor("input_89_groups_0"), val = tensor(1)]; tensor blocks_8_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_8_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(342611008)))]; tensor blocks_8_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_8_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(355718272)))]; tensor input_89_cast_fp16 = conv(bias = blocks_8_mlp_0_bias_to_fp16, dilations = input_89_dilations_0, groups = input_89_groups_0, pad = input_89_pad_0, pad_type = input_89_pad_type_0, strides = input_89_strides_0, weight = blocks_8_mlp_0_weight_to_fp16, x = input_87_cast_fp16)[name = tensor("input_89_cast_fp16")]; tensor input_91_mode_0 = const()[name = tensor("input_91_mode_0"), val = tensor("EXACT")]; tensor input_91_cast_fp16 = gelu(mode = input_91_mode_0, x = input_89_cast_fp16)[name = tensor("input_91_cast_fp16")]; tensor var_2536_pad_type_0 = const()[name = tensor("op_2536_pad_type_0"), val = tensor("valid")]; tensor var_2536_strides_0 = const()[name = tensor("op_2536_strides_0"), val = tensor([1, 1])]; tensor var_2536_pad_0 = const()[name = tensor("op_2536_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_2536_dilations_0 = const()[name = tensor("op_2536_dilations_0"), val = tensor([1, 1])]; tensor var_2536_groups_0 = const()[name = tensor("op_2536_groups_0"), val = tensor(1)]; tensor blocks_8_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_8_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(355728576)))]; tensor blocks_8_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_8_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368835840)))]; tensor var_2536_cast_fp16 = conv(bias = blocks_8_mlp_2_bias_to_fp16, dilations = var_2536_dilations_0, groups = var_2536_groups_0, pad = var_2536_pad_0, pad_type = var_2536_pad_type_0, strides = var_2536_strides_0, weight = blocks_8_mlp_2_weight_to_fp16, x = input_91_cast_fp16)[name = tensor("op_2536_cast_fp16")]; tensor inputs_37_cast_fp16 = add(x = inputs_35_cast_fp16, y = var_2536_cast_fp16)[name = tensor("inputs_37_cast_fp16")]; tensor var_2545 = const()[name = tensor("op_2545"), val = tensor(1)]; tensor input_93_axes_0 = const()[name = tensor("input_93_axes_0"), val = tensor([1])]; tensor input_93_gamma_0_to_fp16 = const()[name = tensor("input_93_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368838464)))]; tensor input_93_beta_0_to_fp16 = const()[name = tensor("input_93_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368841088)))]; tensor var_2561_to_fp16 = const()[name = tensor("op_2561_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_93_cast_fp16 = layer_norm(axes = input_93_axes_0, beta = input_93_beta_0_to_fp16, epsilon = var_2561_to_fp16, gamma = input_93_gamma_0_to_fp16, x = inputs_37_cast_fp16)[name = tensor("input_93_cast_fp16")]; tensor q_19_pad_type_0 = const()[name = tensor("q_19_pad_type_0"), val = tensor("valid")]; tensor q_19_strides_0 = const()[name = tensor("q_19_strides_0"), val = tensor([1, 1])]; tensor q_19_pad_0 = const()[name = tensor("q_19_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_19_dilations_0 = const()[name = tensor("q_19_dilations_0"), val = tensor([1, 1])]; tensor q_19_groups_0 = const()[name = tensor("q_19_groups_0"), val = tensor(1)]; tensor var_2596_weight_0_to_fp16 = const()[name = tensor("op_2596_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368843712)))]; tensor var_2596_bias_0_to_fp16 = const()[name = tensor("op_2596_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(372120576)))]; tensor var_2596_cast_fp16 = conv(bias = var_2596_bias_0_to_fp16, dilations = q_19_dilations_0, groups = q_19_groups_0, pad = q_19_pad_0, pad_type = q_19_pad_type_0, strides = q_19_strides_0, weight = var_2596_weight_0_to_fp16, x = input_93_cast_fp16)[name = tensor("op_2596_cast_fp16")]; tensor k_19_pad_type_0 = const()[name = tensor("k_19_pad_type_0"), val = tensor("valid")]; tensor k_19_strides_0 = const()[name = tensor("k_19_strides_0"), val = tensor([1, 1])]; tensor k_19_pad_0 = const()[name = tensor("k_19_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_19_dilations_0 = const()[name = tensor("k_19_dilations_0"), val = tensor([1, 1])]; tensor k_19_groups_0 = const()[name = tensor("k_19_groups_0"), val = tensor(1)]; tensor blocks_9_attn_key_weight_to_fp16 = const()[name = tensor("blocks_9_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(372123200)))]; tensor k_19_cast_fp16 = conv(dilations = k_19_dilations_0, groups = k_19_groups_0, pad = k_19_pad_0, pad_type = k_19_pad_type_0, strides = k_19_strides_0, weight = blocks_9_attn_key_weight_to_fp16, x = input_93_cast_fp16)[name = tensor("k_19_cast_fp16")]; tensor var_2594_pad_type_0 = const()[name = tensor("op_2594_pad_type_0"), val = tensor("valid")]; tensor var_2594_strides_0 = const()[name = tensor("op_2594_strides_0"), val = tensor([1, 1])]; tensor var_2594_pad_0 = const()[name = tensor("op_2594_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_2594_dilations_0 = const()[name = tensor("op_2594_dilations_0"), val = tensor([1, 1])]; tensor var_2594_groups_0 = const()[name = tensor("op_2594_groups_0"), val = tensor(1)]; tensor blocks_9_attn_value_weight_to_fp16 = const()[name = tensor("blocks_9_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(375400064)))]; tensor blocks_9_attn_value_bias_to_fp16 = const()[name = tensor("blocks_9_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(378676928)))]; tensor var_2594_cast_fp16 = conv(bias = blocks_9_attn_value_bias_to_fp16, dilations = var_2594_dilations_0, groups = var_2594_groups_0, pad = var_2594_pad_0, pad_type = var_2594_pad_type_0, strides = var_2594_strides_0, weight = blocks_9_attn_value_weight_to_fp16, x = input_93_cast_fp16)[name = tensor("op_2594_cast_fp16")]; tensor tile_27 = const()[name = tensor("tile_27"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_2597_axis_0 = const()[name = tensor("op_2597_axis_0"), val = tensor(1)]; tensor var_2597_cast_fp16_0, tensor var_2597_cast_fp16_1, tensor var_2597_cast_fp16_2, tensor var_2597_cast_fp16_3, tensor var_2597_cast_fp16_4, tensor var_2597_cast_fp16_5, tensor var_2597_cast_fp16_6, tensor var_2597_cast_fp16_7, tensor var_2597_cast_fp16_8, tensor var_2597_cast_fp16_9, tensor var_2597_cast_fp16_10, tensor var_2597_cast_fp16_11, tensor var_2597_cast_fp16_12, tensor var_2597_cast_fp16_13, tensor var_2597_cast_fp16_14, tensor var_2597_cast_fp16_15, tensor var_2597_cast_fp16_16, tensor var_2597_cast_fp16_17, tensor var_2597_cast_fp16_18, tensor var_2597_cast_fp16_19 = split(axis = var_2597_axis_0, split_sizes = tile_27, x = var_2596_cast_fp16)[name = tensor("op_2597_cast_fp16")]; tensor var_2618_perm_0 = const()[name = tensor("op_2618_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_28 = const()[name = tensor("tile_28"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_2619_axis_0 = const()[name = tensor("op_2619_axis_0"), val = tensor(3)]; tensor var_2618_cast_fp16 = transpose(perm = var_2618_perm_0, x = k_19_cast_fp16)[name = tensor("transpose_23")]; tensor var_2619_cast_fp16_0, tensor var_2619_cast_fp16_1, tensor var_2619_cast_fp16_2, tensor var_2619_cast_fp16_3, tensor var_2619_cast_fp16_4, tensor var_2619_cast_fp16_5, tensor var_2619_cast_fp16_6, tensor var_2619_cast_fp16_7, tensor var_2619_cast_fp16_8, tensor var_2619_cast_fp16_9, tensor var_2619_cast_fp16_10, tensor var_2619_cast_fp16_11, tensor var_2619_cast_fp16_12, tensor var_2619_cast_fp16_13, tensor var_2619_cast_fp16_14, tensor var_2619_cast_fp16_15, tensor var_2619_cast_fp16_16, tensor var_2619_cast_fp16_17, tensor var_2619_cast_fp16_18, tensor var_2619_cast_fp16_19 = split(axis = var_2619_axis_0, split_sizes = tile_28, x = var_2618_cast_fp16)[name = tensor("op_2619_cast_fp16")]; tensor tile_29 = const()[name = tensor("tile_29"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_2640_axis_0 = const()[name = tensor("op_2640_axis_0"), val = tensor(1)]; tensor var_2640_cast_fp16_0, tensor var_2640_cast_fp16_1, tensor var_2640_cast_fp16_2, tensor var_2640_cast_fp16_3, tensor var_2640_cast_fp16_4, tensor var_2640_cast_fp16_5, tensor var_2640_cast_fp16_6, tensor var_2640_cast_fp16_7, tensor var_2640_cast_fp16_8, tensor var_2640_cast_fp16_9, tensor var_2640_cast_fp16_10, tensor var_2640_cast_fp16_11, tensor var_2640_cast_fp16_12, tensor var_2640_cast_fp16_13, tensor var_2640_cast_fp16_14, tensor var_2640_cast_fp16_15, tensor var_2640_cast_fp16_16, tensor var_2640_cast_fp16_17, tensor var_2640_cast_fp16_18, tensor var_2640_cast_fp16_19 = split(axis = var_2640_axis_0, split_sizes = tile_29, x = var_2594_cast_fp16)[name = tensor("op_2640_cast_fp16")]; tensor aw_361_equation_0 = const()[name = tensor("aw_361_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_361_cast_fp16 = einsum(equation = aw_361_equation_0, values = (var_2619_cast_fp16_0, var_2597_cast_fp16_0))[name = tensor("aw_361_cast_fp16")]; tensor aw_363_equation_0 = const()[name = tensor("aw_363_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_363_cast_fp16 = einsum(equation = aw_363_equation_0, values = (var_2619_cast_fp16_1, var_2597_cast_fp16_1))[name = tensor("aw_363_cast_fp16")]; tensor aw_365_equation_0 = const()[name = tensor("aw_365_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_365_cast_fp16 = einsum(equation = aw_365_equation_0, values = (var_2619_cast_fp16_2, var_2597_cast_fp16_2))[name = tensor("aw_365_cast_fp16")]; tensor aw_367_equation_0 = const()[name = tensor("aw_367_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_367_cast_fp16 = einsum(equation = aw_367_equation_0, values = (var_2619_cast_fp16_3, var_2597_cast_fp16_3))[name = tensor("aw_367_cast_fp16")]; tensor aw_369_equation_0 = const()[name = tensor("aw_369_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_369_cast_fp16 = einsum(equation = aw_369_equation_0, values = (var_2619_cast_fp16_4, var_2597_cast_fp16_4))[name = tensor("aw_369_cast_fp16")]; tensor aw_371_equation_0 = const()[name = tensor("aw_371_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_371_cast_fp16 = einsum(equation = aw_371_equation_0, values = (var_2619_cast_fp16_5, var_2597_cast_fp16_5))[name = tensor("aw_371_cast_fp16")]; tensor aw_373_equation_0 = const()[name = tensor("aw_373_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_373_cast_fp16 = einsum(equation = aw_373_equation_0, values = (var_2619_cast_fp16_6, var_2597_cast_fp16_6))[name = tensor("aw_373_cast_fp16")]; tensor aw_375_equation_0 = const()[name = tensor("aw_375_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_375_cast_fp16 = einsum(equation = aw_375_equation_0, values = (var_2619_cast_fp16_7, var_2597_cast_fp16_7))[name = tensor("aw_375_cast_fp16")]; tensor aw_377_equation_0 = const()[name = tensor("aw_377_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_377_cast_fp16 = einsum(equation = aw_377_equation_0, values = (var_2619_cast_fp16_8, var_2597_cast_fp16_8))[name = tensor("aw_377_cast_fp16")]; tensor aw_379_equation_0 = const()[name = tensor("aw_379_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_379_cast_fp16 = einsum(equation = aw_379_equation_0, values = (var_2619_cast_fp16_9, var_2597_cast_fp16_9))[name = tensor("aw_379_cast_fp16")]; tensor aw_381_equation_0 = const()[name = tensor("aw_381_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_381_cast_fp16 = einsum(equation = aw_381_equation_0, values = (var_2619_cast_fp16_10, var_2597_cast_fp16_10))[name = tensor("aw_381_cast_fp16")]; tensor aw_383_equation_0 = const()[name = tensor("aw_383_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_383_cast_fp16 = einsum(equation = aw_383_equation_0, values = (var_2619_cast_fp16_11, var_2597_cast_fp16_11))[name = tensor("aw_383_cast_fp16")]; tensor aw_385_equation_0 = const()[name = tensor("aw_385_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_385_cast_fp16 = einsum(equation = aw_385_equation_0, values = (var_2619_cast_fp16_12, var_2597_cast_fp16_12))[name = tensor("aw_385_cast_fp16")]; tensor aw_387_equation_0 = const()[name = tensor("aw_387_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_387_cast_fp16 = einsum(equation = aw_387_equation_0, values = (var_2619_cast_fp16_13, var_2597_cast_fp16_13))[name = tensor("aw_387_cast_fp16")]; tensor aw_389_equation_0 = const()[name = tensor("aw_389_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_389_cast_fp16 = einsum(equation = aw_389_equation_0, values = (var_2619_cast_fp16_14, var_2597_cast_fp16_14))[name = tensor("aw_389_cast_fp16")]; tensor aw_391_equation_0 = const()[name = tensor("aw_391_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_391_cast_fp16 = einsum(equation = aw_391_equation_0, values = (var_2619_cast_fp16_15, var_2597_cast_fp16_15))[name = tensor("aw_391_cast_fp16")]; tensor aw_393_equation_0 = const()[name = tensor("aw_393_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_393_cast_fp16 = einsum(equation = aw_393_equation_0, values = (var_2619_cast_fp16_16, var_2597_cast_fp16_16))[name = tensor("aw_393_cast_fp16")]; tensor aw_395_equation_0 = const()[name = tensor("aw_395_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_395_cast_fp16 = einsum(equation = aw_395_equation_0, values = (var_2619_cast_fp16_17, var_2597_cast_fp16_17))[name = tensor("aw_395_cast_fp16")]; tensor aw_397_equation_0 = const()[name = tensor("aw_397_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_397_cast_fp16 = einsum(equation = aw_397_equation_0, values = (var_2619_cast_fp16_18, var_2597_cast_fp16_18))[name = tensor("aw_397_cast_fp16")]; tensor aw_399_equation_0 = const()[name = tensor("aw_399_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_399_cast_fp16 = einsum(equation = aw_399_equation_0, values = (var_2619_cast_fp16_19, var_2597_cast_fp16_19))[name = tensor("aw_399_cast_fp16")]; tensor var_2701_cast_fp16 = softmax(axis = var_2545, x = aw_361_cast_fp16)[name = tensor("op_2701_cast_fp16")]; tensor var_2702_cast_fp16 = softmax(axis = var_2545, x = aw_363_cast_fp16)[name = tensor("op_2702_cast_fp16")]; tensor var_2703_cast_fp16 = softmax(axis = var_2545, x = aw_365_cast_fp16)[name = tensor("op_2703_cast_fp16")]; tensor var_2704_cast_fp16 = softmax(axis = var_2545, x = aw_367_cast_fp16)[name = tensor("op_2704_cast_fp16")]; tensor var_2705_cast_fp16 = softmax(axis = var_2545, x = aw_369_cast_fp16)[name = tensor("op_2705_cast_fp16")]; tensor var_2706_cast_fp16 = softmax(axis = var_2545, x = aw_371_cast_fp16)[name = tensor("op_2706_cast_fp16")]; tensor var_2707_cast_fp16 = softmax(axis = var_2545, x = aw_373_cast_fp16)[name = tensor("op_2707_cast_fp16")]; tensor var_2708_cast_fp16 = softmax(axis = var_2545, x = aw_375_cast_fp16)[name = tensor("op_2708_cast_fp16")]; tensor var_2709_cast_fp16 = softmax(axis = var_2545, x = aw_377_cast_fp16)[name = tensor("op_2709_cast_fp16")]; tensor var_2710_cast_fp16 = softmax(axis = var_2545, x = aw_379_cast_fp16)[name = tensor("op_2710_cast_fp16")]; tensor var_2711_cast_fp16 = softmax(axis = var_2545, x = aw_381_cast_fp16)[name = tensor("op_2711_cast_fp16")]; tensor var_2712_cast_fp16 = softmax(axis = var_2545, x = aw_383_cast_fp16)[name = tensor("op_2712_cast_fp16")]; tensor var_2713_cast_fp16 = softmax(axis = var_2545, x = aw_385_cast_fp16)[name = tensor("op_2713_cast_fp16")]; tensor var_2714_cast_fp16 = softmax(axis = var_2545, x = aw_387_cast_fp16)[name = tensor("op_2714_cast_fp16")]; tensor var_2715_cast_fp16 = softmax(axis = var_2545, x = aw_389_cast_fp16)[name = tensor("op_2715_cast_fp16")]; tensor var_2716_cast_fp16 = softmax(axis = var_2545, x = aw_391_cast_fp16)[name = tensor("op_2716_cast_fp16")]; tensor var_2717_cast_fp16 = softmax(axis = var_2545, x = aw_393_cast_fp16)[name = tensor("op_2717_cast_fp16")]; tensor var_2718_cast_fp16 = softmax(axis = var_2545, x = aw_395_cast_fp16)[name = tensor("op_2718_cast_fp16")]; tensor var_2719_cast_fp16 = softmax(axis = var_2545, x = aw_397_cast_fp16)[name = tensor("op_2719_cast_fp16")]; tensor var_2720_cast_fp16 = softmax(axis = var_2545, x = aw_399_cast_fp16)[name = tensor("op_2720_cast_fp16")]; tensor var_2722_equation_0 = const()[name = tensor("op_2722_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2722_cast_fp16 = einsum(equation = var_2722_equation_0, values = (var_2640_cast_fp16_0, var_2701_cast_fp16))[name = tensor("op_2722_cast_fp16")]; tensor var_2724_equation_0 = const()[name = tensor("op_2724_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2724_cast_fp16 = einsum(equation = var_2724_equation_0, values = (var_2640_cast_fp16_1, var_2702_cast_fp16))[name = tensor("op_2724_cast_fp16")]; tensor var_2726_equation_0 = const()[name = tensor("op_2726_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2726_cast_fp16 = einsum(equation = var_2726_equation_0, values = (var_2640_cast_fp16_2, var_2703_cast_fp16))[name = tensor("op_2726_cast_fp16")]; tensor var_2728_equation_0 = const()[name = tensor("op_2728_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2728_cast_fp16 = einsum(equation = var_2728_equation_0, values = (var_2640_cast_fp16_3, var_2704_cast_fp16))[name = tensor("op_2728_cast_fp16")]; tensor var_2730_equation_0 = const()[name = tensor("op_2730_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2730_cast_fp16 = einsum(equation = var_2730_equation_0, values = (var_2640_cast_fp16_4, var_2705_cast_fp16))[name = tensor("op_2730_cast_fp16")]; tensor var_2732_equation_0 = const()[name = tensor("op_2732_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2732_cast_fp16 = einsum(equation = var_2732_equation_0, values = (var_2640_cast_fp16_5, var_2706_cast_fp16))[name = tensor("op_2732_cast_fp16")]; tensor var_2734_equation_0 = const()[name = tensor("op_2734_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2734_cast_fp16 = einsum(equation = var_2734_equation_0, values = (var_2640_cast_fp16_6, var_2707_cast_fp16))[name = tensor("op_2734_cast_fp16")]; tensor var_2736_equation_0 = const()[name = tensor("op_2736_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2736_cast_fp16 = einsum(equation = var_2736_equation_0, values = (var_2640_cast_fp16_7, var_2708_cast_fp16))[name = tensor("op_2736_cast_fp16")]; tensor var_2738_equation_0 = const()[name = tensor("op_2738_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2738_cast_fp16 = einsum(equation = var_2738_equation_0, values = (var_2640_cast_fp16_8, var_2709_cast_fp16))[name = tensor("op_2738_cast_fp16")]; tensor var_2740_equation_0 = const()[name = tensor("op_2740_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2740_cast_fp16 = einsum(equation = var_2740_equation_0, values = (var_2640_cast_fp16_9, var_2710_cast_fp16))[name = tensor("op_2740_cast_fp16")]; tensor var_2742_equation_0 = const()[name = tensor("op_2742_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2742_cast_fp16 = einsum(equation = var_2742_equation_0, values = (var_2640_cast_fp16_10, var_2711_cast_fp16))[name = tensor("op_2742_cast_fp16")]; tensor var_2744_equation_0 = const()[name = tensor("op_2744_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2744_cast_fp16 = einsum(equation = var_2744_equation_0, values = (var_2640_cast_fp16_11, var_2712_cast_fp16))[name = tensor("op_2744_cast_fp16")]; tensor var_2746_equation_0 = const()[name = tensor("op_2746_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2746_cast_fp16 = einsum(equation = var_2746_equation_0, values = (var_2640_cast_fp16_12, var_2713_cast_fp16))[name = tensor("op_2746_cast_fp16")]; tensor var_2748_equation_0 = const()[name = tensor("op_2748_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2748_cast_fp16 = einsum(equation = var_2748_equation_0, values = (var_2640_cast_fp16_13, var_2714_cast_fp16))[name = tensor("op_2748_cast_fp16")]; tensor var_2750_equation_0 = const()[name = tensor("op_2750_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2750_cast_fp16 = einsum(equation = var_2750_equation_0, values = (var_2640_cast_fp16_14, var_2715_cast_fp16))[name = tensor("op_2750_cast_fp16")]; tensor var_2752_equation_0 = const()[name = tensor("op_2752_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2752_cast_fp16 = einsum(equation = var_2752_equation_0, values = (var_2640_cast_fp16_15, var_2716_cast_fp16))[name = tensor("op_2752_cast_fp16")]; tensor var_2754_equation_0 = const()[name = tensor("op_2754_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2754_cast_fp16 = einsum(equation = var_2754_equation_0, values = (var_2640_cast_fp16_16, var_2717_cast_fp16))[name = tensor("op_2754_cast_fp16")]; tensor var_2756_equation_0 = const()[name = tensor("op_2756_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2756_cast_fp16 = einsum(equation = var_2756_equation_0, values = (var_2640_cast_fp16_17, var_2718_cast_fp16))[name = tensor("op_2756_cast_fp16")]; tensor var_2758_equation_0 = const()[name = tensor("op_2758_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2758_cast_fp16 = einsum(equation = var_2758_equation_0, values = (var_2640_cast_fp16_18, var_2719_cast_fp16))[name = tensor("op_2758_cast_fp16")]; tensor var_2760_equation_0 = const()[name = tensor("op_2760_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2760_cast_fp16 = einsum(equation = var_2760_equation_0, values = (var_2640_cast_fp16_19, var_2720_cast_fp16))[name = tensor("op_2760_cast_fp16")]; tensor input_95_interleave_0 = const()[name = tensor("input_95_interleave_0"), val = tensor(false)]; tensor input_95_cast_fp16 = concat(axis = var_2545, interleave = input_95_interleave_0, values = (var_2722_cast_fp16, var_2724_cast_fp16, var_2726_cast_fp16, var_2728_cast_fp16, var_2730_cast_fp16, var_2732_cast_fp16, var_2734_cast_fp16, var_2736_cast_fp16, var_2738_cast_fp16, var_2740_cast_fp16, var_2742_cast_fp16, var_2744_cast_fp16, var_2746_cast_fp16, var_2748_cast_fp16, var_2750_cast_fp16, var_2752_cast_fp16, var_2754_cast_fp16, var_2756_cast_fp16, var_2758_cast_fp16, var_2760_cast_fp16))[name = tensor("input_95_cast_fp16")]; tensor var_2769_pad_type_0 = const()[name = tensor("op_2769_pad_type_0"), val = tensor("valid")]; tensor var_2769_strides_0 = const()[name = tensor("op_2769_strides_0"), val = tensor([1, 1])]; tensor var_2769_pad_0 = const()[name = tensor("op_2769_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_2769_dilations_0 = const()[name = tensor("op_2769_dilations_0"), val = tensor([1, 1])]; tensor var_2769_groups_0 = const()[name = tensor("op_2769_groups_0"), val = tensor(1)]; tensor blocks_9_attn_out_weight_to_fp16 = const()[name = tensor("blocks_9_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(378679552)))]; tensor blocks_9_attn_out_bias_to_fp16 = const()[name = tensor("blocks_9_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(381956416)))]; tensor var_2769_cast_fp16 = conv(bias = blocks_9_attn_out_bias_to_fp16, dilations = var_2769_dilations_0, groups = var_2769_groups_0, pad = var_2769_pad_0, pad_type = var_2769_pad_type_0, strides = var_2769_strides_0, weight = blocks_9_attn_out_weight_to_fp16, x = input_95_cast_fp16)[name = tensor("op_2769_cast_fp16")]; tensor inputs_39_cast_fp16 = add(x = inputs_37_cast_fp16, y = var_2769_cast_fp16)[name = tensor("inputs_39_cast_fp16")]; tensor input_97_axes_0 = const()[name = tensor("input_97_axes_0"), val = tensor([1])]; tensor input_97_gamma_0_to_fp16 = const()[name = tensor("input_97_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(381959040)))]; tensor input_97_beta_0_to_fp16 = const()[name = tensor("input_97_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(381961664)))]; tensor var_2779_to_fp16 = const()[name = tensor("op_2779_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_97_cast_fp16 = layer_norm(axes = input_97_axes_0, beta = input_97_beta_0_to_fp16, epsilon = var_2779_to_fp16, gamma = input_97_gamma_0_to_fp16, x = inputs_39_cast_fp16)[name = tensor("input_97_cast_fp16")]; tensor input_99_pad_type_0 = const()[name = tensor("input_99_pad_type_0"), val = tensor("valid")]; tensor input_99_strides_0 = const()[name = tensor("input_99_strides_0"), val = tensor([1, 1])]; tensor input_99_pad_0 = const()[name = tensor("input_99_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_99_dilations_0 = const()[name = tensor("input_99_dilations_0"), val = tensor([1, 1])]; tensor input_99_groups_0 = const()[name = tensor("input_99_groups_0"), val = tensor(1)]; tensor blocks_9_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_9_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(381964288)))]; tensor blocks_9_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_9_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(395071552)))]; tensor input_99_cast_fp16 = conv(bias = blocks_9_mlp_0_bias_to_fp16, dilations = input_99_dilations_0, groups = input_99_groups_0, pad = input_99_pad_0, pad_type = input_99_pad_type_0, strides = input_99_strides_0, weight = blocks_9_mlp_0_weight_to_fp16, x = input_97_cast_fp16)[name = tensor("input_99_cast_fp16")]; tensor input_101_mode_0 = const()[name = tensor("input_101_mode_0"), val = tensor("EXACT")]; tensor input_101_cast_fp16 = gelu(mode = input_101_mode_0, x = input_99_cast_fp16)[name = tensor("input_101_cast_fp16")]; tensor var_2805_pad_type_0 = const()[name = tensor("op_2805_pad_type_0"), val = tensor("valid")]; tensor var_2805_strides_0 = const()[name = tensor("op_2805_strides_0"), val = tensor([1, 1])]; tensor var_2805_pad_0 = const()[name = tensor("op_2805_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_2805_dilations_0 = const()[name = tensor("op_2805_dilations_0"), val = tensor([1, 1])]; tensor var_2805_groups_0 = const()[name = tensor("op_2805_groups_0"), val = tensor(1)]; tensor blocks_9_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_9_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(395081856)))]; tensor blocks_9_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_9_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(408189120)))]; tensor var_2805_cast_fp16 = conv(bias = blocks_9_mlp_2_bias_to_fp16, dilations = var_2805_dilations_0, groups = var_2805_groups_0, pad = var_2805_pad_0, pad_type = var_2805_pad_type_0, strides = var_2805_strides_0, weight = blocks_9_mlp_2_weight_to_fp16, x = input_101_cast_fp16)[name = tensor("op_2805_cast_fp16")]; tensor inputs_41_cast_fp16 = add(x = inputs_39_cast_fp16, y = var_2805_cast_fp16)[name = tensor("inputs_41_cast_fp16")]; tensor var_2814 = const()[name = tensor("op_2814"), val = tensor(1)]; tensor input_103_axes_0 = const()[name = tensor("input_103_axes_0"), val = tensor([1])]; tensor input_103_gamma_0_to_fp16 = const()[name = tensor("input_103_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(408191744)))]; tensor input_103_beta_0_to_fp16 = const()[name = tensor("input_103_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(408194368)))]; tensor var_2830_to_fp16 = const()[name = tensor("op_2830_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_103_cast_fp16 = layer_norm(axes = input_103_axes_0, beta = input_103_beta_0_to_fp16, epsilon = var_2830_to_fp16, gamma = input_103_gamma_0_to_fp16, x = inputs_41_cast_fp16)[name = tensor("input_103_cast_fp16")]; tensor q_21_pad_type_0 = const()[name = tensor("q_21_pad_type_0"), val = tensor("valid")]; tensor q_21_strides_0 = const()[name = tensor("q_21_strides_0"), val = tensor([1, 1])]; tensor q_21_pad_0 = const()[name = tensor("q_21_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_21_dilations_0 = const()[name = tensor("q_21_dilations_0"), val = tensor([1, 1])]; tensor q_21_groups_0 = const()[name = tensor("q_21_groups_0"), val = tensor(1)]; tensor var_2865_weight_0_to_fp16 = const()[name = tensor("op_2865_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(408196992)))]; tensor var_2865_bias_0_to_fp16 = const()[name = tensor("op_2865_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(411473856)))]; tensor var_2865_cast_fp16 = conv(bias = var_2865_bias_0_to_fp16, dilations = q_21_dilations_0, groups = q_21_groups_0, pad = q_21_pad_0, pad_type = q_21_pad_type_0, strides = q_21_strides_0, weight = var_2865_weight_0_to_fp16, x = input_103_cast_fp16)[name = tensor("op_2865_cast_fp16")]; tensor k_21_pad_type_0 = const()[name = tensor("k_21_pad_type_0"), val = tensor("valid")]; tensor k_21_strides_0 = const()[name = tensor("k_21_strides_0"), val = tensor([1, 1])]; tensor k_21_pad_0 = const()[name = tensor("k_21_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_21_dilations_0 = const()[name = tensor("k_21_dilations_0"), val = tensor([1, 1])]; tensor k_21_groups_0 = const()[name = tensor("k_21_groups_0"), val = tensor(1)]; tensor blocks_10_attn_key_weight_to_fp16 = const()[name = tensor("blocks_10_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(411476480)))]; tensor k_21_cast_fp16 = conv(dilations = k_21_dilations_0, groups = k_21_groups_0, pad = k_21_pad_0, pad_type = k_21_pad_type_0, strides = k_21_strides_0, weight = blocks_10_attn_key_weight_to_fp16, x = input_103_cast_fp16)[name = tensor("k_21_cast_fp16")]; tensor var_2863_pad_type_0 = const()[name = tensor("op_2863_pad_type_0"), val = tensor("valid")]; tensor var_2863_strides_0 = const()[name = tensor("op_2863_strides_0"), val = tensor([1, 1])]; tensor var_2863_pad_0 = const()[name = tensor("op_2863_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_2863_dilations_0 = const()[name = tensor("op_2863_dilations_0"), val = tensor([1, 1])]; tensor var_2863_groups_0 = const()[name = tensor("op_2863_groups_0"), val = tensor(1)]; tensor blocks_10_attn_value_weight_to_fp16 = const()[name = tensor("blocks_10_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(414753344)))]; tensor blocks_10_attn_value_bias_to_fp16 = const()[name = tensor("blocks_10_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(418030208)))]; tensor var_2863_cast_fp16 = conv(bias = blocks_10_attn_value_bias_to_fp16, dilations = var_2863_dilations_0, groups = var_2863_groups_0, pad = var_2863_pad_0, pad_type = var_2863_pad_type_0, strides = var_2863_strides_0, weight = blocks_10_attn_value_weight_to_fp16, x = input_103_cast_fp16)[name = tensor("op_2863_cast_fp16")]; tensor tile_30 = const()[name = tensor("tile_30"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_2866_axis_0 = const()[name = tensor("op_2866_axis_0"), val = tensor(1)]; tensor var_2866_cast_fp16_0, tensor var_2866_cast_fp16_1, tensor var_2866_cast_fp16_2, tensor var_2866_cast_fp16_3, tensor var_2866_cast_fp16_4, tensor var_2866_cast_fp16_5, tensor var_2866_cast_fp16_6, tensor var_2866_cast_fp16_7, tensor var_2866_cast_fp16_8, tensor var_2866_cast_fp16_9, tensor var_2866_cast_fp16_10, tensor var_2866_cast_fp16_11, tensor var_2866_cast_fp16_12, tensor var_2866_cast_fp16_13, tensor var_2866_cast_fp16_14, tensor var_2866_cast_fp16_15, tensor var_2866_cast_fp16_16, tensor var_2866_cast_fp16_17, tensor var_2866_cast_fp16_18, tensor var_2866_cast_fp16_19 = split(axis = var_2866_axis_0, split_sizes = tile_30, x = var_2865_cast_fp16)[name = tensor("op_2866_cast_fp16")]; tensor var_2887_perm_0 = const()[name = tensor("op_2887_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_31 = const()[name = tensor("tile_31"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_2888_axis_0 = const()[name = tensor("op_2888_axis_0"), val = tensor(3)]; tensor var_2887_cast_fp16 = transpose(perm = var_2887_perm_0, x = k_21_cast_fp16)[name = tensor("transpose_22")]; tensor var_2888_cast_fp16_0, tensor var_2888_cast_fp16_1, tensor var_2888_cast_fp16_2, tensor var_2888_cast_fp16_3, tensor var_2888_cast_fp16_4, tensor var_2888_cast_fp16_5, tensor var_2888_cast_fp16_6, tensor var_2888_cast_fp16_7, tensor var_2888_cast_fp16_8, tensor var_2888_cast_fp16_9, tensor var_2888_cast_fp16_10, tensor var_2888_cast_fp16_11, tensor var_2888_cast_fp16_12, tensor var_2888_cast_fp16_13, tensor var_2888_cast_fp16_14, tensor var_2888_cast_fp16_15, tensor var_2888_cast_fp16_16, tensor var_2888_cast_fp16_17, tensor var_2888_cast_fp16_18, tensor var_2888_cast_fp16_19 = split(axis = var_2888_axis_0, split_sizes = tile_31, x = var_2887_cast_fp16)[name = tensor("op_2888_cast_fp16")]; tensor tile_32 = const()[name = tensor("tile_32"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_2909_axis_0 = const()[name = tensor("op_2909_axis_0"), val = tensor(1)]; tensor var_2909_cast_fp16_0, tensor var_2909_cast_fp16_1, tensor var_2909_cast_fp16_2, tensor var_2909_cast_fp16_3, tensor var_2909_cast_fp16_4, tensor var_2909_cast_fp16_5, tensor var_2909_cast_fp16_6, tensor var_2909_cast_fp16_7, tensor var_2909_cast_fp16_8, tensor var_2909_cast_fp16_9, tensor var_2909_cast_fp16_10, tensor var_2909_cast_fp16_11, tensor var_2909_cast_fp16_12, tensor var_2909_cast_fp16_13, tensor var_2909_cast_fp16_14, tensor var_2909_cast_fp16_15, tensor var_2909_cast_fp16_16, tensor var_2909_cast_fp16_17, tensor var_2909_cast_fp16_18, tensor var_2909_cast_fp16_19 = split(axis = var_2909_axis_0, split_sizes = tile_32, x = var_2863_cast_fp16)[name = tensor("op_2909_cast_fp16")]; tensor aw_401_equation_0 = const()[name = tensor("aw_401_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_401_cast_fp16 = einsum(equation = aw_401_equation_0, values = (var_2888_cast_fp16_0, var_2866_cast_fp16_0))[name = tensor("aw_401_cast_fp16")]; tensor aw_403_equation_0 = const()[name = tensor("aw_403_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_403_cast_fp16 = einsum(equation = aw_403_equation_0, values = (var_2888_cast_fp16_1, var_2866_cast_fp16_1))[name = tensor("aw_403_cast_fp16")]; tensor aw_405_equation_0 = const()[name = tensor("aw_405_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_405_cast_fp16 = einsum(equation = aw_405_equation_0, values = (var_2888_cast_fp16_2, var_2866_cast_fp16_2))[name = tensor("aw_405_cast_fp16")]; tensor aw_407_equation_0 = const()[name = tensor("aw_407_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_407_cast_fp16 = einsum(equation = aw_407_equation_0, values = (var_2888_cast_fp16_3, var_2866_cast_fp16_3))[name = tensor("aw_407_cast_fp16")]; tensor aw_409_equation_0 = const()[name = tensor("aw_409_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_409_cast_fp16 = einsum(equation = aw_409_equation_0, values = (var_2888_cast_fp16_4, var_2866_cast_fp16_4))[name = tensor("aw_409_cast_fp16")]; tensor aw_411_equation_0 = const()[name = tensor("aw_411_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_411_cast_fp16 = einsum(equation = aw_411_equation_0, values = (var_2888_cast_fp16_5, var_2866_cast_fp16_5))[name = tensor("aw_411_cast_fp16")]; tensor aw_413_equation_0 = const()[name = tensor("aw_413_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_413_cast_fp16 = einsum(equation = aw_413_equation_0, values = (var_2888_cast_fp16_6, var_2866_cast_fp16_6))[name = tensor("aw_413_cast_fp16")]; tensor aw_415_equation_0 = const()[name = tensor("aw_415_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_415_cast_fp16 = einsum(equation = aw_415_equation_0, values = (var_2888_cast_fp16_7, var_2866_cast_fp16_7))[name = tensor("aw_415_cast_fp16")]; tensor aw_417_equation_0 = const()[name = tensor("aw_417_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_417_cast_fp16 = einsum(equation = aw_417_equation_0, values = (var_2888_cast_fp16_8, var_2866_cast_fp16_8))[name = tensor("aw_417_cast_fp16")]; tensor aw_419_equation_0 = const()[name = tensor("aw_419_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_419_cast_fp16 = einsum(equation = aw_419_equation_0, values = (var_2888_cast_fp16_9, var_2866_cast_fp16_9))[name = tensor("aw_419_cast_fp16")]; tensor aw_421_equation_0 = const()[name = tensor("aw_421_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_421_cast_fp16 = einsum(equation = aw_421_equation_0, values = (var_2888_cast_fp16_10, var_2866_cast_fp16_10))[name = tensor("aw_421_cast_fp16")]; tensor aw_423_equation_0 = const()[name = tensor("aw_423_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_423_cast_fp16 = einsum(equation = aw_423_equation_0, values = (var_2888_cast_fp16_11, var_2866_cast_fp16_11))[name = tensor("aw_423_cast_fp16")]; tensor aw_425_equation_0 = const()[name = tensor("aw_425_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_425_cast_fp16 = einsum(equation = aw_425_equation_0, values = (var_2888_cast_fp16_12, var_2866_cast_fp16_12))[name = tensor("aw_425_cast_fp16")]; tensor aw_427_equation_0 = const()[name = tensor("aw_427_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_427_cast_fp16 = einsum(equation = aw_427_equation_0, values = (var_2888_cast_fp16_13, var_2866_cast_fp16_13))[name = tensor("aw_427_cast_fp16")]; tensor aw_429_equation_0 = const()[name = tensor("aw_429_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_429_cast_fp16 = einsum(equation = aw_429_equation_0, values = (var_2888_cast_fp16_14, var_2866_cast_fp16_14))[name = tensor("aw_429_cast_fp16")]; tensor aw_431_equation_0 = const()[name = tensor("aw_431_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_431_cast_fp16 = einsum(equation = aw_431_equation_0, values = (var_2888_cast_fp16_15, var_2866_cast_fp16_15))[name = tensor("aw_431_cast_fp16")]; tensor aw_433_equation_0 = const()[name = tensor("aw_433_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_433_cast_fp16 = einsum(equation = aw_433_equation_0, values = (var_2888_cast_fp16_16, var_2866_cast_fp16_16))[name = tensor("aw_433_cast_fp16")]; tensor aw_435_equation_0 = const()[name = tensor("aw_435_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_435_cast_fp16 = einsum(equation = aw_435_equation_0, values = (var_2888_cast_fp16_17, var_2866_cast_fp16_17))[name = tensor("aw_435_cast_fp16")]; tensor aw_437_equation_0 = const()[name = tensor("aw_437_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_437_cast_fp16 = einsum(equation = aw_437_equation_0, values = (var_2888_cast_fp16_18, var_2866_cast_fp16_18))[name = tensor("aw_437_cast_fp16")]; tensor aw_439_equation_0 = const()[name = tensor("aw_439_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_439_cast_fp16 = einsum(equation = aw_439_equation_0, values = (var_2888_cast_fp16_19, var_2866_cast_fp16_19))[name = tensor("aw_439_cast_fp16")]; tensor var_2970_cast_fp16 = softmax(axis = var_2814, x = aw_401_cast_fp16)[name = tensor("op_2970_cast_fp16")]; tensor var_2971_cast_fp16 = softmax(axis = var_2814, x = aw_403_cast_fp16)[name = tensor("op_2971_cast_fp16")]; tensor var_2972_cast_fp16 = softmax(axis = var_2814, x = aw_405_cast_fp16)[name = tensor("op_2972_cast_fp16")]; tensor var_2973_cast_fp16 = softmax(axis = var_2814, x = aw_407_cast_fp16)[name = tensor("op_2973_cast_fp16")]; tensor var_2974_cast_fp16 = softmax(axis = var_2814, x = aw_409_cast_fp16)[name = tensor("op_2974_cast_fp16")]; tensor var_2975_cast_fp16 = softmax(axis = var_2814, x = aw_411_cast_fp16)[name = tensor("op_2975_cast_fp16")]; tensor var_2976_cast_fp16 = softmax(axis = var_2814, x = aw_413_cast_fp16)[name = tensor("op_2976_cast_fp16")]; tensor var_2977_cast_fp16 = softmax(axis = var_2814, x = aw_415_cast_fp16)[name = tensor("op_2977_cast_fp16")]; tensor var_2978_cast_fp16 = softmax(axis = var_2814, x = aw_417_cast_fp16)[name = tensor("op_2978_cast_fp16")]; tensor var_2979_cast_fp16 = softmax(axis = var_2814, x = aw_419_cast_fp16)[name = tensor("op_2979_cast_fp16")]; tensor var_2980_cast_fp16 = softmax(axis = var_2814, x = aw_421_cast_fp16)[name = tensor("op_2980_cast_fp16")]; tensor var_2981_cast_fp16 = softmax(axis = var_2814, x = aw_423_cast_fp16)[name = tensor("op_2981_cast_fp16")]; tensor var_2982_cast_fp16 = softmax(axis = var_2814, x = aw_425_cast_fp16)[name = tensor("op_2982_cast_fp16")]; tensor var_2983_cast_fp16 = softmax(axis = var_2814, x = aw_427_cast_fp16)[name = tensor("op_2983_cast_fp16")]; tensor var_2984_cast_fp16 = softmax(axis = var_2814, x = aw_429_cast_fp16)[name = tensor("op_2984_cast_fp16")]; tensor var_2985_cast_fp16 = softmax(axis = var_2814, x = aw_431_cast_fp16)[name = tensor("op_2985_cast_fp16")]; tensor var_2986_cast_fp16 = softmax(axis = var_2814, x = aw_433_cast_fp16)[name = tensor("op_2986_cast_fp16")]; tensor var_2987_cast_fp16 = softmax(axis = var_2814, x = aw_435_cast_fp16)[name = tensor("op_2987_cast_fp16")]; tensor var_2988_cast_fp16 = softmax(axis = var_2814, x = aw_437_cast_fp16)[name = tensor("op_2988_cast_fp16")]; tensor var_2989_cast_fp16 = softmax(axis = var_2814, x = aw_439_cast_fp16)[name = tensor("op_2989_cast_fp16")]; tensor var_2991_equation_0 = const()[name = tensor("op_2991_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2991_cast_fp16 = einsum(equation = var_2991_equation_0, values = (var_2909_cast_fp16_0, var_2970_cast_fp16))[name = tensor("op_2991_cast_fp16")]; tensor var_2993_equation_0 = const()[name = tensor("op_2993_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2993_cast_fp16 = einsum(equation = var_2993_equation_0, values = (var_2909_cast_fp16_1, var_2971_cast_fp16))[name = tensor("op_2993_cast_fp16")]; tensor var_2995_equation_0 = const()[name = tensor("op_2995_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2995_cast_fp16 = einsum(equation = var_2995_equation_0, values = (var_2909_cast_fp16_2, var_2972_cast_fp16))[name = tensor("op_2995_cast_fp16")]; tensor var_2997_equation_0 = const()[name = tensor("op_2997_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2997_cast_fp16 = einsum(equation = var_2997_equation_0, values = (var_2909_cast_fp16_3, var_2973_cast_fp16))[name = tensor("op_2997_cast_fp16")]; tensor var_2999_equation_0 = const()[name = tensor("op_2999_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2999_cast_fp16 = einsum(equation = var_2999_equation_0, values = (var_2909_cast_fp16_4, var_2974_cast_fp16))[name = tensor("op_2999_cast_fp16")]; tensor var_3001_equation_0 = const()[name = tensor("op_3001_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3001_cast_fp16 = einsum(equation = var_3001_equation_0, values = (var_2909_cast_fp16_5, var_2975_cast_fp16))[name = tensor("op_3001_cast_fp16")]; tensor var_3003_equation_0 = const()[name = tensor("op_3003_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3003_cast_fp16 = einsum(equation = var_3003_equation_0, values = (var_2909_cast_fp16_6, var_2976_cast_fp16))[name = tensor("op_3003_cast_fp16")]; tensor var_3005_equation_0 = const()[name = tensor("op_3005_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3005_cast_fp16 = einsum(equation = var_3005_equation_0, values = (var_2909_cast_fp16_7, var_2977_cast_fp16))[name = tensor("op_3005_cast_fp16")]; tensor var_3007_equation_0 = const()[name = tensor("op_3007_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3007_cast_fp16 = einsum(equation = var_3007_equation_0, values = (var_2909_cast_fp16_8, var_2978_cast_fp16))[name = tensor("op_3007_cast_fp16")]; tensor var_3009_equation_0 = const()[name = tensor("op_3009_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3009_cast_fp16 = einsum(equation = var_3009_equation_0, values = (var_2909_cast_fp16_9, var_2979_cast_fp16))[name = tensor("op_3009_cast_fp16")]; tensor var_3011_equation_0 = const()[name = tensor("op_3011_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3011_cast_fp16 = einsum(equation = var_3011_equation_0, values = (var_2909_cast_fp16_10, var_2980_cast_fp16))[name = tensor("op_3011_cast_fp16")]; tensor var_3013_equation_0 = const()[name = tensor("op_3013_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3013_cast_fp16 = einsum(equation = var_3013_equation_0, values = (var_2909_cast_fp16_11, var_2981_cast_fp16))[name = tensor("op_3013_cast_fp16")]; tensor var_3015_equation_0 = const()[name = tensor("op_3015_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3015_cast_fp16 = einsum(equation = var_3015_equation_0, values = (var_2909_cast_fp16_12, var_2982_cast_fp16))[name = tensor("op_3015_cast_fp16")]; tensor var_3017_equation_0 = const()[name = tensor("op_3017_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3017_cast_fp16 = einsum(equation = var_3017_equation_0, values = (var_2909_cast_fp16_13, var_2983_cast_fp16))[name = tensor("op_3017_cast_fp16")]; tensor var_3019_equation_0 = const()[name = tensor("op_3019_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3019_cast_fp16 = einsum(equation = var_3019_equation_0, values = (var_2909_cast_fp16_14, var_2984_cast_fp16))[name = tensor("op_3019_cast_fp16")]; tensor var_3021_equation_0 = const()[name = tensor("op_3021_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3021_cast_fp16 = einsum(equation = var_3021_equation_0, values = (var_2909_cast_fp16_15, var_2985_cast_fp16))[name = tensor("op_3021_cast_fp16")]; tensor var_3023_equation_0 = const()[name = tensor("op_3023_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3023_cast_fp16 = einsum(equation = var_3023_equation_0, values = (var_2909_cast_fp16_16, var_2986_cast_fp16))[name = tensor("op_3023_cast_fp16")]; tensor var_3025_equation_0 = const()[name = tensor("op_3025_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3025_cast_fp16 = einsum(equation = var_3025_equation_0, values = (var_2909_cast_fp16_17, var_2987_cast_fp16))[name = tensor("op_3025_cast_fp16")]; tensor var_3027_equation_0 = const()[name = tensor("op_3027_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3027_cast_fp16 = einsum(equation = var_3027_equation_0, values = (var_2909_cast_fp16_18, var_2988_cast_fp16))[name = tensor("op_3027_cast_fp16")]; tensor var_3029_equation_0 = const()[name = tensor("op_3029_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3029_cast_fp16 = einsum(equation = var_3029_equation_0, values = (var_2909_cast_fp16_19, var_2989_cast_fp16))[name = tensor("op_3029_cast_fp16")]; tensor input_105_interleave_0 = const()[name = tensor("input_105_interleave_0"), val = tensor(false)]; tensor input_105_cast_fp16 = concat(axis = var_2814, interleave = input_105_interleave_0, values = (var_2991_cast_fp16, var_2993_cast_fp16, var_2995_cast_fp16, var_2997_cast_fp16, var_2999_cast_fp16, var_3001_cast_fp16, var_3003_cast_fp16, var_3005_cast_fp16, var_3007_cast_fp16, var_3009_cast_fp16, var_3011_cast_fp16, var_3013_cast_fp16, var_3015_cast_fp16, var_3017_cast_fp16, var_3019_cast_fp16, var_3021_cast_fp16, var_3023_cast_fp16, var_3025_cast_fp16, var_3027_cast_fp16, var_3029_cast_fp16))[name = tensor("input_105_cast_fp16")]; tensor var_3038_pad_type_0 = const()[name = tensor("op_3038_pad_type_0"), val = tensor("valid")]; tensor var_3038_strides_0 = const()[name = tensor("op_3038_strides_0"), val = tensor([1, 1])]; tensor var_3038_pad_0 = const()[name = tensor("op_3038_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_3038_dilations_0 = const()[name = tensor("op_3038_dilations_0"), val = tensor([1, 1])]; tensor var_3038_groups_0 = const()[name = tensor("op_3038_groups_0"), val = tensor(1)]; tensor blocks_10_attn_out_weight_to_fp16 = const()[name = tensor("blocks_10_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(418032832)))]; tensor blocks_10_attn_out_bias_to_fp16 = const()[name = tensor("blocks_10_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421309696)))]; tensor var_3038_cast_fp16 = conv(bias = blocks_10_attn_out_bias_to_fp16, dilations = var_3038_dilations_0, groups = var_3038_groups_0, pad = var_3038_pad_0, pad_type = var_3038_pad_type_0, strides = var_3038_strides_0, weight = blocks_10_attn_out_weight_to_fp16, x = input_105_cast_fp16)[name = tensor("op_3038_cast_fp16")]; tensor inputs_43_cast_fp16 = add(x = inputs_41_cast_fp16, y = var_3038_cast_fp16)[name = tensor("inputs_43_cast_fp16")]; tensor input_107_axes_0 = const()[name = tensor("input_107_axes_0"), val = tensor([1])]; tensor input_107_gamma_0_to_fp16 = const()[name = tensor("input_107_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421312320)))]; tensor input_107_beta_0_to_fp16 = const()[name = tensor("input_107_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421314944)))]; tensor var_3048_to_fp16 = const()[name = tensor("op_3048_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_107_cast_fp16 = layer_norm(axes = input_107_axes_0, beta = input_107_beta_0_to_fp16, epsilon = var_3048_to_fp16, gamma = input_107_gamma_0_to_fp16, x = inputs_43_cast_fp16)[name = tensor("input_107_cast_fp16")]; tensor input_109_pad_type_0 = const()[name = tensor("input_109_pad_type_0"), val = tensor("valid")]; tensor input_109_strides_0 = const()[name = tensor("input_109_strides_0"), val = tensor([1, 1])]; tensor input_109_pad_0 = const()[name = tensor("input_109_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_109_dilations_0 = const()[name = tensor("input_109_dilations_0"), val = tensor([1, 1])]; tensor input_109_groups_0 = const()[name = tensor("input_109_groups_0"), val = tensor(1)]; tensor blocks_10_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_10_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421317568)))]; tensor blocks_10_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_10_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(434424832)))]; tensor input_109_cast_fp16 = conv(bias = blocks_10_mlp_0_bias_to_fp16, dilations = input_109_dilations_0, groups = input_109_groups_0, pad = input_109_pad_0, pad_type = input_109_pad_type_0, strides = input_109_strides_0, weight = blocks_10_mlp_0_weight_to_fp16, x = input_107_cast_fp16)[name = tensor("input_109_cast_fp16")]; tensor input_111_mode_0 = const()[name = tensor("input_111_mode_0"), val = tensor("EXACT")]; tensor input_111_cast_fp16 = gelu(mode = input_111_mode_0, x = input_109_cast_fp16)[name = tensor("input_111_cast_fp16")]; tensor var_3074_pad_type_0 = const()[name = tensor("op_3074_pad_type_0"), val = tensor("valid")]; tensor var_3074_strides_0 = const()[name = tensor("op_3074_strides_0"), val = tensor([1, 1])]; tensor var_3074_pad_0 = const()[name = tensor("op_3074_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_3074_dilations_0 = const()[name = tensor("op_3074_dilations_0"), val = tensor([1, 1])]; tensor var_3074_groups_0 = const()[name = tensor("op_3074_groups_0"), val = tensor(1)]; tensor blocks_10_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_10_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(434435136)))]; tensor blocks_10_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_10_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(447542400)))]; tensor var_3074_cast_fp16 = conv(bias = blocks_10_mlp_2_bias_to_fp16, dilations = var_3074_dilations_0, groups = var_3074_groups_0, pad = var_3074_pad_0, pad_type = var_3074_pad_type_0, strides = var_3074_strides_0, weight = blocks_10_mlp_2_weight_to_fp16, x = input_111_cast_fp16)[name = tensor("op_3074_cast_fp16")]; tensor inputs_45_cast_fp16 = add(x = inputs_43_cast_fp16, y = var_3074_cast_fp16)[name = tensor("inputs_45_cast_fp16")]; tensor var_3083 = const()[name = tensor("op_3083"), val = tensor(1)]; tensor input_113_axes_0 = const()[name = tensor("input_113_axes_0"), val = tensor([1])]; tensor input_113_gamma_0_to_fp16 = const()[name = tensor("input_113_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(447545024)))]; tensor input_113_beta_0_to_fp16 = const()[name = tensor("input_113_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(447547648)))]; tensor var_3099_to_fp16 = const()[name = tensor("op_3099_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_113_cast_fp16 = layer_norm(axes = input_113_axes_0, beta = input_113_beta_0_to_fp16, epsilon = var_3099_to_fp16, gamma = input_113_gamma_0_to_fp16, x = inputs_45_cast_fp16)[name = tensor("input_113_cast_fp16")]; tensor q_23_pad_type_0 = const()[name = tensor("q_23_pad_type_0"), val = tensor("valid")]; tensor q_23_strides_0 = const()[name = tensor("q_23_strides_0"), val = tensor([1, 1])]; tensor q_23_pad_0 = const()[name = tensor("q_23_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_23_dilations_0 = const()[name = tensor("q_23_dilations_0"), val = tensor([1, 1])]; tensor q_23_groups_0 = const()[name = tensor("q_23_groups_0"), val = tensor(1)]; tensor var_3134_weight_0_to_fp16 = const()[name = tensor("op_3134_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(447550272)))]; tensor var_3134_bias_0_to_fp16 = const()[name = tensor("op_3134_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(450827136)))]; tensor var_3134_cast_fp16 = conv(bias = var_3134_bias_0_to_fp16, dilations = q_23_dilations_0, groups = q_23_groups_0, pad = q_23_pad_0, pad_type = q_23_pad_type_0, strides = q_23_strides_0, weight = var_3134_weight_0_to_fp16, x = input_113_cast_fp16)[name = tensor("op_3134_cast_fp16")]; tensor k_23_pad_type_0 = const()[name = tensor("k_23_pad_type_0"), val = tensor("valid")]; tensor k_23_strides_0 = const()[name = tensor("k_23_strides_0"), val = tensor([1, 1])]; tensor k_23_pad_0 = const()[name = tensor("k_23_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_23_dilations_0 = const()[name = tensor("k_23_dilations_0"), val = tensor([1, 1])]; tensor k_23_groups_0 = const()[name = tensor("k_23_groups_0"), val = tensor(1)]; tensor blocks_11_attn_key_weight_to_fp16 = const()[name = tensor("blocks_11_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(450829760)))]; tensor k_23_cast_fp16 = conv(dilations = k_23_dilations_0, groups = k_23_groups_0, pad = k_23_pad_0, pad_type = k_23_pad_type_0, strides = k_23_strides_0, weight = blocks_11_attn_key_weight_to_fp16, x = input_113_cast_fp16)[name = tensor("k_23_cast_fp16")]; tensor var_3132_pad_type_0 = const()[name = tensor("op_3132_pad_type_0"), val = tensor("valid")]; tensor var_3132_strides_0 = const()[name = tensor("op_3132_strides_0"), val = tensor([1, 1])]; tensor var_3132_pad_0 = const()[name = tensor("op_3132_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_3132_dilations_0 = const()[name = tensor("op_3132_dilations_0"), val = tensor([1, 1])]; tensor var_3132_groups_0 = const()[name = tensor("op_3132_groups_0"), val = tensor(1)]; tensor blocks_11_attn_value_weight_to_fp16 = const()[name = tensor("blocks_11_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(454106624)))]; tensor blocks_11_attn_value_bias_to_fp16 = const()[name = tensor("blocks_11_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(457383488)))]; tensor var_3132_cast_fp16 = conv(bias = blocks_11_attn_value_bias_to_fp16, dilations = var_3132_dilations_0, groups = var_3132_groups_0, pad = var_3132_pad_0, pad_type = var_3132_pad_type_0, strides = var_3132_strides_0, weight = blocks_11_attn_value_weight_to_fp16, x = input_113_cast_fp16)[name = tensor("op_3132_cast_fp16")]; tensor tile_33 = const()[name = tensor("tile_33"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_3135_axis_0 = const()[name = tensor("op_3135_axis_0"), val = tensor(1)]; tensor var_3135_cast_fp16_0, tensor var_3135_cast_fp16_1, tensor var_3135_cast_fp16_2, tensor var_3135_cast_fp16_3, tensor var_3135_cast_fp16_4, tensor var_3135_cast_fp16_5, tensor var_3135_cast_fp16_6, tensor var_3135_cast_fp16_7, tensor var_3135_cast_fp16_8, tensor var_3135_cast_fp16_9, tensor var_3135_cast_fp16_10, tensor var_3135_cast_fp16_11, tensor var_3135_cast_fp16_12, tensor var_3135_cast_fp16_13, tensor var_3135_cast_fp16_14, tensor var_3135_cast_fp16_15, tensor var_3135_cast_fp16_16, tensor var_3135_cast_fp16_17, tensor var_3135_cast_fp16_18, tensor var_3135_cast_fp16_19 = split(axis = var_3135_axis_0, split_sizes = tile_33, x = var_3134_cast_fp16)[name = tensor("op_3135_cast_fp16")]; tensor var_3156_perm_0 = const()[name = tensor("op_3156_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_34 = const()[name = tensor("tile_34"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_3157_axis_0 = const()[name = tensor("op_3157_axis_0"), val = tensor(3)]; tensor var_3156_cast_fp16 = transpose(perm = var_3156_perm_0, x = k_23_cast_fp16)[name = tensor("transpose_21")]; tensor var_3157_cast_fp16_0, tensor var_3157_cast_fp16_1, tensor var_3157_cast_fp16_2, tensor var_3157_cast_fp16_3, tensor var_3157_cast_fp16_4, tensor var_3157_cast_fp16_5, tensor var_3157_cast_fp16_6, tensor var_3157_cast_fp16_7, tensor var_3157_cast_fp16_8, tensor var_3157_cast_fp16_9, tensor var_3157_cast_fp16_10, tensor var_3157_cast_fp16_11, tensor var_3157_cast_fp16_12, tensor var_3157_cast_fp16_13, tensor var_3157_cast_fp16_14, tensor var_3157_cast_fp16_15, tensor var_3157_cast_fp16_16, tensor var_3157_cast_fp16_17, tensor var_3157_cast_fp16_18, tensor var_3157_cast_fp16_19 = split(axis = var_3157_axis_0, split_sizes = tile_34, x = var_3156_cast_fp16)[name = tensor("op_3157_cast_fp16")]; tensor tile_35 = const()[name = tensor("tile_35"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_3178_axis_0 = const()[name = tensor("op_3178_axis_0"), val = tensor(1)]; tensor var_3178_cast_fp16_0, tensor var_3178_cast_fp16_1, tensor var_3178_cast_fp16_2, tensor var_3178_cast_fp16_3, tensor var_3178_cast_fp16_4, tensor var_3178_cast_fp16_5, tensor var_3178_cast_fp16_6, tensor var_3178_cast_fp16_7, tensor var_3178_cast_fp16_8, tensor var_3178_cast_fp16_9, tensor var_3178_cast_fp16_10, tensor var_3178_cast_fp16_11, tensor var_3178_cast_fp16_12, tensor var_3178_cast_fp16_13, tensor var_3178_cast_fp16_14, tensor var_3178_cast_fp16_15, tensor var_3178_cast_fp16_16, tensor var_3178_cast_fp16_17, tensor var_3178_cast_fp16_18, tensor var_3178_cast_fp16_19 = split(axis = var_3178_axis_0, split_sizes = tile_35, x = var_3132_cast_fp16)[name = tensor("op_3178_cast_fp16")]; tensor aw_441_equation_0 = const()[name = tensor("aw_441_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_441_cast_fp16 = einsum(equation = aw_441_equation_0, values = (var_3157_cast_fp16_0, var_3135_cast_fp16_0))[name = tensor("aw_441_cast_fp16")]; tensor aw_443_equation_0 = const()[name = tensor("aw_443_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_443_cast_fp16 = einsum(equation = aw_443_equation_0, values = (var_3157_cast_fp16_1, var_3135_cast_fp16_1))[name = tensor("aw_443_cast_fp16")]; tensor aw_445_equation_0 = const()[name = tensor("aw_445_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_445_cast_fp16 = einsum(equation = aw_445_equation_0, values = (var_3157_cast_fp16_2, var_3135_cast_fp16_2))[name = tensor("aw_445_cast_fp16")]; tensor aw_447_equation_0 = const()[name = tensor("aw_447_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_447_cast_fp16 = einsum(equation = aw_447_equation_0, values = (var_3157_cast_fp16_3, var_3135_cast_fp16_3))[name = tensor("aw_447_cast_fp16")]; tensor aw_449_equation_0 = const()[name = tensor("aw_449_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_449_cast_fp16 = einsum(equation = aw_449_equation_0, values = (var_3157_cast_fp16_4, var_3135_cast_fp16_4))[name = tensor("aw_449_cast_fp16")]; tensor aw_451_equation_0 = const()[name = tensor("aw_451_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_451_cast_fp16 = einsum(equation = aw_451_equation_0, values = (var_3157_cast_fp16_5, var_3135_cast_fp16_5))[name = tensor("aw_451_cast_fp16")]; tensor aw_453_equation_0 = const()[name = tensor("aw_453_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_453_cast_fp16 = einsum(equation = aw_453_equation_0, values = (var_3157_cast_fp16_6, var_3135_cast_fp16_6))[name = tensor("aw_453_cast_fp16")]; tensor aw_455_equation_0 = const()[name = tensor("aw_455_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_455_cast_fp16 = einsum(equation = aw_455_equation_0, values = (var_3157_cast_fp16_7, var_3135_cast_fp16_7))[name = tensor("aw_455_cast_fp16")]; tensor aw_457_equation_0 = const()[name = tensor("aw_457_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_457_cast_fp16 = einsum(equation = aw_457_equation_0, values = (var_3157_cast_fp16_8, var_3135_cast_fp16_8))[name = tensor("aw_457_cast_fp16")]; tensor aw_459_equation_0 = const()[name = tensor("aw_459_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_459_cast_fp16 = einsum(equation = aw_459_equation_0, values = (var_3157_cast_fp16_9, var_3135_cast_fp16_9))[name = tensor("aw_459_cast_fp16")]; tensor aw_461_equation_0 = const()[name = tensor("aw_461_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_461_cast_fp16 = einsum(equation = aw_461_equation_0, values = (var_3157_cast_fp16_10, var_3135_cast_fp16_10))[name = tensor("aw_461_cast_fp16")]; tensor aw_463_equation_0 = const()[name = tensor("aw_463_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_463_cast_fp16 = einsum(equation = aw_463_equation_0, values = (var_3157_cast_fp16_11, var_3135_cast_fp16_11))[name = tensor("aw_463_cast_fp16")]; tensor aw_465_equation_0 = const()[name = tensor("aw_465_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_465_cast_fp16 = einsum(equation = aw_465_equation_0, values = (var_3157_cast_fp16_12, var_3135_cast_fp16_12))[name = tensor("aw_465_cast_fp16")]; tensor aw_467_equation_0 = const()[name = tensor("aw_467_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_467_cast_fp16 = einsum(equation = aw_467_equation_0, values = (var_3157_cast_fp16_13, var_3135_cast_fp16_13))[name = tensor("aw_467_cast_fp16")]; tensor aw_469_equation_0 = const()[name = tensor("aw_469_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_469_cast_fp16 = einsum(equation = aw_469_equation_0, values = (var_3157_cast_fp16_14, var_3135_cast_fp16_14))[name = tensor("aw_469_cast_fp16")]; tensor aw_471_equation_0 = const()[name = tensor("aw_471_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_471_cast_fp16 = einsum(equation = aw_471_equation_0, values = (var_3157_cast_fp16_15, var_3135_cast_fp16_15))[name = tensor("aw_471_cast_fp16")]; tensor aw_473_equation_0 = const()[name = tensor("aw_473_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_473_cast_fp16 = einsum(equation = aw_473_equation_0, values = (var_3157_cast_fp16_16, var_3135_cast_fp16_16))[name = tensor("aw_473_cast_fp16")]; tensor aw_475_equation_0 = const()[name = tensor("aw_475_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_475_cast_fp16 = einsum(equation = aw_475_equation_0, values = (var_3157_cast_fp16_17, var_3135_cast_fp16_17))[name = tensor("aw_475_cast_fp16")]; tensor aw_477_equation_0 = const()[name = tensor("aw_477_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_477_cast_fp16 = einsum(equation = aw_477_equation_0, values = (var_3157_cast_fp16_18, var_3135_cast_fp16_18))[name = tensor("aw_477_cast_fp16")]; tensor aw_479_equation_0 = const()[name = tensor("aw_479_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_479_cast_fp16 = einsum(equation = aw_479_equation_0, values = (var_3157_cast_fp16_19, var_3135_cast_fp16_19))[name = tensor("aw_479_cast_fp16")]; tensor var_3239_cast_fp16 = softmax(axis = var_3083, x = aw_441_cast_fp16)[name = tensor("op_3239_cast_fp16")]; tensor var_3240_cast_fp16 = softmax(axis = var_3083, x = aw_443_cast_fp16)[name = tensor("op_3240_cast_fp16")]; tensor var_3241_cast_fp16 = softmax(axis = var_3083, x = aw_445_cast_fp16)[name = tensor("op_3241_cast_fp16")]; tensor var_3242_cast_fp16 = softmax(axis = var_3083, x = aw_447_cast_fp16)[name = tensor("op_3242_cast_fp16")]; tensor var_3243_cast_fp16 = softmax(axis = var_3083, x = aw_449_cast_fp16)[name = tensor("op_3243_cast_fp16")]; tensor var_3244_cast_fp16 = softmax(axis = var_3083, x = aw_451_cast_fp16)[name = tensor("op_3244_cast_fp16")]; tensor var_3245_cast_fp16 = softmax(axis = var_3083, x = aw_453_cast_fp16)[name = tensor("op_3245_cast_fp16")]; tensor var_3246_cast_fp16 = softmax(axis = var_3083, x = aw_455_cast_fp16)[name = tensor("op_3246_cast_fp16")]; tensor var_3247_cast_fp16 = softmax(axis = var_3083, x = aw_457_cast_fp16)[name = tensor("op_3247_cast_fp16")]; tensor var_3248_cast_fp16 = softmax(axis = var_3083, x = aw_459_cast_fp16)[name = tensor("op_3248_cast_fp16")]; tensor var_3249_cast_fp16 = softmax(axis = var_3083, x = aw_461_cast_fp16)[name = tensor("op_3249_cast_fp16")]; tensor var_3250_cast_fp16 = softmax(axis = var_3083, x = aw_463_cast_fp16)[name = tensor("op_3250_cast_fp16")]; tensor var_3251_cast_fp16 = softmax(axis = var_3083, x = aw_465_cast_fp16)[name = tensor("op_3251_cast_fp16")]; tensor var_3252_cast_fp16 = softmax(axis = var_3083, x = aw_467_cast_fp16)[name = tensor("op_3252_cast_fp16")]; tensor var_3253_cast_fp16 = softmax(axis = var_3083, x = aw_469_cast_fp16)[name = tensor("op_3253_cast_fp16")]; tensor var_3254_cast_fp16 = softmax(axis = var_3083, x = aw_471_cast_fp16)[name = tensor("op_3254_cast_fp16")]; tensor var_3255_cast_fp16 = softmax(axis = var_3083, x = aw_473_cast_fp16)[name = tensor("op_3255_cast_fp16")]; tensor var_3256_cast_fp16 = softmax(axis = var_3083, x = aw_475_cast_fp16)[name = tensor("op_3256_cast_fp16")]; tensor var_3257_cast_fp16 = softmax(axis = var_3083, x = aw_477_cast_fp16)[name = tensor("op_3257_cast_fp16")]; tensor var_3258_cast_fp16 = softmax(axis = var_3083, x = aw_479_cast_fp16)[name = tensor("op_3258_cast_fp16")]; tensor var_3260_equation_0 = const()[name = tensor("op_3260_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3260_cast_fp16 = einsum(equation = var_3260_equation_0, values = (var_3178_cast_fp16_0, var_3239_cast_fp16))[name = tensor("op_3260_cast_fp16")]; tensor var_3262_equation_0 = const()[name = tensor("op_3262_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3262_cast_fp16 = einsum(equation = var_3262_equation_0, values = (var_3178_cast_fp16_1, var_3240_cast_fp16))[name = tensor("op_3262_cast_fp16")]; tensor var_3264_equation_0 = const()[name = tensor("op_3264_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3264_cast_fp16 = einsum(equation = var_3264_equation_0, values = (var_3178_cast_fp16_2, var_3241_cast_fp16))[name = tensor("op_3264_cast_fp16")]; tensor var_3266_equation_0 = const()[name = tensor("op_3266_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3266_cast_fp16 = einsum(equation = var_3266_equation_0, values = (var_3178_cast_fp16_3, var_3242_cast_fp16))[name = tensor("op_3266_cast_fp16")]; tensor var_3268_equation_0 = const()[name = tensor("op_3268_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3268_cast_fp16 = einsum(equation = var_3268_equation_0, values = (var_3178_cast_fp16_4, var_3243_cast_fp16))[name = tensor("op_3268_cast_fp16")]; tensor var_3270_equation_0 = const()[name = tensor("op_3270_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3270_cast_fp16 = einsum(equation = var_3270_equation_0, values = (var_3178_cast_fp16_5, var_3244_cast_fp16))[name = tensor("op_3270_cast_fp16")]; tensor var_3272_equation_0 = const()[name = tensor("op_3272_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3272_cast_fp16 = einsum(equation = var_3272_equation_0, values = (var_3178_cast_fp16_6, var_3245_cast_fp16))[name = tensor("op_3272_cast_fp16")]; tensor var_3274_equation_0 = const()[name = tensor("op_3274_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3274_cast_fp16 = einsum(equation = var_3274_equation_0, values = (var_3178_cast_fp16_7, var_3246_cast_fp16))[name = tensor("op_3274_cast_fp16")]; tensor var_3276_equation_0 = const()[name = tensor("op_3276_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3276_cast_fp16 = einsum(equation = var_3276_equation_0, values = (var_3178_cast_fp16_8, var_3247_cast_fp16))[name = tensor("op_3276_cast_fp16")]; tensor var_3278_equation_0 = const()[name = tensor("op_3278_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3278_cast_fp16 = einsum(equation = var_3278_equation_0, values = (var_3178_cast_fp16_9, var_3248_cast_fp16))[name = tensor("op_3278_cast_fp16")]; tensor var_3280_equation_0 = const()[name = tensor("op_3280_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3280_cast_fp16 = einsum(equation = var_3280_equation_0, values = (var_3178_cast_fp16_10, var_3249_cast_fp16))[name = tensor("op_3280_cast_fp16")]; tensor var_3282_equation_0 = const()[name = tensor("op_3282_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3282_cast_fp16 = einsum(equation = var_3282_equation_0, values = (var_3178_cast_fp16_11, var_3250_cast_fp16))[name = tensor("op_3282_cast_fp16")]; tensor var_3284_equation_0 = const()[name = tensor("op_3284_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3284_cast_fp16 = einsum(equation = var_3284_equation_0, values = (var_3178_cast_fp16_12, var_3251_cast_fp16))[name = tensor("op_3284_cast_fp16")]; tensor var_3286_equation_0 = const()[name = tensor("op_3286_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3286_cast_fp16 = einsum(equation = var_3286_equation_0, values = (var_3178_cast_fp16_13, var_3252_cast_fp16))[name = tensor("op_3286_cast_fp16")]; tensor var_3288_equation_0 = const()[name = tensor("op_3288_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3288_cast_fp16 = einsum(equation = var_3288_equation_0, values = (var_3178_cast_fp16_14, var_3253_cast_fp16))[name = tensor("op_3288_cast_fp16")]; tensor var_3290_equation_0 = const()[name = tensor("op_3290_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3290_cast_fp16 = einsum(equation = var_3290_equation_0, values = (var_3178_cast_fp16_15, var_3254_cast_fp16))[name = tensor("op_3290_cast_fp16")]; tensor var_3292_equation_0 = const()[name = tensor("op_3292_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3292_cast_fp16 = einsum(equation = var_3292_equation_0, values = (var_3178_cast_fp16_16, var_3255_cast_fp16))[name = tensor("op_3292_cast_fp16")]; tensor var_3294_equation_0 = const()[name = tensor("op_3294_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3294_cast_fp16 = einsum(equation = var_3294_equation_0, values = (var_3178_cast_fp16_17, var_3256_cast_fp16))[name = tensor("op_3294_cast_fp16")]; tensor var_3296_equation_0 = const()[name = tensor("op_3296_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3296_cast_fp16 = einsum(equation = var_3296_equation_0, values = (var_3178_cast_fp16_18, var_3257_cast_fp16))[name = tensor("op_3296_cast_fp16")]; tensor var_3298_equation_0 = const()[name = tensor("op_3298_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3298_cast_fp16 = einsum(equation = var_3298_equation_0, values = (var_3178_cast_fp16_19, var_3258_cast_fp16))[name = tensor("op_3298_cast_fp16")]; tensor input_115_interleave_0 = const()[name = tensor("input_115_interleave_0"), val = tensor(false)]; tensor input_115_cast_fp16 = concat(axis = var_3083, interleave = input_115_interleave_0, values = (var_3260_cast_fp16, var_3262_cast_fp16, var_3264_cast_fp16, var_3266_cast_fp16, var_3268_cast_fp16, var_3270_cast_fp16, var_3272_cast_fp16, var_3274_cast_fp16, var_3276_cast_fp16, var_3278_cast_fp16, var_3280_cast_fp16, var_3282_cast_fp16, var_3284_cast_fp16, var_3286_cast_fp16, var_3288_cast_fp16, var_3290_cast_fp16, var_3292_cast_fp16, var_3294_cast_fp16, var_3296_cast_fp16, var_3298_cast_fp16))[name = tensor("input_115_cast_fp16")]; tensor var_3307_pad_type_0 = const()[name = tensor("op_3307_pad_type_0"), val = tensor("valid")]; tensor var_3307_strides_0 = const()[name = tensor("op_3307_strides_0"), val = tensor([1, 1])]; tensor var_3307_pad_0 = const()[name = tensor("op_3307_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_3307_dilations_0 = const()[name = tensor("op_3307_dilations_0"), val = tensor([1, 1])]; tensor var_3307_groups_0 = const()[name = tensor("op_3307_groups_0"), val = tensor(1)]; tensor blocks_11_attn_out_weight_to_fp16 = const()[name = tensor("blocks_11_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(457386112)))]; tensor blocks_11_attn_out_bias_to_fp16 = const()[name = tensor("blocks_11_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(460662976)))]; tensor var_3307_cast_fp16 = conv(bias = blocks_11_attn_out_bias_to_fp16, dilations = var_3307_dilations_0, groups = var_3307_groups_0, pad = var_3307_pad_0, pad_type = var_3307_pad_type_0, strides = var_3307_strides_0, weight = blocks_11_attn_out_weight_to_fp16, x = input_115_cast_fp16)[name = tensor("op_3307_cast_fp16")]; tensor inputs_47_cast_fp16 = add(x = inputs_45_cast_fp16, y = var_3307_cast_fp16)[name = tensor("inputs_47_cast_fp16")]; tensor input_117_axes_0 = const()[name = tensor("input_117_axes_0"), val = tensor([1])]; tensor input_117_gamma_0_to_fp16 = const()[name = tensor("input_117_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(460665600)))]; tensor input_117_beta_0_to_fp16 = const()[name = tensor("input_117_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(460668224)))]; tensor var_3317_to_fp16 = const()[name = tensor("op_3317_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_117_cast_fp16 = layer_norm(axes = input_117_axes_0, beta = input_117_beta_0_to_fp16, epsilon = var_3317_to_fp16, gamma = input_117_gamma_0_to_fp16, x = inputs_47_cast_fp16)[name = tensor("input_117_cast_fp16")]; tensor input_119_pad_type_0 = const()[name = tensor("input_119_pad_type_0"), val = tensor("valid")]; tensor input_119_strides_0 = const()[name = tensor("input_119_strides_0"), val = tensor([1, 1])]; tensor input_119_pad_0 = const()[name = tensor("input_119_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_119_dilations_0 = const()[name = tensor("input_119_dilations_0"), val = tensor([1, 1])]; tensor input_119_groups_0 = const()[name = tensor("input_119_groups_0"), val = tensor(1)]; tensor blocks_11_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_11_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(460670848)))]; tensor blocks_11_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_11_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(473778112)))]; tensor input_119_cast_fp16 = conv(bias = blocks_11_mlp_0_bias_to_fp16, dilations = input_119_dilations_0, groups = input_119_groups_0, pad = input_119_pad_0, pad_type = input_119_pad_type_0, strides = input_119_strides_0, weight = blocks_11_mlp_0_weight_to_fp16, x = input_117_cast_fp16)[name = tensor("input_119_cast_fp16")]; tensor input_121_mode_0 = const()[name = tensor("input_121_mode_0"), val = tensor("EXACT")]; tensor input_121_cast_fp16 = gelu(mode = input_121_mode_0, x = input_119_cast_fp16)[name = tensor("input_121_cast_fp16")]; tensor var_3343_pad_type_0 = const()[name = tensor("op_3343_pad_type_0"), val = tensor("valid")]; tensor var_3343_strides_0 = const()[name = tensor("op_3343_strides_0"), val = tensor([1, 1])]; tensor var_3343_pad_0 = const()[name = tensor("op_3343_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_3343_dilations_0 = const()[name = tensor("op_3343_dilations_0"), val = tensor([1, 1])]; tensor var_3343_groups_0 = const()[name = tensor("op_3343_groups_0"), val = tensor(1)]; tensor blocks_11_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_11_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(473788416)))]; tensor blocks_11_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_11_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(486895680)))]; tensor var_3343_cast_fp16 = conv(bias = blocks_11_mlp_2_bias_to_fp16, dilations = var_3343_dilations_0, groups = var_3343_groups_0, pad = var_3343_pad_0, pad_type = var_3343_pad_type_0, strides = var_3343_strides_0, weight = blocks_11_mlp_2_weight_to_fp16, x = input_121_cast_fp16)[name = tensor("op_3343_cast_fp16")]; tensor inputs_49_cast_fp16 = add(x = inputs_47_cast_fp16, y = var_3343_cast_fp16)[name = tensor("inputs_49_cast_fp16")]; tensor var_3352 = const()[name = tensor("op_3352"), val = tensor(1)]; tensor input_123_axes_0 = const()[name = tensor("input_123_axes_0"), val = tensor([1])]; tensor input_123_gamma_0_to_fp16 = const()[name = tensor("input_123_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(486898304)))]; tensor input_123_beta_0_to_fp16 = const()[name = tensor("input_123_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(486900928)))]; tensor var_3368_to_fp16 = const()[name = tensor("op_3368_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_123_cast_fp16 = layer_norm(axes = input_123_axes_0, beta = input_123_beta_0_to_fp16, epsilon = var_3368_to_fp16, gamma = input_123_gamma_0_to_fp16, x = inputs_49_cast_fp16)[name = tensor("input_123_cast_fp16")]; tensor q_25_pad_type_0 = const()[name = tensor("q_25_pad_type_0"), val = tensor("valid")]; tensor q_25_strides_0 = const()[name = tensor("q_25_strides_0"), val = tensor([1, 1])]; tensor q_25_pad_0 = const()[name = tensor("q_25_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_25_dilations_0 = const()[name = tensor("q_25_dilations_0"), val = tensor([1, 1])]; tensor q_25_groups_0 = const()[name = tensor("q_25_groups_0"), val = tensor(1)]; tensor var_3403_weight_0_to_fp16 = const()[name = tensor("op_3403_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(486903552)))]; tensor var_3403_bias_0_to_fp16 = const()[name = tensor("op_3403_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(490180416)))]; tensor var_3403_cast_fp16 = conv(bias = var_3403_bias_0_to_fp16, dilations = q_25_dilations_0, groups = q_25_groups_0, pad = q_25_pad_0, pad_type = q_25_pad_type_0, strides = q_25_strides_0, weight = var_3403_weight_0_to_fp16, x = input_123_cast_fp16)[name = tensor("op_3403_cast_fp16")]; tensor k_25_pad_type_0 = const()[name = tensor("k_25_pad_type_0"), val = tensor("valid")]; tensor k_25_strides_0 = const()[name = tensor("k_25_strides_0"), val = tensor([1, 1])]; tensor k_25_pad_0 = const()[name = tensor("k_25_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_25_dilations_0 = const()[name = tensor("k_25_dilations_0"), val = tensor([1, 1])]; tensor k_25_groups_0 = const()[name = tensor("k_25_groups_0"), val = tensor(1)]; tensor blocks_12_attn_key_weight_to_fp16 = const()[name = tensor("blocks_12_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(490183040)))]; tensor k_25_cast_fp16 = conv(dilations = k_25_dilations_0, groups = k_25_groups_0, pad = k_25_pad_0, pad_type = k_25_pad_type_0, strides = k_25_strides_0, weight = blocks_12_attn_key_weight_to_fp16, x = input_123_cast_fp16)[name = tensor("k_25_cast_fp16")]; tensor var_3401_pad_type_0 = const()[name = tensor("op_3401_pad_type_0"), val = tensor("valid")]; tensor var_3401_strides_0 = const()[name = tensor("op_3401_strides_0"), val = tensor([1, 1])]; tensor var_3401_pad_0 = const()[name = tensor("op_3401_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_3401_dilations_0 = const()[name = tensor("op_3401_dilations_0"), val = tensor([1, 1])]; tensor var_3401_groups_0 = const()[name = tensor("op_3401_groups_0"), val = tensor(1)]; tensor blocks_12_attn_value_weight_to_fp16 = const()[name = tensor("blocks_12_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(493459904)))]; tensor blocks_12_attn_value_bias_to_fp16 = const()[name = tensor("blocks_12_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(496736768)))]; tensor var_3401_cast_fp16 = conv(bias = blocks_12_attn_value_bias_to_fp16, dilations = var_3401_dilations_0, groups = var_3401_groups_0, pad = var_3401_pad_0, pad_type = var_3401_pad_type_0, strides = var_3401_strides_0, weight = blocks_12_attn_value_weight_to_fp16, x = input_123_cast_fp16)[name = tensor("op_3401_cast_fp16")]; tensor tile_36 = const()[name = tensor("tile_36"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_3404_axis_0 = const()[name = tensor("op_3404_axis_0"), val = tensor(1)]; tensor var_3404_cast_fp16_0, tensor var_3404_cast_fp16_1, tensor var_3404_cast_fp16_2, tensor var_3404_cast_fp16_3, tensor var_3404_cast_fp16_4, tensor var_3404_cast_fp16_5, tensor var_3404_cast_fp16_6, tensor var_3404_cast_fp16_7, tensor var_3404_cast_fp16_8, tensor var_3404_cast_fp16_9, tensor var_3404_cast_fp16_10, tensor var_3404_cast_fp16_11, tensor var_3404_cast_fp16_12, tensor var_3404_cast_fp16_13, tensor var_3404_cast_fp16_14, tensor var_3404_cast_fp16_15, tensor var_3404_cast_fp16_16, tensor var_3404_cast_fp16_17, tensor var_3404_cast_fp16_18, tensor var_3404_cast_fp16_19 = split(axis = var_3404_axis_0, split_sizes = tile_36, x = var_3403_cast_fp16)[name = tensor("op_3404_cast_fp16")]; tensor var_3425_perm_0 = const()[name = tensor("op_3425_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_37 = const()[name = tensor("tile_37"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_3426_axis_0 = const()[name = tensor("op_3426_axis_0"), val = tensor(3)]; tensor var_3425_cast_fp16 = transpose(perm = var_3425_perm_0, x = k_25_cast_fp16)[name = tensor("transpose_20")]; tensor var_3426_cast_fp16_0, tensor var_3426_cast_fp16_1, tensor var_3426_cast_fp16_2, tensor var_3426_cast_fp16_3, tensor var_3426_cast_fp16_4, tensor var_3426_cast_fp16_5, tensor var_3426_cast_fp16_6, tensor var_3426_cast_fp16_7, tensor var_3426_cast_fp16_8, tensor var_3426_cast_fp16_9, tensor var_3426_cast_fp16_10, tensor var_3426_cast_fp16_11, tensor var_3426_cast_fp16_12, tensor var_3426_cast_fp16_13, tensor var_3426_cast_fp16_14, tensor var_3426_cast_fp16_15, tensor var_3426_cast_fp16_16, tensor var_3426_cast_fp16_17, tensor var_3426_cast_fp16_18, tensor var_3426_cast_fp16_19 = split(axis = var_3426_axis_0, split_sizes = tile_37, x = var_3425_cast_fp16)[name = tensor("op_3426_cast_fp16")]; tensor tile_38 = const()[name = tensor("tile_38"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_3447_axis_0 = const()[name = tensor("op_3447_axis_0"), val = tensor(1)]; tensor var_3447_cast_fp16_0, tensor var_3447_cast_fp16_1, tensor var_3447_cast_fp16_2, tensor var_3447_cast_fp16_3, tensor var_3447_cast_fp16_4, tensor var_3447_cast_fp16_5, tensor var_3447_cast_fp16_6, tensor var_3447_cast_fp16_7, tensor var_3447_cast_fp16_8, tensor var_3447_cast_fp16_9, tensor var_3447_cast_fp16_10, tensor var_3447_cast_fp16_11, tensor var_3447_cast_fp16_12, tensor var_3447_cast_fp16_13, tensor var_3447_cast_fp16_14, tensor var_3447_cast_fp16_15, tensor var_3447_cast_fp16_16, tensor var_3447_cast_fp16_17, tensor var_3447_cast_fp16_18, tensor var_3447_cast_fp16_19 = split(axis = var_3447_axis_0, split_sizes = tile_38, x = var_3401_cast_fp16)[name = tensor("op_3447_cast_fp16")]; tensor aw_481_equation_0 = const()[name = tensor("aw_481_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_481_cast_fp16 = einsum(equation = aw_481_equation_0, values = (var_3426_cast_fp16_0, var_3404_cast_fp16_0))[name = tensor("aw_481_cast_fp16")]; tensor aw_483_equation_0 = const()[name = tensor("aw_483_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_483_cast_fp16 = einsum(equation = aw_483_equation_0, values = (var_3426_cast_fp16_1, var_3404_cast_fp16_1))[name = tensor("aw_483_cast_fp16")]; tensor aw_485_equation_0 = const()[name = tensor("aw_485_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_485_cast_fp16 = einsum(equation = aw_485_equation_0, values = (var_3426_cast_fp16_2, var_3404_cast_fp16_2))[name = tensor("aw_485_cast_fp16")]; tensor aw_487_equation_0 = const()[name = tensor("aw_487_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_487_cast_fp16 = einsum(equation = aw_487_equation_0, values = (var_3426_cast_fp16_3, var_3404_cast_fp16_3))[name = tensor("aw_487_cast_fp16")]; tensor aw_489_equation_0 = const()[name = tensor("aw_489_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_489_cast_fp16 = einsum(equation = aw_489_equation_0, values = (var_3426_cast_fp16_4, var_3404_cast_fp16_4))[name = tensor("aw_489_cast_fp16")]; tensor aw_491_equation_0 = const()[name = tensor("aw_491_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_491_cast_fp16 = einsum(equation = aw_491_equation_0, values = (var_3426_cast_fp16_5, var_3404_cast_fp16_5))[name = tensor("aw_491_cast_fp16")]; tensor aw_493_equation_0 = const()[name = tensor("aw_493_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_493_cast_fp16 = einsum(equation = aw_493_equation_0, values = (var_3426_cast_fp16_6, var_3404_cast_fp16_6))[name = tensor("aw_493_cast_fp16")]; tensor aw_495_equation_0 = const()[name = tensor("aw_495_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_495_cast_fp16 = einsum(equation = aw_495_equation_0, values = (var_3426_cast_fp16_7, var_3404_cast_fp16_7))[name = tensor("aw_495_cast_fp16")]; tensor aw_497_equation_0 = const()[name = tensor("aw_497_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_497_cast_fp16 = einsum(equation = aw_497_equation_0, values = (var_3426_cast_fp16_8, var_3404_cast_fp16_8))[name = tensor("aw_497_cast_fp16")]; tensor aw_499_equation_0 = const()[name = tensor("aw_499_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_499_cast_fp16 = einsum(equation = aw_499_equation_0, values = (var_3426_cast_fp16_9, var_3404_cast_fp16_9))[name = tensor("aw_499_cast_fp16")]; tensor aw_501_equation_0 = const()[name = tensor("aw_501_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_501_cast_fp16 = einsum(equation = aw_501_equation_0, values = (var_3426_cast_fp16_10, var_3404_cast_fp16_10))[name = tensor("aw_501_cast_fp16")]; tensor aw_503_equation_0 = const()[name = tensor("aw_503_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_503_cast_fp16 = einsum(equation = aw_503_equation_0, values = (var_3426_cast_fp16_11, var_3404_cast_fp16_11))[name = tensor("aw_503_cast_fp16")]; tensor aw_505_equation_0 = const()[name = tensor("aw_505_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_505_cast_fp16 = einsum(equation = aw_505_equation_0, values = (var_3426_cast_fp16_12, var_3404_cast_fp16_12))[name = tensor("aw_505_cast_fp16")]; tensor aw_507_equation_0 = const()[name = tensor("aw_507_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_507_cast_fp16 = einsum(equation = aw_507_equation_0, values = (var_3426_cast_fp16_13, var_3404_cast_fp16_13))[name = tensor("aw_507_cast_fp16")]; tensor aw_509_equation_0 = const()[name = tensor("aw_509_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_509_cast_fp16 = einsum(equation = aw_509_equation_0, values = (var_3426_cast_fp16_14, var_3404_cast_fp16_14))[name = tensor("aw_509_cast_fp16")]; tensor aw_511_equation_0 = const()[name = tensor("aw_511_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_511_cast_fp16 = einsum(equation = aw_511_equation_0, values = (var_3426_cast_fp16_15, var_3404_cast_fp16_15))[name = tensor("aw_511_cast_fp16")]; tensor aw_513_equation_0 = const()[name = tensor("aw_513_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_513_cast_fp16 = einsum(equation = aw_513_equation_0, values = (var_3426_cast_fp16_16, var_3404_cast_fp16_16))[name = tensor("aw_513_cast_fp16")]; tensor aw_515_equation_0 = const()[name = tensor("aw_515_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_515_cast_fp16 = einsum(equation = aw_515_equation_0, values = (var_3426_cast_fp16_17, var_3404_cast_fp16_17))[name = tensor("aw_515_cast_fp16")]; tensor aw_517_equation_0 = const()[name = tensor("aw_517_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_517_cast_fp16 = einsum(equation = aw_517_equation_0, values = (var_3426_cast_fp16_18, var_3404_cast_fp16_18))[name = tensor("aw_517_cast_fp16")]; tensor aw_519_equation_0 = const()[name = tensor("aw_519_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_519_cast_fp16 = einsum(equation = aw_519_equation_0, values = (var_3426_cast_fp16_19, var_3404_cast_fp16_19))[name = tensor("aw_519_cast_fp16")]; tensor var_3508_cast_fp16 = softmax(axis = var_3352, x = aw_481_cast_fp16)[name = tensor("op_3508_cast_fp16")]; tensor var_3509_cast_fp16 = softmax(axis = var_3352, x = aw_483_cast_fp16)[name = tensor("op_3509_cast_fp16")]; tensor var_3510_cast_fp16 = softmax(axis = var_3352, x = aw_485_cast_fp16)[name = tensor("op_3510_cast_fp16")]; tensor var_3511_cast_fp16 = softmax(axis = var_3352, x = aw_487_cast_fp16)[name = tensor("op_3511_cast_fp16")]; tensor var_3512_cast_fp16 = softmax(axis = var_3352, x = aw_489_cast_fp16)[name = tensor("op_3512_cast_fp16")]; tensor var_3513_cast_fp16 = softmax(axis = var_3352, x = aw_491_cast_fp16)[name = tensor("op_3513_cast_fp16")]; tensor var_3514_cast_fp16 = softmax(axis = var_3352, x = aw_493_cast_fp16)[name = tensor("op_3514_cast_fp16")]; tensor var_3515_cast_fp16 = softmax(axis = var_3352, x = aw_495_cast_fp16)[name = tensor("op_3515_cast_fp16")]; tensor var_3516_cast_fp16 = softmax(axis = var_3352, x = aw_497_cast_fp16)[name = tensor("op_3516_cast_fp16")]; tensor var_3517_cast_fp16 = softmax(axis = var_3352, x = aw_499_cast_fp16)[name = tensor("op_3517_cast_fp16")]; tensor var_3518_cast_fp16 = softmax(axis = var_3352, x = aw_501_cast_fp16)[name = tensor("op_3518_cast_fp16")]; tensor var_3519_cast_fp16 = softmax(axis = var_3352, x = aw_503_cast_fp16)[name = tensor("op_3519_cast_fp16")]; tensor var_3520_cast_fp16 = softmax(axis = var_3352, x = aw_505_cast_fp16)[name = tensor("op_3520_cast_fp16")]; tensor var_3521_cast_fp16 = softmax(axis = var_3352, x = aw_507_cast_fp16)[name = tensor("op_3521_cast_fp16")]; tensor var_3522_cast_fp16 = softmax(axis = var_3352, x = aw_509_cast_fp16)[name = tensor("op_3522_cast_fp16")]; tensor var_3523_cast_fp16 = softmax(axis = var_3352, x = aw_511_cast_fp16)[name = tensor("op_3523_cast_fp16")]; tensor var_3524_cast_fp16 = softmax(axis = var_3352, x = aw_513_cast_fp16)[name = tensor("op_3524_cast_fp16")]; tensor var_3525_cast_fp16 = softmax(axis = var_3352, x = aw_515_cast_fp16)[name = tensor("op_3525_cast_fp16")]; tensor var_3526_cast_fp16 = softmax(axis = var_3352, x = aw_517_cast_fp16)[name = tensor("op_3526_cast_fp16")]; tensor var_3527_cast_fp16 = softmax(axis = var_3352, x = aw_519_cast_fp16)[name = tensor("op_3527_cast_fp16")]; tensor var_3529_equation_0 = const()[name = tensor("op_3529_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3529_cast_fp16 = einsum(equation = var_3529_equation_0, values = (var_3447_cast_fp16_0, var_3508_cast_fp16))[name = tensor("op_3529_cast_fp16")]; tensor var_3531_equation_0 = const()[name = tensor("op_3531_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3531_cast_fp16 = einsum(equation = var_3531_equation_0, values = (var_3447_cast_fp16_1, var_3509_cast_fp16))[name = tensor("op_3531_cast_fp16")]; tensor var_3533_equation_0 = const()[name = tensor("op_3533_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3533_cast_fp16 = einsum(equation = var_3533_equation_0, values = (var_3447_cast_fp16_2, var_3510_cast_fp16))[name = tensor("op_3533_cast_fp16")]; tensor var_3535_equation_0 = const()[name = tensor("op_3535_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3535_cast_fp16 = einsum(equation = var_3535_equation_0, values = (var_3447_cast_fp16_3, var_3511_cast_fp16))[name = tensor("op_3535_cast_fp16")]; tensor var_3537_equation_0 = const()[name = tensor("op_3537_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3537_cast_fp16 = einsum(equation = var_3537_equation_0, values = (var_3447_cast_fp16_4, var_3512_cast_fp16))[name = tensor("op_3537_cast_fp16")]; tensor var_3539_equation_0 = const()[name = tensor("op_3539_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3539_cast_fp16 = einsum(equation = var_3539_equation_0, values = (var_3447_cast_fp16_5, var_3513_cast_fp16))[name = tensor("op_3539_cast_fp16")]; tensor var_3541_equation_0 = const()[name = tensor("op_3541_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3541_cast_fp16 = einsum(equation = var_3541_equation_0, values = (var_3447_cast_fp16_6, var_3514_cast_fp16))[name = tensor("op_3541_cast_fp16")]; tensor var_3543_equation_0 = const()[name = tensor("op_3543_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3543_cast_fp16 = einsum(equation = var_3543_equation_0, values = (var_3447_cast_fp16_7, var_3515_cast_fp16))[name = tensor("op_3543_cast_fp16")]; tensor var_3545_equation_0 = const()[name = tensor("op_3545_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3545_cast_fp16 = einsum(equation = var_3545_equation_0, values = (var_3447_cast_fp16_8, var_3516_cast_fp16))[name = tensor("op_3545_cast_fp16")]; tensor var_3547_equation_0 = const()[name = tensor("op_3547_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3547_cast_fp16 = einsum(equation = var_3547_equation_0, values = (var_3447_cast_fp16_9, var_3517_cast_fp16))[name = tensor("op_3547_cast_fp16")]; tensor var_3549_equation_0 = const()[name = tensor("op_3549_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3549_cast_fp16 = einsum(equation = var_3549_equation_0, values = (var_3447_cast_fp16_10, var_3518_cast_fp16))[name = tensor("op_3549_cast_fp16")]; tensor var_3551_equation_0 = const()[name = tensor("op_3551_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3551_cast_fp16 = einsum(equation = var_3551_equation_0, values = (var_3447_cast_fp16_11, var_3519_cast_fp16))[name = tensor("op_3551_cast_fp16")]; tensor var_3553_equation_0 = const()[name = tensor("op_3553_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3553_cast_fp16 = einsum(equation = var_3553_equation_0, values = (var_3447_cast_fp16_12, var_3520_cast_fp16))[name = tensor("op_3553_cast_fp16")]; tensor var_3555_equation_0 = const()[name = tensor("op_3555_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3555_cast_fp16 = einsum(equation = var_3555_equation_0, values = (var_3447_cast_fp16_13, var_3521_cast_fp16))[name = tensor("op_3555_cast_fp16")]; tensor var_3557_equation_0 = const()[name = tensor("op_3557_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3557_cast_fp16 = einsum(equation = var_3557_equation_0, values = (var_3447_cast_fp16_14, var_3522_cast_fp16))[name = tensor("op_3557_cast_fp16")]; tensor var_3559_equation_0 = const()[name = tensor("op_3559_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3559_cast_fp16 = einsum(equation = var_3559_equation_0, values = (var_3447_cast_fp16_15, var_3523_cast_fp16))[name = tensor("op_3559_cast_fp16")]; tensor var_3561_equation_0 = const()[name = tensor("op_3561_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3561_cast_fp16 = einsum(equation = var_3561_equation_0, values = (var_3447_cast_fp16_16, var_3524_cast_fp16))[name = tensor("op_3561_cast_fp16")]; tensor var_3563_equation_0 = const()[name = tensor("op_3563_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3563_cast_fp16 = einsum(equation = var_3563_equation_0, values = (var_3447_cast_fp16_17, var_3525_cast_fp16))[name = tensor("op_3563_cast_fp16")]; tensor var_3565_equation_0 = const()[name = tensor("op_3565_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3565_cast_fp16 = einsum(equation = var_3565_equation_0, values = (var_3447_cast_fp16_18, var_3526_cast_fp16))[name = tensor("op_3565_cast_fp16")]; tensor var_3567_equation_0 = const()[name = tensor("op_3567_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3567_cast_fp16 = einsum(equation = var_3567_equation_0, values = (var_3447_cast_fp16_19, var_3527_cast_fp16))[name = tensor("op_3567_cast_fp16")]; tensor input_125_interleave_0 = const()[name = tensor("input_125_interleave_0"), val = tensor(false)]; tensor input_125_cast_fp16 = concat(axis = var_3352, interleave = input_125_interleave_0, values = (var_3529_cast_fp16, var_3531_cast_fp16, var_3533_cast_fp16, var_3535_cast_fp16, var_3537_cast_fp16, var_3539_cast_fp16, var_3541_cast_fp16, var_3543_cast_fp16, var_3545_cast_fp16, var_3547_cast_fp16, var_3549_cast_fp16, var_3551_cast_fp16, var_3553_cast_fp16, var_3555_cast_fp16, var_3557_cast_fp16, var_3559_cast_fp16, var_3561_cast_fp16, var_3563_cast_fp16, var_3565_cast_fp16, var_3567_cast_fp16))[name = tensor("input_125_cast_fp16")]; tensor var_3576_pad_type_0 = const()[name = tensor("op_3576_pad_type_0"), val = tensor("valid")]; tensor var_3576_strides_0 = const()[name = tensor("op_3576_strides_0"), val = tensor([1, 1])]; tensor var_3576_pad_0 = const()[name = tensor("op_3576_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_3576_dilations_0 = const()[name = tensor("op_3576_dilations_0"), val = tensor([1, 1])]; tensor var_3576_groups_0 = const()[name = tensor("op_3576_groups_0"), val = tensor(1)]; tensor blocks_12_attn_out_weight_to_fp16 = const()[name = tensor("blocks_12_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(496739392)))]; tensor blocks_12_attn_out_bias_to_fp16 = const()[name = tensor("blocks_12_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(500016256)))]; tensor var_3576_cast_fp16 = conv(bias = blocks_12_attn_out_bias_to_fp16, dilations = var_3576_dilations_0, groups = var_3576_groups_0, pad = var_3576_pad_0, pad_type = var_3576_pad_type_0, strides = var_3576_strides_0, weight = blocks_12_attn_out_weight_to_fp16, x = input_125_cast_fp16)[name = tensor("op_3576_cast_fp16")]; tensor inputs_51_cast_fp16 = add(x = inputs_49_cast_fp16, y = var_3576_cast_fp16)[name = tensor("inputs_51_cast_fp16")]; tensor input_127_axes_0 = const()[name = tensor("input_127_axes_0"), val = tensor([1])]; tensor input_127_gamma_0_to_fp16 = const()[name = tensor("input_127_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(500018880)))]; tensor input_127_beta_0_to_fp16 = const()[name = tensor("input_127_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(500021504)))]; tensor var_3586_to_fp16 = const()[name = tensor("op_3586_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_127_cast_fp16 = layer_norm(axes = input_127_axes_0, beta = input_127_beta_0_to_fp16, epsilon = var_3586_to_fp16, gamma = input_127_gamma_0_to_fp16, x = inputs_51_cast_fp16)[name = tensor("input_127_cast_fp16")]; tensor input_129_pad_type_0 = const()[name = tensor("input_129_pad_type_0"), val = tensor("valid")]; tensor input_129_strides_0 = const()[name = tensor("input_129_strides_0"), val = tensor([1, 1])]; tensor input_129_pad_0 = const()[name = tensor("input_129_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_129_dilations_0 = const()[name = tensor("input_129_dilations_0"), val = tensor([1, 1])]; tensor input_129_groups_0 = const()[name = tensor("input_129_groups_0"), val = tensor(1)]; tensor blocks_12_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_12_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(500024128)))]; tensor blocks_12_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_12_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(513131392)))]; tensor input_129_cast_fp16 = conv(bias = blocks_12_mlp_0_bias_to_fp16, dilations = input_129_dilations_0, groups = input_129_groups_0, pad = input_129_pad_0, pad_type = input_129_pad_type_0, strides = input_129_strides_0, weight = blocks_12_mlp_0_weight_to_fp16, x = input_127_cast_fp16)[name = tensor("input_129_cast_fp16")]; tensor input_131_mode_0 = const()[name = tensor("input_131_mode_0"), val = tensor("EXACT")]; tensor input_131_cast_fp16 = gelu(mode = input_131_mode_0, x = input_129_cast_fp16)[name = tensor("input_131_cast_fp16")]; tensor var_3612_pad_type_0 = const()[name = tensor("op_3612_pad_type_0"), val = tensor("valid")]; tensor var_3612_strides_0 = const()[name = tensor("op_3612_strides_0"), val = tensor([1, 1])]; tensor var_3612_pad_0 = const()[name = tensor("op_3612_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_3612_dilations_0 = const()[name = tensor("op_3612_dilations_0"), val = tensor([1, 1])]; tensor var_3612_groups_0 = const()[name = tensor("op_3612_groups_0"), val = tensor(1)]; tensor blocks_12_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_12_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(513141696)))]; tensor blocks_12_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_12_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526248960)))]; tensor var_3612_cast_fp16 = conv(bias = blocks_12_mlp_2_bias_to_fp16, dilations = var_3612_dilations_0, groups = var_3612_groups_0, pad = var_3612_pad_0, pad_type = var_3612_pad_type_0, strides = var_3612_strides_0, weight = blocks_12_mlp_2_weight_to_fp16, x = input_131_cast_fp16)[name = tensor("op_3612_cast_fp16")]; tensor inputs_53_cast_fp16 = add(x = inputs_51_cast_fp16, y = var_3612_cast_fp16)[name = tensor("inputs_53_cast_fp16")]; tensor var_3621 = const()[name = tensor("op_3621"), val = tensor(1)]; tensor input_133_axes_0 = const()[name = tensor("input_133_axes_0"), val = tensor([1])]; tensor input_133_gamma_0_to_fp16 = const()[name = tensor("input_133_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526251584)))]; tensor input_133_beta_0_to_fp16 = const()[name = tensor("input_133_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526254208)))]; tensor var_3637_to_fp16 = const()[name = tensor("op_3637_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_133_cast_fp16 = layer_norm(axes = input_133_axes_0, beta = input_133_beta_0_to_fp16, epsilon = var_3637_to_fp16, gamma = input_133_gamma_0_to_fp16, x = inputs_53_cast_fp16)[name = tensor("input_133_cast_fp16")]; tensor q_27_pad_type_0 = const()[name = tensor("q_27_pad_type_0"), val = tensor("valid")]; tensor q_27_strides_0 = const()[name = tensor("q_27_strides_0"), val = tensor([1, 1])]; tensor q_27_pad_0 = const()[name = tensor("q_27_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_27_dilations_0 = const()[name = tensor("q_27_dilations_0"), val = tensor([1, 1])]; tensor q_27_groups_0 = const()[name = tensor("q_27_groups_0"), val = tensor(1)]; tensor var_3672_weight_0_to_fp16 = const()[name = tensor("op_3672_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526256832)))]; tensor var_3672_bias_0_to_fp16 = const()[name = tensor("op_3672_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(529533696)))]; tensor var_3672_cast_fp16 = conv(bias = var_3672_bias_0_to_fp16, dilations = q_27_dilations_0, groups = q_27_groups_0, pad = q_27_pad_0, pad_type = q_27_pad_type_0, strides = q_27_strides_0, weight = var_3672_weight_0_to_fp16, x = input_133_cast_fp16)[name = tensor("op_3672_cast_fp16")]; tensor k_27_pad_type_0 = const()[name = tensor("k_27_pad_type_0"), val = tensor("valid")]; tensor k_27_strides_0 = const()[name = tensor("k_27_strides_0"), val = tensor([1, 1])]; tensor k_27_pad_0 = const()[name = tensor("k_27_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_27_dilations_0 = const()[name = tensor("k_27_dilations_0"), val = tensor([1, 1])]; tensor k_27_groups_0 = const()[name = tensor("k_27_groups_0"), val = tensor(1)]; tensor blocks_13_attn_key_weight_to_fp16 = const()[name = tensor("blocks_13_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(529536320)))]; tensor k_27_cast_fp16 = conv(dilations = k_27_dilations_0, groups = k_27_groups_0, pad = k_27_pad_0, pad_type = k_27_pad_type_0, strides = k_27_strides_0, weight = blocks_13_attn_key_weight_to_fp16, x = input_133_cast_fp16)[name = tensor("k_27_cast_fp16")]; tensor var_3670_pad_type_0 = const()[name = tensor("op_3670_pad_type_0"), val = tensor("valid")]; tensor var_3670_strides_0 = const()[name = tensor("op_3670_strides_0"), val = tensor([1, 1])]; tensor var_3670_pad_0 = const()[name = tensor("op_3670_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_3670_dilations_0 = const()[name = tensor("op_3670_dilations_0"), val = tensor([1, 1])]; tensor var_3670_groups_0 = const()[name = tensor("op_3670_groups_0"), val = tensor(1)]; tensor blocks_13_attn_value_weight_to_fp16 = const()[name = tensor("blocks_13_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(532813184)))]; tensor blocks_13_attn_value_bias_to_fp16 = const()[name = tensor("blocks_13_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(536090048)))]; tensor var_3670_cast_fp16 = conv(bias = blocks_13_attn_value_bias_to_fp16, dilations = var_3670_dilations_0, groups = var_3670_groups_0, pad = var_3670_pad_0, pad_type = var_3670_pad_type_0, strides = var_3670_strides_0, weight = blocks_13_attn_value_weight_to_fp16, x = input_133_cast_fp16)[name = tensor("op_3670_cast_fp16")]; tensor tile_39 = const()[name = tensor("tile_39"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_3673_axis_0 = const()[name = tensor("op_3673_axis_0"), val = tensor(1)]; tensor var_3673_cast_fp16_0, tensor var_3673_cast_fp16_1, tensor var_3673_cast_fp16_2, tensor var_3673_cast_fp16_3, tensor var_3673_cast_fp16_4, tensor var_3673_cast_fp16_5, tensor var_3673_cast_fp16_6, tensor var_3673_cast_fp16_7, tensor var_3673_cast_fp16_8, tensor var_3673_cast_fp16_9, tensor var_3673_cast_fp16_10, tensor var_3673_cast_fp16_11, tensor var_3673_cast_fp16_12, tensor var_3673_cast_fp16_13, tensor var_3673_cast_fp16_14, tensor var_3673_cast_fp16_15, tensor var_3673_cast_fp16_16, tensor var_3673_cast_fp16_17, tensor var_3673_cast_fp16_18, tensor var_3673_cast_fp16_19 = split(axis = var_3673_axis_0, split_sizes = tile_39, x = var_3672_cast_fp16)[name = tensor("op_3673_cast_fp16")]; tensor var_3694_perm_0 = const()[name = tensor("op_3694_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_40 = const()[name = tensor("tile_40"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_3695_axis_0 = const()[name = tensor("op_3695_axis_0"), val = tensor(3)]; tensor var_3694_cast_fp16 = transpose(perm = var_3694_perm_0, x = k_27_cast_fp16)[name = tensor("transpose_19")]; tensor var_3695_cast_fp16_0, tensor var_3695_cast_fp16_1, tensor var_3695_cast_fp16_2, tensor var_3695_cast_fp16_3, tensor var_3695_cast_fp16_4, tensor var_3695_cast_fp16_5, tensor var_3695_cast_fp16_6, tensor var_3695_cast_fp16_7, tensor var_3695_cast_fp16_8, tensor var_3695_cast_fp16_9, tensor var_3695_cast_fp16_10, tensor var_3695_cast_fp16_11, tensor var_3695_cast_fp16_12, tensor var_3695_cast_fp16_13, tensor var_3695_cast_fp16_14, tensor var_3695_cast_fp16_15, tensor var_3695_cast_fp16_16, tensor var_3695_cast_fp16_17, tensor var_3695_cast_fp16_18, tensor var_3695_cast_fp16_19 = split(axis = var_3695_axis_0, split_sizes = tile_40, x = var_3694_cast_fp16)[name = tensor("op_3695_cast_fp16")]; tensor tile_41 = const()[name = tensor("tile_41"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_3716_axis_0 = const()[name = tensor("op_3716_axis_0"), val = tensor(1)]; tensor var_3716_cast_fp16_0, tensor var_3716_cast_fp16_1, tensor var_3716_cast_fp16_2, tensor var_3716_cast_fp16_3, tensor var_3716_cast_fp16_4, tensor var_3716_cast_fp16_5, tensor var_3716_cast_fp16_6, tensor var_3716_cast_fp16_7, tensor var_3716_cast_fp16_8, tensor var_3716_cast_fp16_9, tensor var_3716_cast_fp16_10, tensor var_3716_cast_fp16_11, tensor var_3716_cast_fp16_12, tensor var_3716_cast_fp16_13, tensor var_3716_cast_fp16_14, tensor var_3716_cast_fp16_15, tensor var_3716_cast_fp16_16, tensor var_3716_cast_fp16_17, tensor var_3716_cast_fp16_18, tensor var_3716_cast_fp16_19 = split(axis = var_3716_axis_0, split_sizes = tile_41, x = var_3670_cast_fp16)[name = tensor("op_3716_cast_fp16")]; tensor aw_521_equation_0 = const()[name = tensor("aw_521_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_521_cast_fp16 = einsum(equation = aw_521_equation_0, values = (var_3695_cast_fp16_0, var_3673_cast_fp16_0))[name = tensor("aw_521_cast_fp16")]; tensor aw_523_equation_0 = const()[name = tensor("aw_523_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_523_cast_fp16 = einsum(equation = aw_523_equation_0, values = (var_3695_cast_fp16_1, var_3673_cast_fp16_1))[name = tensor("aw_523_cast_fp16")]; tensor aw_525_equation_0 = const()[name = tensor("aw_525_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_525_cast_fp16 = einsum(equation = aw_525_equation_0, values = (var_3695_cast_fp16_2, var_3673_cast_fp16_2))[name = tensor("aw_525_cast_fp16")]; tensor aw_527_equation_0 = const()[name = tensor("aw_527_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_527_cast_fp16 = einsum(equation = aw_527_equation_0, values = (var_3695_cast_fp16_3, var_3673_cast_fp16_3))[name = tensor("aw_527_cast_fp16")]; tensor aw_529_equation_0 = const()[name = tensor("aw_529_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_529_cast_fp16 = einsum(equation = aw_529_equation_0, values = (var_3695_cast_fp16_4, var_3673_cast_fp16_4))[name = tensor("aw_529_cast_fp16")]; tensor aw_531_equation_0 = const()[name = tensor("aw_531_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_531_cast_fp16 = einsum(equation = aw_531_equation_0, values = (var_3695_cast_fp16_5, var_3673_cast_fp16_5))[name = tensor("aw_531_cast_fp16")]; tensor aw_533_equation_0 = const()[name = tensor("aw_533_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_533_cast_fp16 = einsum(equation = aw_533_equation_0, values = (var_3695_cast_fp16_6, var_3673_cast_fp16_6))[name = tensor("aw_533_cast_fp16")]; tensor aw_535_equation_0 = const()[name = tensor("aw_535_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_535_cast_fp16 = einsum(equation = aw_535_equation_0, values = (var_3695_cast_fp16_7, var_3673_cast_fp16_7))[name = tensor("aw_535_cast_fp16")]; tensor aw_537_equation_0 = const()[name = tensor("aw_537_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_537_cast_fp16 = einsum(equation = aw_537_equation_0, values = (var_3695_cast_fp16_8, var_3673_cast_fp16_8))[name = tensor("aw_537_cast_fp16")]; tensor aw_539_equation_0 = const()[name = tensor("aw_539_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_539_cast_fp16 = einsum(equation = aw_539_equation_0, values = (var_3695_cast_fp16_9, var_3673_cast_fp16_9))[name = tensor("aw_539_cast_fp16")]; tensor aw_541_equation_0 = const()[name = tensor("aw_541_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_541_cast_fp16 = einsum(equation = aw_541_equation_0, values = (var_3695_cast_fp16_10, var_3673_cast_fp16_10))[name = tensor("aw_541_cast_fp16")]; tensor aw_543_equation_0 = const()[name = tensor("aw_543_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_543_cast_fp16 = einsum(equation = aw_543_equation_0, values = (var_3695_cast_fp16_11, var_3673_cast_fp16_11))[name = tensor("aw_543_cast_fp16")]; tensor aw_545_equation_0 = const()[name = tensor("aw_545_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_545_cast_fp16 = einsum(equation = aw_545_equation_0, values = (var_3695_cast_fp16_12, var_3673_cast_fp16_12))[name = tensor("aw_545_cast_fp16")]; tensor aw_547_equation_0 = const()[name = tensor("aw_547_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_547_cast_fp16 = einsum(equation = aw_547_equation_0, values = (var_3695_cast_fp16_13, var_3673_cast_fp16_13))[name = tensor("aw_547_cast_fp16")]; tensor aw_549_equation_0 = const()[name = tensor("aw_549_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_549_cast_fp16 = einsum(equation = aw_549_equation_0, values = (var_3695_cast_fp16_14, var_3673_cast_fp16_14))[name = tensor("aw_549_cast_fp16")]; tensor aw_551_equation_0 = const()[name = tensor("aw_551_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_551_cast_fp16 = einsum(equation = aw_551_equation_0, values = (var_3695_cast_fp16_15, var_3673_cast_fp16_15))[name = tensor("aw_551_cast_fp16")]; tensor aw_553_equation_0 = const()[name = tensor("aw_553_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_553_cast_fp16 = einsum(equation = aw_553_equation_0, values = (var_3695_cast_fp16_16, var_3673_cast_fp16_16))[name = tensor("aw_553_cast_fp16")]; tensor aw_555_equation_0 = const()[name = tensor("aw_555_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_555_cast_fp16 = einsum(equation = aw_555_equation_0, values = (var_3695_cast_fp16_17, var_3673_cast_fp16_17))[name = tensor("aw_555_cast_fp16")]; tensor aw_557_equation_0 = const()[name = tensor("aw_557_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_557_cast_fp16 = einsum(equation = aw_557_equation_0, values = (var_3695_cast_fp16_18, var_3673_cast_fp16_18))[name = tensor("aw_557_cast_fp16")]; tensor aw_559_equation_0 = const()[name = tensor("aw_559_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_559_cast_fp16 = einsum(equation = aw_559_equation_0, values = (var_3695_cast_fp16_19, var_3673_cast_fp16_19))[name = tensor("aw_559_cast_fp16")]; tensor var_3777_cast_fp16 = softmax(axis = var_3621, x = aw_521_cast_fp16)[name = tensor("op_3777_cast_fp16")]; tensor var_3778_cast_fp16 = softmax(axis = var_3621, x = aw_523_cast_fp16)[name = tensor("op_3778_cast_fp16")]; tensor var_3779_cast_fp16 = softmax(axis = var_3621, x = aw_525_cast_fp16)[name = tensor("op_3779_cast_fp16")]; tensor var_3780_cast_fp16 = softmax(axis = var_3621, x = aw_527_cast_fp16)[name = tensor("op_3780_cast_fp16")]; tensor var_3781_cast_fp16 = softmax(axis = var_3621, x = aw_529_cast_fp16)[name = tensor("op_3781_cast_fp16")]; tensor var_3782_cast_fp16 = softmax(axis = var_3621, x = aw_531_cast_fp16)[name = tensor("op_3782_cast_fp16")]; tensor var_3783_cast_fp16 = softmax(axis = var_3621, x = aw_533_cast_fp16)[name = tensor("op_3783_cast_fp16")]; tensor var_3784_cast_fp16 = softmax(axis = var_3621, x = aw_535_cast_fp16)[name = tensor("op_3784_cast_fp16")]; tensor var_3785_cast_fp16 = softmax(axis = var_3621, x = aw_537_cast_fp16)[name = tensor("op_3785_cast_fp16")]; tensor var_3786_cast_fp16 = softmax(axis = var_3621, x = aw_539_cast_fp16)[name = tensor("op_3786_cast_fp16")]; tensor var_3787_cast_fp16 = softmax(axis = var_3621, x = aw_541_cast_fp16)[name = tensor("op_3787_cast_fp16")]; tensor var_3788_cast_fp16 = softmax(axis = var_3621, x = aw_543_cast_fp16)[name = tensor("op_3788_cast_fp16")]; tensor var_3789_cast_fp16 = softmax(axis = var_3621, x = aw_545_cast_fp16)[name = tensor("op_3789_cast_fp16")]; tensor var_3790_cast_fp16 = softmax(axis = var_3621, x = aw_547_cast_fp16)[name = tensor("op_3790_cast_fp16")]; tensor var_3791_cast_fp16 = softmax(axis = var_3621, x = aw_549_cast_fp16)[name = tensor("op_3791_cast_fp16")]; tensor var_3792_cast_fp16 = softmax(axis = var_3621, x = aw_551_cast_fp16)[name = tensor("op_3792_cast_fp16")]; tensor var_3793_cast_fp16 = softmax(axis = var_3621, x = aw_553_cast_fp16)[name = tensor("op_3793_cast_fp16")]; tensor var_3794_cast_fp16 = softmax(axis = var_3621, x = aw_555_cast_fp16)[name = tensor("op_3794_cast_fp16")]; tensor var_3795_cast_fp16 = softmax(axis = var_3621, x = aw_557_cast_fp16)[name = tensor("op_3795_cast_fp16")]; tensor var_3796_cast_fp16 = softmax(axis = var_3621, x = aw_559_cast_fp16)[name = tensor("op_3796_cast_fp16")]; tensor var_3798_equation_0 = const()[name = tensor("op_3798_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3798_cast_fp16 = einsum(equation = var_3798_equation_0, values = (var_3716_cast_fp16_0, var_3777_cast_fp16))[name = tensor("op_3798_cast_fp16")]; tensor var_3800_equation_0 = const()[name = tensor("op_3800_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3800_cast_fp16 = einsum(equation = var_3800_equation_0, values = (var_3716_cast_fp16_1, var_3778_cast_fp16))[name = tensor("op_3800_cast_fp16")]; tensor var_3802_equation_0 = const()[name = tensor("op_3802_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3802_cast_fp16 = einsum(equation = var_3802_equation_0, values = (var_3716_cast_fp16_2, var_3779_cast_fp16))[name = tensor("op_3802_cast_fp16")]; tensor var_3804_equation_0 = const()[name = tensor("op_3804_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3804_cast_fp16 = einsum(equation = var_3804_equation_0, values = (var_3716_cast_fp16_3, var_3780_cast_fp16))[name = tensor("op_3804_cast_fp16")]; tensor var_3806_equation_0 = const()[name = tensor("op_3806_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3806_cast_fp16 = einsum(equation = var_3806_equation_0, values = (var_3716_cast_fp16_4, var_3781_cast_fp16))[name = tensor("op_3806_cast_fp16")]; tensor var_3808_equation_0 = const()[name = tensor("op_3808_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3808_cast_fp16 = einsum(equation = var_3808_equation_0, values = (var_3716_cast_fp16_5, var_3782_cast_fp16))[name = tensor("op_3808_cast_fp16")]; tensor var_3810_equation_0 = const()[name = tensor("op_3810_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3810_cast_fp16 = einsum(equation = var_3810_equation_0, values = (var_3716_cast_fp16_6, var_3783_cast_fp16))[name = tensor("op_3810_cast_fp16")]; tensor var_3812_equation_0 = const()[name = tensor("op_3812_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3812_cast_fp16 = einsum(equation = var_3812_equation_0, values = (var_3716_cast_fp16_7, var_3784_cast_fp16))[name = tensor("op_3812_cast_fp16")]; tensor var_3814_equation_0 = const()[name = tensor("op_3814_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3814_cast_fp16 = einsum(equation = var_3814_equation_0, values = (var_3716_cast_fp16_8, var_3785_cast_fp16))[name = tensor("op_3814_cast_fp16")]; tensor var_3816_equation_0 = const()[name = tensor("op_3816_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3816_cast_fp16 = einsum(equation = var_3816_equation_0, values = (var_3716_cast_fp16_9, var_3786_cast_fp16))[name = tensor("op_3816_cast_fp16")]; tensor var_3818_equation_0 = const()[name = tensor("op_3818_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3818_cast_fp16 = einsum(equation = var_3818_equation_0, values = (var_3716_cast_fp16_10, var_3787_cast_fp16))[name = tensor("op_3818_cast_fp16")]; tensor var_3820_equation_0 = const()[name = tensor("op_3820_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3820_cast_fp16 = einsum(equation = var_3820_equation_0, values = (var_3716_cast_fp16_11, var_3788_cast_fp16))[name = tensor("op_3820_cast_fp16")]; tensor var_3822_equation_0 = const()[name = tensor("op_3822_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3822_cast_fp16 = einsum(equation = var_3822_equation_0, values = (var_3716_cast_fp16_12, var_3789_cast_fp16))[name = tensor("op_3822_cast_fp16")]; tensor var_3824_equation_0 = const()[name = tensor("op_3824_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3824_cast_fp16 = einsum(equation = var_3824_equation_0, values = (var_3716_cast_fp16_13, var_3790_cast_fp16))[name = tensor("op_3824_cast_fp16")]; tensor var_3826_equation_0 = const()[name = tensor("op_3826_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3826_cast_fp16 = einsum(equation = var_3826_equation_0, values = (var_3716_cast_fp16_14, var_3791_cast_fp16))[name = tensor("op_3826_cast_fp16")]; tensor var_3828_equation_0 = const()[name = tensor("op_3828_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3828_cast_fp16 = einsum(equation = var_3828_equation_0, values = (var_3716_cast_fp16_15, var_3792_cast_fp16))[name = tensor("op_3828_cast_fp16")]; tensor var_3830_equation_0 = const()[name = tensor("op_3830_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3830_cast_fp16 = einsum(equation = var_3830_equation_0, values = (var_3716_cast_fp16_16, var_3793_cast_fp16))[name = tensor("op_3830_cast_fp16")]; tensor var_3832_equation_0 = const()[name = tensor("op_3832_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3832_cast_fp16 = einsum(equation = var_3832_equation_0, values = (var_3716_cast_fp16_17, var_3794_cast_fp16))[name = tensor("op_3832_cast_fp16")]; tensor var_3834_equation_0 = const()[name = tensor("op_3834_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3834_cast_fp16 = einsum(equation = var_3834_equation_0, values = (var_3716_cast_fp16_18, var_3795_cast_fp16))[name = tensor("op_3834_cast_fp16")]; tensor var_3836_equation_0 = const()[name = tensor("op_3836_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3836_cast_fp16 = einsum(equation = var_3836_equation_0, values = (var_3716_cast_fp16_19, var_3796_cast_fp16))[name = tensor("op_3836_cast_fp16")]; tensor input_135_interleave_0 = const()[name = tensor("input_135_interleave_0"), val = tensor(false)]; tensor input_135_cast_fp16 = concat(axis = var_3621, interleave = input_135_interleave_0, values = (var_3798_cast_fp16, var_3800_cast_fp16, var_3802_cast_fp16, var_3804_cast_fp16, var_3806_cast_fp16, var_3808_cast_fp16, var_3810_cast_fp16, var_3812_cast_fp16, var_3814_cast_fp16, var_3816_cast_fp16, var_3818_cast_fp16, var_3820_cast_fp16, var_3822_cast_fp16, var_3824_cast_fp16, var_3826_cast_fp16, var_3828_cast_fp16, var_3830_cast_fp16, var_3832_cast_fp16, var_3834_cast_fp16, var_3836_cast_fp16))[name = tensor("input_135_cast_fp16")]; tensor var_3845_pad_type_0 = const()[name = tensor("op_3845_pad_type_0"), val = tensor("valid")]; tensor var_3845_strides_0 = const()[name = tensor("op_3845_strides_0"), val = tensor([1, 1])]; tensor var_3845_pad_0 = const()[name = tensor("op_3845_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_3845_dilations_0 = const()[name = tensor("op_3845_dilations_0"), val = tensor([1, 1])]; tensor var_3845_groups_0 = const()[name = tensor("op_3845_groups_0"), val = tensor(1)]; tensor blocks_13_attn_out_weight_to_fp16 = const()[name = tensor("blocks_13_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(536092672)))]; tensor blocks_13_attn_out_bias_to_fp16 = const()[name = tensor("blocks_13_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(539369536)))]; tensor var_3845_cast_fp16 = conv(bias = blocks_13_attn_out_bias_to_fp16, dilations = var_3845_dilations_0, groups = var_3845_groups_0, pad = var_3845_pad_0, pad_type = var_3845_pad_type_0, strides = var_3845_strides_0, weight = blocks_13_attn_out_weight_to_fp16, x = input_135_cast_fp16)[name = tensor("op_3845_cast_fp16")]; tensor inputs_55_cast_fp16 = add(x = inputs_53_cast_fp16, y = var_3845_cast_fp16)[name = tensor("inputs_55_cast_fp16")]; tensor input_137_axes_0 = const()[name = tensor("input_137_axes_0"), val = tensor([1])]; tensor input_137_gamma_0_to_fp16 = const()[name = tensor("input_137_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(539372160)))]; tensor input_137_beta_0_to_fp16 = const()[name = tensor("input_137_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(539374784)))]; tensor var_3855_to_fp16 = const()[name = tensor("op_3855_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_137_cast_fp16 = layer_norm(axes = input_137_axes_0, beta = input_137_beta_0_to_fp16, epsilon = var_3855_to_fp16, gamma = input_137_gamma_0_to_fp16, x = inputs_55_cast_fp16)[name = tensor("input_137_cast_fp16")]; tensor input_139_pad_type_0 = const()[name = tensor("input_139_pad_type_0"), val = tensor("valid")]; tensor input_139_strides_0 = const()[name = tensor("input_139_strides_0"), val = tensor([1, 1])]; tensor input_139_pad_0 = const()[name = tensor("input_139_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_139_dilations_0 = const()[name = tensor("input_139_dilations_0"), val = tensor([1, 1])]; tensor input_139_groups_0 = const()[name = tensor("input_139_groups_0"), val = tensor(1)]; tensor blocks_13_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_13_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(539377408)))]; tensor blocks_13_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_13_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(552484672)))]; tensor input_139_cast_fp16 = conv(bias = blocks_13_mlp_0_bias_to_fp16, dilations = input_139_dilations_0, groups = input_139_groups_0, pad = input_139_pad_0, pad_type = input_139_pad_type_0, strides = input_139_strides_0, weight = blocks_13_mlp_0_weight_to_fp16, x = input_137_cast_fp16)[name = tensor("input_139_cast_fp16")]; tensor input_141_mode_0 = const()[name = tensor("input_141_mode_0"), val = tensor("EXACT")]; tensor input_141_cast_fp16 = gelu(mode = input_141_mode_0, x = input_139_cast_fp16)[name = tensor("input_141_cast_fp16")]; tensor var_3881_pad_type_0 = const()[name = tensor("op_3881_pad_type_0"), val = tensor("valid")]; tensor var_3881_strides_0 = const()[name = tensor("op_3881_strides_0"), val = tensor([1, 1])]; tensor var_3881_pad_0 = const()[name = tensor("op_3881_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_3881_dilations_0 = const()[name = tensor("op_3881_dilations_0"), val = tensor([1, 1])]; tensor var_3881_groups_0 = const()[name = tensor("op_3881_groups_0"), val = tensor(1)]; tensor blocks_13_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_13_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(552494976)))]; tensor blocks_13_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_13_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(565602240)))]; tensor var_3881_cast_fp16 = conv(bias = blocks_13_mlp_2_bias_to_fp16, dilations = var_3881_dilations_0, groups = var_3881_groups_0, pad = var_3881_pad_0, pad_type = var_3881_pad_type_0, strides = var_3881_strides_0, weight = blocks_13_mlp_2_weight_to_fp16, x = input_141_cast_fp16)[name = tensor("op_3881_cast_fp16")]; tensor inputs_57_cast_fp16 = add(x = inputs_55_cast_fp16, y = var_3881_cast_fp16)[name = tensor("inputs_57_cast_fp16")]; tensor var_3890 = const()[name = tensor("op_3890"), val = tensor(1)]; tensor input_143_axes_0 = const()[name = tensor("input_143_axes_0"), val = tensor([1])]; tensor input_143_gamma_0_to_fp16 = const()[name = tensor("input_143_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(565604864)))]; tensor input_143_beta_0_to_fp16 = const()[name = tensor("input_143_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(565607488)))]; tensor var_3906_to_fp16 = const()[name = tensor("op_3906_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_143_cast_fp16 = layer_norm(axes = input_143_axes_0, beta = input_143_beta_0_to_fp16, epsilon = var_3906_to_fp16, gamma = input_143_gamma_0_to_fp16, x = inputs_57_cast_fp16)[name = tensor("input_143_cast_fp16")]; tensor q_29_pad_type_0 = const()[name = tensor("q_29_pad_type_0"), val = tensor("valid")]; tensor q_29_strides_0 = const()[name = tensor("q_29_strides_0"), val = tensor([1, 1])]; tensor q_29_pad_0 = const()[name = tensor("q_29_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_29_dilations_0 = const()[name = tensor("q_29_dilations_0"), val = tensor([1, 1])]; tensor q_29_groups_0 = const()[name = tensor("q_29_groups_0"), val = tensor(1)]; tensor var_3941_weight_0_to_fp16 = const()[name = tensor("op_3941_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(565610112)))]; tensor var_3941_bias_0_to_fp16 = const()[name = tensor("op_3941_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(568886976)))]; tensor var_3941_cast_fp16 = conv(bias = var_3941_bias_0_to_fp16, dilations = q_29_dilations_0, groups = q_29_groups_0, pad = q_29_pad_0, pad_type = q_29_pad_type_0, strides = q_29_strides_0, weight = var_3941_weight_0_to_fp16, x = input_143_cast_fp16)[name = tensor("op_3941_cast_fp16")]; tensor k_29_pad_type_0 = const()[name = tensor("k_29_pad_type_0"), val = tensor("valid")]; tensor k_29_strides_0 = const()[name = tensor("k_29_strides_0"), val = tensor([1, 1])]; tensor k_29_pad_0 = const()[name = tensor("k_29_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_29_dilations_0 = const()[name = tensor("k_29_dilations_0"), val = tensor([1, 1])]; tensor k_29_groups_0 = const()[name = tensor("k_29_groups_0"), val = tensor(1)]; tensor blocks_14_attn_key_weight_to_fp16 = const()[name = tensor("blocks_14_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(568889600)))]; tensor k_29_cast_fp16 = conv(dilations = k_29_dilations_0, groups = k_29_groups_0, pad = k_29_pad_0, pad_type = k_29_pad_type_0, strides = k_29_strides_0, weight = blocks_14_attn_key_weight_to_fp16, x = input_143_cast_fp16)[name = tensor("k_29_cast_fp16")]; tensor var_3939_pad_type_0 = const()[name = tensor("op_3939_pad_type_0"), val = tensor("valid")]; tensor var_3939_strides_0 = const()[name = tensor("op_3939_strides_0"), val = tensor([1, 1])]; tensor var_3939_pad_0 = const()[name = tensor("op_3939_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_3939_dilations_0 = const()[name = tensor("op_3939_dilations_0"), val = tensor([1, 1])]; tensor var_3939_groups_0 = const()[name = tensor("op_3939_groups_0"), val = tensor(1)]; tensor blocks_14_attn_value_weight_to_fp16 = const()[name = tensor("blocks_14_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(572166464)))]; tensor blocks_14_attn_value_bias_to_fp16 = const()[name = tensor("blocks_14_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(575443328)))]; tensor var_3939_cast_fp16 = conv(bias = blocks_14_attn_value_bias_to_fp16, dilations = var_3939_dilations_0, groups = var_3939_groups_0, pad = var_3939_pad_0, pad_type = var_3939_pad_type_0, strides = var_3939_strides_0, weight = blocks_14_attn_value_weight_to_fp16, x = input_143_cast_fp16)[name = tensor("op_3939_cast_fp16")]; tensor tile_42 = const()[name = tensor("tile_42"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_3942_axis_0 = const()[name = tensor("op_3942_axis_0"), val = tensor(1)]; tensor var_3942_cast_fp16_0, tensor var_3942_cast_fp16_1, tensor var_3942_cast_fp16_2, tensor var_3942_cast_fp16_3, tensor var_3942_cast_fp16_4, tensor var_3942_cast_fp16_5, tensor var_3942_cast_fp16_6, tensor var_3942_cast_fp16_7, tensor var_3942_cast_fp16_8, tensor var_3942_cast_fp16_9, tensor var_3942_cast_fp16_10, tensor var_3942_cast_fp16_11, tensor var_3942_cast_fp16_12, tensor var_3942_cast_fp16_13, tensor var_3942_cast_fp16_14, tensor var_3942_cast_fp16_15, tensor var_3942_cast_fp16_16, tensor var_3942_cast_fp16_17, tensor var_3942_cast_fp16_18, tensor var_3942_cast_fp16_19 = split(axis = var_3942_axis_0, split_sizes = tile_42, x = var_3941_cast_fp16)[name = tensor("op_3942_cast_fp16")]; tensor var_3963_perm_0 = const()[name = tensor("op_3963_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_43 = const()[name = tensor("tile_43"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_3964_axis_0 = const()[name = tensor("op_3964_axis_0"), val = tensor(3)]; tensor var_3963_cast_fp16 = transpose(perm = var_3963_perm_0, x = k_29_cast_fp16)[name = tensor("transpose_18")]; tensor var_3964_cast_fp16_0, tensor var_3964_cast_fp16_1, tensor var_3964_cast_fp16_2, tensor var_3964_cast_fp16_3, tensor var_3964_cast_fp16_4, tensor var_3964_cast_fp16_5, tensor var_3964_cast_fp16_6, tensor var_3964_cast_fp16_7, tensor var_3964_cast_fp16_8, tensor var_3964_cast_fp16_9, tensor var_3964_cast_fp16_10, tensor var_3964_cast_fp16_11, tensor var_3964_cast_fp16_12, tensor var_3964_cast_fp16_13, tensor var_3964_cast_fp16_14, tensor var_3964_cast_fp16_15, tensor var_3964_cast_fp16_16, tensor var_3964_cast_fp16_17, tensor var_3964_cast_fp16_18, tensor var_3964_cast_fp16_19 = split(axis = var_3964_axis_0, split_sizes = tile_43, x = var_3963_cast_fp16)[name = tensor("op_3964_cast_fp16")]; tensor tile_44 = const()[name = tensor("tile_44"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_3985_axis_0 = const()[name = tensor("op_3985_axis_0"), val = tensor(1)]; tensor var_3985_cast_fp16_0, tensor var_3985_cast_fp16_1, tensor var_3985_cast_fp16_2, tensor var_3985_cast_fp16_3, tensor var_3985_cast_fp16_4, tensor var_3985_cast_fp16_5, tensor var_3985_cast_fp16_6, tensor var_3985_cast_fp16_7, tensor var_3985_cast_fp16_8, tensor var_3985_cast_fp16_9, tensor var_3985_cast_fp16_10, tensor var_3985_cast_fp16_11, tensor var_3985_cast_fp16_12, tensor var_3985_cast_fp16_13, tensor var_3985_cast_fp16_14, tensor var_3985_cast_fp16_15, tensor var_3985_cast_fp16_16, tensor var_3985_cast_fp16_17, tensor var_3985_cast_fp16_18, tensor var_3985_cast_fp16_19 = split(axis = var_3985_axis_0, split_sizes = tile_44, x = var_3939_cast_fp16)[name = tensor("op_3985_cast_fp16")]; tensor aw_561_equation_0 = const()[name = tensor("aw_561_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_561_cast_fp16 = einsum(equation = aw_561_equation_0, values = (var_3964_cast_fp16_0, var_3942_cast_fp16_0))[name = tensor("aw_561_cast_fp16")]; tensor aw_563_equation_0 = const()[name = tensor("aw_563_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_563_cast_fp16 = einsum(equation = aw_563_equation_0, values = (var_3964_cast_fp16_1, var_3942_cast_fp16_1))[name = tensor("aw_563_cast_fp16")]; tensor aw_565_equation_0 = const()[name = tensor("aw_565_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_565_cast_fp16 = einsum(equation = aw_565_equation_0, values = (var_3964_cast_fp16_2, var_3942_cast_fp16_2))[name = tensor("aw_565_cast_fp16")]; tensor aw_567_equation_0 = const()[name = tensor("aw_567_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_567_cast_fp16 = einsum(equation = aw_567_equation_0, values = (var_3964_cast_fp16_3, var_3942_cast_fp16_3))[name = tensor("aw_567_cast_fp16")]; tensor aw_569_equation_0 = const()[name = tensor("aw_569_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_569_cast_fp16 = einsum(equation = aw_569_equation_0, values = (var_3964_cast_fp16_4, var_3942_cast_fp16_4))[name = tensor("aw_569_cast_fp16")]; tensor aw_571_equation_0 = const()[name = tensor("aw_571_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_571_cast_fp16 = einsum(equation = aw_571_equation_0, values = (var_3964_cast_fp16_5, var_3942_cast_fp16_5))[name = tensor("aw_571_cast_fp16")]; tensor aw_573_equation_0 = const()[name = tensor("aw_573_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_573_cast_fp16 = einsum(equation = aw_573_equation_0, values = (var_3964_cast_fp16_6, var_3942_cast_fp16_6))[name = tensor("aw_573_cast_fp16")]; tensor aw_575_equation_0 = const()[name = tensor("aw_575_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_575_cast_fp16 = einsum(equation = aw_575_equation_0, values = (var_3964_cast_fp16_7, var_3942_cast_fp16_7))[name = tensor("aw_575_cast_fp16")]; tensor aw_577_equation_0 = const()[name = tensor("aw_577_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_577_cast_fp16 = einsum(equation = aw_577_equation_0, values = (var_3964_cast_fp16_8, var_3942_cast_fp16_8))[name = tensor("aw_577_cast_fp16")]; tensor aw_579_equation_0 = const()[name = tensor("aw_579_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_579_cast_fp16 = einsum(equation = aw_579_equation_0, values = (var_3964_cast_fp16_9, var_3942_cast_fp16_9))[name = tensor("aw_579_cast_fp16")]; tensor aw_581_equation_0 = const()[name = tensor("aw_581_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_581_cast_fp16 = einsum(equation = aw_581_equation_0, values = (var_3964_cast_fp16_10, var_3942_cast_fp16_10))[name = tensor("aw_581_cast_fp16")]; tensor aw_583_equation_0 = const()[name = tensor("aw_583_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_583_cast_fp16 = einsum(equation = aw_583_equation_0, values = (var_3964_cast_fp16_11, var_3942_cast_fp16_11))[name = tensor("aw_583_cast_fp16")]; tensor aw_585_equation_0 = const()[name = tensor("aw_585_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_585_cast_fp16 = einsum(equation = aw_585_equation_0, values = (var_3964_cast_fp16_12, var_3942_cast_fp16_12))[name = tensor("aw_585_cast_fp16")]; tensor aw_587_equation_0 = const()[name = tensor("aw_587_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_587_cast_fp16 = einsum(equation = aw_587_equation_0, values = (var_3964_cast_fp16_13, var_3942_cast_fp16_13))[name = tensor("aw_587_cast_fp16")]; tensor aw_589_equation_0 = const()[name = tensor("aw_589_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_589_cast_fp16 = einsum(equation = aw_589_equation_0, values = (var_3964_cast_fp16_14, var_3942_cast_fp16_14))[name = tensor("aw_589_cast_fp16")]; tensor aw_591_equation_0 = const()[name = tensor("aw_591_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_591_cast_fp16 = einsum(equation = aw_591_equation_0, values = (var_3964_cast_fp16_15, var_3942_cast_fp16_15))[name = tensor("aw_591_cast_fp16")]; tensor aw_593_equation_0 = const()[name = tensor("aw_593_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_593_cast_fp16 = einsum(equation = aw_593_equation_0, values = (var_3964_cast_fp16_16, var_3942_cast_fp16_16))[name = tensor("aw_593_cast_fp16")]; tensor aw_595_equation_0 = const()[name = tensor("aw_595_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_595_cast_fp16 = einsum(equation = aw_595_equation_0, values = (var_3964_cast_fp16_17, var_3942_cast_fp16_17))[name = tensor("aw_595_cast_fp16")]; tensor aw_597_equation_0 = const()[name = tensor("aw_597_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_597_cast_fp16 = einsum(equation = aw_597_equation_0, values = (var_3964_cast_fp16_18, var_3942_cast_fp16_18))[name = tensor("aw_597_cast_fp16")]; tensor aw_599_equation_0 = const()[name = tensor("aw_599_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_599_cast_fp16 = einsum(equation = aw_599_equation_0, values = (var_3964_cast_fp16_19, var_3942_cast_fp16_19))[name = tensor("aw_599_cast_fp16")]; tensor var_4046_cast_fp16 = softmax(axis = var_3890, x = aw_561_cast_fp16)[name = tensor("op_4046_cast_fp16")]; tensor var_4047_cast_fp16 = softmax(axis = var_3890, x = aw_563_cast_fp16)[name = tensor("op_4047_cast_fp16")]; tensor var_4048_cast_fp16 = softmax(axis = var_3890, x = aw_565_cast_fp16)[name = tensor("op_4048_cast_fp16")]; tensor var_4049_cast_fp16 = softmax(axis = var_3890, x = aw_567_cast_fp16)[name = tensor("op_4049_cast_fp16")]; tensor var_4050_cast_fp16 = softmax(axis = var_3890, x = aw_569_cast_fp16)[name = tensor("op_4050_cast_fp16")]; tensor var_4051_cast_fp16 = softmax(axis = var_3890, x = aw_571_cast_fp16)[name = tensor("op_4051_cast_fp16")]; tensor var_4052_cast_fp16 = softmax(axis = var_3890, x = aw_573_cast_fp16)[name = tensor("op_4052_cast_fp16")]; tensor var_4053_cast_fp16 = softmax(axis = var_3890, x = aw_575_cast_fp16)[name = tensor("op_4053_cast_fp16")]; tensor var_4054_cast_fp16 = softmax(axis = var_3890, x = aw_577_cast_fp16)[name = tensor("op_4054_cast_fp16")]; tensor var_4055_cast_fp16 = softmax(axis = var_3890, x = aw_579_cast_fp16)[name = tensor("op_4055_cast_fp16")]; tensor var_4056_cast_fp16 = softmax(axis = var_3890, x = aw_581_cast_fp16)[name = tensor("op_4056_cast_fp16")]; tensor var_4057_cast_fp16 = softmax(axis = var_3890, x = aw_583_cast_fp16)[name = tensor("op_4057_cast_fp16")]; tensor var_4058_cast_fp16 = softmax(axis = var_3890, x = aw_585_cast_fp16)[name = tensor("op_4058_cast_fp16")]; tensor var_4059_cast_fp16 = softmax(axis = var_3890, x = aw_587_cast_fp16)[name = tensor("op_4059_cast_fp16")]; tensor var_4060_cast_fp16 = softmax(axis = var_3890, x = aw_589_cast_fp16)[name = tensor("op_4060_cast_fp16")]; tensor var_4061_cast_fp16 = softmax(axis = var_3890, x = aw_591_cast_fp16)[name = tensor("op_4061_cast_fp16")]; tensor var_4062_cast_fp16 = softmax(axis = var_3890, x = aw_593_cast_fp16)[name = tensor("op_4062_cast_fp16")]; tensor var_4063_cast_fp16 = softmax(axis = var_3890, x = aw_595_cast_fp16)[name = tensor("op_4063_cast_fp16")]; tensor var_4064_cast_fp16 = softmax(axis = var_3890, x = aw_597_cast_fp16)[name = tensor("op_4064_cast_fp16")]; tensor var_4065_cast_fp16 = softmax(axis = var_3890, x = aw_599_cast_fp16)[name = tensor("op_4065_cast_fp16")]; tensor var_4067_equation_0 = const()[name = tensor("op_4067_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4067_cast_fp16 = einsum(equation = var_4067_equation_0, values = (var_3985_cast_fp16_0, var_4046_cast_fp16))[name = tensor("op_4067_cast_fp16")]; tensor var_4069_equation_0 = const()[name = tensor("op_4069_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4069_cast_fp16 = einsum(equation = var_4069_equation_0, values = (var_3985_cast_fp16_1, var_4047_cast_fp16))[name = tensor("op_4069_cast_fp16")]; tensor var_4071_equation_0 = const()[name = tensor("op_4071_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4071_cast_fp16 = einsum(equation = var_4071_equation_0, values = (var_3985_cast_fp16_2, var_4048_cast_fp16))[name = tensor("op_4071_cast_fp16")]; tensor var_4073_equation_0 = const()[name = tensor("op_4073_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4073_cast_fp16 = einsum(equation = var_4073_equation_0, values = (var_3985_cast_fp16_3, var_4049_cast_fp16))[name = tensor("op_4073_cast_fp16")]; tensor var_4075_equation_0 = const()[name = tensor("op_4075_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4075_cast_fp16 = einsum(equation = var_4075_equation_0, values = (var_3985_cast_fp16_4, var_4050_cast_fp16))[name = tensor("op_4075_cast_fp16")]; tensor var_4077_equation_0 = const()[name = tensor("op_4077_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4077_cast_fp16 = einsum(equation = var_4077_equation_0, values = (var_3985_cast_fp16_5, var_4051_cast_fp16))[name = tensor("op_4077_cast_fp16")]; tensor var_4079_equation_0 = const()[name = tensor("op_4079_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4079_cast_fp16 = einsum(equation = var_4079_equation_0, values = (var_3985_cast_fp16_6, var_4052_cast_fp16))[name = tensor("op_4079_cast_fp16")]; tensor var_4081_equation_0 = const()[name = tensor("op_4081_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4081_cast_fp16 = einsum(equation = var_4081_equation_0, values = (var_3985_cast_fp16_7, var_4053_cast_fp16))[name = tensor("op_4081_cast_fp16")]; tensor var_4083_equation_0 = const()[name = tensor("op_4083_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4083_cast_fp16 = einsum(equation = var_4083_equation_0, values = (var_3985_cast_fp16_8, var_4054_cast_fp16))[name = tensor("op_4083_cast_fp16")]; tensor var_4085_equation_0 = const()[name = tensor("op_4085_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4085_cast_fp16 = einsum(equation = var_4085_equation_0, values = (var_3985_cast_fp16_9, var_4055_cast_fp16))[name = tensor("op_4085_cast_fp16")]; tensor var_4087_equation_0 = const()[name = tensor("op_4087_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4087_cast_fp16 = einsum(equation = var_4087_equation_0, values = (var_3985_cast_fp16_10, var_4056_cast_fp16))[name = tensor("op_4087_cast_fp16")]; tensor var_4089_equation_0 = const()[name = tensor("op_4089_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4089_cast_fp16 = einsum(equation = var_4089_equation_0, values = (var_3985_cast_fp16_11, var_4057_cast_fp16))[name = tensor("op_4089_cast_fp16")]; tensor var_4091_equation_0 = const()[name = tensor("op_4091_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4091_cast_fp16 = einsum(equation = var_4091_equation_0, values = (var_3985_cast_fp16_12, var_4058_cast_fp16))[name = tensor("op_4091_cast_fp16")]; tensor var_4093_equation_0 = const()[name = tensor("op_4093_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4093_cast_fp16 = einsum(equation = var_4093_equation_0, values = (var_3985_cast_fp16_13, var_4059_cast_fp16))[name = tensor("op_4093_cast_fp16")]; tensor var_4095_equation_0 = const()[name = tensor("op_4095_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4095_cast_fp16 = einsum(equation = var_4095_equation_0, values = (var_3985_cast_fp16_14, var_4060_cast_fp16))[name = tensor("op_4095_cast_fp16")]; tensor var_4097_equation_0 = const()[name = tensor("op_4097_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4097_cast_fp16 = einsum(equation = var_4097_equation_0, values = (var_3985_cast_fp16_15, var_4061_cast_fp16))[name = tensor("op_4097_cast_fp16")]; tensor var_4099_equation_0 = const()[name = tensor("op_4099_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4099_cast_fp16 = einsum(equation = var_4099_equation_0, values = (var_3985_cast_fp16_16, var_4062_cast_fp16))[name = tensor("op_4099_cast_fp16")]; tensor var_4101_equation_0 = const()[name = tensor("op_4101_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4101_cast_fp16 = einsum(equation = var_4101_equation_0, values = (var_3985_cast_fp16_17, var_4063_cast_fp16))[name = tensor("op_4101_cast_fp16")]; tensor var_4103_equation_0 = const()[name = tensor("op_4103_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4103_cast_fp16 = einsum(equation = var_4103_equation_0, values = (var_3985_cast_fp16_18, var_4064_cast_fp16))[name = tensor("op_4103_cast_fp16")]; tensor var_4105_equation_0 = const()[name = tensor("op_4105_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4105_cast_fp16 = einsum(equation = var_4105_equation_0, values = (var_3985_cast_fp16_19, var_4065_cast_fp16))[name = tensor("op_4105_cast_fp16")]; tensor input_145_interleave_0 = const()[name = tensor("input_145_interleave_0"), val = tensor(false)]; tensor input_145_cast_fp16 = concat(axis = var_3890, interleave = input_145_interleave_0, values = (var_4067_cast_fp16, var_4069_cast_fp16, var_4071_cast_fp16, var_4073_cast_fp16, var_4075_cast_fp16, var_4077_cast_fp16, var_4079_cast_fp16, var_4081_cast_fp16, var_4083_cast_fp16, var_4085_cast_fp16, var_4087_cast_fp16, var_4089_cast_fp16, var_4091_cast_fp16, var_4093_cast_fp16, var_4095_cast_fp16, var_4097_cast_fp16, var_4099_cast_fp16, var_4101_cast_fp16, var_4103_cast_fp16, var_4105_cast_fp16))[name = tensor("input_145_cast_fp16")]; tensor var_4114_pad_type_0 = const()[name = tensor("op_4114_pad_type_0"), val = tensor("valid")]; tensor var_4114_strides_0 = const()[name = tensor("op_4114_strides_0"), val = tensor([1, 1])]; tensor var_4114_pad_0 = const()[name = tensor("op_4114_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_4114_dilations_0 = const()[name = tensor("op_4114_dilations_0"), val = tensor([1, 1])]; tensor var_4114_groups_0 = const()[name = tensor("op_4114_groups_0"), val = tensor(1)]; tensor blocks_14_attn_out_weight_to_fp16 = const()[name = tensor("blocks_14_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(575445952)))]; tensor blocks_14_attn_out_bias_to_fp16 = const()[name = tensor("blocks_14_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(578722816)))]; tensor var_4114_cast_fp16 = conv(bias = blocks_14_attn_out_bias_to_fp16, dilations = var_4114_dilations_0, groups = var_4114_groups_0, pad = var_4114_pad_0, pad_type = var_4114_pad_type_0, strides = var_4114_strides_0, weight = blocks_14_attn_out_weight_to_fp16, x = input_145_cast_fp16)[name = tensor("op_4114_cast_fp16")]; tensor inputs_59_cast_fp16 = add(x = inputs_57_cast_fp16, y = var_4114_cast_fp16)[name = tensor("inputs_59_cast_fp16")]; tensor input_147_axes_0 = const()[name = tensor("input_147_axes_0"), val = tensor([1])]; tensor input_147_gamma_0_to_fp16 = const()[name = tensor("input_147_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(578725440)))]; tensor input_147_beta_0_to_fp16 = const()[name = tensor("input_147_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(578728064)))]; tensor var_4124_to_fp16 = const()[name = tensor("op_4124_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_147_cast_fp16 = layer_norm(axes = input_147_axes_0, beta = input_147_beta_0_to_fp16, epsilon = var_4124_to_fp16, gamma = input_147_gamma_0_to_fp16, x = inputs_59_cast_fp16)[name = tensor("input_147_cast_fp16")]; tensor input_149_pad_type_0 = const()[name = tensor("input_149_pad_type_0"), val = tensor("valid")]; tensor input_149_strides_0 = const()[name = tensor("input_149_strides_0"), val = tensor([1, 1])]; tensor input_149_pad_0 = const()[name = tensor("input_149_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_149_dilations_0 = const()[name = tensor("input_149_dilations_0"), val = tensor([1, 1])]; tensor input_149_groups_0 = const()[name = tensor("input_149_groups_0"), val = tensor(1)]; tensor blocks_14_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_14_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(578730688)))]; tensor blocks_14_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_14_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(591837952)))]; tensor input_149_cast_fp16 = conv(bias = blocks_14_mlp_0_bias_to_fp16, dilations = input_149_dilations_0, groups = input_149_groups_0, pad = input_149_pad_0, pad_type = input_149_pad_type_0, strides = input_149_strides_0, weight = blocks_14_mlp_0_weight_to_fp16, x = input_147_cast_fp16)[name = tensor("input_149_cast_fp16")]; tensor input_151_mode_0 = const()[name = tensor("input_151_mode_0"), val = tensor("EXACT")]; tensor input_151_cast_fp16 = gelu(mode = input_151_mode_0, x = input_149_cast_fp16)[name = tensor("input_151_cast_fp16")]; tensor var_4150_pad_type_0 = const()[name = tensor("op_4150_pad_type_0"), val = tensor("valid")]; tensor var_4150_strides_0 = const()[name = tensor("op_4150_strides_0"), val = tensor([1, 1])]; tensor var_4150_pad_0 = const()[name = tensor("op_4150_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_4150_dilations_0 = const()[name = tensor("op_4150_dilations_0"), val = tensor([1, 1])]; tensor var_4150_groups_0 = const()[name = tensor("op_4150_groups_0"), val = tensor(1)]; tensor blocks_14_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_14_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(591848256)))]; tensor blocks_14_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_14_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(604955520)))]; tensor var_4150_cast_fp16 = conv(bias = blocks_14_mlp_2_bias_to_fp16, dilations = var_4150_dilations_0, groups = var_4150_groups_0, pad = var_4150_pad_0, pad_type = var_4150_pad_type_0, strides = var_4150_strides_0, weight = blocks_14_mlp_2_weight_to_fp16, x = input_151_cast_fp16)[name = tensor("op_4150_cast_fp16")]; tensor inputs_61_cast_fp16 = add(x = inputs_59_cast_fp16, y = var_4150_cast_fp16)[name = tensor("inputs_61_cast_fp16")]; tensor var_4159 = const()[name = tensor("op_4159"), val = tensor(1)]; tensor input_153_axes_0 = const()[name = tensor("input_153_axes_0"), val = tensor([1])]; tensor input_153_gamma_0_to_fp16 = const()[name = tensor("input_153_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(604958144)))]; tensor input_153_beta_0_to_fp16 = const()[name = tensor("input_153_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(604960768)))]; tensor var_4175_to_fp16 = const()[name = tensor("op_4175_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_153_cast_fp16 = layer_norm(axes = input_153_axes_0, beta = input_153_beta_0_to_fp16, epsilon = var_4175_to_fp16, gamma = input_153_gamma_0_to_fp16, x = inputs_61_cast_fp16)[name = tensor("input_153_cast_fp16")]; tensor q_31_pad_type_0 = const()[name = tensor("q_31_pad_type_0"), val = tensor("valid")]; tensor q_31_strides_0 = const()[name = tensor("q_31_strides_0"), val = tensor([1, 1])]; tensor q_31_pad_0 = const()[name = tensor("q_31_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_31_dilations_0 = const()[name = tensor("q_31_dilations_0"), val = tensor([1, 1])]; tensor q_31_groups_0 = const()[name = tensor("q_31_groups_0"), val = tensor(1)]; tensor var_4210_weight_0_to_fp16 = const()[name = tensor("op_4210_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(604963392)))]; tensor var_4210_bias_0_to_fp16 = const()[name = tensor("op_4210_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(608240256)))]; tensor var_4210_cast_fp16 = conv(bias = var_4210_bias_0_to_fp16, dilations = q_31_dilations_0, groups = q_31_groups_0, pad = q_31_pad_0, pad_type = q_31_pad_type_0, strides = q_31_strides_0, weight = var_4210_weight_0_to_fp16, x = input_153_cast_fp16)[name = tensor("op_4210_cast_fp16")]; tensor k_31_pad_type_0 = const()[name = tensor("k_31_pad_type_0"), val = tensor("valid")]; tensor k_31_strides_0 = const()[name = tensor("k_31_strides_0"), val = tensor([1, 1])]; tensor k_31_pad_0 = const()[name = tensor("k_31_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_31_dilations_0 = const()[name = tensor("k_31_dilations_0"), val = tensor([1, 1])]; tensor k_31_groups_0 = const()[name = tensor("k_31_groups_0"), val = tensor(1)]; tensor blocks_15_attn_key_weight_to_fp16 = const()[name = tensor("blocks_15_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(608242880)))]; tensor k_31_cast_fp16 = conv(dilations = k_31_dilations_0, groups = k_31_groups_0, pad = k_31_pad_0, pad_type = k_31_pad_type_0, strides = k_31_strides_0, weight = blocks_15_attn_key_weight_to_fp16, x = input_153_cast_fp16)[name = tensor("k_31_cast_fp16")]; tensor var_4208_pad_type_0 = const()[name = tensor("op_4208_pad_type_0"), val = tensor("valid")]; tensor var_4208_strides_0 = const()[name = tensor("op_4208_strides_0"), val = tensor([1, 1])]; tensor var_4208_pad_0 = const()[name = tensor("op_4208_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_4208_dilations_0 = const()[name = tensor("op_4208_dilations_0"), val = tensor([1, 1])]; tensor var_4208_groups_0 = const()[name = tensor("op_4208_groups_0"), val = tensor(1)]; tensor blocks_15_attn_value_weight_to_fp16 = const()[name = tensor("blocks_15_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(611519744)))]; tensor blocks_15_attn_value_bias_to_fp16 = const()[name = tensor("blocks_15_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(614796608)))]; tensor var_4208_cast_fp16 = conv(bias = blocks_15_attn_value_bias_to_fp16, dilations = var_4208_dilations_0, groups = var_4208_groups_0, pad = var_4208_pad_0, pad_type = var_4208_pad_type_0, strides = var_4208_strides_0, weight = blocks_15_attn_value_weight_to_fp16, x = input_153_cast_fp16)[name = tensor("op_4208_cast_fp16")]; tensor tile_45 = const()[name = tensor("tile_45"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_4211_axis_0 = const()[name = tensor("op_4211_axis_0"), val = tensor(1)]; tensor var_4211_cast_fp16_0, tensor var_4211_cast_fp16_1, tensor var_4211_cast_fp16_2, tensor var_4211_cast_fp16_3, tensor var_4211_cast_fp16_4, tensor var_4211_cast_fp16_5, tensor var_4211_cast_fp16_6, tensor var_4211_cast_fp16_7, tensor var_4211_cast_fp16_8, tensor var_4211_cast_fp16_9, tensor var_4211_cast_fp16_10, tensor var_4211_cast_fp16_11, tensor var_4211_cast_fp16_12, tensor var_4211_cast_fp16_13, tensor var_4211_cast_fp16_14, tensor var_4211_cast_fp16_15, tensor var_4211_cast_fp16_16, tensor var_4211_cast_fp16_17, tensor var_4211_cast_fp16_18, tensor var_4211_cast_fp16_19 = split(axis = var_4211_axis_0, split_sizes = tile_45, x = var_4210_cast_fp16)[name = tensor("op_4211_cast_fp16")]; tensor var_4232_perm_0 = const()[name = tensor("op_4232_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_46 = const()[name = tensor("tile_46"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_4233_axis_0 = const()[name = tensor("op_4233_axis_0"), val = tensor(3)]; tensor var_4232_cast_fp16 = transpose(perm = var_4232_perm_0, x = k_31_cast_fp16)[name = tensor("transpose_17")]; tensor var_4233_cast_fp16_0, tensor var_4233_cast_fp16_1, tensor var_4233_cast_fp16_2, tensor var_4233_cast_fp16_3, tensor var_4233_cast_fp16_4, tensor var_4233_cast_fp16_5, tensor var_4233_cast_fp16_6, tensor var_4233_cast_fp16_7, tensor var_4233_cast_fp16_8, tensor var_4233_cast_fp16_9, tensor var_4233_cast_fp16_10, tensor var_4233_cast_fp16_11, tensor var_4233_cast_fp16_12, tensor var_4233_cast_fp16_13, tensor var_4233_cast_fp16_14, tensor var_4233_cast_fp16_15, tensor var_4233_cast_fp16_16, tensor var_4233_cast_fp16_17, tensor var_4233_cast_fp16_18, tensor var_4233_cast_fp16_19 = split(axis = var_4233_axis_0, split_sizes = tile_46, x = var_4232_cast_fp16)[name = tensor("op_4233_cast_fp16")]; tensor tile_47 = const()[name = tensor("tile_47"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_4254_axis_0 = const()[name = tensor("op_4254_axis_0"), val = tensor(1)]; tensor var_4254_cast_fp16_0, tensor var_4254_cast_fp16_1, tensor var_4254_cast_fp16_2, tensor var_4254_cast_fp16_3, tensor var_4254_cast_fp16_4, tensor var_4254_cast_fp16_5, tensor var_4254_cast_fp16_6, tensor var_4254_cast_fp16_7, tensor var_4254_cast_fp16_8, tensor var_4254_cast_fp16_9, tensor var_4254_cast_fp16_10, tensor var_4254_cast_fp16_11, tensor var_4254_cast_fp16_12, tensor var_4254_cast_fp16_13, tensor var_4254_cast_fp16_14, tensor var_4254_cast_fp16_15, tensor var_4254_cast_fp16_16, tensor var_4254_cast_fp16_17, tensor var_4254_cast_fp16_18, tensor var_4254_cast_fp16_19 = split(axis = var_4254_axis_0, split_sizes = tile_47, x = var_4208_cast_fp16)[name = tensor("op_4254_cast_fp16")]; tensor aw_601_equation_0 = const()[name = tensor("aw_601_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_601_cast_fp16 = einsum(equation = aw_601_equation_0, values = (var_4233_cast_fp16_0, var_4211_cast_fp16_0))[name = tensor("aw_601_cast_fp16")]; tensor aw_603_equation_0 = const()[name = tensor("aw_603_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_603_cast_fp16 = einsum(equation = aw_603_equation_0, values = (var_4233_cast_fp16_1, var_4211_cast_fp16_1))[name = tensor("aw_603_cast_fp16")]; tensor aw_605_equation_0 = const()[name = tensor("aw_605_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_605_cast_fp16 = einsum(equation = aw_605_equation_0, values = (var_4233_cast_fp16_2, var_4211_cast_fp16_2))[name = tensor("aw_605_cast_fp16")]; tensor aw_607_equation_0 = const()[name = tensor("aw_607_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_607_cast_fp16 = einsum(equation = aw_607_equation_0, values = (var_4233_cast_fp16_3, var_4211_cast_fp16_3))[name = tensor("aw_607_cast_fp16")]; tensor aw_609_equation_0 = const()[name = tensor("aw_609_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_609_cast_fp16 = einsum(equation = aw_609_equation_0, values = (var_4233_cast_fp16_4, var_4211_cast_fp16_4))[name = tensor("aw_609_cast_fp16")]; tensor aw_611_equation_0 = const()[name = tensor("aw_611_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_611_cast_fp16 = einsum(equation = aw_611_equation_0, values = (var_4233_cast_fp16_5, var_4211_cast_fp16_5))[name = tensor("aw_611_cast_fp16")]; tensor aw_613_equation_0 = const()[name = tensor("aw_613_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_613_cast_fp16 = einsum(equation = aw_613_equation_0, values = (var_4233_cast_fp16_6, var_4211_cast_fp16_6))[name = tensor("aw_613_cast_fp16")]; tensor aw_615_equation_0 = const()[name = tensor("aw_615_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_615_cast_fp16 = einsum(equation = aw_615_equation_0, values = (var_4233_cast_fp16_7, var_4211_cast_fp16_7))[name = tensor("aw_615_cast_fp16")]; tensor aw_617_equation_0 = const()[name = tensor("aw_617_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_617_cast_fp16 = einsum(equation = aw_617_equation_0, values = (var_4233_cast_fp16_8, var_4211_cast_fp16_8))[name = tensor("aw_617_cast_fp16")]; tensor aw_619_equation_0 = const()[name = tensor("aw_619_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_619_cast_fp16 = einsum(equation = aw_619_equation_0, values = (var_4233_cast_fp16_9, var_4211_cast_fp16_9))[name = tensor("aw_619_cast_fp16")]; tensor aw_621_equation_0 = const()[name = tensor("aw_621_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_621_cast_fp16 = einsum(equation = aw_621_equation_0, values = (var_4233_cast_fp16_10, var_4211_cast_fp16_10))[name = tensor("aw_621_cast_fp16")]; tensor aw_623_equation_0 = const()[name = tensor("aw_623_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_623_cast_fp16 = einsum(equation = aw_623_equation_0, values = (var_4233_cast_fp16_11, var_4211_cast_fp16_11))[name = tensor("aw_623_cast_fp16")]; tensor aw_625_equation_0 = const()[name = tensor("aw_625_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_625_cast_fp16 = einsum(equation = aw_625_equation_0, values = (var_4233_cast_fp16_12, var_4211_cast_fp16_12))[name = tensor("aw_625_cast_fp16")]; tensor aw_627_equation_0 = const()[name = tensor("aw_627_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_627_cast_fp16 = einsum(equation = aw_627_equation_0, values = (var_4233_cast_fp16_13, var_4211_cast_fp16_13))[name = tensor("aw_627_cast_fp16")]; tensor aw_629_equation_0 = const()[name = tensor("aw_629_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_629_cast_fp16 = einsum(equation = aw_629_equation_0, values = (var_4233_cast_fp16_14, var_4211_cast_fp16_14))[name = tensor("aw_629_cast_fp16")]; tensor aw_631_equation_0 = const()[name = tensor("aw_631_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_631_cast_fp16 = einsum(equation = aw_631_equation_0, values = (var_4233_cast_fp16_15, var_4211_cast_fp16_15))[name = tensor("aw_631_cast_fp16")]; tensor aw_633_equation_0 = const()[name = tensor("aw_633_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_633_cast_fp16 = einsum(equation = aw_633_equation_0, values = (var_4233_cast_fp16_16, var_4211_cast_fp16_16))[name = tensor("aw_633_cast_fp16")]; tensor aw_635_equation_0 = const()[name = tensor("aw_635_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_635_cast_fp16 = einsum(equation = aw_635_equation_0, values = (var_4233_cast_fp16_17, var_4211_cast_fp16_17))[name = tensor("aw_635_cast_fp16")]; tensor aw_637_equation_0 = const()[name = tensor("aw_637_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_637_cast_fp16 = einsum(equation = aw_637_equation_0, values = (var_4233_cast_fp16_18, var_4211_cast_fp16_18))[name = tensor("aw_637_cast_fp16")]; tensor aw_639_equation_0 = const()[name = tensor("aw_639_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_639_cast_fp16 = einsum(equation = aw_639_equation_0, values = (var_4233_cast_fp16_19, var_4211_cast_fp16_19))[name = tensor("aw_639_cast_fp16")]; tensor var_4315_cast_fp16 = softmax(axis = var_4159, x = aw_601_cast_fp16)[name = tensor("op_4315_cast_fp16")]; tensor var_4316_cast_fp16 = softmax(axis = var_4159, x = aw_603_cast_fp16)[name = tensor("op_4316_cast_fp16")]; tensor var_4317_cast_fp16 = softmax(axis = var_4159, x = aw_605_cast_fp16)[name = tensor("op_4317_cast_fp16")]; tensor var_4318_cast_fp16 = softmax(axis = var_4159, x = aw_607_cast_fp16)[name = tensor("op_4318_cast_fp16")]; tensor var_4319_cast_fp16 = softmax(axis = var_4159, x = aw_609_cast_fp16)[name = tensor("op_4319_cast_fp16")]; tensor var_4320_cast_fp16 = softmax(axis = var_4159, x = aw_611_cast_fp16)[name = tensor("op_4320_cast_fp16")]; tensor var_4321_cast_fp16 = softmax(axis = var_4159, x = aw_613_cast_fp16)[name = tensor("op_4321_cast_fp16")]; tensor var_4322_cast_fp16 = softmax(axis = var_4159, x = aw_615_cast_fp16)[name = tensor("op_4322_cast_fp16")]; tensor var_4323_cast_fp16 = softmax(axis = var_4159, x = aw_617_cast_fp16)[name = tensor("op_4323_cast_fp16")]; tensor var_4324_cast_fp16 = softmax(axis = var_4159, x = aw_619_cast_fp16)[name = tensor("op_4324_cast_fp16")]; tensor var_4325_cast_fp16 = softmax(axis = var_4159, x = aw_621_cast_fp16)[name = tensor("op_4325_cast_fp16")]; tensor var_4326_cast_fp16 = softmax(axis = var_4159, x = aw_623_cast_fp16)[name = tensor("op_4326_cast_fp16")]; tensor var_4327_cast_fp16 = softmax(axis = var_4159, x = aw_625_cast_fp16)[name = tensor("op_4327_cast_fp16")]; tensor var_4328_cast_fp16 = softmax(axis = var_4159, x = aw_627_cast_fp16)[name = tensor("op_4328_cast_fp16")]; tensor var_4329_cast_fp16 = softmax(axis = var_4159, x = aw_629_cast_fp16)[name = tensor("op_4329_cast_fp16")]; tensor var_4330_cast_fp16 = softmax(axis = var_4159, x = aw_631_cast_fp16)[name = tensor("op_4330_cast_fp16")]; tensor var_4331_cast_fp16 = softmax(axis = var_4159, x = aw_633_cast_fp16)[name = tensor("op_4331_cast_fp16")]; tensor var_4332_cast_fp16 = softmax(axis = var_4159, x = aw_635_cast_fp16)[name = tensor("op_4332_cast_fp16")]; tensor var_4333_cast_fp16 = softmax(axis = var_4159, x = aw_637_cast_fp16)[name = tensor("op_4333_cast_fp16")]; tensor var_4334_cast_fp16 = softmax(axis = var_4159, x = aw_639_cast_fp16)[name = tensor("op_4334_cast_fp16")]; tensor var_4336_equation_0 = const()[name = tensor("op_4336_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4336_cast_fp16 = einsum(equation = var_4336_equation_0, values = (var_4254_cast_fp16_0, var_4315_cast_fp16))[name = tensor("op_4336_cast_fp16")]; tensor var_4338_equation_0 = const()[name = tensor("op_4338_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4338_cast_fp16 = einsum(equation = var_4338_equation_0, values = (var_4254_cast_fp16_1, var_4316_cast_fp16))[name = tensor("op_4338_cast_fp16")]; tensor var_4340_equation_0 = const()[name = tensor("op_4340_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4340_cast_fp16 = einsum(equation = var_4340_equation_0, values = (var_4254_cast_fp16_2, var_4317_cast_fp16))[name = tensor("op_4340_cast_fp16")]; tensor var_4342_equation_0 = const()[name = tensor("op_4342_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4342_cast_fp16 = einsum(equation = var_4342_equation_0, values = (var_4254_cast_fp16_3, var_4318_cast_fp16))[name = tensor("op_4342_cast_fp16")]; tensor var_4344_equation_0 = const()[name = tensor("op_4344_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4344_cast_fp16 = einsum(equation = var_4344_equation_0, values = (var_4254_cast_fp16_4, var_4319_cast_fp16))[name = tensor("op_4344_cast_fp16")]; tensor var_4346_equation_0 = const()[name = tensor("op_4346_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4346_cast_fp16 = einsum(equation = var_4346_equation_0, values = (var_4254_cast_fp16_5, var_4320_cast_fp16))[name = tensor("op_4346_cast_fp16")]; tensor var_4348_equation_0 = const()[name = tensor("op_4348_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4348_cast_fp16 = einsum(equation = var_4348_equation_0, values = (var_4254_cast_fp16_6, var_4321_cast_fp16))[name = tensor("op_4348_cast_fp16")]; tensor var_4350_equation_0 = const()[name = tensor("op_4350_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4350_cast_fp16 = einsum(equation = var_4350_equation_0, values = (var_4254_cast_fp16_7, var_4322_cast_fp16))[name = tensor("op_4350_cast_fp16")]; tensor var_4352_equation_0 = const()[name = tensor("op_4352_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4352_cast_fp16 = einsum(equation = var_4352_equation_0, values = (var_4254_cast_fp16_8, var_4323_cast_fp16))[name = tensor("op_4352_cast_fp16")]; tensor var_4354_equation_0 = const()[name = tensor("op_4354_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4354_cast_fp16 = einsum(equation = var_4354_equation_0, values = (var_4254_cast_fp16_9, var_4324_cast_fp16))[name = tensor("op_4354_cast_fp16")]; tensor var_4356_equation_0 = const()[name = tensor("op_4356_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4356_cast_fp16 = einsum(equation = var_4356_equation_0, values = (var_4254_cast_fp16_10, var_4325_cast_fp16))[name = tensor("op_4356_cast_fp16")]; tensor var_4358_equation_0 = const()[name = tensor("op_4358_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4358_cast_fp16 = einsum(equation = var_4358_equation_0, values = (var_4254_cast_fp16_11, var_4326_cast_fp16))[name = tensor("op_4358_cast_fp16")]; tensor var_4360_equation_0 = const()[name = tensor("op_4360_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4360_cast_fp16 = einsum(equation = var_4360_equation_0, values = (var_4254_cast_fp16_12, var_4327_cast_fp16))[name = tensor("op_4360_cast_fp16")]; tensor var_4362_equation_0 = const()[name = tensor("op_4362_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4362_cast_fp16 = einsum(equation = var_4362_equation_0, values = (var_4254_cast_fp16_13, var_4328_cast_fp16))[name = tensor("op_4362_cast_fp16")]; tensor var_4364_equation_0 = const()[name = tensor("op_4364_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4364_cast_fp16 = einsum(equation = var_4364_equation_0, values = (var_4254_cast_fp16_14, var_4329_cast_fp16))[name = tensor("op_4364_cast_fp16")]; tensor var_4366_equation_0 = const()[name = tensor("op_4366_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4366_cast_fp16 = einsum(equation = var_4366_equation_0, values = (var_4254_cast_fp16_15, var_4330_cast_fp16))[name = tensor("op_4366_cast_fp16")]; tensor var_4368_equation_0 = const()[name = tensor("op_4368_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4368_cast_fp16 = einsum(equation = var_4368_equation_0, values = (var_4254_cast_fp16_16, var_4331_cast_fp16))[name = tensor("op_4368_cast_fp16")]; tensor var_4370_equation_0 = const()[name = tensor("op_4370_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4370_cast_fp16 = einsum(equation = var_4370_equation_0, values = (var_4254_cast_fp16_17, var_4332_cast_fp16))[name = tensor("op_4370_cast_fp16")]; tensor var_4372_equation_0 = const()[name = tensor("op_4372_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4372_cast_fp16 = einsum(equation = var_4372_equation_0, values = (var_4254_cast_fp16_18, var_4333_cast_fp16))[name = tensor("op_4372_cast_fp16")]; tensor var_4374_equation_0 = const()[name = tensor("op_4374_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4374_cast_fp16 = einsum(equation = var_4374_equation_0, values = (var_4254_cast_fp16_19, var_4334_cast_fp16))[name = tensor("op_4374_cast_fp16")]; tensor input_155_interleave_0 = const()[name = tensor("input_155_interleave_0"), val = tensor(false)]; tensor input_155_cast_fp16 = concat(axis = var_4159, interleave = input_155_interleave_0, values = (var_4336_cast_fp16, var_4338_cast_fp16, var_4340_cast_fp16, var_4342_cast_fp16, var_4344_cast_fp16, var_4346_cast_fp16, var_4348_cast_fp16, var_4350_cast_fp16, var_4352_cast_fp16, var_4354_cast_fp16, var_4356_cast_fp16, var_4358_cast_fp16, var_4360_cast_fp16, var_4362_cast_fp16, var_4364_cast_fp16, var_4366_cast_fp16, var_4368_cast_fp16, var_4370_cast_fp16, var_4372_cast_fp16, var_4374_cast_fp16))[name = tensor("input_155_cast_fp16")]; tensor var_4383_pad_type_0 = const()[name = tensor("op_4383_pad_type_0"), val = tensor("valid")]; tensor var_4383_strides_0 = const()[name = tensor("op_4383_strides_0"), val = tensor([1, 1])]; tensor var_4383_pad_0 = const()[name = tensor("op_4383_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_4383_dilations_0 = const()[name = tensor("op_4383_dilations_0"), val = tensor([1, 1])]; tensor var_4383_groups_0 = const()[name = tensor("op_4383_groups_0"), val = tensor(1)]; tensor blocks_15_attn_out_weight_to_fp16 = const()[name = tensor("blocks_15_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(614799232)))]; tensor blocks_15_attn_out_bias_to_fp16 = const()[name = tensor("blocks_15_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(618076096)))]; tensor var_4383_cast_fp16 = conv(bias = blocks_15_attn_out_bias_to_fp16, dilations = var_4383_dilations_0, groups = var_4383_groups_0, pad = var_4383_pad_0, pad_type = var_4383_pad_type_0, strides = var_4383_strides_0, weight = blocks_15_attn_out_weight_to_fp16, x = input_155_cast_fp16)[name = tensor("op_4383_cast_fp16")]; tensor inputs_63_cast_fp16 = add(x = inputs_61_cast_fp16, y = var_4383_cast_fp16)[name = tensor("inputs_63_cast_fp16")]; tensor input_157_axes_0 = const()[name = tensor("input_157_axes_0"), val = tensor([1])]; tensor input_157_gamma_0_to_fp16 = const()[name = tensor("input_157_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(618078720)))]; tensor input_157_beta_0_to_fp16 = const()[name = tensor("input_157_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(618081344)))]; tensor var_4393_to_fp16 = const()[name = tensor("op_4393_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_157_cast_fp16 = layer_norm(axes = input_157_axes_0, beta = input_157_beta_0_to_fp16, epsilon = var_4393_to_fp16, gamma = input_157_gamma_0_to_fp16, x = inputs_63_cast_fp16)[name = tensor("input_157_cast_fp16")]; tensor input_159_pad_type_0 = const()[name = tensor("input_159_pad_type_0"), val = tensor("valid")]; tensor input_159_strides_0 = const()[name = tensor("input_159_strides_0"), val = tensor([1, 1])]; tensor input_159_pad_0 = const()[name = tensor("input_159_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_159_dilations_0 = const()[name = tensor("input_159_dilations_0"), val = tensor([1, 1])]; tensor input_159_groups_0 = const()[name = tensor("input_159_groups_0"), val = tensor(1)]; tensor blocks_15_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_15_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(618083968)))]; tensor blocks_15_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_15_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(631191232)))]; tensor input_159_cast_fp16 = conv(bias = blocks_15_mlp_0_bias_to_fp16, dilations = input_159_dilations_0, groups = input_159_groups_0, pad = input_159_pad_0, pad_type = input_159_pad_type_0, strides = input_159_strides_0, weight = blocks_15_mlp_0_weight_to_fp16, x = input_157_cast_fp16)[name = tensor("input_159_cast_fp16")]; tensor input_161_mode_0 = const()[name = tensor("input_161_mode_0"), val = tensor("EXACT")]; tensor input_161_cast_fp16 = gelu(mode = input_161_mode_0, x = input_159_cast_fp16)[name = tensor("input_161_cast_fp16")]; tensor var_4419_pad_type_0 = const()[name = tensor("op_4419_pad_type_0"), val = tensor("valid")]; tensor var_4419_strides_0 = const()[name = tensor("op_4419_strides_0"), val = tensor([1, 1])]; tensor var_4419_pad_0 = const()[name = tensor("op_4419_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_4419_dilations_0 = const()[name = tensor("op_4419_dilations_0"), val = tensor([1, 1])]; tensor var_4419_groups_0 = const()[name = tensor("op_4419_groups_0"), val = tensor(1)]; tensor blocks_15_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_15_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(631201536)))]; tensor blocks_15_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_15_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(644308800)))]; tensor var_4419_cast_fp16 = conv(bias = blocks_15_mlp_2_bias_to_fp16, dilations = var_4419_dilations_0, groups = var_4419_groups_0, pad = var_4419_pad_0, pad_type = var_4419_pad_type_0, strides = var_4419_strides_0, weight = blocks_15_mlp_2_weight_to_fp16, x = input_161_cast_fp16)[name = tensor("op_4419_cast_fp16")]; tensor inputs_65_cast_fp16 = add(x = inputs_63_cast_fp16, y = var_4419_cast_fp16)[name = tensor("inputs_65_cast_fp16")]; tensor var_4428 = const()[name = tensor("op_4428"), val = tensor(1)]; tensor input_163_axes_0 = const()[name = tensor("input_163_axes_0"), val = tensor([1])]; tensor input_163_gamma_0_to_fp16 = const()[name = tensor("input_163_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(644311424)))]; tensor input_163_beta_0_to_fp16 = const()[name = tensor("input_163_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(644314048)))]; tensor var_4444_to_fp16 = const()[name = tensor("op_4444_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_163_cast_fp16 = layer_norm(axes = input_163_axes_0, beta = input_163_beta_0_to_fp16, epsilon = var_4444_to_fp16, gamma = input_163_gamma_0_to_fp16, x = inputs_65_cast_fp16)[name = tensor("input_163_cast_fp16")]; tensor q_33_pad_type_0 = const()[name = tensor("q_33_pad_type_0"), val = tensor("valid")]; tensor q_33_strides_0 = const()[name = tensor("q_33_strides_0"), val = tensor([1, 1])]; tensor q_33_pad_0 = const()[name = tensor("q_33_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_33_dilations_0 = const()[name = tensor("q_33_dilations_0"), val = tensor([1, 1])]; tensor q_33_groups_0 = const()[name = tensor("q_33_groups_0"), val = tensor(1)]; tensor var_4479_weight_0_to_fp16 = const()[name = tensor("op_4479_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(644316672)))]; tensor var_4479_bias_0_to_fp16 = const()[name = tensor("op_4479_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(647593536)))]; tensor var_4479_cast_fp16 = conv(bias = var_4479_bias_0_to_fp16, dilations = q_33_dilations_0, groups = q_33_groups_0, pad = q_33_pad_0, pad_type = q_33_pad_type_0, strides = q_33_strides_0, weight = var_4479_weight_0_to_fp16, x = input_163_cast_fp16)[name = tensor("op_4479_cast_fp16")]; tensor k_33_pad_type_0 = const()[name = tensor("k_33_pad_type_0"), val = tensor("valid")]; tensor k_33_strides_0 = const()[name = tensor("k_33_strides_0"), val = tensor([1, 1])]; tensor k_33_pad_0 = const()[name = tensor("k_33_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_33_dilations_0 = const()[name = tensor("k_33_dilations_0"), val = tensor([1, 1])]; tensor k_33_groups_0 = const()[name = tensor("k_33_groups_0"), val = tensor(1)]; tensor blocks_16_attn_key_weight_to_fp16 = const()[name = tensor("blocks_16_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(647596160)))]; tensor k_33_cast_fp16 = conv(dilations = k_33_dilations_0, groups = k_33_groups_0, pad = k_33_pad_0, pad_type = k_33_pad_type_0, strides = k_33_strides_0, weight = blocks_16_attn_key_weight_to_fp16, x = input_163_cast_fp16)[name = tensor("k_33_cast_fp16")]; tensor var_4477_pad_type_0 = const()[name = tensor("op_4477_pad_type_0"), val = tensor("valid")]; tensor var_4477_strides_0 = const()[name = tensor("op_4477_strides_0"), val = tensor([1, 1])]; tensor var_4477_pad_0 = const()[name = tensor("op_4477_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_4477_dilations_0 = const()[name = tensor("op_4477_dilations_0"), val = tensor([1, 1])]; tensor var_4477_groups_0 = const()[name = tensor("op_4477_groups_0"), val = tensor(1)]; tensor blocks_16_attn_value_weight_to_fp16 = const()[name = tensor("blocks_16_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(650873024)))]; tensor blocks_16_attn_value_bias_to_fp16 = const()[name = tensor("blocks_16_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(654149888)))]; tensor var_4477_cast_fp16 = conv(bias = blocks_16_attn_value_bias_to_fp16, dilations = var_4477_dilations_0, groups = var_4477_groups_0, pad = var_4477_pad_0, pad_type = var_4477_pad_type_0, strides = var_4477_strides_0, weight = blocks_16_attn_value_weight_to_fp16, x = input_163_cast_fp16)[name = tensor("op_4477_cast_fp16")]; tensor tile_48 = const()[name = tensor("tile_48"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_4480_axis_0 = const()[name = tensor("op_4480_axis_0"), val = tensor(1)]; tensor var_4480_cast_fp16_0, tensor var_4480_cast_fp16_1, tensor var_4480_cast_fp16_2, tensor var_4480_cast_fp16_3, tensor var_4480_cast_fp16_4, tensor var_4480_cast_fp16_5, tensor var_4480_cast_fp16_6, tensor var_4480_cast_fp16_7, tensor var_4480_cast_fp16_8, tensor var_4480_cast_fp16_9, tensor var_4480_cast_fp16_10, tensor var_4480_cast_fp16_11, tensor var_4480_cast_fp16_12, tensor var_4480_cast_fp16_13, tensor var_4480_cast_fp16_14, tensor var_4480_cast_fp16_15, tensor var_4480_cast_fp16_16, tensor var_4480_cast_fp16_17, tensor var_4480_cast_fp16_18, tensor var_4480_cast_fp16_19 = split(axis = var_4480_axis_0, split_sizes = tile_48, x = var_4479_cast_fp16)[name = tensor("op_4480_cast_fp16")]; tensor var_4501_perm_0 = const()[name = tensor("op_4501_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_49 = const()[name = tensor("tile_49"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_4502_axis_0 = const()[name = tensor("op_4502_axis_0"), val = tensor(3)]; tensor var_4501_cast_fp16 = transpose(perm = var_4501_perm_0, x = k_33_cast_fp16)[name = tensor("transpose_16")]; tensor var_4502_cast_fp16_0, tensor var_4502_cast_fp16_1, tensor var_4502_cast_fp16_2, tensor var_4502_cast_fp16_3, tensor var_4502_cast_fp16_4, tensor var_4502_cast_fp16_5, tensor var_4502_cast_fp16_6, tensor var_4502_cast_fp16_7, tensor var_4502_cast_fp16_8, tensor var_4502_cast_fp16_9, tensor var_4502_cast_fp16_10, tensor var_4502_cast_fp16_11, tensor var_4502_cast_fp16_12, tensor var_4502_cast_fp16_13, tensor var_4502_cast_fp16_14, tensor var_4502_cast_fp16_15, tensor var_4502_cast_fp16_16, tensor var_4502_cast_fp16_17, tensor var_4502_cast_fp16_18, tensor var_4502_cast_fp16_19 = split(axis = var_4502_axis_0, split_sizes = tile_49, x = var_4501_cast_fp16)[name = tensor("op_4502_cast_fp16")]; tensor tile_50 = const()[name = tensor("tile_50"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_4523_axis_0 = const()[name = tensor("op_4523_axis_0"), val = tensor(1)]; tensor var_4523_cast_fp16_0, tensor var_4523_cast_fp16_1, tensor var_4523_cast_fp16_2, tensor var_4523_cast_fp16_3, tensor var_4523_cast_fp16_4, tensor var_4523_cast_fp16_5, tensor var_4523_cast_fp16_6, tensor var_4523_cast_fp16_7, tensor var_4523_cast_fp16_8, tensor var_4523_cast_fp16_9, tensor var_4523_cast_fp16_10, tensor var_4523_cast_fp16_11, tensor var_4523_cast_fp16_12, tensor var_4523_cast_fp16_13, tensor var_4523_cast_fp16_14, tensor var_4523_cast_fp16_15, tensor var_4523_cast_fp16_16, tensor var_4523_cast_fp16_17, tensor var_4523_cast_fp16_18, tensor var_4523_cast_fp16_19 = split(axis = var_4523_axis_0, split_sizes = tile_50, x = var_4477_cast_fp16)[name = tensor("op_4523_cast_fp16")]; tensor aw_641_equation_0 = const()[name = tensor("aw_641_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_641_cast_fp16 = einsum(equation = aw_641_equation_0, values = (var_4502_cast_fp16_0, var_4480_cast_fp16_0))[name = tensor("aw_641_cast_fp16")]; tensor aw_643_equation_0 = const()[name = tensor("aw_643_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_643_cast_fp16 = einsum(equation = aw_643_equation_0, values = (var_4502_cast_fp16_1, var_4480_cast_fp16_1))[name = tensor("aw_643_cast_fp16")]; tensor aw_645_equation_0 = const()[name = tensor("aw_645_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_645_cast_fp16 = einsum(equation = aw_645_equation_0, values = (var_4502_cast_fp16_2, var_4480_cast_fp16_2))[name = tensor("aw_645_cast_fp16")]; tensor aw_647_equation_0 = const()[name = tensor("aw_647_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_647_cast_fp16 = einsum(equation = aw_647_equation_0, values = (var_4502_cast_fp16_3, var_4480_cast_fp16_3))[name = tensor("aw_647_cast_fp16")]; tensor aw_649_equation_0 = const()[name = tensor("aw_649_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_649_cast_fp16 = einsum(equation = aw_649_equation_0, values = (var_4502_cast_fp16_4, var_4480_cast_fp16_4))[name = tensor("aw_649_cast_fp16")]; tensor aw_651_equation_0 = const()[name = tensor("aw_651_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_651_cast_fp16 = einsum(equation = aw_651_equation_0, values = (var_4502_cast_fp16_5, var_4480_cast_fp16_5))[name = tensor("aw_651_cast_fp16")]; tensor aw_653_equation_0 = const()[name = tensor("aw_653_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_653_cast_fp16 = einsum(equation = aw_653_equation_0, values = (var_4502_cast_fp16_6, var_4480_cast_fp16_6))[name = tensor("aw_653_cast_fp16")]; tensor aw_655_equation_0 = const()[name = tensor("aw_655_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_655_cast_fp16 = einsum(equation = aw_655_equation_0, values = (var_4502_cast_fp16_7, var_4480_cast_fp16_7))[name = tensor("aw_655_cast_fp16")]; tensor aw_657_equation_0 = const()[name = tensor("aw_657_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_657_cast_fp16 = einsum(equation = aw_657_equation_0, values = (var_4502_cast_fp16_8, var_4480_cast_fp16_8))[name = tensor("aw_657_cast_fp16")]; tensor aw_659_equation_0 = const()[name = tensor("aw_659_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_659_cast_fp16 = einsum(equation = aw_659_equation_0, values = (var_4502_cast_fp16_9, var_4480_cast_fp16_9))[name = tensor("aw_659_cast_fp16")]; tensor aw_661_equation_0 = const()[name = tensor("aw_661_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_661_cast_fp16 = einsum(equation = aw_661_equation_0, values = (var_4502_cast_fp16_10, var_4480_cast_fp16_10))[name = tensor("aw_661_cast_fp16")]; tensor aw_663_equation_0 = const()[name = tensor("aw_663_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_663_cast_fp16 = einsum(equation = aw_663_equation_0, values = (var_4502_cast_fp16_11, var_4480_cast_fp16_11))[name = tensor("aw_663_cast_fp16")]; tensor aw_665_equation_0 = const()[name = tensor("aw_665_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_665_cast_fp16 = einsum(equation = aw_665_equation_0, values = (var_4502_cast_fp16_12, var_4480_cast_fp16_12))[name = tensor("aw_665_cast_fp16")]; tensor aw_667_equation_0 = const()[name = tensor("aw_667_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_667_cast_fp16 = einsum(equation = aw_667_equation_0, values = (var_4502_cast_fp16_13, var_4480_cast_fp16_13))[name = tensor("aw_667_cast_fp16")]; tensor aw_669_equation_0 = const()[name = tensor("aw_669_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_669_cast_fp16 = einsum(equation = aw_669_equation_0, values = (var_4502_cast_fp16_14, var_4480_cast_fp16_14))[name = tensor("aw_669_cast_fp16")]; tensor aw_671_equation_0 = const()[name = tensor("aw_671_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_671_cast_fp16 = einsum(equation = aw_671_equation_0, values = (var_4502_cast_fp16_15, var_4480_cast_fp16_15))[name = tensor("aw_671_cast_fp16")]; tensor aw_673_equation_0 = const()[name = tensor("aw_673_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_673_cast_fp16 = einsum(equation = aw_673_equation_0, values = (var_4502_cast_fp16_16, var_4480_cast_fp16_16))[name = tensor("aw_673_cast_fp16")]; tensor aw_675_equation_0 = const()[name = tensor("aw_675_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_675_cast_fp16 = einsum(equation = aw_675_equation_0, values = (var_4502_cast_fp16_17, var_4480_cast_fp16_17))[name = tensor("aw_675_cast_fp16")]; tensor aw_677_equation_0 = const()[name = tensor("aw_677_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_677_cast_fp16 = einsum(equation = aw_677_equation_0, values = (var_4502_cast_fp16_18, var_4480_cast_fp16_18))[name = tensor("aw_677_cast_fp16")]; tensor aw_679_equation_0 = const()[name = tensor("aw_679_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_679_cast_fp16 = einsum(equation = aw_679_equation_0, values = (var_4502_cast_fp16_19, var_4480_cast_fp16_19))[name = tensor("aw_679_cast_fp16")]; tensor var_4584_cast_fp16 = softmax(axis = var_4428, x = aw_641_cast_fp16)[name = tensor("op_4584_cast_fp16")]; tensor var_4585_cast_fp16 = softmax(axis = var_4428, x = aw_643_cast_fp16)[name = tensor("op_4585_cast_fp16")]; tensor var_4586_cast_fp16 = softmax(axis = var_4428, x = aw_645_cast_fp16)[name = tensor("op_4586_cast_fp16")]; tensor var_4587_cast_fp16 = softmax(axis = var_4428, x = aw_647_cast_fp16)[name = tensor("op_4587_cast_fp16")]; tensor var_4588_cast_fp16 = softmax(axis = var_4428, x = aw_649_cast_fp16)[name = tensor("op_4588_cast_fp16")]; tensor var_4589_cast_fp16 = softmax(axis = var_4428, x = aw_651_cast_fp16)[name = tensor("op_4589_cast_fp16")]; tensor var_4590_cast_fp16 = softmax(axis = var_4428, x = aw_653_cast_fp16)[name = tensor("op_4590_cast_fp16")]; tensor var_4591_cast_fp16 = softmax(axis = var_4428, x = aw_655_cast_fp16)[name = tensor("op_4591_cast_fp16")]; tensor var_4592_cast_fp16 = softmax(axis = var_4428, x = aw_657_cast_fp16)[name = tensor("op_4592_cast_fp16")]; tensor var_4593_cast_fp16 = softmax(axis = var_4428, x = aw_659_cast_fp16)[name = tensor("op_4593_cast_fp16")]; tensor var_4594_cast_fp16 = softmax(axis = var_4428, x = aw_661_cast_fp16)[name = tensor("op_4594_cast_fp16")]; tensor var_4595_cast_fp16 = softmax(axis = var_4428, x = aw_663_cast_fp16)[name = tensor("op_4595_cast_fp16")]; tensor var_4596_cast_fp16 = softmax(axis = var_4428, x = aw_665_cast_fp16)[name = tensor("op_4596_cast_fp16")]; tensor var_4597_cast_fp16 = softmax(axis = var_4428, x = aw_667_cast_fp16)[name = tensor("op_4597_cast_fp16")]; tensor var_4598_cast_fp16 = softmax(axis = var_4428, x = aw_669_cast_fp16)[name = tensor("op_4598_cast_fp16")]; tensor var_4599_cast_fp16 = softmax(axis = var_4428, x = aw_671_cast_fp16)[name = tensor("op_4599_cast_fp16")]; tensor var_4600_cast_fp16 = softmax(axis = var_4428, x = aw_673_cast_fp16)[name = tensor("op_4600_cast_fp16")]; tensor var_4601_cast_fp16 = softmax(axis = var_4428, x = aw_675_cast_fp16)[name = tensor("op_4601_cast_fp16")]; tensor var_4602_cast_fp16 = softmax(axis = var_4428, x = aw_677_cast_fp16)[name = tensor("op_4602_cast_fp16")]; tensor var_4603_cast_fp16 = softmax(axis = var_4428, x = aw_679_cast_fp16)[name = tensor("op_4603_cast_fp16")]; tensor var_4605_equation_0 = const()[name = tensor("op_4605_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4605_cast_fp16 = einsum(equation = var_4605_equation_0, values = (var_4523_cast_fp16_0, var_4584_cast_fp16))[name = tensor("op_4605_cast_fp16")]; tensor var_4607_equation_0 = const()[name = tensor("op_4607_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4607_cast_fp16 = einsum(equation = var_4607_equation_0, values = (var_4523_cast_fp16_1, var_4585_cast_fp16))[name = tensor("op_4607_cast_fp16")]; tensor var_4609_equation_0 = const()[name = tensor("op_4609_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4609_cast_fp16 = einsum(equation = var_4609_equation_0, values = (var_4523_cast_fp16_2, var_4586_cast_fp16))[name = tensor("op_4609_cast_fp16")]; tensor var_4611_equation_0 = const()[name = tensor("op_4611_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4611_cast_fp16 = einsum(equation = var_4611_equation_0, values = (var_4523_cast_fp16_3, var_4587_cast_fp16))[name = tensor("op_4611_cast_fp16")]; tensor var_4613_equation_0 = const()[name = tensor("op_4613_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4613_cast_fp16 = einsum(equation = var_4613_equation_0, values = (var_4523_cast_fp16_4, var_4588_cast_fp16))[name = tensor("op_4613_cast_fp16")]; tensor var_4615_equation_0 = const()[name = tensor("op_4615_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4615_cast_fp16 = einsum(equation = var_4615_equation_0, values = (var_4523_cast_fp16_5, var_4589_cast_fp16))[name = tensor("op_4615_cast_fp16")]; tensor var_4617_equation_0 = const()[name = tensor("op_4617_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4617_cast_fp16 = einsum(equation = var_4617_equation_0, values = (var_4523_cast_fp16_6, var_4590_cast_fp16))[name = tensor("op_4617_cast_fp16")]; tensor var_4619_equation_0 = const()[name = tensor("op_4619_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4619_cast_fp16 = einsum(equation = var_4619_equation_0, values = (var_4523_cast_fp16_7, var_4591_cast_fp16))[name = tensor("op_4619_cast_fp16")]; tensor var_4621_equation_0 = const()[name = tensor("op_4621_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4621_cast_fp16 = einsum(equation = var_4621_equation_0, values = (var_4523_cast_fp16_8, var_4592_cast_fp16))[name = tensor("op_4621_cast_fp16")]; tensor var_4623_equation_0 = const()[name = tensor("op_4623_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4623_cast_fp16 = einsum(equation = var_4623_equation_0, values = (var_4523_cast_fp16_9, var_4593_cast_fp16))[name = tensor("op_4623_cast_fp16")]; tensor var_4625_equation_0 = const()[name = tensor("op_4625_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4625_cast_fp16 = einsum(equation = var_4625_equation_0, values = (var_4523_cast_fp16_10, var_4594_cast_fp16))[name = tensor("op_4625_cast_fp16")]; tensor var_4627_equation_0 = const()[name = tensor("op_4627_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4627_cast_fp16 = einsum(equation = var_4627_equation_0, values = (var_4523_cast_fp16_11, var_4595_cast_fp16))[name = tensor("op_4627_cast_fp16")]; tensor var_4629_equation_0 = const()[name = tensor("op_4629_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4629_cast_fp16 = einsum(equation = var_4629_equation_0, values = (var_4523_cast_fp16_12, var_4596_cast_fp16))[name = tensor("op_4629_cast_fp16")]; tensor var_4631_equation_0 = const()[name = tensor("op_4631_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4631_cast_fp16 = einsum(equation = var_4631_equation_0, values = (var_4523_cast_fp16_13, var_4597_cast_fp16))[name = tensor("op_4631_cast_fp16")]; tensor var_4633_equation_0 = const()[name = tensor("op_4633_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4633_cast_fp16 = einsum(equation = var_4633_equation_0, values = (var_4523_cast_fp16_14, var_4598_cast_fp16))[name = tensor("op_4633_cast_fp16")]; tensor var_4635_equation_0 = const()[name = tensor("op_4635_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4635_cast_fp16 = einsum(equation = var_4635_equation_0, values = (var_4523_cast_fp16_15, var_4599_cast_fp16))[name = tensor("op_4635_cast_fp16")]; tensor var_4637_equation_0 = const()[name = tensor("op_4637_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4637_cast_fp16 = einsum(equation = var_4637_equation_0, values = (var_4523_cast_fp16_16, var_4600_cast_fp16))[name = tensor("op_4637_cast_fp16")]; tensor var_4639_equation_0 = const()[name = tensor("op_4639_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4639_cast_fp16 = einsum(equation = var_4639_equation_0, values = (var_4523_cast_fp16_17, var_4601_cast_fp16))[name = tensor("op_4639_cast_fp16")]; tensor var_4641_equation_0 = const()[name = tensor("op_4641_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4641_cast_fp16 = einsum(equation = var_4641_equation_0, values = (var_4523_cast_fp16_18, var_4602_cast_fp16))[name = tensor("op_4641_cast_fp16")]; tensor var_4643_equation_0 = const()[name = tensor("op_4643_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4643_cast_fp16 = einsum(equation = var_4643_equation_0, values = (var_4523_cast_fp16_19, var_4603_cast_fp16))[name = tensor("op_4643_cast_fp16")]; tensor input_165_interleave_0 = const()[name = tensor("input_165_interleave_0"), val = tensor(false)]; tensor input_165_cast_fp16 = concat(axis = var_4428, interleave = input_165_interleave_0, values = (var_4605_cast_fp16, var_4607_cast_fp16, var_4609_cast_fp16, var_4611_cast_fp16, var_4613_cast_fp16, var_4615_cast_fp16, var_4617_cast_fp16, var_4619_cast_fp16, var_4621_cast_fp16, var_4623_cast_fp16, var_4625_cast_fp16, var_4627_cast_fp16, var_4629_cast_fp16, var_4631_cast_fp16, var_4633_cast_fp16, var_4635_cast_fp16, var_4637_cast_fp16, var_4639_cast_fp16, var_4641_cast_fp16, var_4643_cast_fp16))[name = tensor("input_165_cast_fp16")]; tensor var_4652_pad_type_0 = const()[name = tensor("op_4652_pad_type_0"), val = tensor("valid")]; tensor var_4652_strides_0 = const()[name = tensor("op_4652_strides_0"), val = tensor([1, 1])]; tensor var_4652_pad_0 = const()[name = tensor("op_4652_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_4652_dilations_0 = const()[name = tensor("op_4652_dilations_0"), val = tensor([1, 1])]; tensor var_4652_groups_0 = const()[name = tensor("op_4652_groups_0"), val = tensor(1)]; tensor blocks_16_attn_out_weight_to_fp16 = const()[name = tensor("blocks_16_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(654152512)))]; tensor blocks_16_attn_out_bias_to_fp16 = const()[name = tensor("blocks_16_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(657429376)))]; tensor var_4652_cast_fp16 = conv(bias = blocks_16_attn_out_bias_to_fp16, dilations = var_4652_dilations_0, groups = var_4652_groups_0, pad = var_4652_pad_0, pad_type = var_4652_pad_type_0, strides = var_4652_strides_0, weight = blocks_16_attn_out_weight_to_fp16, x = input_165_cast_fp16)[name = tensor("op_4652_cast_fp16")]; tensor inputs_67_cast_fp16 = add(x = inputs_65_cast_fp16, y = var_4652_cast_fp16)[name = tensor("inputs_67_cast_fp16")]; tensor input_167_axes_0 = const()[name = tensor("input_167_axes_0"), val = tensor([1])]; tensor input_167_gamma_0_to_fp16 = const()[name = tensor("input_167_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(657432000)))]; tensor input_167_beta_0_to_fp16 = const()[name = tensor("input_167_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(657434624)))]; tensor var_4662_to_fp16 = const()[name = tensor("op_4662_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_167_cast_fp16 = layer_norm(axes = input_167_axes_0, beta = input_167_beta_0_to_fp16, epsilon = var_4662_to_fp16, gamma = input_167_gamma_0_to_fp16, x = inputs_67_cast_fp16)[name = tensor("input_167_cast_fp16")]; tensor input_169_pad_type_0 = const()[name = tensor("input_169_pad_type_0"), val = tensor("valid")]; tensor input_169_strides_0 = const()[name = tensor("input_169_strides_0"), val = tensor([1, 1])]; tensor input_169_pad_0 = const()[name = tensor("input_169_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_169_dilations_0 = const()[name = tensor("input_169_dilations_0"), val = tensor([1, 1])]; tensor input_169_groups_0 = const()[name = tensor("input_169_groups_0"), val = tensor(1)]; tensor blocks_16_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_16_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(657437248)))]; tensor blocks_16_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_16_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(670544512)))]; tensor input_169_cast_fp16 = conv(bias = blocks_16_mlp_0_bias_to_fp16, dilations = input_169_dilations_0, groups = input_169_groups_0, pad = input_169_pad_0, pad_type = input_169_pad_type_0, strides = input_169_strides_0, weight = blocks_16_mlp_0_weight_to_fp16, x = input_167_cast_fp16)[name = tensor("input_169_cast_fp16")]; tensor input_171_mode_0 = const()[name = tensor("input_171_mode_0"), val = tensor("EXACT")]; tensor input_171_cast_fp16 = gelu(mode = input_171_mode_0, x = input_169_cast_fp16)[name = tensor("input_171_cast_fp16")]; tensor var_4688_pad_type_0 = const()[name = tensor("op_4688_pad_type_0"), val = tensor("valid")]; tensor var_4688_strides_0 = const()[name = tensor("op_4688_strides_0"), val = tensor([1, 1])]; tensor var_4688_pad_0 = const()[name = tensor("op_4688_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_4688_dilations_0 = const()[name = tensor("op_4688_dilations_0"), val = tensor([1, 1])]; tensor var_4688_groups_0 = const()[name = tensor("op_4688_groups_0"), val = tensor(1)]; tensor blocks_16_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_16_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(670554816)))]; tensor blocks_16_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_16_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(683662080)))]; tensor var_4688_cast_fp16 = conv(bias = blocks_16_mlp_2_bias_to_fp16, dilations = var_4688_dilations_0, groups = var_4688_groups_0, pad = var_4688_pad_0, pad_type = var_4688_pad_type_0, strides = var_4688_strides_0, weight = blocks_16_mlp_2_weight_to_fp16, x = input_171_cast_fp16)[name = tensor("op_4688_cast_fp16")]; tensor inputs_69_cast_fp16 = add(x = inputs_67_cast_fp16, y = var_4688_cast_fp16)[name = tensor("inputs_69_cast_fp16")]; tensor var_4697 = const()[name = tensor("op_4697"), val = tensor(1)]; tensor input_173_axes_0 = const()[name = tensor("input_173_axes_0"), val = tensor([1])]; tensor input_173_gamma_0_to_fp16 = const()[name = tensor("input_173_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(683664704)))]; tensor input_173_beta_0_to_fp16 = const()[name = tensor("input_173_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(683667328)))]; tensor var_4713_to_fp16 = const()[name = tensor("op_4713_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_173_cast_fp16 = layer_norm(axes = input_173_axes_0, beta = input_173_beta_0_to_fp16, epsilon = var_4713_to_fp16, gamma = input_173_gamma_0_to_fp16, x = inputs_69_cast_fp16)[name = tensor("input_173_cast_fp16")]; tensor q_35_pad_type_0 = const()[name = tensor("q_35_pad_type_0"), val = tensor("valid")]; tensor q_35_strides_0 = const()[name = tensor("q_35_strides_0"), val = tensor([1, 1])]; tensor q_35_pad_0 = const()[name = tensor("q_35_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_35_dilations_0 = const()[name = tensor("q_35_dilations_0"), val = tensor([1, 1])]; tensor q_35_groups_0 = const()[name = tensor("q_35_groups_0"), val = tensor(1)]; tensor var_4748_weight_0_to_fp16 = const()[name = tensor("op_4748_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(683669952)))]; tensor var_4748_bias_0_to_fp16 = const()[name = tensor("op_4748_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(686946816)))]; tensor var_4748_cast_fp16 = conv(bias = var_4748_bias_0_to_fp16, dilations = q_35_dilations_0, groups = q_35_groups_0, pad = q_35_pad_0, pad_type = q_35_pad_type_0, strides = q_35_strides_0, weight = var_4748_weight_0_to_fp16, x = input_173_cast_fp16)[name = tensor("op_4748_cast_fp16")]; tensor k_35_pad_type_0 = const()[name = tensor("k_35_pad_type_0"), val = tensor("valid")]; tensor k_35_strides_0 = const()[name = tensor("k_35_strides_0"), val = tensor([1, 1])]; tensor k_35_pad_0 = const()[name = tensor("k_35_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_35_dilations_0 = const()[name = tensor("k_35_dilations_0"), val = tensor([1, 1])]; tensor k_35_groups_0 = const()[name = tensor("k_35_groups_0"), val = tensor(1)]; tensor blocks_17_attn_key_weight_to_fp16 = const()[name = tensor("blocks_17_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(686949440)))]; tensor k_35_cast_fp16 = conv(dilations = k_35_dilations_0, groups = k_35_groups_0, pad = k_35_pad_0, pad_type = k_35_pad_type_0, strides = k_35_strides_0, weight = blocks_17_attn_key_weight_to_fp16, x = input_173_cast_fp16)[name = tensor("k_35_cast_fp16")]; tensor var_4746_pad_type_0 = const()[name = tensor("op_4746_pad_type_0"), val = tensor("valid")]; tensor var_4746_strides_0 = const()[name = tensor("op_4746_strides_0"), val = tensor([1, 1])]; tensor var_4746_pad_0 = const()[name = tensor("op_4746_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_4746_dilations_0 = const()[name = tensor("op_4746_dilations_0"), val = tensor([1, 1])]; tensor var_4746_groups_0 = const()[name = tensor("op_4746_groups_0"), val = tensor(1)]; tensor blocks_17_attn_value_weight_to_fp16 = const()[name = tensor("blocks_17_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(690226304)))]; tensor blocks_17_attn_value_bias_to_fp16 = const()[name = tensor("blocks_17_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(693503168)))]; tensor var_4746_cast_fp16 = conv(bias = blocks_17_attn_value_bias_to_fp16, dilations = var_4746_dilations_0, groups = var_4746_groups_0, pad = var_4746_pad_0, pad_type = var_4746_pad_type_0, strides = var_4746_strides_0, weight = blocks_17_attn_value_weight_to_fp16, x = input_173_cast_fp16)[name = tensor("op_4746_cast_fp16")]; tensor tile_51 = const()[name = tensor("tile_51"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_4749_axis_0 = const()[name = tensor("op_4749_axis_0"), val = tensor(1)]; tensor var_4749_cast_fp16_0, tensor var_4749_cast_fp16_1, tensor var_4749_cast_fp16_2, tensor var_4749_cast_fp16_3, tensor var_4749_cast_fp16_4, tensor var_4749_cast_fp16_5, tensor var_4749_cast_fp16_6, tensor var_4749_cast_fp16_7, tensor var_4749_cast_fp16_8, tensor var_4749_cast_fp16_9, tensor var_4749_cast_fp16_10, tensor var_4749_cast_fp16_11, tensor var_4749_cast_fp16_12, tensor var_4749_cast_fp16_13, tensor var_4749_cast_fp16_14, tensor var_4749_cast_fp16_15, tensor var_4749_cast_fp16_16, tensor var_4749_cast_fp16_17, tensor var_4749_cast_fp16_18, tensor var_4749_cast_fp16_19 = split(axis = var_4749_axis_0, split_sizes = tile_51, x = var_4748_cast_fp16)[name = tensor("op_4749_cast_fp16")]; tensor var_4770_perm_0 = const()[name = tensor("op_4770_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_52 = const()[name = tensor("tile_52"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_4771_axis_0 = const()[name = tensor("op_4771_axis_0"), val = tensor(3)]; tensor var_4770_cast_fp16 = transpose(perm = var_4770_perm_0, x = k_35_cast_fp16)[name = tensor("transpose_15")]; tensor var_4771_cast_fp16_0, tensor var_4771_cast_fp16_1, tensor var_4771_cast_fp16_2, tensor var_4771_cast_fp16_3, tensor var_4771_cast_fp16_4, tensor var_4771_cast_fp16_5, tensor var_4771_cast_fp16_6, tensor var_4771_cast_fp16_7, tensor var_4771_cast_fp16_8, tensor var_4771_cast_fp16_9, tensor var_4771_cast_fp16_10, tensor var_4771_cast_fp16_11, tensor var_4771_cast_fp16_12, tensor var_4771_cast_fp16_13, tensor var_4771_cast_fp16_14, tensor var_4771_cast_fp16_15, tensor var_4771_cast_fp16_16, tensor var_4771_cast_fp16_17, tensor var_4771_cast_fp16_18, tensor var_4771_cast_fp16_19 = split(axis = var_4771_axis_0, split_sizes = tile_52, x = var_4770_cast_fp16)[name = tensor("op_4771_cast_fp16")]; tensor tile_53 = const()[name = tensor("tile_53"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_4792_axis_0 = const()[name = tensor("op_4792_axis_0"), val = tensor(1)]; tensor var_4792_cast_fp16_0, tensor var_4792_cast_fp16_1, tensor var_4792_cast_fp16_2, tensor var_4792_cast_fp16_3, tensor var_4792_cast_fp16_4, tensor var_4792_cast_fp16_5, tensor var_4792_cast_fp16_6, tensor var_4792_cast_fp16_7, tensor var_4792_cast_fp16_8, tensor var_4792_cast_fp16_9, tensor var_4792_cast_fp16_10, tensor var_4792_cast_fp16_11, tensor var_4792_cast_fp16_12, tensor var_4792_cast_fp16_13, tensor var_4792_cast_fp16_14, tensor var_4792_cast_fp16_15, tensor var_4792_cast_fp16_16, tensor var_4792_cast_fp16_17, tensor var_4792_cast_fp16_18, tensor var_4792_cast_fp16_19 = split(axis = var_4792_axis_0, split_sizes = tile_53, x = var_4746_cast_fp16)[name = tensor("op_4792_cast_fp16")]; tensor aw_681_equation_0 = const()[name = tensor("aw_681_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_681_cast_fp16 = einsum(equation = aw_681_equation_0, values = (var_4771_cast_fp16_0, var_4749_cast_fp16_0))[name = tensor("aw_681_cast_fp16")]; tensor aw_683_equation_0 = const()[name = tensor("aw_683_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_683_cast_fp16 = einsum(equation = aw_683_equation_0, values = (var_4771_cast_fp16_1, var_4749_cast_fp16_1))[name = tensor("aw_683_cast_fp16")]; tensor aw_685_equation_0 = const()[name = tensor("aw_685_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_685_cast_fp16 = einsum(equation = aw_685_equation_0, values = (var_4771_cast_fp16_2, var_4749_cast_fp16_2))[name = tensor("aw_685_cast_fp16")]; tensor aw_687_equation_0 = const()[name = tensor("aw_687_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_687_cast_fp16 = einsum(equation = aw_687_equation_0, values = (var_4771_cast_fp16_3, var_4749_cast_fp16_3))[name = tensor("aw_687_cast_fp16")]; tensor aw_689_equation_0 = const()[name = tensor("aw_689_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_689_cast_fp16 = einsum(equation = aw_689_equation_0, values = (var_4771_cast_fp16_4, var_4749_cast_fp16_4))[name = tensor("aw_689_cast_fp16")]; tensor aw_691_equation_0 = const()[name = tensor("aw_691_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_691_cast_fp16 = einsum(equation = aw_691_equation_0, values = (var_4771_cast_fp16_5, var_4749_cast_fp16_5))[name = tensor("aw_691_cast_fp16")]; tensor aw_693_equation_0 = const()[name = tensor("aw_693_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_693_cast_fp16 = einsum(equation = aw_693_equation_0, values = (var_4771_cast_fp16_6, var_4749_cast_fp16_6))[name = tensor("aw_693_cast_fp16")]; tensor aw_695_equation_0 = const()[name = tensor("aw_695_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_695_cast_fp16 = einsum(equation = aw_695_equation_0, values = (var_4771_cast_fp16_7, var_4749_cast_fp16_7))[name = tensor("aw_695_cast_fp16")]; tensor aw_697_equation_0 = const()[name = tensor("aw_697_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_697_cast_fp16 = einsum(equation = aw_697_equation_0, values = (var_4771_cast_fp16_8, var_4749_cast_fp16_8))[name = tensor("aw_697_cast_fp16")]; tensor aw_699_equation_0 = const()[name = tensor("aw_699_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_699_cast_fp16 = einsum(equation = aw_699_equation_0, values = (var_4771_cast_fp16_9, var_4749_cast_fp16_9))[name = tensor("aw_699_cast_fp16")]; tensor aw_701_equation_0 = const()[name = tensor("aw_701_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_701_cast_fp16 = einsum(equation = aw_701_equation_0, values = (var_4771_cast_fp16_10, var_4749_cast_fp16_10))[name = tensor("aw_701_cast_fp16")]; tensor aw_703_equation_0 = const()[name = tensor("aw_703_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_703_cast_fp16 = einsum(equation = aw_703_equation_0, values = (var_4771_cast_fp16_11, var_4749_cast_fp16_11))[name = tensor("aw_703_cast_fp16")]; tensor aw_705_equation_0 = const()[name = tensor("aw_705_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_705_cast_fp16 = einsum(equation = aw_705_equation_0, values = (var_4771_cast_fp16_12, var_4749_cast_fp16_12))[name = tensor("aw_705_cast_fp16")]; tensor aw_707_equation_0 = const()[name = tensor("aw_707_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_707_cast_fp16 = einsum(equation = aw_707_equation_0, values = (var_4771_cast_fp16_13, var_4749_cast_fp16_13))[name = tensor("aw_707_cast_fp16")]; tensor aw_709_equation_0 = const()[name = tensor("aw_709_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_709_cast_fp16 = einsum(equation = aw_709_equation_0, values = (var_4771_cast_fp16_14, var_4749_cast_fp16_14))[name = tensor("aw_709_cast_fp16")]; tensor aw_711_equation_0 = const()[name = tensor("aw_711_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_711_cast_fp16 = einsum(equation = aw_711_equation_0, values = (var_4771_cast_fp16_15, var_4749_cast_fp16_15))[name = tensor("aw_711_cast_fp16")]; tensor aw_713_equation_0 = const()[name = tensor("aw_713_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_713_cast_fp16 = einsum(equation = aw_713_equation_0, values = (var_4771_cast_fp16_16, var_4749_cast_fp16_16))[name = tensor("aw_713_cast_fp16")]; tensor aw_715_equation_0 = const()[name = tensor("aw_715_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_715_cast_fp16 = einsum(equation = aw_715_equation_0, values = (var_4771_cast_fp16_17, var_4749_cast_fp16_17))[name = tensor("aw_715_cast_fp16")]; tensor aw_717_equation_0 = const()[name = tensor("aw_717_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_717_cast_fp16 = einsum(equation = aw_717_equation_0, values = (var_4771_cast_fp16_18, var_4749_cast_fp16_18))[name = tensor("aw_717_cast_fp16")]; tensor aw_719_equation_0 = const()[name = tensor("aw_719_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_719_cast_fp16 = einsum(equation = aw_719_equation_0, values = (var_4771_cast_fp16_19, var_4749_cast_fp16_19))[name = tensor("aw_719_cast_fp16")]; tensor var_4853_cast_fp16 = softmax(axis = var_4697, x = aw_681_cast_fp16)[name = tensor("op_4853_cast_fp16")]; tensor var_4854_cast_fp16 = softmax(axis = var_4697, x = aw_683_cast_fp16)[name = tensor("op_4854_cast_fp16")]; tensor var_4855_cast_fp16 = softmax(axis = var_4697, x = aw_685_cast_fp16)[name = tensor("op_4855_cast_fp16")]; tensor var_4856_cast_fp16 = softmax(axis = var_4697, x = aw_687_cast_fp16)[name = tensor("op_4856_cast_fp16")]; tensor var_4857_cast_fp16 = softmax(axis = var_4697, x = aw_689_cast_fp16)[name = tensor("op_4857_cast_fp16")]; tensor var_4858_cast_fp16 = softmax(axis = var_4697, x = aw_691_cast_fp16)[name = tensor("op_4858_cast_fp16")]; tensor var_4859_cast_fp16 = softmax(axis = var_4697, x = aw_693_cast_fp16)[name = tensor("op_4859_cast_fp16")]; tensor var_4860_cast_fp16 = softmax(axis = var_4697, x = aw_695_cast_fp16)[name = tensor("op_4860_cast_fp16")]; tensor var_4861_cast_fp16 = softmax(axis = var_4697, x = aw_697_cast_fp16)[name = tensor("op_4861_cast_fp16")]; tensor var_4862_cast_fp16 = softmax(axis = var_4697, x = aw_699_cast_fp16)[name = tensor("op_4862_cast_fp16")]; tensor var_4863_cast_fp16 = softmax(axis = var_4697, x = aw_701_cast_fp16)[name = tensor("op_4863_cast_fp16")]; tensor var_4864_cast_fp16 = softmax(axis = var_4697, x = aw_703_cast_fp16)[name = tensor("op_4864_cast_fp16")]; tensor var_4865_cast_fp16 = softmax(axis = var_4697, x = aw_705_cast_fp16)[name = tensor("op_4865_cast_fp16")]; tensor var_4866_cast_fp16 = softmax(axis = var_4697, x = aw_707_cast_fp16)[name = tensor("op_4866_cast_fp16")]; tensor var_4867_cast_fp16 = softmax(axis = var_4697, x = aw_709_cast_fp16)[name = tensor("op_4867_cast_fp16")]; tensor var_4868_cast_fp16 = softmax(axis = var_4697, x = aw_711_cast_fp16)[name = tensor("op_4868_cast_fp16")]; tensor var_4869_cast_fp16 = softmax(axis = var_4697, x = aw_713_cast_fp16)[name = tensor("op_4869_cast_fp16")]; tensor var_4870_cast_fp16 = softmax(axis = var_4697, x = aw_715_cast_fp16)[name = tensor("op_4870_cast_fp16")]; tensor var_4871_cast_fp16 = softmax(axis = var_4697, x = aw_717_cast_fp16)[name = tensor("op_4871_cast_fp16")]; tensor var_4872_cast_fp16 = softmax(axis = var_4697, x = aw_719_cast_fp16)[name = tensor("op_4872_cast_fp16")]; tensor var_4874_equation_0 = const()[name = tensor("op_4874_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4874_cast_fp16 = einsum(equation = var_4874_equation_0, values = (var_4792_cast_fp16_0, var_4853_cast_fp16))[name = tensor("op_4874_cast_fp16")]; tensor var_4876_equation_0 = const()[name = tensor("op_4876_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4876_cast_fp16 = einsum(equation = var_4876_equation_0, values = (var_4792_cast_fp16_1, var_4854_cast_fp16))[name = tensor("op_4876_cast_fp16")]; tensor var_4878_equation_0 = const()[name = tensor("op_4878_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4878_cast_fp16 = einsum(equation = var_4878_equation_0, values = (var_4792_cast_fp16_2, var_4855_cast_fp16))[name = tensor("op_4878_cast_fp16")]; tensor var_4880_equation_0 = const()[name = tensor("op_4880_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4880_cast_fp16 = einsum(equation = var_4880_equation_0, values = (var_4792_cast_fp16_3, var_4856_cast_fp16))[name = tensor("op_4880_cast_fp16")]; tensor var_4882_equation_0 = const()[name = tensor("op_4882_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4882_cast_fp16 = einsum(equation = var_4882_equation_0, values = (var_4792_cast_fp16_4, var_4857_cast_fp16))[name = tensor("op_4882_cast_fp16")]; tensor var_4884_equation_0 = const()[name = tensor("op_4884_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4884_cast_fp16 = einsum(equation = var_4884_equation_0, values = (var_4792_cast_fp16_5, var_4858_cast_fp16))[name = tensor("op_4884_cast_fp16")]; tensor var_4886_equation_0 = const()[name = tensor("op_4886_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4886_cast_fp16 = einsum(equation = var_4886_equation_0, values = (var_4792_cast_fp16_6, var_4859_cast_fp16))[name = tensor("op_4886_cast_fp16")]; tensor var_4888_equation_0 = const()[name = tensor("op_4888_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4888_cast_fp16 = einsum(equation = var_4888_equation_0, values = (var_4792_cast_fp16_7, var_4860_cast_fp16))[name = tensor("op_4888_cast_fp16")]; tensor var_4890_equation_0 = const()[name = tensor("op_4890_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4890_cast_fp16 = einsum(equation = var_4890_equation_0, values = (var_4792_cast_fp16_8, var_4861_cast_fp16))[name = tensor("op_4890_cast_fp16")]; tensor var_4892_equation_0 = const()[name = tensor("op_4892_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4892_cast_fp16 = einsum(equation = var_4892_equation_0, values = (var_4792_cast_fp16_9, var_4862_cast_fp16))[name = tensor("op_4892_cast_fp16")]; tensor var_4894_equation_0 = const()[name = tensor("op_4894_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4894_cast_fp16 = einsum(equation = var_4894_equation_0, values = (var_4792_cast_fp16_10, var_4863_cast_fp16))[name = tensor("op_4894_cast_fp16")]; tensor var_4896_equation_0 = const()[name = tensor("op_4896_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4896_cast_fp16 = einsum(equation = var_4896_equation_0, values = (var_4792_cast_fp16_11, var_4864_cast_fp16))[name = tensor("op_4896_cast_fp16")]; tensor var_4898_equation_0 = const()[name = tensor("op_4898_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4898_cast_fp16 = einsum(equation = var_4898_equation_0, values = (var_4792_cast_fp16_12, var_4865_cast_fp16))[name = tensor("op_4898_cast_fp16")]; tensor var_4900_equation_0 = const()[name = tensor("op_4900_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4900_cast_fp16 = einsum(equation = var_4900_equation_0, values = (var_4792_cast_fp16_13, var_4866_cast_fp16))[name = tensor("op_4900_cast_fp16")]; tensor var_4902_equation_0 = const()[name = tensor("op_4902_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4902_cast_fp16 = einsum(equation = var_4902_equation_0, values = (var_4792_cast_fp16_14, var_4867_cast_fp16))[name = tensor("op_4902_cast_fp16")]; tensor var_4904_equation_0 = const()[name = tensor("op_4904_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4904_cast_fp16 = einsum(equation = var_4904_equation_0, values = (var_4792_cast_fp16_15, var_4868_cast_fp16))[name = tensor("op_4904_cast_fp16")]; tensor var_4906_equation_0 = const()[name = tensor("op_4906_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4906_cast_fp16 = einsum(equation = var_4906_equation_0, values = (var_4792_cast_fp16_16, var_4869_cast_fp16))[name = tensor("op_4906_cast_fp16")]; tensor var_4908_equation_0 = const()[name = tensor("op_4908_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4908_cast_fp16 = einsum(equation = var_4908_equation_0, values = (var_4792_cast_fp16_17, var_4870_cast_fp16))[name = tensor("op_4908_cast_fp16")]; tensor var_4910_equation_0 = const()[name = tensor("op_4910_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4910_cast_fp16 = einsum(equation = var_4910_equation_0, values = (var_4792_cast_fp16_18, var_4871_cast_fp16))[name = tensor("op_4910_cast_fp16")]; tensor var_4912_equation_0 = const()[name = tensor("op_4912_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4912_cast_fp16 = einsum(equation = var_4912_equation_0, values = (var_4792_cast_fp16_19, var_4872_cast_fp16))[name = tensor("op_4912_cast_fp16")]; tensor input_175_interleave_0 = const()[name = tensor("input_175_interleave_0"), val = tensor(false)]; tensor input_175_cast_fp16 = concat(axis = var_4697, interleave = input_175_interleave_0, values = (var_4874_cast_fp16, var_4876_cast_fp16, var_4878_cast_fp16, var_4880_cast_fp16, var_4882_cast_fp16, var_4884_cast_fp16, var_4886_cast_fp16, var_4888_cast_fp16, var_4890_cast_fp16, var_4892_cast_fp16, var_4894_cast_fp16, var_4896_cast_fp16, var_4898_cast_fp16, var_4900_cast_fp16, var_4902_cast_fp16, var_4904_cast_fp16, var_4906_cast_fp16, var_4908_cast_fp16, var_4910_cast_fp16, var_4912_cast_fp16))[name = tensor("input_175_cast_fp16")]; tensor var_4921_pad_type_0 = const()[name = tensor("op_4921_pad_type_0"), val = tensor("valid")]; tensor var_4921_strides_0 = const()[name = tensor("op_4921_strides_0"), val = tensor([1, 1])]; tensor var_4921_pad_0 = const()[name = tensor("op_4921_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_4921_dilations_0 = const()[name = tensor("op_4921_dilations_0"), val = tensor([1, 1])]; tensor var_4921_groups_0 = const()[name = tensor("op_4921_groups_0"), val = tensor(1)]; tensor blocks_17_attn_out_weight_to_fp16 = const()[name = tensor("blocks_17_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(693505792)))]; tensor blocks_17_attn_out_bias_to_fp16 = const()[name = tensor("blocks_17_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(696782656)))]; tensor var_4921_cast_fp16 = conv(bias = blocks_17_attn_out_bias_to_fp16, dilations = var_4921_dilations_0, groups = var_4921_groups_0, pad = var_4921_pad_0, pad_type = var_4921_pad_type_0, strides = var_4921_strides_0, weight = blocks_17_attn_out_weight_to_fp16, x = input_175_cast_fp16)[name = tensor("op_4921_cast_fp16")]; tensor inputs_71_cast_fp16 = add(x = inputs_69_cast_fp16, y = var_4921_cast_fp16)[name = tensor("inputs_71_cast_fp16")]; tensor input_177_axes_0 = const()[name = tensor("input_177_axes_0"), val = tensor([1])]; tensor input_177_gamma_0_to_fp16 = const()[name = tensor("input_177_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(696785280)))]; tensor input_177_beta_0_to_fp16 = const()[name = tensor("input_177_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(696787904)))]; tensor var_4931_to_fp16 = const()[name = tensor("op_4931_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_177_cast_fp16 = layer_norm(axes = input_177_axes_0, beta = input_177_beta_0_to_fp16, epsilon = var_4931_to_fp16, gamma = input_177_gamma_0_to_fp16, x = inputs_71_cast_fp16)[name = tensor("input_177_cast_fp16")]; tensor input_179_pad_type_0 = const()[name = tensor("input_179_pad_type_0"), val = tensor("valid")]; tensor input_179_strides_0 = const()[name = tensor("input_179_strides_0"), val = tensor([1, 1])]; tensor input_179_pad_0 = const()[name = tensor("input_179_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_179_dilations_0 = const()[name = tensor("input_179_dilations_0"), val = tensor([1, 1])]; tensor input_179_groups_0 = const()[name = tensor("input_179_groups_0"), val = tensor(1)]; tensor blocks_17_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_17_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(696790528)))]; tensor blocks_17_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_17_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(709897792)))]; tensor input_179_cast_fp16 = conv(bias = blocks_17_mlp_0_bias_to_fp16, dilations = input_179_dilations_0, groups = input_179_groups_0, pad = input_179_pad_0, pad_type = input_179_pad_type_0, strides = input_179_strides_0, weight = blocks_17_mlp_0_weight_to_fp16, x = input_177_cast_fp16)[name = tensor("input_179_cast_fp16")]; tensor input_181_mode_0 = const()[name = tensor("input_181_mode_0"), val = tensor("EXACT")]; tensor input_181_cast_fp16 = gelu(mode = input_181_mode_0, x = input_179_cast_fp16)[name = tensor("input_181_cast_fp16")]; tensor var_4957_pad_type_0 = const()[name = tensor("op_4957_pad_type_0"), val = tensor("valid")]; tensor var_4957_strides_0 = const()[name = tensor("op_4957_strides_0"), val = tensor([1, 1])]; tensor var_4957_pad_0 = const()[name = tensor("op_4957_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_4957_dilations_0 = const()[name = tensor("op_4957_dilations_0"), val = tensor([1, 1])]; tensor var_4957_groups_0 = const()[name = tensor("op_4957_groups_0"), val = tensor(1)]; tensor blocks_17_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_17_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(709908096)))]; tensor blocks_17_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_17_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(723015360)))]; tensor var_4957_cast_fp16 = conv(bias = blocks_17_mlp_2_bias_to_fp16, dilations = var_4957_dilations_0, groups = var_4957_groups_0, pad = var_4957_pad_0, pad_type = var_4957_pad_type_0, strides = var_4957_strides_0, weight = blocks_17_mlp_2_weight_to_fp16, x = input_181_cast_fp16)[name = tensor("op_4957_cast_fp16")]; tensor inputs_73_cast_fp16 = add(x = inputs_71_cast_fp16, y = var_4957_cast_fp16)[name = tensor("inputs_73_cast_fp16")]; tensor var_4966 = const()[name = tensor("op_4966"), val = tensor(1)]; tensor input_183_axes_0 = const()[name = tensor("input_183_axes_0"), val = tensor([1])]; tensor input_183_gamma_0_to_fp16 = const()[name = tensor("input_183_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(723017984)))]; tensor input_183_beta_0_to_fp16 = const()[name = tensor("input_183_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(723020608)))]; tensor var_4982_to_fp16 = const()[name = tensor("op_4982_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_183_cast_fp16 = layer_norm(axes = input_183_axes_0, beta = input_183_beta_0_to_fp16, epsilon = var_4982_to_fp16, gamma = input_183_gamma_0_to_fp16, x = inputs_73_cast_fp16)[name = tensor("input_183_cast_fp16")]; tensor q_37_pad_type_0 = const()[name = tensor("q_37_pad_type_0"), val = tensor("valid")]; tensor q_37_strides_0 = const()[name = tensor("q_37_strides_0"), val = tensor([1, 1])]; tensor q_37_pad_0 = const()[name = tensor("q_37_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_37_dilations_0 = const()[name = tensor("q_37_dilations_0"), val = tensor([1, 1])]; tensor q_37_groups_0 = const()[name = tensor("q_37_groups_0"), val = tensor(1)]; tensor var_5017_weight_0_to_fp16 = const()[name = tensor("op_5017_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(723023232)))]; tensor var_5017_bias_0_to_fp16 = const()[name = tensor("op_5017_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(726300096)))]; tensor var_5017_cast_fp16 = conv(bias = var_5017_bias_0_to_fp16, dilations = q_37_dilations_0, groups = q_37_groups_0, pad = q_37_pad_0, pad_type = q_37_pad_type_0, strides = q_37_strides_0, weight = var_5017_weight_0_to_fp16, x = input_183_cast_fp16)[name = tensor("op_5017_cast_fp16")]; tensor k_37_pad_type_0 = const()[name = tensor("k_37_pad_type_0"), val = tensor("valid")]; tensor k_37_strides_0 = const()[name = tensor("k_37_strides_0"), val = tensor([1, 1])]; tensor k_37_pad_0 = const()[name = tensor("k_37_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_37_dilations_0 = const()[name = tensor("k_37_dilations_0"), val = tensor([1, 1])]; tensor k_37_groups_0 = const()[name = tensor("k_37_groups_0"), val = tensor(1)]; tensor blocks_18_attn_key_weight_to_fp16 = const()[name = tensor("blocks_18_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(726302720)))]; tensor k_37_cast_fp16 = conv(dilations = k_37_dilations_0, groups = k_37_groups_0, pad = k_37_pad_0, pad_type = k_37_pad_type_0, strides = k_37_strides_0, weight = blocks_18_attn_key_weight_to_fp16, x = input_183_cast_fp16)[name = tensor("k_37_cast_fp16")]; tensor var_5015_pad_type_0 = const()[name = tensor("op_5015_pad_type_0"), val = tensor("valid")]; tensor var_5015_strides_0 = const()[name = tensor("op_5015_strides_0"), val = tensor([1, 1])]; tensor var_5015_pad_0 = const()[name = tensor("op_5015_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_5015_dilations_0 = const()[name = tensor("op_5015_dilations_0"), val = tensor([1, 1])]; tensor var_5015_groups_0 = const()[name = tensor("op_5015_groups_0"), val = tensor(1)]; tensor blocks_18_attn_value_weight_to_fp16 = const()[name = tensor("blocks_18_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(729579584)))]; tensor blocks_18_attn_value_bias_to_fp16 = const()[name = tensor("blocks_18_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(732856448)))]; tensor var_5015_cast_fp16 = conv(bias = blocks_18_attn_value_bias_to_fp16, dilations = var_5015_dilations_0, groups = var_5015_groups_0, pad = var_5015_pad_0, pad_type = var_5015_pad_type_0, strides = var_5015_strides_0, weight = blocks_18_attn_value_weight_to_fp16, x = input_183_cast_fp16)[name = tensor("op_5015_cast_fp16")]; tensor tile_54 = const()[name = tensor("tile_54"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_5018_axis_0 = const()[name = tensor("op_5018_axis_0"), val = tensor(1)]; tensor var_5018_cast_fp16_0, tensor var_5018_cast_fp16_1, tensor var_5018_cast_fp16_2, tensor var_5018_cast_fp16_3, tensor var_5018_cast_fp16_4, tensor var_5018_cast_fp16_5, tensor var_5018_cast_fp16_6, tensor var_5018_cast_fp16_7, tensor var_5018_cast_fp16_8, tensor var_5018_cast_fp16_9, tensor var_5018_cast_fp16_10, tensor var_5018_cast_fp16_11, tensor var_5018_cast_fp16_12, tensor var_5018_cast_fp16_13, tensor var_5018_cast_fp16_14, tensor var_5018_cast_fp16_15, tensor var_5018_cast_fp16_16, tensor var_5018_cast_fp16_17, tensor var_5018_cast_fp16_18, tensor var_5018_cast_fp16_19 = split(axis = var_5018_axis_0, split_sizes = tile_54, x = var_5017_cast_fp16)[name = tensor("op_5018_cast_fp16")]; tensor var_5039_perm_0 = const()[name = tensor("op_5039_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_55 = const()[name = tensor("tile_55"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_5040_axis_0 = const()[name = tensor("op_5040_axis_0"), val = tensor(3)]; tensor var_5039_cast_fp16 = transpose(perm = var_5039_perm_0, x = k_37_cast_fp16)[name = tensor("transpose_14")]; tensor var_5040_cast_fp16_0, tensor var_5040_cast_fp16_1, tensor var_5040_cast_fp16_2, tensor var_5040_cast_fp16_3, tensor var_5040_cast_fp16_4, tensor var_5040_cast_fp16_5, tensor var_5040_cast_fp16_6, tensor var_5040_cast_fp16_7, tensor var_5040_cast_fp16_8, tensor var_5040_cast_fp16_9, tensor var_5040_cast_fp16_10, tensor var_5040_cast_fp16_11, tensor var_5040_cast_fp16_12, tensor var_5040_cast_fp16_13, tensor var_5040_cast_fp16_14, tensor var_5040_cast_fp16_15, tensor var_5040_cast_fp16_16, tensor var_5040_cast_fp16_17, tensor var_5040_cast_fp16_18, tensor var_5040_cast_fp16_19 = split(axis = var_5040_axis_0, split_sizes = tile_55, x = var_5039_cast_fp16)[name = tensor("op_5040_cast_fp16")]; tensor tile_56 = const()[name = tensor("tile_56"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_5061_axis_0 = const()[name = tensor("op_5061_axis_0"), val = tensor(1)]; tensor var_5061_cast_fp16_0, tensor var_5061_cast_fp16_1, tensor var_5061_cast_fp16_2, tensor var_5061_cast_fp16_3, tensor var_5061_cast_fp16_4, tensor var_5061_cast_fp16_5, tensor var_5061_cast_fp16_6, tensor var_5061_cast_fp16_7, tensor var_5061_cast_fp16_8, tensor var_5061_cast_fp16_9, tensor var_5061_cast_fp16_10, tensor var_5061_cast_fp16_11, tensor var_5061_cast_fp16_12, tensor var_5061_cast_fp16_13, tensor var_5061_cast_fp16_14, tensor var_5061_cast_fp16_15, tensor var_5061_cast_fp16_16, tensor var_5061_cast_fp16_17, tensor var_5061_cast_fp16_18, tensor var_5061_cast_fp16_19 = split(axis = var_5061_axis_0, split_sizes = tile_56, x = var_5015_cast_fp16)[name = tensor("op_5061_cast_fp16")]; tensor aw_721_equation_0 = const()[name = tensor("aw_721_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_721_cast_fp16 = einsum(equation = aw_721_equation_0, values = (var_5040_cast_fp16_0, var_5018_cast_fp16_0))[name = tensor("aw_721_cast_fp16")]; tensor aw_723_equation_0 = const()[name = tensor("aw_723_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_723_cast_fp16 = einsum(equation = aw_723_equation_0, values = (var_5040_cast_fp16_1, var_5018_cast_fp16_1))[name = tensor("aw_723_cast_fp16")]; tensor aw_725_equation_0 = const()[name = tensor("aw_725_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_725_cast_fp16 = einsum(equation = aw_725_equation_0, values = (var_5040_cast_fp16_2, var_5018_cast_fp16_2))[name = tensor("aw_725_cast_fp16")]; tensor aw_727_equation_0 = const()[name = tensor("aw_727_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_727_cast_fp16 = einsum(equation = aw_727_equation_0, values = (var_5040_cast_fp16_3, var_5018_cast_fp16_3))[name = tensor("aw_727_cast_fp16")]; tensor aw_729_equation_0 = const()[name = tensor("aw_729_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_729_cast_fp16 = einsum(equation = aw_729_equation_0, values = (var_5040_cast_fp16_4, var_5018_cast_fp16_4))[name = tensor("aw_729_cast_fp16")]; tensor aw_731_equation_0 = const()[name = tensor("aw_731_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_731_cast_fp16 = einsum(equation = aw_731_equation_0, values = (var_5040_cast_fp16_5, var_5018_cast_fp16_5))[name = tensor("aw_731_cast_fp16")]; tensor aw_733_equation_0 = const()[name = tensor("aw_733_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_733_cast_fp16 = einsum(equation = aw_733_equation_0, values = (var_5040_cast_fp16_6, var_5018_cast_fp16_6))[name = tensor("aw_733_cast_fp16")]; tensor aw_735_equation_0 = const()[name = tensor("aw_735_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_735_cast_fp16 = einsum(equation = aw_735_equation_0, values = (var_5040_cast_fp16_7, var_5018_cast_fp16_7))[name = tensor("aw_735_cast_fp16")]; tensor aw_737_equation_0 = const()[name = tensor("aw_737_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_737_cast_fp16 = einsum(equation = aw_737_equation_0, values = (var_5040_cast_fp16_8, var_5018_cast_fp16_8))[name = tensor("aw_737_cast_fp16")]; tensor aw_739_equation_0 = const()[name = tensor("aw_739_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_739_cast_fp16 = einsum(equation = aw_739_equation_0, values = (var_5040_cast_fp16_9, var_5018_cast_fp16_9))[name = tensor("aw_739_cast_fp16")]; tensor aw_741_equation_0 = const()[name = tensor("aw_741_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_741_cast_fp16 = einsum(equation = aw_741_equation_0, values = (var_5040_cast_fp16_10, var_5018_cast_fp16_10))[name = tensor("aw_741_cast_fp16")]; tensor aw_743_equation_0 = const()[name = tensor("aw_743_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_743_cast_fp16 = einsum(equation = aw_743_equation_0, values = (var_5040_cast_fp16_11, var_5018_cast_fp16_11))[name = tensor("aw_743_cast_fp16")]; tensor aw_745_equation_0 = const()[name = tensor("aw_745_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_745_cast_fp16 = einsum(equation = aw_745_equation_0, values = (var_5040_cast_fp16_12, var_5018_cast_fp16_12))[name = tensor("aw_745_cast_fp16")]; tensor aw_747_equation_0 = const()[name = tensor("aw_747_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_747_cast_fp16 = einsum(equation = aw_747_equation_0, values = (var_5040_cast_fp16_13, var_5018_cast_fp16_13))[name = tensor("aw_747_cast_fp16")]; tensor aw_749_equation_0 = const()[name = tensor("aw_749_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_749_cast_fp16 = einsum(equation = aw_749_equation_0, values = (var_5040_cast_fp16_14, var_5018_cast_fp16_14))[name = tensor("aw_749_cast_fp16")]; tensor aw_751_equation_0 = const()[name = tensor("aw_751_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_751_cast_fp16 = einsum(equation = aw_751_equation_0, values = (var_5040_cast_fp16_15, var_5018_cast_fp16_15))[name = tensor("aw_751_cast_fp16")]; tensor aw_753_equation_0 = const()[name = tensor("aw_753_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_753_cast_fp16 = einsum(equation = aw_753_equation_0, values = (var_5040_cast_fp16_16, var_5018_cast_fp16_16))[name = tensor("aw_753_cast_fp16")]; tensor aw_755_equation_0 = const()[name = tensor("aw_755_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_755_cast_fp16 = einsum(equation = aw_755_equation_0, values = (var_5040_cast_fp16_17, var_5018_cast_fp16_17))[name = tensor("aw_755_cast_fp16")]; tensor aw_757_equation_0 = const()[name = tensor("aw_757_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_757_cast_fp16 = einsum(equation = aw_757_equation_0, values = (var_5040_cast_fp16_18, var_5018_cast_fp16_18))[name = tensor("aw_757_cast_fp16")]; tensor aw_759_equation_0 = const()[name = tensor("aw_759_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_759_cast_fp16 = einsum(equation = aw_759_equation_0, values = (var_5040_cast_fp16_19, var_5018_cast_fp16_19))[name = tensor("aw_759_cast_fp16")]; tensor var_5122_cast_fp16 = softmax(axis = var_4966, x = aw_721_cast_fp16)[name = tensor("op_5122_cast_fp16")]; tensor var_5123_cast_fp16 = softmax(axis = var_4966, x = aw_723_cast_fp16)[name = tensor("op_5123_cast_fp16")]; tensor var_5124_cast_fp16 = softmax(axis = var_4966, x = aw_725_cast_fp16)[name = tensor("op_5124_cast_fp16")]; tensor var_5125_cast_fp16 = softmax(axis = var_4966, x = aw_727_cast_fp16)[name = tensor("op_5125_cast_fp16")]; tensor var_5126_cast_fp16 = softmax(axis = var_4966, x = aw_729_cast_fp16)[name = tensor("op_5126_cast_fp16")]; tensor var_5127_cast_fp16 = softmax(axis = var_4966, x = aw_731_cast_fp16)[name = tensor("op_5127_cast_fp16")]; tensor var_5128_cast_fp16 = softmax(axis = var_4966, x = aw_733_cast_fp16)[name = tensor("op_5128_cast_fp16")]; tensor var_5129_cast_fp16 = softmax(axis = var_4966, x = aw_735_cast_fp16)[name = tensor("op_5129_cast_fp16")]; tensor var_5130_cast_fp16 = softmax(axis = var_4966, x = aw_737_cast_fp16)[name = tensor("op_5130_cast_fp16")]; tensor var_5131_cast_fp16 = softmax(axis = var_4966, x = aw_739_cast_fp16)[name = tensor("op_5131_cast_fp16")]; tensor var_5132_cast_fp16 = softmax(axis = var_4966, x = aw_741_cast_fp16)[name = tensor("op_5132_cast_fp16")]; tensor var_5133_cast_fp16 = softmax(axis = var_4966, x = aw_743_cast_fp16)[name = tensor("op_5133_cast_fp16")]; tensor var_5134_cast_fp16 = softmax(axis = var_4966, x = aw_745_cast_fp16)[name = tensor("op_5134_cast_fp16")]; tensor var_5135_cast_fp16 = softmax(axis = var_4966, x = aw_747_cast_fp16)[name = tensor("op_5135_cast_fp16")]; tensor var_5136_cast_fp16 = softmax(axis = var_4966, x = aw_749_cast_fp16)[name = tensor("op_5136_cast_fp16")]; tensor var_5137_cast_fp16 = softmax(axis = var_4966, x = aw_751_cast_fp16)[name = tensor("op_5137_cast_fp16")]; tensor var_5138_cast_fp16 = softmax(axis = var_4966, x = aw_753_cast_fp16)[name = tensor("op_5138_cast_fp16")]; tensor var_5139_cast_fp16 = softmax(axis = var_4966, x = aw_755_cast_fp16)[name = tensor("op_5139_cast_fp16")]; tensor var_5140_cast_fp16 = softmax(axis = var_4966, x = aw_757_cast_fp16)[name = tensor("op_5140_cast_fp16")]; tensor var_5141_cast_fp16 = softmax(axis = var_4966, x = aw_759_cast_fp16)[name = tensor("op_5141_cast_fp16")]; tensor var_5143_equation_0 = const()[name = tensor("op_5143_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5143_cast_fp16 = einsum(equation = var_5143_equation_0, values = (var_5061_cast_fp16_0, var_5122_cast_fp16))[name = tensor("op_5143_cast_fp16")]; tensor var_5145_equation_0 = const()[name = tensor("op_5145_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5145_cast_fp16 = einsum(equation = var_5145_equation_0, values = (var_5061_cast_fp16_1, var_5123_cast_fp16))[name = tensor("op_5145_cast_fp16")]; tensor var_5147_equation_0 = const()[name = tensor("op_5147_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5147_cast_fp16 = einsum(equation = var_5147_equation_0, values = (var_5061_cast_fp16_2, var_5124_cast_fp16))[name = tensor("op_5147_cast_fp16")]; tensor var_5149_equation_0 = const()[name = tensor("op_5149_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5149_cast_fp16 = einsum(equation = var_5149_equation_0, values = (var_5061_cast_fp16_3, var_5125_cast_fp16))[name = tensor("op_5149_cast_fp16")]; tensor var_5151_equation_0 = const()[name = tensor("op_5151_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5151_cast_fp16 = einsum(equation = var_5151_equation_0, values = (var_5061_cast_fp16_4, var_5126_cast_fp16))[name = tensor("op_5151_cast_fp16")]; tensor var_5153_equation_0 = const()[name = tensor("op_5153_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5153_cast_fp16 = einsum(equation = var_5153_equation_0, values = (var_5061_cast_fp16_5, var_5127_cast_fp16))[name = tensor("op_5153_cast_fp16")]; tensor var_5155_equation_0 = const()[name = tensor("op_5155_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5155_cast_fp16 = einsum(equation = var_5155_equation_0, values = (var_5061_cast_fp16_6, var_5128_cast_fp16))[name = tensor("op_5155_cast_fp16")]; tensor var_5157_equation_0 = const()[name = tensor("op_5157_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5157_cast_fp16 = einsum(equation = var_5157_equation_0, values = (var_5061_cast_fp16_7, var_5129_cast_fp16))[name = tensor("op_5157_cast_fp16")]; tensor var_5159_equation_0 = const()[name = tensor("op_5159_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5159_cast_fp16 = einsum(equation = var_5159_equation_0, values = (var_5061_cast_fp16_8, var_5130_cast_fp16))[name = tensor("op_5159_cast_fp16")]; tensor var_5161_equation_0 = const()[name = tensor("op_5161_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5161_cast_fp16 = einsum(equation = var_5161_equation_0, values = (var_5061_cast_fp16_9, var_5131_cast_fp16))[name = tensor("op_5161_cast_fp16")]; tensor var_5163_equation_0 = const()[name = tensor("op_5163_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5163_cast_fp16 = einsum(equation = var_5163_equation_0, values = (var_5061_cast_fp16_10, var_5132_cast_fp16))[name = tensor("op_5163_cast_fp16")]; tensor var_5165_equation_0 = const()[name = tensor("op_5165_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5165_cast_fp16 = einsum(equation = var_5165_equation_0, values = (var_5061_cast_fp16_11, var_5133_cast_fp16))[name = tensor("op_5165_cast_fp16")]; tensor var_5167_equation_0 = const()[name = tensor("op_5167_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5167_cast_fp16 = einsum(equation = var_5167_equation_0, values = (var_5061_cast_fp16_12, var_5134_cast_fp16))[name = tensor("op_5167_cast_fp16")]; tensor var_5169_equation_0 = const()[name = tensor("op_5169_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5169_cast_fp16 = einsum(equation = var_5169_equation_0, values = (var_5061_cast_fp16_13, var_5135_cast_fp16))[name = tensor("op_5169_cast_fp16")]; tensor var_5171_equation_0 = const()[name = tensor("op_5171_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5171_cast_fp16 = einsum(equation = var_5171_equation_0, values = (var_5061_cast_fp16_14, var_5136_cast_fp16))[name = tensor("op_5171_cast_fp16")]; tensor var_5173_equation_0 = const()[name = tensor("op_5173_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5173_cast_fp16 = einsum(equation = var_5173_equation_0, values = (var_5061_cast_fp16_15, var_5137_cast_fp16))[name = tensor("op_5173_cast_fp16")]; tensor var_5175_equation_0 = const()[name = tensor("op_5175_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5175_cast_fp16 = einsum(equation = var_5175_equation_0, values = (var_5061_cast_fp16_16, var_5138_cast_fp16))[name = tensor("op_5175_cast_fp16")]; tensor var_5177_equation_0 = const()[name = tensor("op_5177_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5177_cast_fp16 = einsum(equation = var_5177_equation_0, values = (var_5061_cast_fp16_17, var_5139_cast_fp16))[name = tensor("op_5177_cast_fp16")]; tensor var_5179_equation_0 = const()[name = tensor("op_5179_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5179_cast_fp16 = einsum(equation = var_5179_equation_0, values = (var_5061_cast_fp16_18, var_5140_cast_fp16))[name = tensor("op_5179_cast_fp16")]; tensor var_5181_equation_0 = const()[name = tensor("op_5181_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5181_cast_fp16 = einsum(equation = var_5181_equation_0, values = (var_5061_cast_fp16_19, var_5141_cast_fp16))[name = tensor("op_5181_cast_fp16")]; tensor input_185_interleave_0 = const()[name = tensor("input_185_interleave_0"), val = tensor(false)]; tensor input_185_cast_fp16 = concat(axis = var_4966, interleave = input_185_interleave_0, values = (var_5143_cast_fp16, var_5145_cast_fp16, var_5147_cast_fp16, var_5149_cast_fp16, var_5151_cast_fp16, var_5153_cast_fp16, var_5155_cast_fp16, var_5157_cast_fp16, var_5159_cast_fp16, var_5161_cast_fp16, var_5163_cast_fp16, var_5165_cast_fp16, var_5167_cast_fp16, var_5169_cast_fp16, var_5171_cast_fp16, var_5173_cast_fp16, var_5175_cast_fp16, var_5177_cast_fp16, var_5179_cast_fp16, var_5181_cast_fp16))[name = tensor("input_185_cast_fp16")]; tensor var_5190_pad_type_0 = const()[name = tensor("op_5190_pad_type_0"), val = tensor("valid")]; tensor var_5190_strides_0 = const()[name = tensor("op_5190_strides_0"), val = tensor([1, 1])]; tensor var_5190_pad_0 = const()[name = tensor("op_5190_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_5190_dilations_0 = const()[name = tensor("op_5190_dilations_0"), val = tensor([1, 1])]; tensor var_5190_groups_0 = const()[name = tensor("op_5190_groups_0"), val = tensor(1)]; tensor blocks_18_attn_out_weight_to_fp16 = const()[name = tensor("blocks_18_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(732859072)))]; tensor blocks_18_attn_out_bias_to_fp16 = const()[name = tensor("blocks_18_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(736135936)))]; tensor var_5190_cast_fp16 = conv(bias = blocks_18_attn_out_bias_to_fp16, dilations = var_5190_dilations_0, groups = var_5190_groups_0, pad = var_5190_pad_0, pad_type = var_5190_pad_type_0, strides = var_5190_strides_0, weight = blocks_18_attn_out_weight_to_fp16, x = input_185_cast_fp16)[name = tensor("op_5190_cast_fp16")]; tensor inputs_75_cast_fp16 = add(x = inputs_73_cast_fp16, y = var_5190_cast_fp16)[name = tensor("inputs_75_cast_fp16")]; tensor input_187_axes_0 = const()[name = tensor("input_187_axes_0"), val = tensor([1])]; tensor input_187_gamma_0_to_fp16 = const()[name = tensor("input_187_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(736138560)))]; tensor input_187_beta_0_to_fp16 = const()[name = tensor("input_187_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(736141184)))]; tensor var_5200_to_fp16 = const()[name = tensor("op_5200_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_187_cast_fp16 = layer_norm(axes = input_187_axes_0, beta = input_187_beta_0_to_fp16, epsilon = var_5200_to_fp16, gamma = input_187_gamma_0_to_fp16, x = inputs_75_cast_fp16)[name = tensor("input_187_cast_fp16")]; tensor input_189_pad_type_0 = const()[name = tensor("input_189_pad_type_0"), val = tensor("valid")]; tensor input_189_strides_0 = const()[name = tensor("input_189_strides_0"), val = tensor([1, 1])]; tensor input_189_pad_0 = const()[name = tensor("input_189_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_189_dilations_0 = const()[name = tensor("input_189_dilations_0"), val = tensor([1, 1])]; tensor input_189_groups_0 = const()[name = tensor("input_189_groups_0"), val = tensor(1)]; tensor blocks_18_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_18_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(736143808)))]; tensor blocks_18_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_18_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(749251072)))]; tensor input_189_cast_fp16 = conv(bias = blocks_18_mlp_0_bias_to_fp16, dilations = input_189_dilations_0, groups = input_189_groups_0, pad = input_189_pad_0, pad_type = input_189_pad_type_0, strides = input_189_strides_0, weight = blocks_18_mlp_0_weight_to_fp16, x = input_187_cast_fp16)[name = tensor("input_189_cast_fp16")]; tensor input_191_mode_0 = const()[name = tensor("input_191_mode_0"), val = tensor("EXACT")]; tensor input_191_cast_fp16 = gelu(mode = input_191_mode_0, x = input_189_cast_fp16)[name = tensor("input_191_cast_fp16")]; tensor var_5226_pad_type_0 = const()[name = tensor("op_5226_pad_type_0"), val = tensor("valid")]; tensor var_5226_strides_0 = const()[name = tensor("op_5226_strides_0"), val = tensor([1, 1])]; tensor var_5226_pad_0 = const()[name = tensor("op_5226_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_5226_dilations_0 = const()[name = tensor("op_5226_dilations_0"), val = tensor([1, 1])]; tensor var_5226_groups_0 = const()[name = tensor("op_5226_groups_0"), val = tensor(1)]; tensor blocks_18_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_18_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(749261376)))]; tensor blocks_18_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_18_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(762368640)))]; tensor var_5226_cast_fp16 = conv(bias = blocks_18_mlp_2_bias_to_fp16, dilations = var_5226_dilations_0, groups = var_5226_groups_0, pad = var_5226_pad_0, pad_type = var_5226_pad_type_0, strides = var_5226_strides_0, weight = blocks_18_mlp_2_weight_to_fp16, x = input_191_cast_fp16)[name = tensor("op_5226_cast_fp16")]; tensor inputs_77_cast_fp16 = add(x = inputs_75_cast_fp16, y = var_5226_cast_fp16)[name = tensor("inputs_77_cast_fp16")]; tensor var_5235 = const()[name = tensor("op_5235"), val = tensor(1)]; tensor input_193_axes_0 = const()[name = tensor("input_193_axes_0"), val = tensor([1])]; tensor input_193_gamma_0_to_fp16 = const()[name = tensor("input_193_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(762371264)))]; tensor input_193_beta_0_to_fp16 = const()[name = tensor("input_193_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(762373888)))]; tensor var_5251_to_fp16 = const()[name = tensor("op_5251_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_193_cast_fp16 = layer_norm(axes = input_193_axes_0, beta = input_193_beta_0_to_fp16, epsilon = var_5251_to_fp16, gamma = input_193_gamma_0_to_fp16, x = inputs_77_cast_fp16)[name = tensor("input_193_cast_fp16")]; tensor q_39_pad_type_0 = const()[name = tensor("q_39_pad_type_0"), val = tensor("valid")]; tensor q_39_strides_0 = const()[name = tensor("q_39_strides_0"), val = tensor([1, 1])]; tensor q_39_pad_0 = const()[name = tensor("q_39_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_39_dilations_0 = const()[name = tensor("q_39_dilations_0"), val = tensor([1, 1])]; tensor q_39_groups_0 = const()[name = tensor("q_39_groups_0"), val = tensor(1)]; tensor var_5286_weight_0_to_fp16 = const()[name = tensor("op_5286_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(762376512)))]; tensor var_5286_bias_0_to_fp16 = const()[name = tensor("op_5286_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(765653376)))]; tensor var_5286_cast_fp16 = conv(bias = var_5286_bias_0_to_fp16, dilations = q_39_dilations_0, groups = q_39_groups_0, pad = q_39_pad_0, pad_type = q_39_pad_type_0, strides = q_39_strides_0, weight = var_5286_weight_0_to_fp16, x = input_193_cast_fp16)[name = tensor("op_5286_cast_fp16")]; tensor k_39_pad_type_0 = const()[name = tensor("k_39_pad_type_0"), val = tensor("valid")]; tensor k_39_strides_0 = const()[name = tensor("k_39_strides_0"), val = tensor([1, 1])]; tensor k_39_pad_0 = const()[name = tensor("k_39_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_39_dilations_0 = const()[name = tensor("k_39_dilations_0"), val = tensor([1, 1])]; tensor k_39_groups_0 = const()[name = tensor("k_39_groups_0"), val = tensor(1)]; tensor blocks_19_attn_key_weight_to_fp16 = const()[name = tensor("blocks_19_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(765656000)))]; tensor k_39_cast_fp16 = conv(dilations = k_39_dilations_0, groups = k_39_groups_0, pad = k_39_pad_0, pad_type = k_39_pad_type_0, strides = k_39_strides_0, weight = blocks_19_attn_key_weight_to_fp16, x = input_193_cast_fp16)[name = tensor("k_39_cast_fp16")]; tensor var_5284_pad_type_0 = const()[name = tensor("op_5284_pad_type_0"), val = tensor("valid")]; tensor var_5284_strides_0 = const()[name = tensor("op_5284_strides_0"), val = tensor([1, 1])]; tensor var_5284_pad_0 = const()[name = tensor("op_5284_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_5284_dilations_0 = const()[name = tensor("op_5284_dilations_0"), val = tensor([1, 1])]; tensor var_5284_groups_0 = const()[name = tensor("op_5284_groups_0"), val = tensor(1)]; tensor blocks_19_attn_value_weight_to_fp16 = const()[name = tensor("blocks_19_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(768932864)))]; tensor blocks_19_attn_value_bias_to_fp16 = const()[name = tensor("blocks_19_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(772209728)))]; tensor var_5284_cast_fp16 = conv(bias = blocks_19_attn_value_bias_to_fp16, dilations = var_5284_dilations_0, groups = var_5284_groups_0, pad = var_5284_pad_0, pad_type = var_5284_pad_type_0, strides = var_5284_strides_0, weight = blocks_19_attn_value_weight_to_fp16, x = input_193_cast_fp16)[name = tensor("op_5284_cast_fp16")]; tensor tile_57 = const()[name = tensor("tile_57"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_5287_axis_0 = const()[name = tensor("op_5287_axis_0"), val = tensor(1)]; tensor var_5287_cast_fp16_0, tensor var_5287_cast_fp16_1, tensor var_5287_cast_fp16_2, tensor var_5287_cast_fp16_3, tensor var_5287_cast_fp16_4, tensor var_5287_cast_fp16_5, tensor var_5287_cast_fp16_6, tensor var_5287_cast_fp16_7, tensor var_5287_cast_fp16_8, tensor var_5287_cast_fp16_9, tensor var_5287_cast_fp16_10, tensor var_5287_cast_fp16_11, tensor var_5287_cast_fp16_12, tensor var_5287_cast_fp16_13, tensor var_5287_cast_fp16_14, tensor var_5287_cast_fp16_15, tensor var_5287_cast_fp16_16, tensor var_5287_cast_fp16_17, tensor var_5287_cast_fp16_18, tensor var_5287_cast_fp16_19 = split(axis = var_5287_axis_0, split_sizes = tile_57, x = var_5286_cast_fp16)[name = tensor("op_5287_cast_fp16")]; tensor var_5308_perm_0 = const()[name = tensor("op_5308_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_58 = const()[name = tensor("tile_58"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_5309_axis_0 = const()[name = tensor("op_5309_axis_0"), val = tensor(3)]; tensor var_5308_cast_fp16 = transpose(perm = var_5308_perm_0, x = k_39_cast_fp16)[name = tensor("transpose_13")]; tensor var_5309_cast_fp16_0, tensor var_5309_cast_fp16_1, tensor var_5309_cast_fp16_2, tensor var_5309_cast_fp16_3, tensor var_5309_cast_fp16_4, tensor var_5309_cast_fp16_5, tensor var_5309_cast_fp16_6, tensor var_5309_cast_fp16_7, tensor var_5309_cast_fp16_8, tensor var_5309_cast_fp16_9, tensor var_5309_cast_fp16_10, tensor var_5309_cast_fp16_11, tensor var_5309_cast_fp16_12, tensor var_5309_cast_fp16_13, tensor var_5309_cast_fp16_14, tensor var_5309_cast_fp16_15, tensor var_5309_cast_fp16_16, tensor var_5309_cast_fp16_17, tensor var_5309_cast_fp16_18, tensor var_5309_cast_fp16_19 = split(axis = var_5309_axis_0, split_sizes = tile_58, x = var_5308_cast_fp16)[name = tensor("op_5309_cast_fp16")]; tensor tile_59 = const()[name = tensor("tile_59"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_5330_axis_0 = const()[name = tensor("op_5330_axis_0"), val = tensor(1)]; tensor var_5330_cast_fp16_0, tensor var_5330_cast_fp16_1, tensor var_5330_cast_fp16_2, tensor var_5330_cast_fp16_3, tensor var_5330_cast_fp16_4, tensor var_5330_cast_fp16_5, tensor var_5330_cast_fp16_6, tensor var_5330_cast_fp16_7, tensor var_5330_cast_fp16_8, tensor var_5330_cast_fp16_9, tensor var_5330_cast_fp16_10, tensor var_5330_cast_fp16_11, tensor var_5330_cast_fp16_12, tensor var_5330_cast_fp16_13, tensor var_5330_cast_fp16_14, tensor var_5330_cast_fp16_15, tensor var_5330_cast_fp16_16, tensor var_5330_cast_fp16_17, tensor var_5330_cast_fp16_18, tensor var_5330_cast_fp16_19 = split(axis = var_5330_axis_0, split_sizes = tile_59, x = var_5284_cast_fp16)[name = tensor("op_5330_cast_fp16")]; tensor aw_761_equation_0 = const()[name = tensor("aw_761_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_761_cast_fp16 = einsum(equation = aw_761_equation_0, values = (var_5309_cast_fp16_0, var_5287_cast_fp16_0))[name = tensor("aw_761_cast_fp16")]; tensor aw_763_equation_0 = const()[name = tensor("aw_763_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_763_cast_fp16 = einsum(equation = aw_763_equation_0, values = (var_5309_cast_fp16_1, var_5287_cast_fp16_1))[name = tensor("aw_763_cast_fp16")]; tensor aw_765_equation_0 = const()[name = tensor("aw_765_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_765_cast_fp16 = einsum(equation = aw_765_equation_0, values = (var_5309_cast_fp16_2, var_5287_cast_fp16_2))[name = tensor("aw_765_cast_fp16")]; tensor aw_767_equation_0 = const()[name = tensor("aw_767_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_767_cast_fp16 = einsum(equation = aw_767_equation_0, values = (var_5309_cast_fp16_3, var_5287_cast_fp16_3))[name = tensor("aw_767_cast_fp16")]; tensor aw_769_equation_0 = const()[name = tensor("aw_769_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_769_cast_fp16 = einsum(equation = aw_769_equation_0, values = (var_5309_cast_fp16_4, var_5287_cast_fp16_4))[name = tensor("aw_769_cast_fp16")]; tensor aw_771_equation_0 = const()[name = tensor("aw_771_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_771_cast_fp16 = einsum(equation = aw_771_equation_0, values = (var_5309_cast_fp16_5, var_5287_cast_fp16_5))[name = tensor("aw_771_cast_fp16")]; tensor aw_773_equation_0 = const()[name = tensor("aw_773_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_773_cast_fp16 = einsum(equation = aw_773_equation_0, values = (var_5309_cast_fp16_6, var_5287_cast_fp16_6))[name = tensor("aw_773_cast_fp16")]; tensor aw_775_equation_0 = const()[name = tensor("aw_775_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_775_cast_fp16 = einsum(equation = aw_775_equation_0, values = (var_5309_cast_fp16_7, var_5287_cast_fp16_7))[name = tensor("aw_775_cast_fp16")]; tensor aw_777_equation_0 = const()[name = tensor("aw_777_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_777_cast_fp16 = einsum(equation = aw_777_equation_0, values = (var_5309_cast_fp16_8, var_5287_cast_fp16_8))[name = tensor("aw_777_cast_fp16")]; tensor aw_779_equation_0 = const()[name = tensor("aw_779_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_779_cast_fp16 = einsum(equation = aw_779_equation_0, values = (var_5309_cast_fp16_9, var_5287_cast_fp16_9))[name = tensor("aw_779_cast_fp16")]; tensor aw_781_equation_0 = const()[name = tensor("aw_781_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_781_cast_fp16 = einsum(equation = aw_781_equation_0, values = (var_5309_cast_fp16_10, var_5287_cast_fp16_10))[name = tensor("aw_781_cast_fp16")]; tensor aw_783_equation_0 = const()[name = tensor("aw_783_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_783_cast_fp16 = einsum(equation = aw_783_equation_0, values = (var_5309_cast_fp16_11, var_5287_cast_fp16_11))[name = tensor("aw_783_cast_fp16")]; tensor aw_785_equation_0 = const()[name = tensor("aw_785_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_785_cast_fp16 = einsum(equation = aw_785_equation_0, values = (var_5309_cast_fp16_12, var_5287_cast_fp16_12))[name = tensor("aw_785_cast_fp16")]; tensor aw_787_equation_0 = const()[name = tensor("aw_787_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_787_cast_fp16 = einsum(equation = aw_787_equation_0, values = (var_5309_cast_fp16_13, var_5287_cast_fp16_13))[name = tensor("aw_787_cast_fp16")]; tensor aw_789_equation_0 = const()[name = tensor("aw_789_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_789_cast_fp16 = einsum(equation = aw_789_equation_0, values = (var_5309_cast_fp16_14, var_5287_cast_fp16_14))[name = tensor("aw_789_cast_fp16")]; tensor aw_791_equation_0 = const()[name = tensor("aw_791_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_791_cast_fp16 = einsum(equation = aw_791_equation_0, values = (var_5309_cast_fp16_15, var_5287_cast_fp16_15))[name = tensor("aw_791_cast_fp16")]; tensor aw_793_equation_0 = const()[name = tensor("aw_793_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_793_cast_fp16 = einsum(equation = aw_793_equation_0, values = (var_5309_cast_fp16_16, var_5287_cast_fp16_16))[name = tensor("aw_793_cast_fp16")]; tensor aw_795_equation_0 = const()[name = tensor("aw_795_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_795_cast_fp16 = einsum(equation = aw_795_equation_0, values = (var_5309_cast_fp16_17, var_5287_cast_fp16_17))[name = tensor("aw_795_cast_fp16")]; tensor aw_797_equation_0 = const()[name = tensor("aw_797_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_797_cast_fp16 = einsum(equation = aw_797_equation_0, values = (var_5309_cast_fp16_18, var_5287_cast_fp16_18))[name = tensor("aw_797_cast_fp16")]; tensor aw_799_equation_0 = const()[name = tensor("aw_799_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_799_cast_fp16 = einsum(equation = aw_799_equation_0, values = (var_5309_cast_fp16_19, var_5287_cast_fp16_19))[name = tensor("aw_799_cast_fp16")]; tensor var_5391_cast_fp16 = softmax(axis = var_5235, x = aw_761_cast_fp16)[name = tensor("op_5391_cast_fp16")]; tensor var_5392_cast_fp16 = softmax(axis = var_5235, x = aw_763_cast_fp16)[name = tensor("op_5392_cast_fp16")]; tensor var_5393_cast_fp16 = softmax(axis = var_5235, x = aw_765_cast_fp16)[name = tensor("op_5393_cast_fp16")]; tensor var_5394_cast_fp16 = softmax(axis = var_5235, x = aw_767_cast_fp16)[name = tensor("op_5394_cast_fp16")]; tensor var_5395_cast_fp16 = softmax(axis = var_5235, x = aw_769_cast_fp16)[name = tensor("op_5395_cast_fp16")]; tensor var_5396_cast_fp16 = softmax(axis = var_5235, x = aw_771_cast_fp16)[name = tensor("op_5396_cast_fp16")]; tensor var_5397_cast_fp16 = softmax(axis = var_5235, x = aw_773_cast_fp16)[name = tensor("op_5397_cast_fp16")]; tensor var_5398_cast_fp16 = softmax(axis = var_5235, x = aw_775_cast_fp16)[name = tensor("op_5398_cast_fp16")]; tensor var_5399_cast_fp16 = softmax(axis = var_5235, x = aw_777_cast_fp16)[name = tensor("op_5399_cast_fp16")]; tensor var_5400_cast_fp16 = softmax(axis = var_5235, x = aw_779_cast_fp16)[name = tensor("op_5400_cast_fp16")]; tensor var_5401_cast_fp16 = softmax(axis = var_5235, x = aw_781_cast_fp16)[name = tensor("op_5401_cast_fp16")]; tensor var_5402_cast_fp16 = softmax(axis = var_5235, x = aw_783_cast_fp16)[name = tensor("op_5402_cast_fp16")]; tensor var_5403_cast_fp16 = softmax(axis = var_5235, x = aw_785_cast_fp16)[name = tensor("op_5403_cast_fp16")]; tensor var_5404_cast_fp16 = softmax(axis = var_5235, x = aw_787_cast_fp16)[name = tensor("op_5404_cast_fp16")]; tensor var_5405_cast_fp16 = softmax(axis = var_5235, x = aw_789_cast_fp16)[name = tensor("op_5405_cast_fp16")]; tensor var_5406_cast_fp16 = softmax(axis = var_5235, x = aw_791_cast_fp16)[name = tensor("op_5406_cast_fp16")]; tensor var_5407_cast_fp16 = softmax(axis = var_5235, x = aw_793_cast_fp16)[name = tensor("op_5407_cast_fp16")]; tensor var_5408_cast_fp16 = softmax(axis = var_5235, x = aw_795_cast_fp16)[name = tensor("op_5408_cast_fp16")]; tensor var_5409_cast_fp16 = softmax(axis = var_5235, x = aw_797_cast_fp16)[name = tensor("op_5409_cast_fp16")]; tensor var_5410_cast_fp16 = softmax(axis = var_5235, x = aw_799_cast_fp16)[name = tensor("op_5410_cast_fp16")]; tensor var_5412_equation_0 = const()[name = tensor("op_5412_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5412_cast_fp16 = einsum(equation = var_5412_equation_0, values = (var_5330_cast_fp16_0, var_5391_cast_fp16))[name = tensor("op_5412_cast_fp16")]; tensor var_5414_equation_0 = const()[name = tensor("op_5414_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5414_cast_fp16 = einsum(equation = var_5414_equation_0, values = (var_5330_cast_fp16_1, var_5392_cast_fp16))[name = tensor("op_5414_cast_fp16")]; tensor var_5416_equation_0 = const()[name = tensor("op_5416_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5416_cast_fp16 = einsum(equation = var_5416_equation_0, values = (var_5330_cast_fp16_2, var_5393_cast_fp16))[name = tensor("op_5416_cast_fp16")]; tensor var_5418_equation_0 = const()[name = tensor("op_5418_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5418_cast_fp16 = einsum(equation = var_5418_equation_0, values = (var_5330_cast_fp16_3, var_5394_cast_fp16))[name = tensor("op_5418_cast_fp16")]; tensor var_5420_equation_0 = const()[name = tensor("op_5420_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5420_cast_fp16 = einsum(equation = var_5420_equation_0, values = (var_5330_cast_fp16_4, var_5395_cast_fp16))[name = tensor("op_5420_cast_fp16")]; tensor var_5422_equation_0 = const()[name = tensor("op_5422_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5422_cast_fp16 = einsum(equation = var_5422_equation_0, values = (var_5330_cast_fp16_5, var_5396_cast_fp16))[name = tensor("op_5422_cast_fp16")]; tensor var_5424_equation_0 = const()[name = tensor("op_5424_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5424_cast_fp16 = einsum(equation = var_5424_equation_0, values = (var_5330_cast_fp16_6, var_5397_cast_fp16))[name = tensor("op_5424_cast_fp16")]; tensor var_5426_equation_0 = const()[name = tensor("op_5426_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5426_cast_fp16 = einsum(equation = var_5426_equation_0, values = (var_5330_cast_fp16_7, var_5398_cast_fp16))[name = tensor("op_5426_cast_fp16")]; tensor var_5428_equation_0 = const()[name = tensor("op_5428_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5428_cast_fp16 = einsum(equation = var_5428_equation_0, values = (var_5330_cast_fp16_8, var_5399_cast_fp16))[name = tensor("op_5428_cast_fp16")]; tensor var_5430_equation_0 = const()[name = tensor("op_5430_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5430_cast_fp16 = einsum(equation = var_5430_equation_0, values = (var_5330_cast_fp16_9, var_5400_cast_fp16))[name = tensor("op_5430_cast_fp16")]; tensor var_5432_equation_0 = const()[name = tensor("op_5432_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5432_cast_fp16 = einsum(equation = var_5432_equation_0, values = (var_5330_cast_fp16_10, var_5401_cast_fp16))[name = tensor("op_5432_cast_fp16")]; tensor var_5434_equation_0 = const()[name = tensor("op_5434_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5434_cast_fp16 = einsum(equation = var_5434_equation_0, values = (var_5330_cast_fp16_11, var_5402_cast_fp16))[name = tensor("op_5434_cast_fp16")]; tensor var_5436_equation_0 = const()[name = tensor("op_5436_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5436_cast_fp16 = einsum(equation = var_5436_equation_0, values = (var_5330_cast_fp16_12, var_5403_cast_fp16))[name = tensor("op_5436_cast_fp16")]; tensor var_5438_equation_0 = const()[name = tensor("op_5438_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5438_cast_fp16 = einsum(equation = var_5438_equation_0, values = (var_5330_cast_fp16_13, var_5404_cast_fp16))[name = tensor("op_5438_cast_fp16")]; tensor var_5440_equation_0 = const()[name = tensor("op_5440_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5440_cast_fp16 = einsum(equation = var_5440_equation_0, values = (var_5330_cast_fp16_14, var_5405_cast_fp16))[name = tensor("op_5440_cast_fp16")]; tensor var_5442_equation_0 = const()[name = tensor("op_5442_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5442_cast_fp16 = einsum(equation = var_5442_equation_0, values = (var_5330_cast_fp16_15, var_5406_cast_fp16))[name = tensor("op_5442_cast_fp16")]; tensor var_5444_equation_0 = const()[name = tensor("op_5444_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5444_cast_fp16 = einsum(equation = var_5444_equation_0, values = (var_5330_cast_fp16_16, var_5407_cast_fp16))[name = tensor("op_5444_cast_fp16")]; tensor var_5446_equation_0 = const()[name = tensor("op_5446_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5446_cast_fp16 = einsum(equation = var_5446_equation_0, values = (var_5330_cast_fp16_17, var_5408_cast_fp16))[name = tensor("op_5446_cast_fp16")]; tensor var_5448_equation_0 = const()[name = tensor("op_5448_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5448_cast_fp16 = einsum(equation = var_5448_equation_0, values = (var_5330_cast_fp16_18, var_5409_cast_fp16))[name = tensor("op_5448_cast_fp16")]; tensor var_5450_equation_0 = const()[name = tensor("op_5450_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5450_cast_fp16 = einsum(equation = var_5450_equation_0, values = (var_5330_cast_fp16_19, var_5410_cast_fp16))[name = tensor("op_5450_cast_fp16")]; tensor input_195_interleave_0 = const()[name = tensor("input_195_interleave_0"), val = tensor(false)]; tensor input_195_cast_fp16 = concat(axis = var_5235, interleave = input_195_interleave_0, values = (var_5412_cast_fp16, var_5414_cast_fp16, var_5416_cast_fp16, var_5418_cast_fp16, var_5420_cast_fp16, var_5422_cast_fp16, var_5424_cast_fp16, var_5426_cast_fp16, var_5428_cast_fp16, var_5430_cast_fp16, var_5432_cast_fp16, var_5434_cast_fp16, var_5436_cast_fp16, var_5438_cast_fp16, var_5440_cast_fp16, var_5442_cast_fp16, var_5444_cast_fp16, var_5446_cast_fp16, var_5448_cast_fp16, var_5450_cast_fp16))[name = tensor("input_195_cast_fp16")]; tensor var_5459_pad_type_0 = const()[name = tensor("op_5459_pad_type_0"), val = tensor("valid")]; tensor var_5459_strides_0 = const()[name = tensor("op_5459_strides_0"), val = tensor([1, 1])]; tensor var_5459_pad_0 = const()[name = tensor("op_5459_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_5459_dilations_0 = const()[name = tensor("op_5459_dilations_0"), val = tensor([1, 1])]; tensor var_5459_groups_0 = const()[name = tensor("op_5459_groups_0"), val = tensor(1)]; tensor blocks_19_attn_out_weight_to_fp16 = const()[name = tensor("blocks_19_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(772212352)))]; tensor blocks_19_attn_out_bias_to_fp16 = const()[name = tensor("blocks_19_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(775489216)))]; tensor var_5459_cast_fp16 = conv(bias = blocks_19_attn_out_bias_to_fp16, dilations = var_5459_dilations_0, groups = var_5459_groups_0, pad = var_5459_pad_0, pad_type = var_5459_pad_type_0, strides = var_5459_strides_0, weight = blocks_19_attn_out_weight_to_fp16, x = input_195_cast_fp16)[name = tensor("op_5459_cast_fp16")]; tensor inputs_79_cast_fp16 = add(x = inputs_77_cast_fp16, y = var_5459_cast_fp16)[name = tensor("inputs_79_cast_fp16")]; tensor input_197_axes_0 = const()[name = tensor("input_197_axes_0"), val = tensor([1])]; tensor input_197_gamma_0_to_fp16 = const()[name = tensor("input_197_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(775491840)))]; tensor input_197_beta_0_to_fp16 = const()[name = tensor("input_197_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(775494464)))]; tensor var_5469_to_fp16 = const()[name = tensor("op_5469_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_197_cast_fp16 = layer_norm(axes = input_197_axes_0, beta = input_197_beta_0_to_fp16, epsilon = var_5469_to_fp16, gamma = input_197_gamma_0_to_fp16, x = inputs_79_cast_fp16)[name = tensor("input_197_cast_fp16")]; tensor input_199_pad_type_0 = const()[name = tensor("input_199_pad_type_0"), val = tensor("valid")]; tensor input_199_strides_0 = const()[name = tensor("input_199_strides_0"), val = tensor([1, 1])]; tensor input_199_pad_0 = const()[name = tensor("input_199_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_199_dilations_0 = const()[name = tensor("input_199_dilations_0"), val = tensor([1, 1])]; tensor input_199_groups_0 = const()[name = tensor("input_199_groups_0"), val = tensor(1)]; tensor blocks_19_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_19_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(775497088)))]; tensor blocks_19_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_19_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(788604352)))]; tensor input_199_cast_fp16 = conv(bias = blocks_19_mlp_0_bias_to_fp16, dilations = input_199_dilations_0, groups = input_199_groups_0, pad = input_199_pad_0, pad_type = input_199_pad_type_0, strides = input_199_strides_0, weight = blocks_19_mlp_0_weight_to_fp16, x = input_197_cast_fp16)[name = tensor("input_199_cast_fp16")]; tensor input_201_mode_0 = const()[name = tensor("input_201_mode_0"), val = tensor("EXACT")]; tensor input_201_cast_fp16 = gelu(mode = input_201_mode_0, x = input_199_cast_fp16)[name = tensor("input_201_cast_fp16")]; tensor var_5495_pad_type_0 = const()[name = tensor("op_5495_pad_type_0"), val = tensor("valid")]; tensor var_5495_strides_0 = const()[name = tensor("op_5495_strides_0"), val = tensor([1, 1])]; tensor var_5495_pad_0 = const()[name = tensor("op_5495_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_5495_dilations_0 = const()[name = tensor("op_5495_dilations_0"), val = tensor([1, 1])]; tensor var_5495_groups_0 = const()[name = tensor("op_5495_groups_0"), val = tensor(1)]; tensor blocks_19_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_19_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(788614656)))]; tensor blocks_19_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_19_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(801721920)))]; tensor var_5495_cast_fp16 = conv(bias = blocks_19_mlp_2_bias_to_fp16, dilations = var_5495_dilations_0, groups = var_5495_groups_0, pad = var_5495_pad_0, pad_type = var_5495_pad_type_0, strides = var_5495_strides_0, weight = blocks_19_mlp_2_weight_to_fp16, x = input_201_cast_fp16)[name = tensor("op_5495_cast_fp16")]; tensor inputs_81_cast_fp16 = add(x = inputs_79_cast_fp16, y = var_5495_cast_fp16)[name = tensor("inputs_81_cast_fp16")]; tensor var_5504 = const()[name = tensor("op_5504"), val = tensor(1)]; tensor input_203_axes_0 = const()[name = tensor("input_203_axes_0"), val = tensor([1])]; tensor input_203_gamma_0_to_fp16 = const()[name = tensor("input_203_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(801724544)))]; tensor input_203_beta_0_to_fp16 = const()[name = tensor("input_203_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(801727168)))]; tensor var_5520_to_fp16 = const()[name = tensor("op_5520_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_203_cast_fp16 = layer_norm(axes = input_203_axes_0, beta = input_203_beta_0_to_fp16, epsilon = var_5520_to_fp16, gamma = input_203_gamma_0_to_fp16, x = inputs_81_cast_fp16)[name = tensor("input_203_cast_fp16")]; tensor q_41_pad_type_0 = const()[name = tensor("q_41_pad_type_0"), val = tensor("valid")]; tensor q_41_strides_0 = const()[name = tensor("q_41_strides_0"), val = tensor([1, 1])]; tensor q_41_pad_0 = const()[name = tensor("q_41_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_41_dilations_0 = const()[name = tensor("q_41_dilations_0"), val = tensor([1, 1])]; tensor q_41_groups_0 = const()[name = tensor("q_41_groups_0"), val = tensor(1)]; tensor var_5555_weight_0_to_fp16 = const()[name = tensor("op_5555_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(801729792)))]; tensor var_5555_bias_0_to_fp16 = const()[name = tensor("op_5555_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(805006656)))]; tensor var_5555_cast_fp16 = conv(bias = var_5555_bias_0_to_fp16, dilations = q_41_dilations_0, groups = q_41_groups_0, pad = q_41_pad_0, pad_type = q_41_pad_type_0, strides = q_41_strides_0, weight = var_5555_weight_0_to_fp16, x = input_203_cast_fp16)[name = tensor("op_5555_cast_fp16")]; tensor k_41_pad_type_0 = const()[name = tensor("k_41_pad_type_0"), val = tensor("valid")]; tensor k_41_strides_0 = const()[name = tensor("k_41_strides_0"), val = tensor([1, 1])]; tensor k_41_pad_0 = const()[name = tensor("k_41_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_41_dilations_0 = const()[name = tensor("k_41_dilations_0"), val = tensor([1, 1])]; tensor k_41_groups_0 = const()[name = tensor("k_41_groups_0"), val = tensor(1)]; tensor blocks_20_attn_key_weight_to_fp16 = const()[name = tensor("blocks_20_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(805009280)))]; tensor k_41_cast_fp16 = conv(dilations = k_41_dilations_0, groups = k_41_groups_0, pad = k_41_pad_0, pad_type = k_41_pad_type_0, strides = k_41_strides_0, weight = blocks_20_attn_key_weight_to_fp16, x = input_203_cast_fp16)[name = tensor("k_41_cast_fp16")]; tensor var_5553_pad_type_0 = const()[name = tensor("op_5553_pad_type_0"), val = tensor("valid")]; tensor var_5553_strides_0 = const()[name = tensor("op_5553_strides_0"), val = tensor([1, 1])]; tensor var_5553_pad_0 = const()[name = tensor("op_5553_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_5553_dilations_0 = const()[name = tensor("op_5553_dilations_0"), val = tensor([1, 1])]; tensor var_5553_groups_0 = const()[name = tensor("op_5553_groups_0"), val = tensor(1)]; tensor blocks_20_attn_value_weight_to_fp16 = const()[name = tensor("blocks_20_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(808286144)))]; tensor blocks_20_attn_value_bias_to_fp16 = const()[name = tensor("blocks_20_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(811563008)))]; tensor var_5553_cast_fp16 = conv(bias = blocks_20_attn_value_bias_to_fp16, dilations = var_5553_dilations_0, groups = var_5553_groups_0, pad = var_5553_pad_0, pad_type = var_5553_pad_type_0, strides = var_5553_strides_0, weight = blocks_20_attn_value_weight_to_fp16, x = input_203_cast_fp16)[name = tensor("op_5553_cast_fp16")]; tensor tile_60 = const()[name = tensor("tile_60"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_5556_axis_0 = const()[name = tensor("op_5556_axis_0"), val = tensor(1)]; tensor var_5556_cast_fp16_0, tensor var_5556_cast_fp16_1, tensor var_5556_cast_fp16_2, tensor var_5556_cast_fp16_3, tensor var_5556_cast_fp16_4, tensor var_5556_cast_fp16_5, tensor var_5556_cast_fp16_6, tensor var_5556_cast_fp16_7, tensor var_5556_cast_fp16_8, tensor var_5556_cast_fp16_9, tensor var_5556_cast_fp16_10, tensor var_5556_cast_fp16_11, tensor var_5556_cast_fp16_12, tensor var_5556_cast_fp16_13, tensor var_5556_cast_fp16_14, tensor var_5556_cast_fp16_15, tensor var_5556_cast_fp16_16, tensor var_5556_cast_fp16_17, tensor var_5556_cast_fp16_18, tensor var_5556_cast_fp16_19 = split(axis = var_5556_axis_0, split_sizes = tile_60, x = var_5555_cast_fp16)[name = tensor("op_5556_cast_fp16")]; tensor var_5577_perm_0 = const()[name = tensor("op_5577_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_61 = const()[name = tensor("tile_61"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_5578_axis_0 = const()[name = tensor("op_5578_axis_0"), val = tensor(3)]; tensor var_5577_cast_fp16 = transpose(perm = var_5577_perm_0, x = k_41_cast_fp16)[name = tensor("transpose_12")]; tensor var_5578_cast_fp16_0, tensor var_5578_cast_fp16_1, tensor var_5578_cast_fp16_2, tensor var_5578_cast_fp16_3, tensor var_5578_cast_fp16_4, tensor var_5578_cast_fp16_5, tensor var_5578_cast_fp16_6, tensor var_5578_cast_fp16_7, tensor var_5578_cast_fp16_8, tensor var_5578_cast_fp16_9, tensor var_5578_cast_fp16_10, tensor var_5578_cast_fp16_11, tensor var_5578_cast_fp16_12, tensor var_5578_cast_fp16_13, tensor var_5578_cast_fp16_14, tensor var_5578_cast_fp16_15, tensor var_5578_cast_fp16_16, tensor var_5578_cast_fp16_17, tensor var_5578_cast_fp16_18, tensor var_5578_cast_fp16_19 = split(axis = var_5578_axis_0, split_sizes = tile_61, x = var_5577_cast_fp16)[name = tensor("op_5578_cast_fp16")]; tensor tile_62 = const()[name = tensor("tile_62"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_5599_axis_0 = const()[name = tensor("op_5599_axis_0"), val = tensor(1)]; tensor var_5599_cast_fp16_0, tensor var_5599_cast_fp16_1, tensor var_5599_cast_fp16_2, tensor var_5599_cast_fp16_3, tensor var_5599_cast_fp16_4, tensor var_5599_cast_fp16_5, tensor var_5599_cast_fp16_6, tensor var_5599_cast_fp16_7, tensor var_5599_cast_fp16_8, tensor var_5599_cast_fp16_9, tensor var_5599_cast_fp16_10, tensor var_5599_cast_fp16_11, tensor var_5599_cast_fp16_12, tensor var_5599_cast_fp16_13, tensor var_5599_cast_fp16_14, tensor var_5599_cast_fp16_15, tensor var_5599_cast_fp16_16, tensor var_5599_cast_fp16_17, tensor var_5599_cast_fp16_18, tensor var_5599_cast_fp16_19 = split(axis = var_5599_axis_0, split_sizes = tile_62, x = var_5553_cast_fp16)[name = tensor("op_5599_cast_fp16")]; tensor aw_801_equation_0 = const()[name = tensor("aw_801_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_801_cast_fp16 = einsum(equation = aw_801_equation_0, values = (var_5578_cast_fp16_0, var_5556_cast_fp16_0))[name = tensor("aw_801_cast_fp16")]; tensor aw_803_equation_0 = const()[name = tensor("aw_803_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_803_cast_fp16 = einsum(equation = aw_803_equation_0, values = (var_5578_cast_fp16_1, var_5556_cast_fp16_1))[name = tensor("aw_803_cast_fp16")]; tensor aw_805_equation_0 = const()[name = tensor("aw_805_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_805_cast_fp16 = einsum(equation = aw_805_equation_0, values = (var_5578_cast_fp16_2, var_5556_cast_fp16_2))[name = tensor("aw_805_cast_fp16")]; tensor aw_807_equation_0 = const()[name = tensor("aw_807_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_807_cast_fp16 = einsum(equation = aw_807_equation_0, values = (var_5578_cast_fp16_3, var_5556_cast_fp16_3))[name = tensor("aw_807_cast_fp16")]; tensor aw_809_equation_0 = const()[name = tensor("aw_809_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_809_cast_fp16 = einsum(equation = aw_809_equation_0, values = (var_5578_cast_fp16_4, var_5556_cast_fp16_4))[name = tensor("aw_809_cast_fp16")]; tensor aw_811_equation_0 = const()[name = tensor("aw_811_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_811_cast_fp16 = einsum(equation = aw_811_equation_0, values = (var_5578_cast_fp16_5, var_5556_cast_fp16_5))[name = tensor("aw_811_cast_fp16")]; tensor aw_813_equation_0 = const()[name = tensor("aw_813_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_813_cast_fp16 = einsum(equation = aw_813_equation_0, values = (var_5578_cast_fp16_6, var_5556_cast_fp16_6))[name = tensor("aw_813_cast_fp16")]; tensor aw_815_equation_0 = const()[name = tensor("aw_815_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_815_cast_fp16 = einsum(equation = aw_815_equation_0, values = (var_5578_cast_fp16_7, var_5556_cast_fp16_7))[name = tensor("aw_815_cast_fp16")]; tensor aw_817_equation_0 = const()[name = tensor("aw_817_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_817_cast_fp16 = einsum(equation = aw_817_equation_0, values = (var_5578_cast_fp16_8, var_5556_cast_fp16_8))[name = tensor("aw_817_cast_fp16")]; tensor aw_819_equation_0 = const()[name = tensor("aw_819_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_819_cast_fp16 = einsum(equation = aw_819_equation_0, values = (var_5578_cast_fp16_9, var_5556_cast_fp16_9))[name = tensor("aw_819_cast_fp16")]; tensor aw_821_equation_0 = const()[name = tensor("aw_821_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_821_cast_fp16 = einsum(equation = aw_821_equation_0, values = (var_5578_cast_fp16_10, var_5556_cast_fp16_10))[name = tensor("aw_821_cast_fp16")]; tensor aw_823_equation_0 = const()[name = tensor("aw_823_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_823_cast_fp16 = einsum(equation = aw_823_equation_0, values = (var_5578_cast_fp16_11, var_5556_cast_fp16_11))[name = tensor("aw_823_cast_fp16")]; tensor aw_825_equation_0 = const()[name = tensor("aw_825_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_825_cast_fp16 = einsum(equation = aw_825_equation_0, values = (var_5578_cast_fp16_12, var_5556_cast_fp16_12))[name = tensor("aw_825_cast_fp16")]; tensor aw_827_equation_0 = const()[name = tensor("aw_827_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_827_cast_fp16 = einsum(equation = aw_827_equation_0, values = (var_5578_cast_fp16_13, var_5556_cast_fp16_13))[name = tensor("aw_827_cast_fp16")]; tensor aw_829_equation_0 = const()[name = tensor("aw_829_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_829_cast_fp16 = einsum(equation = aw_829_equation_0, values = (var_5578_cast_fp16_14, var_5556_cast_fp16_14))[name = tensor("aw_829_cast_fp16")]; tensor aw_831_equation_0 = const()[name = tensor("aw_831_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_831_cast_fp16 = einsum(equation = aw_831_equation_0, values = (var_5578_cast_fp16_15, var_5556_cast_fp16_15))[name = tensor("aw_831_cast_fp16")]; tensor aw_833_equation_0 = const()[name = tensor("aw_833_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_833_cast_fp16 = einsum(equation = aw_833_equation_0, values = (var_5578_cast_fp16_16, var_5556_cast_fp16_16))[name = tensor("aw_833_cast_fp16")]; tensor aw_835_equation_0 = const()[name = tensor("aw_835_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_835_cast_fp16 = einsum(equation = aw_835_equation_0, values = (var_5578_cast_fp16_17, var_5556_cast_fp16_17))[name = tensor("aw_835_cast_fp16")]; tensor aw_837_equation_0 = const()[name = tensor("aw_837_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_837_cast_fp16 = einsum(equation = aw_837_equation_0, values = (var_5578_cast_fp16_18, var_5556_cast_fp16_18))[name = tensor("aw_837_cast_fp16")]; tensor aw_839_equation_0 = const()[name = tensor("aw_839_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_839_cast_fp16 = einsum(equation = aw_839_equation_0, values = (var_5578_cast_fp16_19, var_5556_cast_fp16_19))[name = tensor("aw_839_cast_fp16")]; tensor var_5660_cast_fp16 = softmax(axis = var_5504, x = aw_801_cast_fp16)[name = tensor("op_5660_cast_fp16")]; tensor var_5661_cast_fp16 = softmax(axis = var_5504, x = aw_803_cast_fp16)[name = tensor("op_5661_cast_fp16")]; tensor var_5662_cast_fp16 = softmax(axis = var_5504, x = aw_805_cast_fp16)[name = tensor("op_5662_cast_fp16")]; tensor var_5663_cast_fp16 = softmax(axis = var_5504, x = aw_807_cast_fp16)[name = tensor("op_5663_cast_fp16")]; tensor var_5664_cast_fp16 = softmax(axis = var_5504, x = aw_809_cast_fp16)[name = tensor("op_5664_cast_fp16")]; tensor var_5665_cast_fp16 = softmax(axis = var_5504, x = aw_811_cast_fp16)[name = tensor("op_5665_cast_fp16")]; tensor var_5666_cast_fp16 = softmax(axis = var_5504, x = aw_813_cast_fp16)[name = tensor("op_5666_cast_fp16")]; tensor var_5667_cast_fp16 = softmax(axis = var_5504, x = aw_815_cast_fp16)[name = tensor("op_5667_cast_fp16")]; tensor var_5668_cast_fp16 = softmax(axis = var_5504, x = aw_817_cast_fp16)[name = tensor("op_5668_cast_fp16")]; tensor var_5669_cast_fp16 = softmax(axis = var_5504, x = aw_819_cast_fp16)[name = tensor("op_5669_cast_fp16")]; tensor var_5670_cast_fp16 = softmax(axis = var_5504, x = aw_821_cast_fp16)[name = tensor("op_5670_cast_fp16")]; tensor var_5671_cast_fp16 = softmax(axis = var_5504, x = aw_823_cast_fp16)[name = tensor("op_5671_cast_fp16")]; tensor var_5672_cast_fp16 = softmax(axis = var_5504, x = aw_825_cast_fp16)[name = tensor("op_5672_cast_fp16")]; tensor var_5673_cast_fp16 = softmax(axis = var_5504, x = aw_827_cast_fp16)[name = tensor("op_5673_cast_fp16")]; tensor var_5674_cast_fp16 = softmax(axis = var_5504, x = aw_829_cast_fp16)[name = tensor("op_5674_cast_fp16")]; tensor var_5675_cast_fp16 = softmax(axis = var_5504, x = aw_831_cast_fp16)[name = tensor("op_5675_cast_fp16")]; tensor var_5676_cast_fp16 = softmax(axis = var_5504, x = aw_833_cast_fp16)[name = tensor("op_5676_cast_fp16")]; tensor var_5677_cast_fp16 = softmax(axis = var_5504, x = aw_835_cast_fp16)[name = tensor("op_5677_cast_fp16")]; tensor var_5678_cast_fp16 = softmax(axis = var_5504, x = aw_837_cast_fp16)[name = tensor("op_5678_cast_fp16")]; tensor var_5679_cast_fp16 = softmax(axis = var_5504, x = aw_839_cast_fp16)[name = tensor("op_5679_cast_fp16")]; tensor var_5681_equation_0 = const()[name = tensor("op_5681_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5681_cast_fp16 = einsum(equation = var_5681_equation_0, values = (var_5599_cast_fp16_0, var_5660_cast_fp16))[name = tensor("op_5681_cast_fp16")]; tensor var_5683_equation_0 = const()[name = tensor("op_5683_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5683_cast_fp16 = einsum(equation = var_5683_equation_0, values = (var_5599_cast_fp16_1, var_5661_cast_fp16))[name = tensor("op_5683_cast_fp16")]; tensor var_5685_equation_0 = const()[name = tensor("op_5685_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5685_cast_fp16 = einsum(equation = var_5685_equation_0, values = (var_5599_cast_fp16_2, var_5662_cast_fp16))[name = tensor("op_5685_cast_fp16")]; tensor var_5687_equation_0 = const()[name = tensor("op_5687_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5687_cast_fp16 = einsum(equation = var_5687_equation_0, values = (var_5599_cast_fp16_3, var_5663_cast_fp16))[name = tensor("op_5687_cast_fp16")]; tensor var_5689_equation_0 = const()[name = tensor("op_5689_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5689_cast_fp16 = einsum(equation = var_5689_equation_0, values = (var_5599_cast_fp16_4, var_5664_cast_fp16))[name = tensor("op_5689_cast_fp16")]; tensor var_5691_equation_0 = const()[name = tensor("op_5691_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5691_cast_fp16 = einsum(equation = var_5691_equation_0, values = (var_5599_cast_fp16_5, var_5665_cast_fp16))[name = tensor("op_5691_cast_fp16")]; tensor var_5693_equation_0 = const()[name = tensor("op_5693_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5693_cast_fp16 = einsum(equation = var_5693_equation_0, values = (var_5599_cast_fp16_6, var_5666_cast_fp16))[name = tensor("op_5693_cast_fp16")]; tensor var_5695_equation_0 = const()[name = tensor("op_5695_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5695_cast_fp16 = einsum(equation = var_5695_equation_0, values = (var_5599_cast_fp16_7, var_5667_cast_fp16))[name = tensor("op_5695_cast_fp16")]; tensor var_5697_equation_0 = const()[name = tensor("op_5697_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5697_cast_fp16 = einsum(equation = var_5697_equation_0, values = (var_5599_cast_fp16_8, var_5668_cast_fp16))[name = tensor("op_5697_cast_fp16")]; tensor var_5699_equation_0 = const()[name = tensor("op_5699_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5699_cast_fp16 = einsum(equation = var_5699_equation_0, values = (var_5599_cast_fp16_9, var_5669_cast_fp16))[name = tensor("op_5699_cast_fp16")]; tensor var_5701_equation_0 = const()[name = tensor("op_5701_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5701_cast_fp16 = einsum(equation = var_5701_equation_0, values = (var_5599_cast_fp16_10, var_5670_cast_fp16))[name = tensor("op_5701_cast_fp16")]; tensor var_5703_equation_0 = const()[name = tensor("op_5703_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5703_cast_fp16 = einsum(equation = var_5703_equation_0, values = (var_5599_cast_fp16_11, var_5671_cast_fp16))[name = tensor("op_5703_cast_fp16")]; tensor var_5705_equation_0 = const()[name = tensor("op_5705_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5705_cast_fp16 = einsum(equation = var_5705_equation_0, values = (var_5599_cast_fp16_12, var_5672_cast_fp16))[name = tensor("op_5705_cast_fp16")]; tensor var_5707_equation_0 = const()[name = tensor("op_5707_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5707_cast_fp16 = einsum(equation = var_5707_equation_0, values = (var_5599_cast_fp16_13, var_5673_cast_fp16))[name = tensor("op_5707_cast_fp16")]; tensor var_5709_equation_0 = const()[name = tensor("op_5709_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5709_cast_fp16 = einsum(equation = var_5709_equation_0, values = (var_5599_cast_fp16_14, var_5674_cast_fp16))[name = tensor("op_5709_cast_fp16")]; tensor var_5711_equation_0 = const()[name = tensor("op_5711_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5711_cast_fp16 = einsum(equation = var_5711_equation_0, values = (var_5599_cast_fp16_15, var_5675_cast_fp16))[name = tensor("op_5711_cast_fp16")]; tensor var_5713_equation_0 = const()[name = tensor("op_5713_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5713_cast_fp16 = einsum(equation = var_5713_equation_0, values = (var_5599_cast_fp16_16, var_5676_cast_fp16))[name = tensor("op_5713_cast_fp16")]; tensor var_5715_equation_0 = const()[name = tensor("op_5715_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5715_cast_fp16 = einsum(equation = var_5715_equation_0, values = (var_5599_cast_fp16_17, var_5677_cast_fp16))[name = tensor("op_5715_cast_fp16")]; tensor var_5717_equation_0 = const()[name = tensor("op_5717_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5717_cast_fp16 = einsum(equation = var_5717_equation_0, values = (var_5599_cast_fp16_18, var_5678_cast_fp16))[name = tensor("op_5717_cast_fp16")]; tensor var_5719_equation_0 = const()[name = tensor("op_5719_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5719_cast_fp16 = einsum(equation = var_5719_equation_0, values = (var_5599_cast_fp16_19, var_5679_cast_fp16))[name = tensor("op_5719_cast_fp16")]; tensor input_205_interleave_0 = const()[name = tensor("input_205_interleave_0"), val = tensor(false)]; tensor input_205_cast_fp16 = concat(axis = var_5504, interleave = input_205_interleave_0, values = (var_5681_cast_fp16, var_5683_cast_fp16, var_5685_cast_fp16, var_5687_cast_fp16, var_5689_cast_fp16, var_5691_cast_fp16, var_5693_cast_fp16, var_5695_cast_fp16, var_5697_cast_fp16, var_5699_cast_fp16, var_5701_cast_fp16, var_5703_cast_fp16, var_5705_cast_fp16, var_5707_cast_fp16, var_5709_cast_fp16, var_5711_cast_fp16, var_5713_cast_fp16, var_5715_cast_fp16, var_5717_cast_fp16, var_5719_cast_fp16))[name = tensor("input_205_cast_fp16")]; tensor var_5728_pad_type_0 = const()[name = tensor("op_5728_pad_type_0"), val = tensor("valid")]; tensor var_5728_strides_0 = const()[name = tensor("op_5728_strides_0"), val = tensor([1, 1])]; tensor var_5728_pad_0 = const()[name = tensor("op_5728_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_5728_dilations_0 = const()[name = tensor("op_5728_dilations_0"), val = tensor([1, 1])]; tensor var_5728_groups_0 = const()[name = tensor("op_5728_groups_0"), val = tensor(1)]; tensor blocks_20_attn_out_weight_to_fp16 = const()[name = tensor("blocks_20_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(811565632)))]; tensor blocks_20_attn_out_bias_to_fp16 = const()[name = tensor("blocks_20_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(814842496)))]; tensor var_5728_cast_fp16 = conv(bias = blocks_20_attn_out_bias_to_fp16, dilations = var_5728_dilations_0, groups = var_5728_groups_0, pad = var_5728_pad_0, pad_type = var_5728_pad_type_0, strides = var_5728_strides_0, weight = blocks_20_attn_out_weight_to_fp16, x = input_205_cast_fp16)[name = tensor("op_5728_cast_fp16")]; tensor inputs_83_cast_fp16 = add(x = inputs_81_cast_fp16, y = var_5728_cast_fp16)[name = tensor("inputs_83_cast_fp16")]; tensor input_207_axes_0 = const()[name = tensor("input_207_axes_0"), val = tensor([1])]; tensor input_207_gamma_0_to_fp16 = const()[name = tensor("input_207_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(814845120)))]; tensor input_207_beta_0_to_fp16 = const()[name = tensor("input_207_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(814847744)))]; tensor var_5738_to_fp16 = const()[name = tensor("op_5738_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_207_cast_fp16 = layer_norm(axes = input_207_axes_0, beta = input_207_beta_0_to_fp16, epsilon = var_5738_to_fp16, gamma = input_207_gamma_0_to_fp16, x = inputs_83_cast_fp16)[name = tensor("input_207_cast_fp16")]; tensor input_209_pad_type_0 = const()[name = tensor("input_209_pad_type_0"), val = tensor("valid")]; tensor input_209_strides_0 = const()[name = tensor("input_209_strides_0"), val = tensor([1, 1])]; tensor input_209_pad_0 = const()[name = tensor("input_209_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_209_dilations_0 = const()[name = tensor("input_209_dilations_0"), val = tensor([1, 1])]; tensor input_209_groups_0 = const()[name = tensor("input_209_groups_0"), val = tensor(1)]; tensor blocks_20_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_20_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(814850368)))]; tensor blocks_20_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_20_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(827957632)))]; tensor input_209_cast_fp16 = conv(bias = blocks_20_mlp_0_bias_to_fp16, dilations = input_209_dilations_0, groups = input_209_groups_0, pad = input_209_pad_0, pad_type = input_209_pad_type_0, strides = input_209_strides_0, weight = blocks_20_mlp_0_weight_to_fp16, x = input_207_cast_fp16)[name = tensor("input_209_cast_fp16")]; tensor input_211_mode_0 = const()[name = tensor("input_211_mode_0"), val = tensor("EXACT")]; tensor input_211_cast_fp16 = gelu(mode = input_211_mode_0, x = input_209_cast_fp16)[name = tensor("input_211_cast_fp16")]; tensor var_5764_pad_type_0 = const()[name = tensor("op_5764_pad_type_0"), val = tensor("valid")]; tensor var_5764_strides_0 = const()[name = tensor("op_5764_strides_0"), val = tensor([1, 1])]; tensor var_5764_pad_0 = const()[name = tensor("op_5764_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_5764_dilations_0 = const()[name = tensor("op_5764_dilations_0"), val = tensor([1, 1])]; tensor var_5764_groups_0 = const()[name = tensor("op_5764_groups_0"), val = tensor(1)]; tensor blocks_20_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_20_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(827967936)))]; tensor blocks_20_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_20_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(841075200)))]; tensor var_5764_cast_fp16 = conv(bias = blocks_20_mlp_2_bias_to_fp16, dilations = var_5764_dilations_0, groups = var_5764_groups_0, pad = var_5764_pad_0, pad_type = var_5764_pad_type_0, strides = var_5764_strides_0, weight = blocks_20_mlp_2_weight_to_fp16, x = input_211_cast_fp16)[name = tensor("op_5764_cast_fp16")]; tensor inputs_85_cast_fp16 = add(x = inputs_83_cast_fp16, y = var_5764_cast_fp16)[name = tensor("inputs_85_cast_fp16")]; tensor var_5773 = const()[name = tensor("op_5773"), val = tensor(1)]; tensor input_213_axes_0 = const()[name = tensor("input_213_axes_0"), val = tensor([1])]; tensor input_213_gamma_0_to_fp16 = const()[name = tensor("input_213_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(841077824)))]; tensor input_213_beta_0_to_fp16 = const()[name = tensor("input_213_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(841080448)))]; tensor var_5789_to_fp16 = const()[name = tensor("op_5789_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_213_cast_fp16 = layer_norm(axes = input_213_axes_0, beta = input_213_beta_0_to_fp16, epsilon = var_5789_to_fp16, gamma = input_213_gamma_0_to_fp16, x = inputs_85_cast_fp16)[name = tensor("input_213_cast_fp16")]; tensor q_43_pad_type_0 = const()[name = tensor("q_43_pad_type_0"), val = tensor("valid")]; tensor q_43_strides_0 = const()[name = tensor("q_43_strides_0"), val = tensor([1, 1])]; tensor q_43_pad_0 = const()[name = tensor("q_43_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_43_dilations_0 = const()[name = tensor("q_43_dilations_0"), val = tensor([1, 1])]; tensor q_43_groups_0 = const()[name = tensor("q_43_groups_0"), val = tensor(1)]; tensor var_5824_weight_0_to_fp16 = const()[name = tensor("op_5824_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(841083072)))]; tensor var_5824_bias_0_to_fp16 = const()[name = tensor("op_5824_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(844359936)))]; tensor var_5824_cast_fp16 = conv(bias = var_5824_bias_0_to_fp16, dilations = q_43_dilations_0, groups = q_43_groups_0, pad = q_43_pad_0, pad_type = q_43_pad_type_0, strides = q_43_strides_0, weight = var_5824_weight_0_to_fp16, x = input_213_cast_fp16)[name = tensor("op_5824_cast_fp16")]; tensor k_43_pad_type_0 = const()[name = tensor("k_43_pad_type_0"), val = tensor("valid")]; tensor k_43_strides_0 = const()[name = tensor("k_43_strides_0"), val = tensor([1, 1])]; tensor k_43_pad_0 = const()[name = tensor("k_43_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_43_dilations_0 = const()[name = tensor("k_43_dilations_0"), val = tensor([1, 1])]; tensor k_43_groups_0 = const()[name = tensor("k_43_groups_0"), val = tensor(1)]; tensor blocks_21_attn_key_weight_to_fp16 = const()[name = tensor("blocks_21_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(844362560)))]; tensor k_43_cast_fp16 = conv(dilations = k_43_dilations_0, groups = k_43_groups_0, pad = k_43_pad_0, pad_type = k_43_pad_type_0, strides = k_43_strides_0, weight = blocks_21_attn_key_weight_to_fp16, x = input_213_cast_fp16)[name = tensor("k_43_cast_fp16")]; tensor var_5822_pad_type_0 = const()[name = tensor("op_5822_pad_type_0"), val = tensor("valid")]; tensor var_5822_strides_0 = const()[name = tensor("op_5822_strides_0"), val = tensor([1, 1])]; tensor var_5822_pad_0 = const()[name = tensor("op_5822_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_5822_dilations_0 = const()[name = tensor("op_5822_dilations_0"), val = tensor([1, 1])]; tensor var_5822_groups_0 = const()[name = tensor("op_5822_groups_0"), val = tensor(1)]; tensor blocks_21_attn_value_weight_to_fp16 = const()[name = tensor("blocks_21_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(847639424)))]; tensor blocks_21_attn_value_bias_to_fp16 = const()[name = tensor("blocks_21_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(850916288)))]; tensor var_5822_cast_fp16 = conv(bias = blocks_21_attn_value_bias_to_fp16, dilations = var_5822_dilations_0, groups = var_5822_groups_0, pad = var_5822_pad_0, pad_type = var_5822_pad_type_0, strides = var_5822_strides_0, weight = blocks_21_attn_value_weight_to_fp16, x = input_213_cast_fp16)[name = tensor("op_5822_cast_fp16")]; tensor tile_63 = const()[name = tensor("tile_63"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_5825_axis_0 = const()[name = tensor("op_5825_axis_0"), val = tensor(1)]; tensor var_5825_cast_fp16_0, tensor var_5825_cast_fp16_1, tensor var_5825_cast_fp16_2, tensor var_5825_cast_fp16_3, tensor var_5825_cast_fp16_4, tensor var_5825_cast_fp16_5, tensor var_5825_cast_fp16_6, tensor var_5825_cast_fp16_7, tensor var_5825_cast_fp16_8, tensor var_5825_cast_fp16_9, tensor var_5825_cast_fp16_10, tensor var_5825_cast_fp16_11, tensor var_5825_cast_fp16_12, tensor var_5825_cast_fp16_13, tensor var_5825_cast_fp16_14, tensor var_5825_cast_fp16_15, tensor var_5825_cast_fp16_16, tensor var_5825_cast_fp16_17, tensor var_5825_cast_fp16_18, tensor var_5825_cast_fp16_19 = split(axis = var_5825_axis_0, split_sizes = tile_63, x = var_5824_cast_fp16)[name = tensor("op_5825_cast_fp16")]; tensor var_5846_perm_0 = const()[name = tensor("op_5846_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_64 = const()[name = tensor("tile_64"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_5847_axis_0 = const()[name = tensor("op_5847_axis_0"), val = tensor(3)]; tensor var_5846_cast_fp16 = transpose(perm = var_5846_perm_0, x = k_43_cast_fp16)[name = tensor("transpose_11")]; tensor var_5847_cast_fp16_0, tensor var_5847_cast_fp16_1, tensor var_5847_cast_fp16_2, tensor var_5847_cast_fp16_3, tensor var_5847_cast_fp16_4, tensor var_5847_cast_fp16_5, tensor var_5847_cast_fp16_6, tensor var_5847_cast_fp16_7, tensor var_5847_cast_fp16_8, tensor var_5847_cast_fp16_9, tensor var_5847_cast_fp16_10, tensor var_5847_cast_fp16_11, tensor var_5847_cast_fp16_12, tensor var_5847_cast_fp16_13, tensor var_5847_cast_fp16_14, tensor var_5847_cast_fp16_15, tensor var_5847_cast_fp16_16, tensor var_5847_cast_fp16_17, tensor var_5847_cast_fp16_18, tensor var_5847_cast_fp16_19 = split(axis = var_5847_axis_0, split_sizes = tile_64, x = var_5846_cast_fp16)[name = tensor("op_5847_cast_fp16")]; tensor tile_65 = const()[name = tensor("tile_65"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_5868_axis_0 = const()[name = tensor("op_5868_axis_0"), val = tensor(1)]; tensor var_5868_cast_fp16_0, tensor var_5868_cast_fp16_1, tensor var_5868_cast_fp16_2, tensor var_5868_cast_fp16_3, tensor var_5868_cast_fp16_4, tensor var_5868_cast_fp16_5, tensor var_5868_cast_fp16_6, tensor var_5868_cast_fp16_7, tensor var_5868_cast_fp16_8, tensor var_5868_cast_fp16_9, tensor var_5868_cast_fp16_10, tensor var_5868_cast_fp16_11, tensor var_5868_cast_fp16_12, tensor var_5868_cast_fp16_13, tensor var_5868_cast_fp16_14, tensor var_5868_cast_fp16_15, tensor var_5868_cast_fp16_16, tensor var_5868_cast_fp16_17, tensor var_5868_cast_fp16_18, tensor var_5868_cast_fp16_19 = split(axis = var_5868_axis_0, split_sizes = tile_65, x = var_5822_cast_fp16)[name = tensor("op_5868_cast_fp16")]; tensor aw_841_equation_0 = const()[name = tensor("aw_841_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_841_cast_fp16 = einsum(equation = aw_841_equation_0, values = (var_5847_cast_fp16_0, var_5825_cast_fp16_0))[name = tensor("aw_841_cast_fp16")]; tensor aw_843_equation_0 = const()[name = tensor("aw_843_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_843_cast_fp16 = einsum(equation = aw_843_equation_0, values = (var_5847_cast_fp16_1, var_5825_cast_fp16_1))[name = tensor("aw_843_cast_fp16")]; tensor aw_845_equation_0 = const()[name = tensor("aw_845_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_845_cast_fp16 = einsum(equation = aw_845_equation_0, values = (var_5847_cast_fp16_2, var_5825_cast_fp16_2))[name = tensor("aw_845_cast_fp16")]; tensor aw_847_equation_0 = const()[name = tensor("aw_847_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_847_cast_fp16 = einsum(equation = aw_847_equation_0, values = (var_5847_cast_fp16_3, var_5825_cast_fp16_3))[name = tensor("aw_847_cast_fp16")]; tensor aw_849_equation_0 = const()[name = tensor("aw_849_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_849_cast_fp16 = einsum(equation = aw_849_equation_0, values = (var_5847_cast_fp16_4, var_5825_cast_fp16_4))[name = tensor("aw_849_cast_fp16")]; tensor aw_851_equation_0 = const()[name = tensor("aw_851_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_851_cast_fp16 = einsum(equation = aw_851_equation_0, values = (var_5847_cast_fp16_5, var_5825_cast_fp16_5))[name = tensor("aw_851_cast_fp16")]; tensor aw_853_equation_0 = const()[name = tensor("aw_853_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_853_cast_fp16 = einsum(equation = aw_853_equation_0, values = (var_5847_cast_fp16_6, var_5825_cast_fp16_6))[name = tensor("aw_853_cast_fp16")]; tensor aw_855_equation_0 = const()[name = tensor("aw_855_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_855_cast_fp16 = einsum(equation = aw_855_equation_0, values = (var_5847_cast_fp16_7, var_5825_cast_fp16_7))[name = tensor("aw_855_cast_fp16")]; tensor aw_857_equation_0 = const()[name = tensor("aw_857_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_857_cast_fp16 = einsum(equation = aw_857_equation_0, values = (var_5847_cast_fp16_8, var_5825_cast_fp16_8))[name = tensor("aw_857_cast_fp16")]; tensor aw_859_equation_0 = const()[name = tensor("aw_859_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_859_cast_fp16 = einsum(equation = aw_859_equation_0, values = (var_5847_cast_fp16_9, var_5825_cast_fp16_9))[name = tensor("aw_859_cast_fp16")]; tensor aw_861_equation_0 = const()[name = tensor("aw_861_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_861_cast_fp16 = einsum(equation = aw_861_equation_0, values = (var_5847_cast_fp16_10, var_5825_cast_fp16_10))[name = tensor("aw_861_cast_fp16")]; tensor aw_863_equation_0 = const()[name = tensor("aw_863_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_863_cast_fp16 = einsum(equation = aw_863_equation_0, values = (var_5847_cast_fp16_11, var_5825_cast_fp16_11))[name = tensor("aw_863_cast_fp16")]; tensor aw_865_equation_0 = const()[name = tensor("aw_865_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_865_cast_fp16 = einsum(equation = aw_865_equation_0, values = (var_5847_cast_fp16_12, var_5825_cast_fp16_12))[name = tensor("aw_865_cast_fp16")]; tensor aw_867_equation_0 = const()[name = tensor("aw_867_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_867_cast_fp16 = einsum(equation = aw_867_equation_0, values = (var_5847_cast_fp16_13, var_5825_cast_fp16_13))[name = tensor("aw_867_cast_fp16")]; tensor aw_869_equation_0 = const()[name = tensor("aw_869_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_869_cast_fp16 = einsum(equation = aw_869_equation_0, values = (var_5847_cast_fp16_14, var_5825_cast_fp16_14))[name = tensor("aw_869_cast_fp16")]; tensor aw_871_equation_0 = const()[name = tensor("aw_871_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_871_cast_fp16 = einsum(equation = aw_871_equation_0, values = (var_5847_cast_fp16_15, var_5825_cast_fp16_15))[name = tensor("aw_871_cast_fp16")]; tensor aw_873_equation_0 = const()[name = tensor("aw_873_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_873_cast_fp16 = einsum(equation = aw_873_equation_0, values = (var_5847_cast_fp16_16, var_5825_cast_fp16_16))[name = tensor("aw_873_cast_fp16")]; tensor aw_875_equation_0 = const()[name = tensor("aw_875_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_875_cast_fp16 = einsum(equation = aw_875_equation_0, values = (var_5847_cast_fp16_17, var_5825_cast_fp16_17))[name = tensor("aw_875_cast_fp16")]; tensor aw_877_equation_0 = const()[name = tensor("aw_877_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_877_cast_fp16 = einsum(equation = aw_877_equation_0, values = (var_5847_cast_fp16_18, var_5825_cast_fp16_18))[name = tensor("aw_877_cast_fp16")]; tensor aw_879_equation_0 = const()[name = tensor("aw_879_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_879_cast_fp16 = einsum(equation = aw_879_equation_0, values = (var_5847_cast_fp16_19, var_5825_cast_fp16_19))[name = tensor("aw_879_cast_fp16")]; tensor var_5929_cast_fp16 = softmax(axis = var_5773, x = aw_841_cast_fp16)[name = tensor("op_5929_cast_fp16")]; tensor var_5930_cast_fp16 = softmax(axis = var_5773, x = aw_843_cast_fp16)[name = tensor("op_5930_cast_fp16")]; tensor var_5931_cast_fp16 = softmax(axis = var_5773, x = aw_845_cast_fp16)[name = tensor("op_5931_cast_fp16")]; tensor var_5932_cast_fp16 = softmax(axis = var_5773, x = aw_847_cast_fp16)[name = tensor("op_5932_cast_fp16")]; tensor var_5933_cast_fp16 = softmax(axis = var_5773, x = aw_849_cast_fp16)[name = tensor("op_5933_cast_fp16")]; tensor var_5934_cast_fp16 = softmax(axis = var_5773, x = aw_851_cast_fp16)[name = tensor("op_5934_cast_fp16")]; tensor var_5935_cast_fp16 = softmax(axis = var_5773, x = aw_853_cast_fp16)[name = tensor("op_5935_cast_fp16")]; tensor var_5936_cast_fp16 = softmax(axis = var_5773, x = aw_855_cast_fp16)[name = tensor("op_5936_cast_fp16")]; tensor var_5937_cast_fp16 = softmax(axis = var_5773, x = aw_857_cast_fp16)[name = tensor("op_5937_cast_fp16")]; tensor var_5938_cast_fp16 = softmax(axis = var_5773, x = aw_859_cast_fp16)[name = tensor("op_5938_cast_fp16")]; tensor var_5939_cast_fp16 = softmax(axis = var_5773, x = aw_861_cast_fp16)[name = tensor("op_5939_cast_fp16")]; tensor var_5940_cast_fp16 = softmax(axis = var_5773, x = aw_863_cast_fp16)[name = tensor("op_5940_cast_fp16")]; tensor var_5941_cast_fp16 = softmax(axis = var_5773, x = aw_865_cast_fp16)[name = tensor("op_5941_cast_fp16")]; tensor var_5942_cast_fp16 = softmax(axis = var_5773, x = aw_867_cast_fp16)[name = tensor("op_5942_cast_fp16")]; tensor var_5943_cast_fp16 = softmax(axis = var_5773, x = aw_869_cast_fp16)[name = tensor("op_5943_cast_fp16")]; tensor var_5944_cast_fp16 = softmax(axis = var_5773, x = aw_871_cast_fp16)[name = tensor("op_5944_cast_fp16")]; tensor var_5945_cast_fp16 = softmax(axis = var_5773, x = aw_873_cast_fp16)[name = tensor("op_5945_cast_fp16")]; tensor var_5946_cast_fp16 = softmax(axis = var_5773, x = aw_875_cast_fp16)[name = tensor("op_5946_cast_fp16")]; tensor var_5947_cast_fp16 = softmax(axis = var_5773, x = aw_877_cast_fp16)[name = tensor("op_5947_cast_fp16")]; tensor var_5948_cast_fp16 = softmax(axis = var_5773, x = aw_879_cast_fp16)[name = tensor("op_5948_cast_fp16")]; tensor var_5950_equation_0 = const()[name = tensor("op_5950_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5950_cast_fp16 = einsum(equation = var_5950_equation_0, values = (var_5868_cast_fp16_0, var_5929_cast_fp16))[name = tensor("op_5950_cast_fp16")]; tensor var_5952_equation_0 = const()[name = tensor("op_5952_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5952_cast_fp16 = einsum(equation = var_5952_equation_0, values = (var_5868_cast_fp16_1, var_5930_cast_fp16))[name = tensor("op_5952_cast_fp16")]; tensor var_5954_equation_0 = const()[name = tensor("op_5954_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5954_cast_fp16 = einsum(equation = var_5954_equation_0, values = (var_5868_cast_fp16_2, var_5931_cast_fp16))[name = tensor("op_5954_cast_fp16")]; tensor var_5956_equation_0 = const()[name = tensor("op_5956_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5956_cast_fp16 = einsum(equation = var_5956_equation_0, values = (var_5868_cast_fp16_3, var_5932_cast_fp16))[name = tensor("op_5956_cast_fp16")]; tensor var_5958_equation_0 = const()[name = tensor("op_5958_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5958_cast_fp16 = einsum(equation = var_5958_equation_0, values = (var_5868_cast_fp16_4, var_5933_cast_fp16))[name = tensor("op_5958_cast_fp16")]; tensor var_5960_equation_0 = const()[name = tensor("op_5960_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5960_cast_fp16 = einsum(equation = var_5960_equation_0, values = (var_5868_cast_fp16_5, var_5934_cast_fp16))[name = tensor("op_5960_cast_fp16")]; tensor var_5962_equation_0 = const()[name = tensor("op_5962_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5962_cast_fp16 = einsum(equation = var_5962_equation_0, values = (var_5868_cast_fp16_6, var_5935_cast_fp16))[name = tensor("op_5962_cast_fp16")]; tensor var_5964_equation_0 = const()[name = tensor("op_5964_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5964_cast_fp16 = einsum(equation = var_5964_equation_0, values = (var_5868_cast_fp16_7, var_5936_cast_fp16))[name = tensor("op_5964_cast_fp16")]; tensor var_5966_equation_0 = const()[name = tensor("op_5966_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5966_cast_fp16 = einsum(equation = var_5966_equation_0, values = (var_5868_cast_fp16_8, var_5937_cast_fp16))[name = tensor("op_5966_cast_fp16")]; tensor var_5968_equation_0 = const()[name = tensor("op_5968_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5968_cast_fp16 = einsum(equation = var_5968_equation_0, values = (var_5868_cast_fp16_9, var_5938_cast_fp16))[name = tensor("op_5968_cast_fp16")]; tensor var_5970_equation_0 = const()[name = tensor("op_5970_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5970_cast_fp16 = einsum(equation = var_5970_equation_0, values = (var_5868_cast_fp16_10, var_5939_cast_fp16))[name = tensor("op_5970_cast_fp16")]; tensor var_5972_equation_0 = const()[name = tensor("op_5972_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5972_cast_fp16 = einsum(equation = var_5972_equation_0, values = (var_5868_cast_fp16_11, var_5940_cast_fp16))[name = tensor("op_5972_cast_fp16")]; tensor var_5974_equation_0 = const()[name = tensor("op_5974_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5974_cast_fp16 = einsum(equation = var_5974_equation_0, values = (var_5868_cast_fp16_12, var_5941_cast_fp16))[name = tensor("op_5974_cast_fp16")]; tensor var_5976_equation_0 = const()[name = tensor("op_5976_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5976_cast_fp16 = einsum(equation = var_5976_equation_0, values = (var_5868_cast_fp16_13, var_5942_cast_fp16))[name = tensor("op_5976_cast_fp16")]; tensor var_5978_equation_0 = const()[name = tensor("op_5978_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5978_cast_fp16 = einsum(equation = var_5978_equation_0, values = (var_5868_cast_fp16_14, var_5943_cast_fp16))[name = tensor("op_5978_cast_fp16")]; tensor var_5980_equation_0 = const()[name = tensor("op_5980_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5980_cast_fp16 = einsum(equation = var_5980_equation_0, values = (var_5868_cast_fp16_15, var_5944_cast_fp16))[name = tensor("op_5980_cast_fp16")]; tensor var_5982_equation_0 = const()[name = tensor("op_5982_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5982_cast_fp16 = einsum(equation = var_5982_equation_0, values = (var_5868_cast_fp16_16, var_5945_cast_fp16))[name = tensor("op_5982_cast_fp16")]; tensor var_5984_equation_0 = const()[name = tensor("op_5984_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5984_cast_fp16 = einsum(equation = var_5984_equation_0, values = (var_5868_cast_fp16_17, var_5946_cast_fp16))[name = tensor("op_5984_cast_fp16")]; tensor var_5986_equation_0 = const()[name = tensor("op_5986_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5986_cast_fp16 = einsum(equation = var_5986_equation_0, values = (var_5868_cast_fp16_18, var_5947_cast_fp16))[name = tensor("op_5986_cast_fp16")]; tensor var_5988_equation_0 = const()[name = tensor("op_5988_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5988_cast_fp16 = einsum(equation = var_5988_equation_0, values = (var_5868_cast_fp16_19, var_5948_cast_fp16))[name = tensor("op_5988_cast_fp16")]; tensor input_215_interleave_0 = const()[name = tensor("input_215_interleave_0"), val = tensor(false)]; tensor input_215_cast_fp16 = concat(axis = var_5773, interleave = input_215_interleave_0, values = (var_5950_cast_fp16, var_5952_cast_fp16, var_5954_cast_fp16, var_5956_cast_fp16, var_5958_cast_fp16, var_5960_cast_fp16, var_5962_cast_fp16, var_5964_cast_fp16, var_5966_cast_fp16, var_5968_cast_fp16, var_5970_cast_fp16, var_5972_cast_fp16, var_5974_cast_fp16, var_5976_cast_fp16, var_5978_cast_fp16, var_5980_cast_fp16, var_5982_cast_fp16, var_5984_cast_fp16, var_5986_cast_fp16, var_5988_cast_fp16))[name = tensor("input_215_cast_fp16")]; tensor var_5997_pad_type_0 = const()[name = tensor("op_5997_pad_type_0"), val = tensor("valid")]; tensor var_5997_strides_0 = const()[name = tensor("op_5997_strides_0"), val = tensor([1, 1])]; tensor var_5997_pad_0 = const()[name = tensor("op_5997_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_5997_dilations_0 = const()[name = tensor("op_5997_dilations_0"), val = tensor([1, 1])]; tensor var_5997_groups_0 = const()[name = tensor("op_5997_groups_0"), val = tensor(1)]; tensor blocks_21_attn_out_weight_to_fp16 = const()[name = tensor("blocks_21_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(850918912)))]; tensor blocks_21_attn_out_bias_to_fp16 = const()[name = tensor("blocks_21_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(854195776)))]; tensor var_5997_cast_fp16 = conv(bias = blocks_21_attn_out_bias_to_fp16, dilations = var_5997_dilations_0, groups = var_5997_groups_0, pad = var_5997_pad_0, pad_type = var_5997_pad_type_0, strides = var_5997_strides_0, weight = blocks_21_attn_out_weight_to_fp16, x = input_215_cast_fp16)[name = tensor("op_5997_cast_fp16")]; tensor inputs_87_cast_fp16 = add(x = inputs_85_cast_fp16, y = var_5997_cast_fp16)[name = tensor("inputs_87_cast_fp16")]; tensor input_217_axes_0 = const()[name = tensor("input_217_axes_0"), val = tensor([1])]; tensor input_217_gamma_0_to_fp16 = const()[name = tensor("input_217_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(854198400)))]; tensor input_217_beta_0_to_fp16 = const()[name = tensor("input_217_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(854201024)))]; tensor var_6007_to_fp16 = const()[name = tensor("op_6007_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_217_cast_fp16 = layer_norm(axes = input_217_axes_0, beta = input_217_beta_0_to_fp16, epsilon = var_6007_to_fp16, gamma = input_217_gamma_0_to_fp16, x = inputs_87_cast_fp16)[name = tensor("input_217_cast_fp16")]; tensor input_219_pad_type_0 = const()[name = tensor("input_219_pad_type_0"), val = tensor("valid")]; tensor input_219_strides_0 = const()[name = tensor("input_219_strides_0"), val = tensor([1, 1])]; tensor input_219_pad_0 = const()[name = tensor("input_219_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_219_dilations_0 = const()[name = tensor("input_219_dilations_0"), val = tensor([1, 1])]; tensor input_219_groups_0 = const()[name = tensor("input_219_groups_0"), val = tensor(1)]; tensor blocks_21_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_21_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(854203648)))]; tensor blocks_21_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_21_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(867310912)))]; tensor input_219_cast_fp16 = conv(bias = blocks_21_mlp_0_bias_to_fp16, dilations = input_219_dilations_0, groups = input_219_groups_0, pad = input_219_pad_0, pad_type = input_219_pad_type_0, strides = input_219_strides_0, weight = blocks_21_mlp_0_weight_to_fp16, x = input_217_cast_fp16)[name = tensor("input_219_cast_fp16")]; tensor input_221_mode_0 = const()[name = tensor("input_221_mode_0"), val = tensor("EXACT")]; tensor input_221_cast_fp16 = gelu(mode = input_221_mode_0, x = input_219_cast_fp16)[name = tensor("input_221_cast_fp16")]; tensor var_6033_pad_type_0 = const()[name = tensor("op_6033_pad_type_0"), val = tensor("valid")]; tensor var_6033_strides_0 = const()[name = tensor("op_6033_strides_0"), val = tensor([1, 1])]; tensor var_6033_pad_0 = const()[name = tensor("op_6033_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_6033_dilations_0 = const()[name = tensor("op_6033_dilations_0"), val = tensor([1, 1])]; tensor var_6033_groups_0 = const()[name = tensor("op_6033_groups_0"), val = tensor(1)]; tensor blocks_21_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_21_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(867321216)))]; tensor blocks_21_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_21_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(880428480)))]; tensor var_6033_cast_fp16 = conv(bias = blocks_21_mlp_2_bias_to_fp16, dilations = var_6033_dilations_0, groups = var_6033_groups_0, pad = var_6033_pad_0, pad_type = var_6033_pad_type_0, strides = var_6033_strides_0, weight = blocks_21_mlp_2_weight_to_fp16, x = input_221_cast_fp16)[name = tensor("op_6033_cast_fp16")]; tensor inputs_89_cast_fp16 = add(x = inputs_87_cast_fp16, y = var_6033_cast_fp16)[name = tensor("inputs_89_cast_fp16")]; tensor var_6042 = const()[name = tensor("op_6042"), val = tensor(1)]; tensor input_223_axes_0 = const()[name = tensor("input_223_axes_0"), val = tensor([1])]; tensor input_223_gamma_0_to_fp16 = const()[name = tensor("input_223_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(880431104)))]; tensor input_223_beta_0_to_fp16 = const()[name = tensor("input_223_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(880433728)))]; tensor var_6058_to_fp16 = const()[name = tensor("op_6058_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_223_cast_fp16 = layer_norm(axes = input_223_axes_0, beta = input_223_beta_0_to_fp16, epsilon = var_6058_to_fp16, gamma = input_223_gamma_0_to_fp16, x = inputs_89_cast_fp16)[name = tensor("input_223_cast_fp16")]; tensor q_45_pad_type_0 = const()[name = tensor("q_45_pad_type_0"), val = tensor("valid")]; tensor q_45_strides_0 = const()[name = tensor("q_45_strides_0"), val = tensor([1, 1])]; tensor q_45_pad_0 = const()[name = tensor("q_45_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_45_dilations_0 = const()[name = tensor("q_45_dilations_0"), val = tensor([1, 1])]; tensor q_45_groups_0 = const()[name = tensor("q_45_groups_0"), val = tensor(1)]; tensor var_6093_weight_0_to_fp16 = const()[name = tensor("op_6093_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(880436352)))]; tensor var_6093_bias_0_to_fp16 = const()[name = tensor("op_6093_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(883713216)))]; tensor var_6093_cast_fp16 = conv(bias = var_6093_bias_0_to_fp16, dilations = q_45_dilations_0, groups = q_45_groups_0, pad = q_45_pad_0, pad_type = q_45_pad_type_0, strides = q_45_strides_0, weight = var_6093_weight_0_to_fp16, x = input_223_cast_fp16)[name = tensor("op_6093_cast_fp16")]; tensor k_45_pad_type_0 = const()[name = tensor("k_45_pad_type_0"), val = tensor("valid")]; tensor k_45_strides_0 = const()[name = tensor("k_45_strides_0"), val = tensor([1, 1])]; tensor k_45_pad_0 = const()[name = tensor("k_45_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_45_dilations_0 = const()[name = tensor("k_45_dilations_0"), val = tensor([1, 1])]; tensor k_45_groups_0 = const()[name = tensor("k_45_groups_0"), val = tensor(1)]; tensor blocks_22_attn_key_weight_to_fp16 = const()[name = tensor("blocks_22_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(883715840)))]; tensor k_45_cast_fp16 = conv(dilations = k_45_dilations_0, groups = k_45_groups_0, pad = k_45_pad_0, pad_type = k_45_pad_type_0, strides = k_45_strides_0, weight = blocks_22_attn_key_weight_to_fp16, x = input_223_cast_fp16)[name = tensor("k_45_cast_fp16")]; tensor var_6091_pad_type_0 = const()[name = tensor("op_6091_pad_type_0"), val = tensor("valid")]; tensor var_6091_strides_0 = const()[name = tensor("op_6091_strides_0"), val = tensor([1, 1])]; tensor var_6091_pad_0 = const()[name = tensor("op_6091_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_6091_dilations_0 = const()[name = tensor("op_6091_dilations_0"), val = tensor([1, 1])]; tensor var_6091_groups_0 = const()[name = tensor("op_6091_groups_0"), val = tensor(1)]; tensor blocks_22_attn_value_weight_to_fp16 = const()[name = tensor("blocks_22_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(886992704)))]; tensor blocks_22_attn_value_bias_to_fp16 = const()[name = tensor("blocks_22_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(890269568)))]; tensor var_6091_cast_fp16 = conv(bias = blocks_22_attn_value_bias_to_fp16, dilations = var_6091_dilations_0, groups = var_6091_groups_0, pad = var_6091_pad_0, pad_type = var_6091_pad_type_0, strides = var_6091_strides_0, weight = blocks_22_attn_value_weight_to_fp16, x = input_223_cast_fp16)[name = tensor("op_6091_cast_fp16")]; tensor tile_66 = const()[name = tensor("tile_66"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_6094_axis_0 = const()[name = tensor("op_6094_axis_0"), val = tensor(1)]; tensor var_6094_cast_fp16_0, tensor var_6094_cast_fp16_1, tensor var_6094_cast_fp16_2, tensor var_6094_cast_fp16_3, tensor var_6094_cast_fp16_4, tensor var_6094_cast_fp16_5, tensor var_6094_cast_fp16_6, tensor var_6094_cast_fp16_7, tensor var_6094_cast_fp16_8, tensor var_6094_cast_fp16_9, tensor var_6094_cast_fp16_10, tensor var_6094_cast_fp16_11, tensor var_6094_cast_fp16_12, tensor var_6094_cast_fp16_13, tensor var_6094_cast_fp16_14, tensor var_6094_cast_fp16_15, tensor var_6094_cast_fp16_16, tensor var_6094_cast_fp16_17, tensor var_6094_cast_fp16_18, tensor var_6094_cast_fp16_19 = split(axis = var_6094_axis_0, split_sizes = tile_66, x = var_6093_cast_fp16)[name = tensor("op_6094_cast_fp16")]; tensor var_6115_perm_0 = const()[name = tensor("op_6115_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_67 = const()[name = tensor("tile_67"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_6116_axis_0 = const()[name = tensor("op_6116_axis_0"), val = tensor(3)]; tensor var_6115_cast_fp16 = transpose(perm = var_6115_perm_0, x = k_45_cast_fp16)[name = tensor("transpose_10")]; tensor var_6116_cast_fp16_0, tensor var_6116_cast_fp16_1, tensor var_6116_cast_fp16_2, tensor var_6116_cast_fp16_3, tensor var_6116_cast_fp16_4, tensor var_6116_cast_fp16_5, tensor var_6116_cast_fp16_6, tensor var_6116_cast_fp16_7, tensor var_6116_cast_fp16_8, tensor var_6116_cast_fp16_9, tensor var_6116_cast_fp16_10, tensor var_6116_cast_fp16_11, tensor var_6116_cast_fp16_12, tensor var_6116_cast_fp16_13, tensor var_6116_cast_fp16_14, tensor var_6116_cast_fp16_15, tensor var_6116_cast_fp16_16, tensor var_6116_cast_fp16_17, tensor var_6116_cast_fp16_18, tensor var_6116_cast_fp16_19 = split(axis = var_6116_axis_0, split_sizes = tile_67, x = var_6115_cast_fp16)[name = tensor("op_6116_cast_fp16")]; tensor tile_68 = const()[name = tensor("tile_68"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_6137_axis_0 = const()[name = tensor("op_6137_axis_0"), val = tensor(1)]; tensor var_6137_cast_fp16_0, tensor var_6137_cast_fp16_1, tensor var_6137_cast_fp16_2, tensor var_6137_cast_fp16_3, tensor var_6137_cast_fp16_4, tensor var_6137_cast_fp16_5, tensor var_6137_cast_fp16_6, tensor var_6137_cast_fp16_7, tensor var_6137_cast_fp16_8, tensor var_6137_cast_fp16_9, tensor var_6137_cast_fp16_10, tensor var_6137_cast_fp16_11, tensor var_6137_cast_fp16_12, tensor var_6137_cast_fp16_13, tensor var_6137_cast_fp16_14, tensor var_6137_cast_fp16_15, tensor var_6137_cast_fp16_16, tensor var_6137_cast_fp16_17, tensor var_6137_cast_fp16_18, tensor var_6137_cast_fp16_19 = split(axis = var_6137_axis_0, split_sizes = tile_68, x = var_6091_cast_fp16)[name = tensor("op_6137_cast_fp16")]; tensor aw_881_equation_0 = const()[name = tensor("aw_881_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_881_cast_fp16 = einsum(equation = aw_881_equation_0, values = (var_6116_cast_fp16_0, var_6094_cast_fp16_0))[name = tensor("aw_881_cast_fp16")]; tensor aw_883_equation_0 = const()[name = tensor("aw_883_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_883_cast_fp16 = einsum(equation = aw_883_equation_0, values = (var_6116_cast_fp16_1, var_6094_cast_fp16_1))[name = tensor("aw_883_cast_fp16")]; tensor aw_885_equation_0 = const()[name = tensor("aw_885_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_885_cast_fp16 = einsum(equation = aw_885_equation_0, values = (var_6116_cast_fp16_2, var_6094_cast_fp16_2))[name = tensor("aw_885_cast_fp16")]; tensor aw_887_equation_0 = const()[name = tensor("aw_887_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_887_cast_fp16 = einsum(equation = aw_887_equation_0, values = (var_6116_cast_fp16_3, var_6094_cast_fp16_3))[name = tensor("aw_887_cast_fp16")]; tensor aw_889_equation_0 = const()[name = tensor("aw_889_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_889_cast_fp16 = einsum(equation = aw_889_equation_0, values = (var_6116_cast_fp16_4, var_6094_cast_fp16_4))[name = tensor("aw_889_cast_fp16")]; tensor aw_891_equation_0 = const()[name = tensor("aw_891_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_891_cast_fp16 = einsum(equation = aw_891_equation_0, values = (var_6116_cast_fp16_5, var_6094_cast_fp16_5))[name = tensor("aw_891_cast_fp16")]; tensor aw_893_equation_0 = const()[name = tensor("aw_893_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_893_cast_fp16 = einsum(equation = aw_893_equation_0, values = (var_6116_cast_fp16_6, var_6094_cast_fp16_6))[name = tensor("aw_893_cast_fp16")]; tensor aw_895_equation_0 = const()[name = tensor("aw_895_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_895_cast_fp16 = einsum(equation = aw_895_equation_0, values = (var_6116_cast_fp16_7, var_6094_cast_fp16_7))[name = tensor("aw_895_cast_fp16")]; tensor aw_897_equation_0 = const()[name = tensor("aw_897_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_897_cast_fp16 = einsum(equation = aw_897_equation_0, values = (var_6116_cast_fp16_8, var_6094_cast_fp16_8))[name = tensor("aw_897_cast_fp16")]; tensor aw_899_equation_0 = const()[name = tensor("aw_899_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_899_cast_fp16 = einsum(equation = aw_899_equation_0, values = (var_6116_cast_fp16_9, var_6094_cast_fp16_9))[name = tensor("aw_899_cast_fp16")]; tensor aw_901_equation_0 = const()[name = tensor("aw_901_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_901_cast_fp16 = einsum(equation = aw_901_equation_0, values = (var_6116_cast_fp16_10, var_6094_cast_fp16_10))[name = tensor("aw_901_cast_fp16")]; tensor aw_903_equation_0 = const()[name = tensor("aw_903_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_903_cast_fp16 = einsum(equation = aw_903_equation_0, values = (var_6116_cast_fp16_11, var_6094_cast_fp16_11))[name = tensor("aw_903_cast_fp16")]; tensor aw_905_equation_0 = const()[name = tensor("aw_905_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_905_cast_fp16 = einsum(equation = aw_905_equation_0, values = (var_6116_cast_fp16_12, var_6094_cast_fp16_12))[name = tensor("aw_905_cast_fp16")]; tensor aw_907_equation_0 = const()[name = tensor("aw_907_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_907_cast_fp16 = einsum(equation = aw_907_equation_0, values = (var_6116_cast_fp16_13, var_6094_cast_fp16_13))[name = tensor("aw_907_cast_fp16")]; tensor aw_909_equation_0 = const()[name = tensor("aw_909_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_909_cast_fp16 = einsum(equation = aw_909_equation_0, values = (var_6116_cast_fp16_14, var_6094_cast_fp16_14))[name = tensor("aw_909_cast_fp16")]; tensor aw_911_equation_0 = const()[name = tensor("aw_911_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_911_cast_fp16 = einsum(equation = aw_911_equation_0, values = (var_6116_cast_fp16_15, var_6094_cast_fp16_15))[name = tensor("aw_911_cast_fp16")]; tensor aw_913_equation_0 = const()[name = tensor("aw_913_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_913_cast_fp16 = einsum(equation = aw_913_equation_0, values = (var_6116_cast_fp16_16, var_6094_cast_fp16_16))[name = tensor("aw_913_cast_fp16")]; tensor aw_915_equation_0 = const()[name = tensor("aw_915_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_915_cast_fp16 = einsum(equation = aw_915_equation_0, values = (var_6116_cast_fp16_17, var_6094_cast_fp16_17))[name = tensor("aw_915_cast_fp16")]; tensor aw_917_equation_0 = const()[name = tensor("aw_917_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_917_cast_fp16 = einsum(equation = aw_917_equation_0, values = (var_6116_cast_fp16_18, var_6094_cast_fp16_18))[name = tensor("aw_917_cast_fp16")]; tensor aw_919_equation_0 = const()[name = tensor("aw_919_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_919_cast_fp16 = einsum(equation = aw_919_equation_0, values = (var_6116_cast_fp16_19, var_6094_cast_fp16_19))[name = tensor("aw_919_cast_fp16")]; tensor var_6198_cast_fp16 = softmax(axis = var_6042, x = aw_881_cast_fp16)[name = tensor("op_6198_cast_fp16")]; tensor var_6199_cast_fp16 = softmax(axis = var_6042, x = aw_883_cast_fp16)[name = tensor("op_6199_cast_fp16")]; tensor var_6200_cast_fp16 = softmax(axis = var_6042, x = aw_885_cast_fp16)[name = tensor("op_6200_cast_fp16")]; tensor var_6201_cast_fp16 = softmax(axis = var_6042, x = aw_887_cast_fp16)[name = tensor("op_6201_cast_fp16")]; tensor var_6202_cast_fp16 = softmax(axis = var_6042, x = aw_889_cast_fp16)[name = tensor("op_6202_cast_fp16")]; tensor var_6203_cast_fp16 = softmax(axis = var_6042, x = aw_891_cast_fp16)[name = tensor("op_6203_cast_fp16")]; tensor var_6204_cast_fp16 = softmax(axis = var_6042, x = aw_893_cast_fp16)[name = tensor("op_6204_cast_fp16")]; tensor var_6205_cast_fp16 = softmax(axis = var_6042, x = aw_895_cast_fp16)[name = tensor("op_6205_cast_fp16")]; tensor var_6206_cast_fp16 = softmax(axis = var_6042, x = aw_897_cast_fp16)[name = tensor("op_6206_cast_fp16")]; tensor var_6207_cast_fp16 = softmax(axis = var_6042, x = aw_899_cast_fp16)[name = tensor("op_6207_cast_fp16")]; tensor var_6208_cast_fp16 = softmax(axis = var_6042, x = aw_901_cast_fp16)[name = tensor("op_6208_cast_fp16")]; tensor var_6209_cast_fp16 = softmax(axis = var_6042, x = aw_903_cast_fp16)[name = tensor("op_6209_cast_fp16")]; tensor var_6210_cast_fp16 = softmax(axis = var_6042, x = aw_905_cast_fp16)[name = tensor("op_6210_cast_fp16")]; tensor var_6211_cast_fp16 = softmax(axis = var_6042, x = aw_907_cast_fp16)[name = tensor("op_6211_cast_fp16")]; tensor var_6212_cast_fp16 = softmax(axis = var_6042, x = aw_909_cast_fp16)[name = tensor("op_6212_cast_fp16")]; tensor var_6213_cast_fp16 = softmax(axis = var_6042, x = aw_911_cast_fp16)[name = tensor("op_6213_cast_fp16")]; tensor var_6214_cast_fp16 = softmax(axis = var_6042, x = aw_913_cast_fp16)[name = tensor("op_6214_cast_fp16")]; tensor var_6215_cast_fp16 = softmax(axis = var_6042, x = aw_915_cast_fp16)[name = tensor("op_6215_cast_fp16")]; tensor var_6216_cast_fp16 = softmax(axis = var_6042, x = aw_917_cast_fp16)[name = tensor("op_6216_cast_fp16")]; tensor var_6217_cast_fp16 = softmax(axis = var_6042, x = aw_919_cast_fp16)[name = tensor("op_6217_cast_fp16")]; tensor var_6219_equation_0 = const()[name = tensor("op_6219_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6219_cast_fp16 = einsum(equation = var_6219_equation_0, values = (var_6137_cast_fp16_0, var_6198_cast_fp16))[name = tensor("op_6219_cast_fp16")]; tensor var_6221_equation_0 = const()[name = tensor("op_6221_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6221_cast_fp16 = einsum(equation = var_6221_equation_0, values = (var_6137_cast_fp16_1, var_6199_cast_fp16))[name = tensor("op_6221_cast_fp16")]; tensor var_6223_equation_0 = const()[name = tensor("op_6223_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6223_cast_fp16 = einsum(equation = var_6223_equation_0, values = (var_6137_cast_fp16_2, var_6200_cast_fp16))[name = tensor("op_6223_cast_fp16")]; tensor var_6225_equation_0 = const()[name = tensor("op_6225_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6225_cast_fp16 = einsum(equation = var_6225_equation_0, values = (var_6137_cast_fp16_3, var_6201_cast_fp16))[name = tensor("op_6225_cast_fp16")]; tensor var_6227_equation_0 = const()[name = tensor("op_6227_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6227_cast_fp16 = einsum(equation = var_6227_equation_0, values = (var_6137_cast_fp16_4, var_6202_cast_fp16))[name = tensor("op_6227_cast_fp16")]; tensor var_6229_equation_0 = const()[name = tensor("op_6229_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6229_cast_fp16 = einsum(equation = var_6229_equation_0, values = (var_6137_cast_fp16_5, var_6203_cast_fp16))[name = tensor("op_6229_cast_fp16")]; tensor var_6231_equation_0 = const()[name = tensor("op_6231_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6231_cast_fp16 = einsum(equation = var_6231_equation_0, values = (var_6137_cast_fp16_6, var_6204_cast_fp16))[name = tensor("op_6231_cast_fp16")]; tensor var_6233_equation_0 = const()[name = tensor("op_6233_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6233_cast_fp16 = einsum(equation = var_6233_equation_0, values = (var_6137_cast_fp16_7, var_6205_cast_fp16))[name = tensor("op_6233_cast_fp16")]; tensor var_6235_equation_0 = const()[name = tensor("op_6235_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6235_cast_fp16 = einsum(equation = var_6235_equation_0, values = (var_6137_cast_fp16_8, var_6206_cast_fp16))[name = tensor("op_6235_cast_fp16")]; tensor var_6237_equation_0 = const()[name = tensor("op_6237_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6237_cast_fp16 = einsum(equation = var_6237_equation_0, values = (var_6137_cast_fp16_9, var_6207_cast_fp16))[name = tensor("op_6237_cast_fp16")]; tensor var_6239_equation_0 = const()[name = tensor("op_6239_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6239_cast_fp16 = einsum(equation = var_6239_equation_0, values = (var_6137_cast_fp16_10, var_6208_cast_fp16))[name = tensor("op_6239_cast_fp16")]; tensor var_6241_equation_0 = const()[name = tensor("op_6241_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6241_cast_fp16 = einsum(equation = var_6241_equation_0, values = (var_6137_cast_fp16_11, var_6209_cast_fp16))[name = tensor("op_6241_cast_fp16")]; tensor var_6243_equation_0 = const()[name = tensor("op_6243_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6243_cast_fp16 = einsum(equation = var_6243_equation_0, values = (var_6137_cast_fp16_12, var_6210_cast_fp16))[name = tensor("op_6243_cast_fp16")]; tensor var_6245_equation_0 = const()[name = tensor("op_6245_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6245_cast_fp16 = einsum(equation = var_6245_equation_0, values = (var_6137_cast_fp16_13, var_6211_cast_fp16))[name = tensor("op_6245_cast_fp16")]; tensor var_6247_equation_0 = const()[name = tensor("op_6247_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6247_cast_fp16 = einsum(equation = var_6247_equation_0, values = (var_6137_cast_fp16_14, var_6212_cast_fp16))[name = tensor("op_6247_cast_fp16")]; tensor var_6249_equation_0 = const()[name = tensor("op_6249_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6249_cast_fp16 = einsum(equation = var_6249_equation_0, values = (var_6137_cast_fp16_15, var_6213_cast_fp16))[name = tensor("op_6249_cast_fp16")]; tensor var_6251_equation_0 = const()[name = tensor("op_6251_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6251_cast_fp16 = einsum(equation = var_6251_equation_0, values = (var_6137_cast_fp16_16, var_6214_cast_fp16))[name = tensor("op_6251_cast_fp16")]; tensor var_6253_equation_0 = const()[name = tensor("op_6253_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6253_cast_fp16 = einsum(equation = var_6253_equation_0, values = (var_6137_cast_fp16_17, var_6215_cast_fp16))[name = tensor("op_6253_cast_fp16")]; tensor var_6255_equation_0 = const()[name = tensor("op_6255_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6255_cast_fp16 = einsum(equation = var_6255_equation_0, values = (var_6137_cast_fp16_18, var_6216_cast_fp16))[name = tensor("op_6255_cast_fp16")]; tensor var_6257_equation_0 = const()[name = tensor("op_6257_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6257_cast_fp16 = einsum(equation = var_6257_equation_0, values = (var_6137_cast_fp16_19, var_6217_cast_fp16))[name = tensor("op_6257_cast_fp16")]; tensor input_225_interleave_0 = const()[name = tensor("input_225_interleave_0"), val = tensor(false)]; tensor input_225_cast_fp16 = concat(axis = var_6042, interleave = input_225_interleave_0, values = (var_6219_cast_fp16, var_6221_cast_fp16, var_6223_cast_fp16, var_6225_cast_fp16, var_6227_cast_fp16, var_6229_cast_fp16, var_6231_cast_fp16, var_6233_cast_fp16, var_6235_cast_fp16, var_6237_cast_fp16, var_6239_cast_fp16, var_6241_cast_fp16, var_6243_cast_fp16, var_6245_cast_fp16, var_6247_cast_fp16, var_6249_cast_fp16, var_6251_cast_fp16, var_6253_cast_fp16, var_6255_cast_fp16, var_6257_cast_fp16))[name = tensor("input_225_cast_fp16")]; tensor var_6266_pad_type_0 = const()[name = tensor("op_6266_pad_type_0"), val = tensor("valid")]; tensor var_6266_strides_0 = const()[name = tensor("op_6266_strides_0"), val = tensor([1, 1])]; tensor var_6266_pad_0 = const()[name = tensor("op_6266_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_6266_dilations_0 = const()[name = tensor("op_6266_dilations_0"), val = tensor([1, 1])]; tensor var_6266_groups_0 = const()[name = tensor("op_6266_groups_0"), val = tensor(1)]; tensor blocks_22_attn_out_weight_to_fp16 = const()[name = tensor("blocks_22_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(890272192)))]; tensor blocks_22_attn_out_bias_to_fp16 = const()[name = tensor("blocks_22_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(893549056)))]; tensor var_6266_cast_fp16 = conv(bias = blocks_22_attn_out_bias_to_fp16, dilations = var_6266_dilations_0, groups = var_6266_groups_0, pad = var_6266_pad_0, pad_type = var_6266_pad_type_0, strides = var_6266_strides_0, weight = blocks_22_attn_out_weight_to_fp16, x = input_225_cast_fp16)[name = tensor("op_6266_cast_fp16")]; tensor inputs_91_cast_fp16 = add(x = inputs_89_cast_fp16, y = var_6266_cast_fp16)[name = tensor("inputs_91_cast_fp16")]; tensor input_227_axes_0 = const()[name = tensor("input_227_axes_0"), val = tensor([1])]; tensor input_227_gamma_0_to_fp16 = const()[name = tensor("input_227_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(893551680)))]; tensor input_227_beta_0_to_fp16 = const()[name = tensor("input_227_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(893554304)))]; tensor var_6276_to_fp16 = const()[name = tensor("op_6276_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_227_cast_fp16 = layer_norm(axes = input_227_axes_0, beta = input_227_beta_0_to_fp16, epsilon = var_6276_to_fp16, gamma = input_227_gamma_0_to_fp16, x = inputs_91_cast_fp16)[name = tensor("input_227_cast_fp16")]; tensor input_229_pad_type_0 = const()[name = tensor("input_229_pad_type_0"), val = tensor("valid")]; tensor input_229_strides_0 = const()[name = tensor("input_229_strides_0"), val = tensor([1, 1])]; tensor input_229_pad_0 = const()[name = tensor("input_229_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_229_dilations_0 = const()[name = tensor("input_229_dilations_0"), val = tensor([1, 1])]; tensor input_229_groups_0 = const()[name = tensor("input_229_groups_0"), val = tensor(1)]; tensor blocks_22_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_22_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(893556928)))]; tensor blocks_22_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_22_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(906664192)))]; tensor input_229_cast_fp16 = conv(bias = blocks_22_mlp_0_bias_to_fp16, dilations = input_229_dilations_0, groups = input_229_groups_0, pad = input_229_pad_0, pad_type = input_229_pad_type_0, strides = input_229_strides_0, weight = blocks_22_mlp_0_weight_to_fp16, x = input_227_cast_fp16)[name = tensor("input_229_cast_fp16")]; tensor input_231_mode_0 = const()[name = tensor("input_231_mode_0"), val = tensor("EXACT")]; tensor input_231_cast_fp16 = gelu(mode = input_231_mode_0, x = input_229_cast_fp16)[name = tensor("input_231_cast_fp16")]; tensor var_6302_pad_type_0 = const()[name = tensor("op_6302_pad_type_0"), val = tensor("valid")]; tensor var_6302_strides_0 = const()[name = tensor("op_6302_strides_0"), val = tensor([1, 1])]; tensor var_6302_pad_0 = const()[name = tensor("op_6302_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_6302_dilations_0 = const()[name = tensor("op_6302_dilations_0"), val = tensor([1, 1])]; tensor var_6302_groups_0 = const()[name = tensor("op_6302_groups_0"), val = tensor(1)]; tensor blocks_22_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_22_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(906674496)))]; tensor blocks_22_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_22_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(919781760)))]; tensor var_6302_cast_fp16 = conv(bias = blocks_22_mlp_2_bias_to_fp16, dilations = var_6302_dilations_0, groups = var_6302_groups_0, pad = var_6302_pad_0, pad_type = var_6302_pad_type_0, strides = var_6302_strides_0, weight = blocks_22_mlp_2_weight_to_fp16, x = input_231_cast_fp16)[name = tensor("op_6302_cast_fp16")]; tensor inputs_93_cast_fp16 = add(x = inputs_91_cast_fp16, y = var_6302_cast_fp16)[name = tensor("inputs_93_cast_fp16")]; tensor var_6311 = const()[name = tensor("op_6311"), val = tensor(1)]; tensor input_233_axes_0 = const()[name = tensor("input_233_axes_0"), val = tensor([1])]; tensor input_233_gamma_0_to_fp16 = const()[name = tensor("input_233_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(919784384)))]; tensor input_233_beta_0_to_fp16 = const()[name = tensor("input_233_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(919787008)))]; tensor var_6327_to_fp16 = const()[name = tensor("op_6327_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_233_cast_fp16 = layer_norm(axes = input_233_axes_0, beta = input_233_beta_0_to_fp16, epsilon = var_6327_to_fp16, gamma = input_233_gamma_0_to_fp16, x = inputs_93_cast_fp16)[name = tensor("input_233_cast_fp16")]; tensor q_47_pad_type_0 = const()[name = tensor("q_47_pad_type_0"), val = tensor("valid")]; tensor q_47_strides_0 = const()[name = tensor("q_47_strides_0"), val = tensor([1, 1])]; tensor q_47_pad_0 = const()[name = tensor("q_47_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_47_dilations_0 = const()[name = tensor("q_47_dilations_0"), val = tensor([1, 1])]; tensor q_47_groups_0 = const()[name = tensor("q_47_groups_0"), val = tensor(1)]; tensor var_6362_weight_0_to_fp16 = const()[name = tensor("op_6362_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(919789632)))]; tensor var_6362_bias_0_to_fp16 = const()[name = tensor("op_6362_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(923066496)))]; tensor var_6362_cast_fp16 = conv(bias = var_6362_bias_0_to_fp16, dilations = q_47_dilations_0, groups = q_47_groups_0, pad = q_47_pad_0, pad_type = q_47_pad_type_0, strides = q_47_strides_0, weight = var_6362_weight_0_to_fp16, x = input_233_cast_fp16)[name = tensor("op_6362_cast_fp16")]; tensor k_47_pad_type_0 = const()[name = tensor("k_47_pad_type_0"), val = tensor("valid")]; tensor k_47_strides_0 = const()[name = tensor("k_47_strides_0"), val = tensor([1, 1])]; tensor k_47_pad_0 = const()[name = tensor("k_47_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_47_dilations_0 = const()[name = tensor("k_47_dilations_0"), val = tensor([1, 1])]; tensor k_47_groups_0 = const()[name = tensor("k_47_groups_0"), val = tensor(1)]; tensor blocks_23_attn_key_weight_to_fp16 = const()[name = tensor("blocks_23_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(923069120)))]; tensor k_47_cast_fp16 = conv(dilations = k_47_dilations_0, groups = k_47_groups_0, pad = k_47_pad_0, pad_type = k_47_pad_type_0, strides = k_47_strides_0, weight = blocks_23_attn_key_weight_to_fp16, x = input_233_cast_fp16)[name = tensor("k_47_cast_fp16")]; tensor var_6360_pad_type_0 = const()[name = tensor("op_6360_pad_type_0"), val = tensor("valid")]; tensor var_6360_strides_0 = const()[name = tensor("op_6360_strides_0"), val = tensor([1, 1])]; tensor var_6360_pad_0 = const()[name = tensor("op_6360_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_6360_dilations_0 = const()[name = tensor("op_6360_dilations_0"), val = tensor([1, 1])]; tensor var_6360_groups_0 = const()[name = tensor("op_6360_groups_0"), val = tensor(1)]; tensor blocks_23_attn_value_weight_to_fp16 = const()[name = tensor("blocks_23_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(926345984)))]; tensor blocks_23_attn_value_bias_to_fp16 = const()[name = tensor("blocks_23_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(929622848)))]; tensor var_6360_cast_fp16 = conv(bias = blocks_23_attn_value_bias_to_fp16, dilations = var_6360_dilations_0, groups = var_6360_groups_0, pad = var_6360_pad_0, pad_type = var_6360_pad_type_0, strides = var_6360_strides_0, weight = blocks_23_attn_value_weight_to_fp16, x = input_233_cast_fp16)[name = tensor("op_6360_cast_fp16")]; tensor tile_69 = const()[name = tensor("tile_69"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_6363_axis_0 = const()[name = tensor("op_6363_axis_0"), val = tensor(1)]; tensor var_6363_cast_fp16_0, tensor var_6363_cast_fp16_1, tensor var_6363_cast_fp16_2, tensor var_6363_cast_fp16_3, tensor var_6363_cast_fp16_4, tensor var_6363_cast_fp16_5, tensor var_6363_cast_fp16_6, tensor var_6363_cast_fp16_7, tensor var_6363_cast_fp16_8, tensor var_6363_cast_fp16_9, tensor var_6363_cast_fp16_10, tensor var_6363_cast_fp16_11, tensor var_6363_cast_fp16_12, tensor var_6363_cast_fp16_13, tensor var_6363_cast_fp16_14, tensor var_6363_cast_fp16_15, tensor var_6363_cast_fp16_16, tensor var_6363_cast_fp16_17, tensor var_6363_cast_fp16_18, tensor var_6363_cast_fp16_19 = split(axis = var_6363_axis_0, split_sizes = tile_69, x = var_6362_cast_fp16)[name = tensor("op_6363_cast_fp16")]; tensor var_6384_perm_0 = const()[name = tensor("op_6384_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_70 = const()[name = tensor("tile_70"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_6385_axis_0 = const()[name = tensor("op_6385_axis_0"), val = tensor(3)]; tensor var_6384_cast_fp16 = transpose(perm = var_6384_perm_0, x = k_47_cast_fp16)[name = tensor("transpose_9")]; tensor var_6385_cast_fp16_0, tensor var_6385_cast_fp16_1, tensor var_6385_cast_fp16_2, tensor var_6385_cast_fp16_3, tensor var_6385_cast_fp16_4, tensor var_6385_cast_fp16_5, tensor var_6385_cast_fp16_6, tensor var_6385_cast_fp16_7, tensor var_6385_cast_fp16_8, tensor var_6385_cast_fp16_9, tensor var_6385_cast_fp16_10, tensor var_6385_cast_fp16_11, tensor var_6385_cast_fp16_12, tensor var_6385_cast_fp16_13, tensor var_6385_cast_fp16_14, tensor var_6385_cast_fp16_15, tensor var_6385_cast_fp16_16, tensor var_6385_cast_fp16_17, tensor var_6385_cast_fp16_18, tensor var_6385_cast_fp16_19 = split(axis = var_6385_axis_0, split_sizes = tile_70, x = var_6384_cast_fp16)[name = tensor("op_6385_cast_fp16")]; tensor tile_71 = const()[name = tensor("tile_71"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_6406_axis_0 = const()[name = tensor("op_6406_axis_0"), val = tensor(1)]; tensor var_6406_cast_fp16_0, tensor var_6406_cast_fp16_1, tensor var_6406_cast_fp16_2, tensor var_6406_cast_fp16_3, tensor var_6406_cast_fp16_4, tensor var_6406_cast_fp16_5, tensor var_6406_cast_fp16_6, tensor var_6406_cast_fp16_7, tensor var_6406_cast_fp16_8, tensor var_6406_cast_fp16_9, tensor var_6406_cast_fp16_10, tensor var_6406_cast_fp16_11, tensor var_6406_cast_fp16_12, tensor var_6406_cast_fp16_13, tensor var_6406_cast_fp16_14, tensor var_6406_cast_fp16_15, tensor var_6406_cast_fp16_16, tensor var_6406_cast_fp16_17, tensor var_6406_cast_fp16_18, tensor var_6406_cast_fp16_19 = split(axis = var_6406_axis_0, split_sizes = tile_71, x = var_6360_cast_fp16)[name = tensor("op_6406_cast_fp16")]; tensor aw_921_equation_0 = const()[name = tensor("aw_921_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_921_cast_fp16 = einsum(equation = aw_921_equation_0, values = (var_6385_cast_fp16_0, var_6363_cast_fp16_0))[name = tensor("aw_921_cast_fp16")]; tensor aw_923_equation_0 = const()[name = tensor("aw_923_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_923_cast_fp16 = einsum(equation = aw_923_equation_0, values = (var_6385_cast_fp16_1, var_6363_cast_fp16_1))[name = tensor("aw_923_cast_fp16")]; tensor aw_925_equation_0 = const()[name = tensor("aw_925_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_925_cast_fp16 = einsum(equation = aw_925_equation_0, values = (var_6385_cast_fp16_2, var_6363_cast_fp16_2))[name = tensor("aw_925_cast_fp16")]; tensor aw_927_equation_0 = const()[name = tensor("aw_927_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_927_cast_fp16 = einsum(equation = aw_927_equation_0, values = (var_6385_cast_fp16_3, var_6363_cast_fp16_3))[name = tensor("aw_927_cast_fp16")]; tensor aw_929_equation_0 = const()[name = tensor("aw_929_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_929_cast_fp16 = einsum(equation = aw_929_equation_0, values = (var_6385_cast_fp16_4, var_6363_cast_fp16_4))[name = tensor("aw_929_cast_fp16")]; tensor aw_931_equation_0 = const()[name = tensor("aw_931_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_931_cast_fp16 = einsum(equation = aw_931_equation_0, values = (var_6385_cast_fp16_5, var_6363_cast_fp16_5))[name = tensor("aw_931_cast_fp16")]; tensor aw_933_equation_0 = const()[name = tensor("aw_933_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_933_cast_fp16 = einsum(equation = aw_933_equation_0, values = (var_6385_cast_fp16_6, var_6363_cast_fp16_6))[name = tensor("aw_933_cast_fp16")]; tensor aw_935_equation_0 = const()[name = tensor("aw_935_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_935_cast_fp16 = einsum(equation = aw_935_equation_0, values = (var_6385_cast_fp16_7, var_6363_cast_fp16_7))[name = tensor("aw_935_cast_fp16")]; tensor aw_937_equation_0 = const()[name = tensor("aw_937_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_937_cast_fp16 = einsum(equation = aw_937_equation_0, values = (var_6385_cast_fp16_8, var_6363_cast_fp16_8))[name = tensor("aw_937_cast_fp16")]; tensor aw_939_equation_0 = const()[name = tensor("aw_939_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_939_cast_fp16 = einsum(equation = aw_939_equation_0, values = (var_6385_cast_fp16_9, var_6363_cast_fp16_9))[name = tensor("aw_939_cast_fp16")]; tensor aw_941_equation_0 = const()[name = tensor("aw_941_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_941_cast_fp16 = einsum(equation = aw_941_equation_0, values = (var_6385_cast_fp16_10, var_6363_cast_fp16_10))[name = tensor("aw_941_cast_fp16")]; tensor aw_943_equation_0 = const()[name = tensor("aw_943_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_943_cast_fp16 = einsum(equation = aw_943_equation_0, values = (var_6385_cast_fp16_11, var_6363_cast_fp16_11))[name = tensor("aw_943_cast_fp16")]; tensor aw_945_equation_0 = const()[name = tensor("aw_945_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_945_cast_fp16 = einsum(equation = aw_945_equation_0, values = (var_6385_cast_fp16_12, var_6363_cast_fp16_12))[name = tensor("aw_945_cast_fp16")]; tensor aw_947_equation_0 = const()[name = tensor("aw_947_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_947_cast_fp16 = einsum(equation = aw_947_equation_0, values = (var_6385_cast_fp16_13, var_6363_cast_fp16_13))[name = tensor("aw_947_cast_fp16")]; tensor aw_949_equation_0 = const()[name = tensor("aw_949_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_949_cast_fp16 = einsum(equation = aw_949_equation_0, values = (var_6385_cast_fp16_14, var_6363_cast_fp16_14))[name = tensor("aw_949_cast_fp16")]; tensor aw_951_equation_0 = const()[name = tensor("aw_951_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_951_cast_fp16 = einsum(equation = aw_951_equation_0, values = (var_6385_cast_fp16_15, var_6363_cast_fp16_15))[name = tensor("aw_951_cast_fp16")]; tensor aw_953_equation_0 = const()[name = tensor("aw_953_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_953_cast_fp16 = einsum(equation = aw_953_equation_0, values = (var_6385_cast_fp16_16, var_6363_cast_fp16_16))[name = tensor("aw_953_cast_fp16")]; tensor aw_955_equation_0 = const()[name = tensor("aw_955_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_955_cast_fp16 = einsum(equation = aw_955_equation_0, values = (var_6385_cast_fp16_17, var_6363_cast_fp16_17))[name = tensor("aw_955_cast_fp16")]; tensor aw_957_equation_0 = const()[name = tensor("aw_957_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_957_cast_fp16 = einsum(equation = aw_957_equation_0, values = (var_6385_cast_fp16_18, var_6363_cast_fp16_18))[name = tensor("aw_957_cast_fp16")]; tensor aw_959_equation_0 = const()[name = tensor("aw_959_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_959_cast_fp16 = einsum(equation = aw_959_equation_0, values = (var_6385_cast_fp16_19, var_6363_cast_fp16_19))[name = tensor("aw_959_cast_fp16")]; tensor var_6467_cast_fp16 = softmax(axis = var_6311, x = aw_921_cast_fp16)[name = tensor("op_6467_cast_fp16")]; tensor var_6468_cast_fp16 = softmax(axis = var_6311, x = aw_923_cast_fp16)[name = tensor("op_6468_cast_fp16")]; tensor var_6469_cast_fp16 = softmax(axis = var_6311, x = aw_925_cast_fp16)[name = tensor("op_6469_cast_fp16")]; tensor var_6470_cast_fp16 = softmax(axis = var_6311, x = aw_927_cast_fp16)[name = tensor("op_6470_cast_fp16")]; tensor var_6471_cast_fp16 = softmax(axis = var_6311, x = aw_929_cast_fp16)[name = tensor("op_6471_cast_fp16")]; tensor var_6472_cast_fp16 = softmax(axis = var_6311, x = aw_931_cast_fp16)[name = tensor("op_6472_cast_fp16")]; tensor var_6473_cast_fp16 = softmax(axis = var_6311, x = aw_933_cast_fp16)[name = tensor("op_6473_cast_fp16")]; tensor var_6474_cast_fp16 = softmax(axis = var_6311, x = aw_935_cast_fp16)[name = tensor("op_6474_cast_fp16")]; tensor var_6475_cast_fp16 = softmax(axis = var_6311, x = aw_937_cast_fp16)[name = tensor("op_6475_cast_fp16")]; tensor var_6476_cast_fp16 = softmax(axis = var_6311, x = aw_939_cast_fp16)[name = tensor("op_6476_cast_fp16")]; tensor var_6477_cast_fp16 = softmax(axis = var_6311, x = aw_941_cast_fp16)[name = tensor("op_6477_cast_fp16")]; tensor var_6478_cast_fp16 = softmax(axis = var_6311, x = aw_943_cast_fp16)[name = tensor("op_6478_cast_fp16")]; tensor var_6479_cast_fp16 = softmax(axis = var_6311, x = aw_945_cast_fp16)[name = tensor("op_6479_cast_fp16")]; tensor var_6480_cast_fp16 = softmax(axis = var_6311, x = aw_947_cast_fp16)[name = tensor("op_6480_cast_fp16")]; tensor var_6481_cast_fp16 = softmax(axis = var_6311, x = aw_949_cast_fp16)[name = tensor("op_6481_cast_fp16")]; tensor var_6482_cast_fp16 = softmax(axis = var_6311, x = aw_951_cast_fp16)[name = tensor("op_6482_cast_fp16")]; tensor var_6483_cast_fp16 = softmax(axis = var_6311, x = aw_953_cast_fp16)[name = tensor("op_6483_cast_fp16")]; tensor var_6484_cast_fp16 = softmax(axis = var_6311, x = aw_955_cast_fp16)[name = tensor("op_6484_cast_fp16")]; tensor var_6485_cast_fp16 = softmax(axis = var_6311, x = aw_957_cast_fp16)[name = tensor("op_6485_cast_fp16")]; tensor var_6486_cast_fp16 = softmax(axis = var_6311, x = aw_959_cast_fp16)[name = tensor("op_6486_cast_fp16")]; tensor var_6488_equation_0 = const()[name = tensor("op_6488_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6488_cast_fp16 = einsum(equation = var_6488_equation_0, values = (var_6406_cast_fp16_0, var_6467_cast_fp16))[name = tensor("op_6488_cast_fp16")]; tensor var_6490_equation_0 = const()[name = tensor("op_6490_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6490_cast_fp16 = einsum(equation = var_6490_equation_0, values = (var_6406_cast_fp16_1, var_6468_cast_fp16))[name = tensor("op_6490_cast_fp16")]; tensor var_6492_equation_0 = const()[name = tensor("op_6492_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6492_cast_fp16 = einsum(equation = var_6492_equation_0, values = (var_6406_cast_fp16_2, var_6469_cast_fp16))[name = tensor("op_6492_cast_fp16")]; tensor var_6494_equation_0 = const()[name = tensor("op_6494_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6494_cast_fp16 = einsum(equation = var_6494_equation_0, values = (var_6406_cast_fp16_3, var_6470_cast_fp16))[name = tensor("op_6494_cast_fp16")]; tensor var_6496_equation_0 = const()[name = tensor("op_6496_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6496_cast_fp16 = einsum(equation = var_6496_equation_0, values = (var_6406_cast_fp16_4, var_6471_cast_fp16))[name = tensor("op_6496_cast_fp16")]; tensor var_6498_equation_0 = const()[name = tensor("op_6498_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6498_cast_fp16 = einsum(equation = var_6498_equation_0, values = (var_6406_cast_fp16_5, var_6472_cast_fp16))[name = tensor("op_6498_cast_fp16")]; tensor var_6500_equation_0 = const()[name = tensor("op_6500_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6500_cast_fp16 = einsum(equation = var_6500_equation_0, values = (var_6406_cast_fp16_6, var_6473_cast_fp16))[name = tensor("op_6500_cast_fp16")]; tensor var_6502_equation_0 = const()[name = tensor("op_6502_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6502_cast_fp16 = einsum(equation = var_6502_equation_0, values = (var_6406_cast_fp16_7, var_6474_cast_fp16))[name = tensor("op_6502_cast_fp16")]; tensor var_6504_equation_0 = const()[name = tensor("op_6504_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6504_cast_fp16 = einsum(equation = var_6504_equation_0, values = (var_6406_cast_fp16_8, var_6475_cast_fp16))[name = tensor("op_6504_cast_fp16")]; tensor var_6506_equation_0 = const()[name = tensor("op_6506_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6506_cast_fp16 = einsum(equation = var_6506_equation_0, values = (var_6406_cast_fp16_9, var_6476_cast_fp16))[name = tensor("op_6506_cast_fp16")]; tensor var_6508_equation_0 = const()[name = tensor("op_6508_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6508_cast_fp16 = einsum(equation = var_6508_equation_0, values = (var_6406_cast_fp16_10, var_6477_cast_fp16))[name = tensor("op_6508_cast_fp16")]; tensor var_6510_equation_0 = const()[name = tensor("op_6510_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6510_cast_fp16 = einsum(equation = var_6510_equation_0, values = (var_6406_cast_fp16_11, var_6478_cast_fp16))[name = tensor("op_6510_cast_fp16")]; tensor var_6512_equation_0 = const()[name = tensor("op_6512_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6512_cast_fp16 = einsum(equation = var_6512_equation_0, values = (var_6406_cast_fp16_12, var_6479_cast_fp16))[name = tensor("op_6512_cast_fp16")]; tensor var_6514_equation_0 = const()[name = tensor("op_6514_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6514_cast_fp16 = einsum(equation = var_6514_equation_0, values = (var_6406_cast_fp16_13, var_6480_cast_fp16))[name = tensor("op_6514_cast_fp16")]; tensor var_6516_equation_0 = const()[name = tensor("op_6516_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6516_cast_fp16 = einsum(equation = var_6516_equation_0, values = (var_6406_cast_fp16_14, var_6481_cast_fp16))[name = tensor("op_6516_cast_fp16")]; tensor var_6518_equation_0 = const()[name = tensor("op_6518_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6518_cast_fp16 = einsum(equation = var_6518_equation_0, values = (var_6406_cast_fp16_15, var_6482_cast_fp16))[name = tensor("op_6518_cast_fp16")]; tensor var_6520_equation_0 = const()[name = tensor("op_6520_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6520_cast_fp16 = einsum(equation = var_6520_equation_0, values = (var_6406_cast_fp16_16, var_6483_cast_fp16))[name = tensor("op_6520_cast_fp16")]; tensor var_6522_equation_0 = const()[name = tensor("op_6522_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6522_cast_fp16 = einsum(equation = var_6522_equation_0, values = (var_6406_cast_fp16_17, var_6484_cast_fp16))[name = tensor("op_6522_cast_fp16")]; tensor var_6524_equation_0 = const()[name = tensor("op_6524_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6524_cast_fp16 = einsum(equation = var_6524_equation_0, values = (var_6406_cast_fp16_18, var_6485_cast_fp16))[name = tensor("op_6524_cast_fp16")]; tensor var_6526_equation_0 = const()[name = tensor("op_6526_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6526_cast_fp16 = einsum(equation = var_6526_equation_0, values = (var_6406_cast_fp16_19, var_6486_cast_fp16))[name = tensor("op_6526_cast_fp16")]; tensor input_235_interleave_0 = const()[name = tensor("input_235_interleave_0"), val = tensor(false)]; tensor input_235_cast_fp16 = concat(axis = var_6311, interleave = input_235_interleave_0, values = (var_6488_cast_fp16, var_6490_cast_fp16, var_6492_cast_fp16, var_6494_cast_fp16, var_6496_cast_fp16, var_6498_cast_fp16, var_6500_cast_fp16, var_6502_cast_fp16, var_6504_cast_fp16, var_6506_cast_fp16, var_6508_cast_fp16, var_6510_cast_fp16, var_6512_cast_fp16, var_6514_cast_fp16, var_6516_cast_fp16, var_6518_cast_fp16, var_6520_cast_fp16, var_6522_cast_fp16, var_6524_cast_fp16, var_6526_cast_fp16))[name = tensor("input_235_cast_fp16")]; tensor var_6535_pad_type_0 = const()[name = tensor("op_6535_pad_type_0"), val = tensor("valid")]; tensor var_6535_strides_0 = const()[name = tensor("op_6535_strides_0"), val = tensor([1, 1])]; tensor var_6535_pad_0 = const()[name = tensor("op_6535_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_6535_dilations_0 = const()[name = tensor("op_6535_dilations_0"), val = tensor([1, 1])]; tensor var_6535_groups_0 = const()[name = tensor("op_6535_groups_0"), val = tensor(1)]; tensor blocks_23_attn_out_weight_to_fp16 = const()[name = tensor("blocks_23_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(929625472)))]; tensor blocks_23_attn_out_bias_to_fp16 = const()[name = tensor("blocks_23_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(932902336)))]; tensor var_6535_cast_fp16 = conv(bias = blocks_23_attn_out_bias_to_fp16, dilations = var_6535_dilations_0, groups = var_6535_groups_0, pad = var_6535_pad_0, pad_type = var_6535_pad_type_0, strides = var_6535_strides_0, weight = blocks_23_attn_out_weight_to_fp16, x = input_235_cast_fp16)[name = tensor("op_6535_cast_fp16")]; tensor inputs_95_cast_fp16 = add(x = inputs_93_cast_fp16, y = var_6535_cast_fp16)[name = tensor("inputs_95_cast_fp16")]; tensor input_237_axes_0 = const()[name = tensor("input_237_axes_0"), val = tensor([1])]; tensor input_237_gamma_0_to_fp16 = const()[name = tensor("input_237_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(932904960)))]; tensor input_237_beta_0_to_fp16 = const()[name = tensor("input_237_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(932907584)))]; tensor var_6545_to_fp16 = const()[name = tensor("op_6545_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_237_cast_fp16 = layer_norm(axes = input_237_axes_0, beta = input_237_beta_0_to_fp16, epsilon = var_6545_to_fp16, gamma = input_237_gamma_0_to_fp16, x = inputs_95_cast_fp16)[name = tensor("input_237_cast_fp16")]; tensor input_239_pad_type_0 = const()[name = tensor("input_239_pad_type_0"), val = tensor("valid")]; tensor input_239_strides_0 = const()[name = tensor("input_239_strides_0"), val = tensor([1, 1])]; tensor input_239_pad_0 = const()[name = tensor("input_239_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_239_dilations_0 = const()[name = tensor("input_239_dilations_0"), val = tensor([1, 1])]; tensor input_239_groups_0 = const()[name = tensor("input_239_groups_0"), val = tensor(1)]; tensor blocks_23_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_23_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(932910208)))]; tensor blocks_23_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_23_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(946017472)))]; tensor input_239_cast_fp16 = conv(bias = blocks_23_mlp_0_bias_to_fp16, dilations = input_239_dilations_0, groups = input_239_groups_0, pad = input_239_pad_0, pad_type = input_239_pad_type_0, strides = input_239_strides_0, weight = blocks_23_mlp_0_weight_to_fp16, x = input_237_cast_fp16)[name = tensor("input_239_cast_fp16")]; tensor input_241_mode_0 = const()[name = tensor("input_241_mode_0"), val = tensor("EXACT")]; tensor input_241_cast_fp16 = gelu(mode = input_241_mode_0, x = input_239_cast_fp16)[name = tensor("input_241_cast_fp16")]; tensor var_6571_pad_type_0 = const()[name = tensor("op_6571_pad_type_0"), val = tensor("valid")]; tensor var_6571_strides_0 = const()[name = tensor("op_6571_strides_0"), val = tensor([1, 1])]; tensor var_6571_pad_0 = const()[name = tensor("op_6571_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_6571_dilations_0 = const()[name = tensor("op_6571_dilations_0"), val = tensor([1, 1])]; tensor var_6571_groups_0 = const()[name = tensor("op_6571_groups_0"), val = tensor(1)]; tensor blocks_23_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_23_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(946027776)))]; tensor blocks_23_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_23_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(959135040)))]; tensor var_6571_cast_fp16 = conv(bias = blocks_23_mlp_2_bias_to_fp16, dilations = var_6571_dilations_0, groups = var_6571_groups_0, pad = var_6571_pad_0, pad_type = var_6571_pad_type_0, strides = var_6571_strides_0, weight = blocks_23_mlp_2_weight_to_fp16, x = input_241_cast_fp16)[name = tensor("op_6571_cast_fp16")]; tensor inputs_97_cast_fp16 = add(x = inputs_95_cast_fp16, y = var_6571_cast_fp16)[name = tensor("inputs_97_cast_fp16")]; tensor var_6580 = const()[name = tensor("op_6580"), val = tensor(1)]; tensor input_243_axes_0 = const()[name = tensor("input_243_axes_0"), val = tensor([1])]; tensor input_243_gamma_0_to_fp16 = const()[name = tensor("input_243_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(959137664)))]; tensor input_243_beta_0_to_fp16 = const()[name = tensor("input_243_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(959140288)))]; tensor var_6596_to_fp16 = const()[name = tensor("op_6596_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_243_cast_fp16 = layer_norm(axes = input_243_axes_0, beta = input_243_beta_0_to_fp16, epsilon = var_6596_to_fp16, gamma = input_243_gamma_0_to_fp16, x = inputs_97_cast_fp16)[name = tensor("input_243_cast_fp16")]; tensor q_49_pad_type_0 = const()[name = tensor("q_49_pad_type_0"), val = tensor("valid")]; tensor q_49_strides_0 = const()[name = tensor("q_49_strides_0"), val = tensor([1, 1])]; tensor q_49_pad_0 = const()[name = tensor("q_49_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_49_dilations_0 = const()[name = tensor("q_49_dilations_0"), val = tensor([1, 1])]; tensor q_49_groups_0 = const()[name = tensor("q_49_groups_0"), val = tensor(1)]; tensor var_6631_weight_0_to_fp16 = const()[name = tensor("op_6631_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(959142912)))]; tensor var_6631_bias_0_to_fp16 = const()[name = tensor("op_6631_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(962419776)))]; tensor var_6631_cast_fp16 = conv(bias = var_6631_bias_0_to_fp16, dilations = q_49_dilations_0, groups = q_49_groups_0, pad = q_49_pad_0, pad_type = q_49_pad_type_0, strides = q_49_strides_0, weight = var_6631_weight_0_to_fp16, x = input_243_cast_fp16)[name = tensor("op_6631_cast_fp16")]; tensor k_49_pad_type_0 = const()[name = tensor("k_49_pad_type_0"), val = tensor("valid")]; tensor k_49_strides_0 = const()[name = tensor("k_49_strides_0"), val = tensor([1, 1])]; tensor k_49_pad_0 = const()[name = tensor("k_49_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_49_dilations_0 = const()[name = tensor("k_49_dilations_0"), val = tensor([1, 1])]; tensor k_49_groups_0 = const()[name = tensor("k_49_groups_0"), val = tensor(1)]; tensor blocks_24_attn_key_weight_to_fp16 = const()[name = tensor("blocks_24_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(962422400)))]; tensor k_49_cast_fp16 = conv(dilations = k_49_dilations_0, groups = k_49_groups_0, pad = k_49_pad_0, pad_type = k_49_pad_type_0, strides = k_49_strides_0, weight = blocks_24_attn_key_weight_to_fp16, x = input_243_cast_fp16)[name = tensor("k_49_cast_fp16")]; tensor var_6629_pad_type_0 = const()[name = tensor("op_6629_pad_type_0"), val = tensor("valid")]; tensor var_6629_strides_0 = const()[name = tensor("op_6629_strides_0"), val = tensor([1, 1])]; tensor var_6629_pad_0 = const()[name = tensor("op_6629_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_6629_dilations_0 = const()[name = tensor("op_6629_dilations_0"), val = tensor([1, 1])]; tensor var_6629_groups_0 = const()[name = tensor("op_6629_groups_0"), val = tensor(1)]; tensor blocks_24_attn_value_weight_to_fp16 = const()[name = tensor("blocks_24_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(965699264)))]; tensor blocks_24_attn_value_bias_to_fp16 = const()[name = tensor("blocks_24_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(968976128)))]; tensor var_6629_cast_fp16 = conv(bias = blocks_24_attn_value_bias_to_fp16, dilations = var_6629_dilations_0, groups = var_6629_groups_0, pad = var_6629_pad_0, pad_type = var_6629_pad_type_0, strides = var_6629_strides_0, weight = blocks_24_attn_value_weight_to_fp16, x = input_243_cast_fp16)[name = tensor("op_6629_cast_fp16")]; tensor tile_72 = const()[name = tensor("tile_72"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_6632_axis_0 = const()[name = tensor("op_6632_axis_0"), val = tensor(1)]; tensor var_6632_cast_fp16_0, tensor var_6632_cast_fp16_1, tensor var_6632_cast_fp16_2, tensor var_6632_cast_fp16_3, tensor var_6632_cast_fp16_4, tensor var_6632_cast_fp16_5, tensor var_6632_cast_fp16_6, tensor var_6632_cast_fp16_7, tensor var_6632_cast_fp16_8, tensor var_6632_cast_fp16_9, tensor var_6632_cast_fp16_10, tensor var_6632_cast_fp16_11, tensor var_6632_cast_fp16_12, tensor var_6632_cast_fp16_13, tensor var_6632_cast_fp16_14, tensor var_6632_cast_fp16_15, tensor var_6632_cast_fp16_16, tensor var_6632_cast_fp16_17, tensor var_6632_cast_fp16_18, tensor var_6632_cast_fp16_19 = split(axis = var_6632_axis_0, split_sizes = tile_72, x = var_6631_cast_fp16)[name = tensor("op_6632_cast_fp16")]; tensor var_6653_perm_0 = const()[name = tensor("op_6653_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_73 = const()[name = tensor("tile_73"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_6654_axis_0 = const()[name = tensor("op_6654_axis_0"), val = tensor(3)]; tensor var_6653_cast_fp16 = transpose(perm = var_6653_perm_0, x = k_49_cast_fp16)[name = tensor("transpose_8")]; tensor var_6654_cast_fp16_0, tensor var_6654_cast_fp16_1, tensor var_6654_cast_fp16_2, tensor var_6654_cast_fp16_3, tensor var_6654_cast_fp16_4, tensor var_6654_cast_fp16_5, tensor var_6654_cast_fp16_6, tensor var_6654_cast_fp16_7, tensor var_6654_cast_fp16_8, tensor var_6654_cast_fp16_9, tensor var_6654_cast_fp16_10, tensor var_6654_cast_fp16_11, tensor var_6654_cast_fp16_12, tensor var_6654_cast_fp16_13, tensor var_6654_cast_fp16_14, tensor var_6654_cast_fp16_15, tensor var_6654_cast_fp16_16, tensor var_6654_cast_fp16_17, tensor var_6654_cast_fp16_18, tensor var_6654_cast_fp16_19 = split(axis = var_6654_axis_0, split_sizes = tile_73, x = var_6653_cast_fp16)[name = tensor("op_6654_cast_fp16")]; tensor tile_74 = const()[name = tensor("tile_74"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_6675_axis_0 = const()[name = tensor("op_6675_axis_0"), val = tensor(1)]; tensor var_6675_cast_fp16_0, tensor var_6675_cast_fp16_1, tensor var_6675_cast_fp16_2, tensor var_6675_cast_fp16_3, tensor var_6675_cast_fp16_4, tensor var_6675_cast_fp16_5, tensor var_6675_cast_fp16_6, tensor var_6675_cast_fp16_7, tensor var_6675_cast_fp16_8, tensor var_6675_cast_fp16_9, tensor var_6675_cast_fp16_10, tensor var_6675_cast_fp16_11, tensor var_6675_cast_fp16_12, tensor var_6675_cast_fp16_13, tensor var_6675_cast_fp16_14, tensor var_6675_cast_fp16_15, tensor var_6675_cast_fp16_16, tensor var_6675_cast_fp16_17, tensor var_6675_cast_fp16_18, tensor var_6675_cast_fp16_19 = split(axis = var_6675_axis_0, split_sizes = tile_74, x = var_6629_cast_fp16)[name = tensor("op_6675_cast_fp16")]; tensor aw_961_equation_0 = const()[name = tensor("aw_961_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_961_cast_fp16 = einsum(equation = aw_961_equation_0, values = (var_6654_cast_fp16_0, var_6632_cast_fp16_0))[name = tensor("aw_961_cast_fp16")]; tensor aw_963_equation_0 = const()[name = tensor("aw_963_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_963_cast_fp16 = einsum(equation = aw_963_equation_0, values = (var_6654_cast_fp16_1, var_6632_cast_fp16_1))[name = tensor("aw_963_cast_fp16")]; tensor aw_965_equation_0 = const()[name = tensor("aw_965_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_965_cast_fp16 = einsum(equation = aw_965_equation_0, values = (var_6654_cast_fp16_2, var_6632_cast_fp16_2))[name = tensor("aw_965_cast_fp16")]; tensor aw_967_equation_0 = const()[name = tensor("aw_967_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_967_cast_fp16 = einsum(equation = aw_967_equation_0, values = (var_6654_cast_fp16_3, var_6632_cast_fp16_3))[name = tensor("aw_967_cast_fp16")]; tensor aw_969_equation_0 = const()[name = tensor("aw_969_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_969_cast_fp16 = einsum(equation = aw_969_equation_0, values = (var_6654_cast_fp16_4, var_6632_cast_fp16_4))[name = tensor("aw_969_cast_fp16")]; tensor aw_971_equation_0 = const()[name = tensor("aw_971_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_971_cast_fp16 = einsum(equation = aw_971_equation_0, values = (var_6654_cast_fp16_5, var_6632_cast_fp16_5))[name = tensor("aw_971_cast_fp16")]; tensor aw_973_equation_0 = const()[name = tensor("aw_973_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_973_cast_fp16 = einsum(equation = aw_973_equation_0, values = (var_6654_cast_fp16_6, var_6632_cast_fp16_6))[name = tensor("aw_973_cast_fp16")]; tensor aw_975_equation_0 = const()[name = tensor("aw_975_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_975_cast_fp16 = einsum(equation = aw_975_equation_0, values = (var_6654_cast_fp16_7, var_6632_cast_fp16_7))[name = tensor("aw_975_cast_fp16")]; tensor aw_977_equation_0 = const()[name = tensor("aw_977_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_977_cast_fp16 = einsum(equation = aw_977_equation_0, values = (var_6654_cast_fp16_8, var_6632_cast_fp16_8))[name = tensor("aw_977_cast_fp16")]; tensor aw_979_equation_0 = const()[name = tensor("aw_979_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_979_cast_fp16 = einsum(equation = aw_979_equation_0, values = (var_6654_cast_fp16_9, var_6632_cast_fp16_9))[name = tensor("aw_979_cast_fp16")]; tensor aw_981_equation_0 = const()[name = tensor("aw_981_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_981_cast_fp16 = einsum(equation = aw_981_equation_0, values = (var_6654_cast_fp16_10, var_6632_cast_fp16_10))[name = tensor("aw_981_cast_fp16")]; tensor aw_983_equation_0 = const()[name = tensor("aw_983_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_983_cast_fp16 = einsum(equation = aw_983_equation_0, values = (var_6654_cast_fp16_11, var_6632_cast_fp16_11))[name = tensor("aw_983_cast_fp16")]; tensor aw_985_equation_0 = const()[name = tensor("aw_985_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_985_cast_fp16 = einsum(equation = aw_985_equation_0, values = (var_6654_cast_fp16_12, var_6632_cast_fp16_12))[name = tensor("aw_985_cast_fp16")]; tensor aw_987_equation_0 = const()[name = tensor("aw_987_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_987_cast_fp16 = einsum(equation = aw_987_equation_0, values = (var_6654_cast_fp16_13, var_6632_cast_fp16_13))[name = tensor("aw_987_cast_fp16")]; tensor aw_989_equation_0 = const()[name = tensor("aw_989_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_989_cast_fp16 = einsum(equation = aw_989_equation_0, values = (var_6654_cast_fp16_14, var_6632_cast_fp16_14))[name = tensor("aw_989_cast_fp16")]; tensor aw_991_equation_0 = const()[name = tensor("aw_991_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_991_cast_fp16 = einsum(equation = aw_991_equation_0, values = (var_6654_cast_fp16_15, var_6632_cast_fp16_15))[name = tensor("aw_991_cast_fp16")]; tensor aw_993_equation_0 = const()[name = tensor("aw_993_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_993_cast_fp16 = einsum(equation = aw_993_equation_0, values = (var_6654_cast_fp16_16, var_6632_cast_fp16_16))[name = tensor("aw_993_cast_fp16")]; tensor aw_995_equation_0 = const()[name = tensor("aw_995_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_995_cast_fp16 = einsum(equation = aw_995_equation_0, values = (var_6654_cast_fp16_17, var_6632_cast_fp16_17))[name = tensor("aw_995_cast_fp16")]; tensor aw_997_equation_0 = const()[name = tensor("aw_997_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_997_cast_fp16 = einsum(equation = aw_997_equation_0, values = (var_6654_cast_fp16_18, var_6632_cast_fp16_18))[name = tensor("aw_997_cast_fp16")]; tensor aw_999_equation_0 = const()[name = tensor("aw_999_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_999_cast_fp16 = einsum(equation = aw_999_equation_0, values = (var_6654_cast_fp16_19, var_6632_cast_fp16_19))[name = tensor("aw_999_cast_fp16")]; tensor var_6736_cast_fp16 = softmax(axis = var_6580, x = aw_961_cast_fp16)[name = tensor("op_6736_cast_fp16")]; tensor var_6737_cast_fp16 = softmax(axis = var_6580, x = aw_963_cast_fp16)[name = tensor("op_6737_cast_fp16")]; tensor var_6738_cast_fp16 = softmax(axis = var_6580, x = aw_965_cast_fp16)[name = tensor("op_6738_cast_fp16")]; tensor var_6739_cast_fp16 = softmax(axis = var_6580, x = aw_967_cast_fp16)[name = tensor("op_6739_cast_fp16")]; tensor var_6740_cast_fp16 = softmax(axis = var_6580, x = aw_969_cast_fp16)[name = tensor("op_6740_cast_fp16")]; tensor var_6741_cast_fp16 = softmax(axis = var_6580, x = aw_971_cast_fp16)[name = tensor("op_6741_cast_fp16")]; tensor var_6742_cast_fp16 = softmax(axis = var_6580, x = aw_973_cast_fp16)[name = tensor("op_6742_cast_fp16")]; tensor var_6743_cast_fp16 = softmax(axis = var_6580, x = aw_975_cast_fp16)[name = tensor("op_6743_cast_fp16")]; tensor var_6744_cast_fp16 = softmax(axis = var_6580, x = aw_977_cast_fp16)[name = tensor("op_6744_cast_fp16")]; tensor var_6745_cast_fp16 = softmax(axis = var_6580, x = aw_979_cast_fp16)[name = tensor("op_6745_cast_fp16")]; tensor var_6746_cast_fp16 = softmax(axis = var_6580, x = aw_981_cast_fp16)[name = tensor("op_6746_cast_fp16")]; tensor var_6747_cast_fp16 = softmax(axis = var_6580, x = aw_983_cast_fp16)[name = tensor("op_6747_cast_fp16")]; tensor var_6748_cast_fp16 = softmax(axis = var_6580, x = aw_985_cast_fp16)[name = tensor("op_6748_cast_fp16")]; tensor var_6749_cast_fp16 = softmax(axis = var_6580, x = aw_987_cast_fp16)[name = tensor("op_6749_cast_fp16")]; tensor var_6750_cast_fp16 = softmax(axis = var_6580, x = aw_989_cast_fp16)[name = tensor("op_6750_cast_fp16")]; tensor var_6751_cast_fp16 = softmax(axis = var_6580, x = aw_991_cast_fp16)[name = tensor("op_6751_cast_fp16")]; tensor var_6752_cast_fp16 = softmax(axis = var_6580, x = aw_993_cast_fp16)[name = tensor("op_6752_cast_fp16")]; tensor var_6753_cast_fp16 = softmax(axis = var_6580, x = aw_995_cast_fp16)[name = tensor("op_6753_cast_fp16")]; tensor var_6754_cast_fp16 = softmax(axis = var_6580, x = aw_997_cast_fp16)[name = tensor("op_6754_cast_fp16")]; tensor var_6755_cast_fp16 = softmax(axis = var_6580, x = aw_999_cast_fp16)[name = tensor("op_6755_cast_fp16")]; tensor var_6757_equation_0 = const()[name = tensor("op_6757_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6757_cast_fp16 = einsum(equation = var_6757_equation_0, values = (var_6675_cast_fp16_0, var_6736_cast_fp16))[name = tensor("op_6757_cast_fp16")]; tensor var_6759_equation_0 = const()[name = tensor("op_6759_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6759_cast_fp16 = einsum(equation = var_6759_equation_0, values = (var_6675_cast_fp16_1, var_6737_cast_fp16))[name = tensor("op_6759_cast_fp16")]; tensor var_6761_equation_0 = const()[name = tensor("op_6761_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6761_cast_fp16 = einsum(equation = var_6761_equation_0, values = (var_6675_cast_fp16_2, var_6738_cast_fp16))[name = tensor("op_6761_cast_fp16")]; tensor var_6763_equation_0 = const()[name = tensor("op_6763_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6763_cast_fp16 = einsum(equation = var_6763_equation_0, values = (var_6675_cast_fp16_3, var_6739_cast_fp16))[name = tensor("op_6763_cast_fp16")]; tensor var_6765_equation_0 = const()[name = tensor("op_6765_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6765_cast_fp16 = einsum(equation = var_6765_equation_0, values = (var_6675_cast_fp16_4, var_6740_cast_fp16))[name = tensor("op_6765_cast_fp16")]; tensor var_6767_equation_0 = const()[name = tensor("op_6767_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6767_cast_fp16 = einsum(equation = var_6767_equation_0, values = (var_6675_cast_fp16_5, var_6741_cast_fp16))[name = tensor("op_6767_cast_fp16")]; tensor var_6769_equation_0 = const()[name = tensor("op_6769_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6769_cast_fp16 = einsum(equation = var_6769_equation_0, values = (var_6675_cast_fp16_6, var_6742_cast_fp16))[name = tensor("op_6769_cast_fp16")]; tensor var_6771_equation_0 = const()[name = tensor("op_6771_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6771_cast_fp16 = einsum(equation = var_6771_equation_0, values = (var_6675_cast_fp16_7, var_6743_cast_fp16))[name = tensor("op_6771_cast_fp16")]; tensor var_6773_equation_0 = const()[name = tensor("op_6773_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6773_cast_fp16 = einsum(equation = var_6773_equation_0, values = (var_6675_cast_fp16_8, var_6744_cast_fp16))[name = tensor("op_6773_cast_fp16")]; tensor var_6775_equation_0 = const()[name = tensor("op_6775_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6775_cast_fp16 = einsum(equation = var_6775_equation_0, values = (var_6675_cast_fp16_9, var_6745_cast_fp16))[name = tensor("op_6775_cast_fp16")]; tensor var_6777_equation_0 = const()[name = tensor("op_6777_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6777_cast_fp16 = einsum(equation = var_6777_equation_0, values = (var_6675_cast_fp16_10, var_6746_cast_fp16))[name = tensor("op_6777_cast_fp16")]; tensor var_6779_equation_0 = const()[name = tensor("op_6779_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6779_cast_fp16 = einsum(equation = var_6779_equation_0, values = (var_6675_cast_fp16_11, var_6747_cast_fp16))[name = tensor("op_6779_cast_fp16")]; tensor var_6781_equation_0 = const()[name = tensor("op_6781_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6781_cast_fp16 = einsum(equation = var_6781_equation_0, values = (var_6675_cast_fp16_12, var_6748_cast_fp16))[name = tensor("op_6781_cast_fp16")]; tensor var_6783_equation_0 = const()[name = tensor("op_6783_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6783_cast_fp16 = einsum(equation = var_6783_equation_0, values = (var_6675_cast_fp16_13, var_6749_cast_fp16))[name = tensor("op_6783_cast_fp16")]; tensor var_6785_equation_0 = const()[name = tensor("op_6785_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6785_cast_fp16 = einsum(equation = var_6785_equation_0, values = (var_6675_cast_fp16_14, var_6750_cast_fp16))[name = tensor("op_6785_cast_fp16")]; tensor var_6787_equation_0 = const()[name = tensor("op_6787_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6787_cast_fp16 = einsum(equation = var_6787_equation_0, values = (var_6675_cast_fp16_15, var_6751_cast_fp16))[name = tensor("op_6787_cast_fp16")]; tensor var_6789_equation_0 = const()[name = tensor("op_6789_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6789_cast_fp16 = einsum(equation = var_6789_equation_0, values = (var_6675_cast_fp16_16, var_6752_cast_fp16))[name = tensor("op_6789_cast_fp16")]; tensor var_6791_equation_0 = const()[name = tensor("op_6791_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6791_cast_fp16 = einsum(equation = var_6791_equation_0, values = (var_6675_cast_fp16_17, var_6753_cast_fp16))[name = tensor("op_6791_cast_fp16")]; tensor var_6793_equation_0 = const()[name = tensor("op_6793_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6793_cast_fp16 = einsum(equation = var_6793_equation_0, values = (var_6675_cast_fp16_18, var_6754_cast_fp16))[name = tensor("op_6793_cast_fp16")]; tensor var_6795_equation_0 = const()[name = tensor("op_6795_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_6795_cast_fp16 = einsum(equation = var_6795_equation_0, values = (var_6675_cast_fp16_19, var_6755_cast_fp16))[name = tensor("op_6795_cast_fp16")]; tensor input_245_interleave_0 = const()[name = tensor("input_245_interleave_0"), val = tensor(false)]; tensor input_245_cast_fp16 = concat(axis = var_6580, interleave = input_245_interleave_0, values = (var_6757_cast_fp16, var_6759_cast_fp16, var_6761_cast_fp16, var_6763_cast_fp16, var_6765_cast_fp16, var_6767_cast_fp16, var_6769_cast_fp16, var_6771_cast_fp16, var_6773_cast_fp16, var_6775_cast_fp16, var_6777_cast_fp16, var_6779_cast_fp16, var_6781_cast_fp16, var_6783_cast_fp16, var_6785_cast_fp16, var_6787_cast_fp16, var_6789_cast_fp16, var_6791_cast_fp16, var_6793_cast_fp16, var_6795_cast_fp16))[name = tensor("input_245_cast_fp16")]; tensor var_6804_pad_type_0 = const()[name = tensor("op_6804_pad_type_0"), val = tensor("valid")]; tensor var_6804_strides_0 = const()[name = tensor("op_6804_strides_0"), val = tensor([1, 1])]; tensor var_6804_pad_0 = const()[name = tensor("op_6804_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_6804_dilations_0 = const()[name = tensor("op_6804_dilations_0"), val = tensor([1, 1])]; tensor var_6804_groups_0 = const()[name = tensor("op_6804_groups_0"), val = tensor(1)]; tensor blocks_24_attn_out_weight_to_fp16 = const()[name = tensor("blocks_24_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(968978752)))]; tensor blocks_24_attn_out_bias_to_fp16 = const()[name = tensor("blocks_24_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(972255616)))]; tensor var_6804_cast_fp16 = conv(bias = blocks_24_attn_out_bias_to_fp16, dilations = var_6804_dilations_0, groups = var_6804_groups_0, pad = var_6804_pad_0, pad_type = var_6804_pad_type_0, strides = var_6804_strides_0, weight = blocks_24_attn_out_weight_to_fp16, x = input_245_cast_fp16)[name = tensor("op_6804_cast_fp16")]; tensor inputs_99_cast_fp16 = add(x = inputs_97_cast_fp16, y = var_6804_cast_fp16)[name = tensor("inputs_99_cast_fp16")]; tensor input_247_axes_0 = const()[name = tensor("input_247_axes_0"), val = tensor([1])]; tensor input_247_gamma_0_to_fp16 = const()[name = tensor("input_247_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(972258240)))]; tensor input_247_beta_0_to_fp16 = const()[name = tensor("input_247_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(972260864)))]; tensor var_6814_to_fp16 = const()[name = tensor("op_6814_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_247_cast_fp16 = layer_norm(axes = input_247_axes_0, beta = input_247_beta_0_to_fp16, epsilon = var_6814_to_fp16, gamma = input_247_gamma_0_to_fp16, x = inputs_99_cast_fp16)[name = tensor("input_247_cast_fp16")]; tensor input_249_pad_type_0 = const()[name = tensor("input_249_pad_type_0"), val = tensor("valid")]; tensor input_249_strides_0 = const()[name = tensor("input_249_strides_0"), val = tensor([1, 1])]; tensor input_249_pad_0 = const()[name = tensor("input_249_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_249_dilations_0 = const()[name = tensor("input_249_dilations_0"), val = tensor([1, 1])]; tensor input_249_groups_0 = const()[name = tensor("input_249_groups_0"), val = tensor(1)]; tensor blocks_24_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_24_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(972263488)))]; tensor blocks_24_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_24_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(985370752)))]; tensor input_249_cast_fp16 = conv(bias = blocks_24_mlp_0_bias_to_fp16, dilations = input_249_dilations_0, groups = input_249_groups_0, pad = input_249_pad_0, pad_type = input_249_pad_type_0, strides = input_249_strides_0, weight = blocks_24_mlp_0_weight_to_fp16, x = input_247_cast_fp16)[name = tensor("input_249_cast_fp16")]; tensor input_251_mode_0 = const()[name = tensor("input_251_mode_0"), val = tensor("EXACT")]; tensor input_251_cast_fp16 = gelu(mode = input_251_mode_0, x = input_249_cast_fp16)[name = tensor("input_251_cast_fp16")]; tensor var_6840_pad_type_0 = const()[name = tensor("op_6840_pad_type_0"), val = tensor("valid")]; tensor var_6840_strides_0 = const()[name = tensor("op_6840_strides_0"), val = tensor([1, 1])]; tensor var_6840_pad_0 = const()[name = tensor("op_6840_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_6840_dilations_0 = const()[name = tensor("op_6840_dilations_0"), val = tensor([1, 1])]; tensor var_6840_groups_0 = const()[name = tensor("op_6840_groups_0"), val = tensor(1)]; tensor blocks_24_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_24_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(985381056)))]; tensor blocks_24_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_24_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(998488320)))]; tensor var_6840_cast_fp16 = conv(bias = blocks_24_mlp_2_bias_to_fp16, dilations = var_6840_dilations_0, groups = var_6840_groups_0, pad = var_6840_pad_0, pad_type = var_6840_pad_type_0, strides = var_6840_strides_0, weight = blocks_24_mlp_2_weight_to_fp16, x = input_251_cast_fp16)[name = tensor("op_6840_cast_fp16")]; tensor inputs_101_cast_fp16 = add(x = inputs_99_cast_fp16, y = var_6840_cast_fp16)[name = tensor("inputs_101_cast_fp16")]; tensor var_6849 = const()[name = tensor("op_6849"), val = tensor(1)]; tensor input_253_axes_0 = const()[name = tensor("input_253_axes_0"), val = tensor([1])]; tensor input_253_gamma_0_to_fp16 = const()[name = tensor("input_253_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(998490944)))]; tensor input_253_beta_0_to_fp16 = const()[name = tensor("input_253_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(998493568)))]; tensor var_6865_to_fp16 = const()[name = tensor("op_6865_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_253_cast_fp16 = layer_norm(axes = input_253_axes_0, beta = input_253_beta_0_to_fp16, epsilon = var_6865_to_fp16, gamma = input_253_gamma_0_to_fp16, x = inputs_101_cast_fp16)[name = tensor("input_253_cast_fp16")]; tensor q_51_pad_type_0 = const()[name = tensor("q_51_pad_type_0"), val = tensor("valid")]; tensor q_51_strides_0 = const()[name = tensor("q_51_strides_0"), val = tensor([1, 1])]; tensor q_51_pad_0 = const()[name = tensor("q_51_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_51_dilations_0 = const()[name = tensor("q_51_dilations_0"), val = tensor([1, 1])]; tensor q_51_groups_0 = const()[name = tensor("q_51_groups_0"), val = tensor(1)]; tensor var_6900_weight_0_to_fp16 = const()[name = tensor("op_6900_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(998496192)))]; tensor var_6900_bias_0_to_fp16 = const()[name = tensor("op_6900_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1001773056)))]; tensor var_6900_cast_fp16 = conv(bias = var_6900_bias_0_to_fp16, dilations = q_51_dilations_0, groups = q_51_groups_0, pad = q_51_pad_0, pad_type = q_51_pad_type_0, strides = q_51_strides_0, weight = var_6900_weight_0_to_fp16, x = input_253_cast_fp16)[name = tensor("op_6900_cast_fp16")]; tensor k_51_pad_type_0 = const()[name = tensor("k_51_pad_type_0"), val = tensor("valid")]; tensor k_51_strides_0 = const()[name = tensor("k_51_strides_0"), val = tensor([1, 1])]; tensor k_51_pad_0 = const()[name = tensor("k_51_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_51_dilations_0 = const()[name = tensor("k_51_dilations_0"), val = tensor([1, 1])]; tensor k_51_groups_0 = const()[name = tensor("k_51_groups_0"), val = tensor(1)]; tensor blocks_25_attn_key_weight_to_fp16 = const()[name = tensor("blocks_25_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1001775680)))]; tensor k_51_cast_fp16 = conv(dilations = k_51_dilations_0, groups = k_51_groups_0, pad = k_51_pad_0, pad_type = k_51_pad_type_0, strides = k_51_strides_0, weight = blocks_25_attn_key_weight_to_fp16, x = input_253_cast_fp16)[name = tensor("k_51_cast_fp16")]; tensor var_6898_pad_type_0 = const()[name = tensor("op_6898_pad_type_0"), val = tensor("valid")]; tensor var_6898_strides_0 = const()[name = tensor("op_6898_strides_0"), val = tensor([1, 1])]; tensor var_6898_pad_0 = const()[name = tensor("op_6898_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_6898_dilations_0 = const()[name = tensor("op_6898_dilations_0"), val = tensor([1, 1])]; tensor var_6898_groups_0 = const()[name = tensor("op_6898_groups_0"), val = tensor(1)]; tensor blocks_25_attn_value_weight_to_fp16 = const()[name = tensor("blocks_25_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1005052544)))]; tensor blocks_25_attn_value_bias_to_fp16 = const()[name = tensor("blocks_25_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1008329408)))]; tensor var_6898_cast_fp16 = conv(bias = blocks_25_attn_value_bias_to_fp16, dilations = var_6898_dilations_0, groups = var_6898_groups_0, pad = var_6898_pad_0, pad_type = var_6898_pad_type_0, strides = var_6898_strides_0, weight = blocks_25_attn_value_weight_to_fp16, x = input_253_cast_fp16)[name = tensor("op_6898_cast_fp16")]; tensor tile_75 = const()[name = tensor("tile_75"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_6901_axis_0 = const()[name = tensor("op_6901_axis_0"), val = tensor(1)]; tensor var_6901_cast_fp16_0, tensor var_6901_cast_fp16_1, tensor var_6901_cast_fp16_2, tensor var_6901_cast_fp16_3, tensor var_6901_cast_fp16_4, tensor var_6901_cast_fp16_5, tensor var_6901_cast_fp16_6, tensor var_6901_cast_fp16_7, tensor var_6901_cast_fp16_8, tensor var_6901_cast_fp16_9, tensor var_6901_cast_fp16_10, tensor var_6901_cast_fp16_11, tensor var_6901_cast_fp16_12, tensor var_6901_cast_fp16_13, tensor var_6901_cast_fp16_14, tensor var_6901_cast_fp16_15, tensor var_6901_cast_fp16_16, tensor var_6901_cast_fp16_17, tensor var_6901_cast_fp16_18, tensor var_6901_cast_fp16_19 = split(axis = var_6901_axis_0, split_sizes = tile_75, x = var_6900_cast_fp16)[name = tensor("op_6901_cast_fp16")]; tensor var_6922_perm_0 = const()[name = tensor("op_6922_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_76 = const()[name = tensor("tile_76"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_6923_axis_0 = const()[name = tensor("op_6923_axis_0"), val = tensor(3)]; tensor var_6922_cast_fp16 = transpose(perm = var_6922_perm_0, x = k_51_cast_fp16)[name = tensor("transpose_7")]; tensor var_6923_cast_fp16_0, tensor var_6923_cast_fp16_1, tensor var_6923_cast_fp16_2, tensor var_6923_cast_fp16_3, tensor var_6923_cast_fp16_4, tensor var_6923_cast_fp16_5, tensor var_6923_cast_fp16_6, tensor var_6923_cast_fp16_7, tensor var_6923_cast_fp16_8, tensor var_6923_cast_fp16_9, tensor var_6923_cast_fp16_10, tensor var_6923_cast_fp16_11, tensor var_6923_cast_fp16_12, tensor var_6923_cast_fp16_13, tensor var_6923_cast_fp16_14, tensor var_6923_cast_fp16_15, tensor var_6923_cast_fp16_16, tensor var_6923_cast_fp16_17, tensor var_6923_cast_fp16_18, tensor var_6923_cast_fp16_19 = split(axis = var_6923_axis_0, split_sizes = tile_76, x = var_6922_cast_fp16)[name = tensor("op_6923_cast_fp16")]; tensor tile_77 = const()[name = tensor("tile_77"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_6944_axis_0 = const()[name = tensor("op_6944_axis_0"), val = tensor(1)]; tensor var_6944_cast_fp16_0, tensor var_6944_cast_fp16_1, tensor var_6944_cast_fp16_2, tensor var_6944_cast_fp16_3, tensor var_6944_cast_fp16_4, tensor var_6944_cast_fp16_5, tensor var_6944_cast_fp16_6, tensor var_6944_cast_fp16_7, tensor var_6944_cast_fp16_8, tensor var_6944_cast_fp16_9, tensor var_6944_cast_fp16_10, tensor var_6944_cast_fp16_11, tensor var_6944_cast_fp16_12, tensor var_6944_cast_fp16_13, tensor var_6944_cast_fp16_14, tensor var_6944_cast_fp16_15, tensor var_6944_cast_fp16_16, tensor var_6944_cast_fp16_17, tensor var_6944_cast_fp16_18, tensor var_6944_cast_fp16_19 = split(axis = var_6944_axis_0, split_sizes = tile_77, x = var_6898_cast_fp16)[name = tensor("op_6944_cast_fp16")]; tensor aw_1001_equation_0 = const()[name = tensor("aw_1001_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1001_cast_fp16 = einsum(equation = aw_1001_equation_0, values = (var_6923_cast_fp16_0, var_6901_cast_fp16_0))[name = tensor("aw_1001_cast_fp16")]; tensor aw_1003_equation_0 = const()[name = tensor("aw_1003_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1003_cast_fp16 = einsum(equation = aw_1003_equation_0, values = (var_6923_cast_fp16_1, var_6901_cast_fp16_1))[name = tensor("aw_1003_cast_fp16")]; tensor aw_1005_equation_0 = const()[name = tensor("aw_1005_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1005_cast_fp16 = einsum(equation = aw_1005_equation_0, values = (var_6923_cast_fp16_2, var_6901_cast_fp16_2))[name = tensor("aw_1005_cast_fp16")]; tensor aw_1007_equation_0 = const()[name = tensor("aw_1007_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1007_cast_fp16 = einsum(equation = aw_1007_equation_0, values = (var_6923_cast_fp16_3, var_6901_cast_fp16_3))[name = tensor("aw_1007_cast_fp16")]; tensor aw_1009_equation_0 = const()[name = tensor("aw_1009_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1009_cast_fp16 = einsum(equation = aw_1009_equation_0, values = (var_6923_cast_fp16_4, var_6901_cast_fp16_4))[name = tensor("aw_1009_cast_fp16")]; tensor aw_1011_equation_0 = const()[name = tensor("aw_1011_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1011_cast_fp16 = einsum(equation = aw_1011_equation_0, values = (var_6923_cast_fp16_5, var_6901_cast_fp16_5))[name = tensor("aw_1011_cast_fp16")]; tensor aw_1013_equation_0 = const()[name = tensor("aw_1013_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1013_cast_fp16 = einsum(equation = aw_1013_equation_0, values = (var_6923_cast_fp16_6, var_6901_cast_fp16_6))[name = tensor("aw_1013_cast_fp16")]; tensor aw_1015_equation_0 = const()[name = tensor("aw_1015_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1015_cast_fp16 = einsum(equation = aw_1015_equation_0, values = (var_6923_cast_fp16_7, var_6901_cast_fp16_7))[name = tensor("aw_1015_cast_fp16")]; tensor aw_1017_equation_0 = const()[name = tensor("aw_1017_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1017_cast_fp16 = einsum(equation = aw_1017_equation_0, values = (var_6923_cast_fp16_8, var_6901_cast_fp16_8))[name = tensor("aw_1017_cast_fp16")]; tensor aw_1019_equation_0 = const()[name = tensor("aw_1019_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1019_cast_fp16 = einsum(equation = aw_1019_equation_0, values = (var_6923_cast_fp16_9, var_6901_cast_fp16_9))[name = tensor("aw_1019_cast_fp16")]; tensor aw_1021_equation_0 = const()[name = tensor("aw_1021_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1021_cast_fp16 = einsum(equation = aw_1021_equation_0, values = (var_6923_cast_fp16_10, var_6901_cast_fp16_10))[name = tensor("aw_1021_cast_fp16")]; tensor aw_1023_equation_0 = const()[name = tensor("aw_1023_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1023_cast_fp16 = einsum(equation = aw_1023_equation_0, values = (var_6923_cast_fp16_11, var_6901_cast_fp16_11))[name = tensor("aw_1023_cast_fp16")]; tensor aw_1025_equation_0 = const()[name = tensor("aw_1025_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1025_cast_fp16 = einsum(equation = aw_1025_equation_0, values = (var_6923_cast_fp16_12, var_6901_cast_fp16_12))[name = tensor("aw_1025_cast_fp16")]; tensor aw_1027_equation_0 = const()[name = tensor("aw_1027_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1027_cast_fp16 = einsum(equation = aw_1027_equation_0, values = (var_6923_cast_fp16_13, var_6901_cast_fp16_13))[name = tensor("aw_1027_cast_fp16")]; tensor aw_1029_equation_0 = const()[name = tensor("aw_1029_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1029_cast_fp16 = einsum(equation = aw_1029_equation_0, values = (var_6923_cast_fp16_14, var_6901_cast_fp16_14))[name = tensor("aw_1029_cast_fp16")]; tensor aw_1031_equation_0 = const()[name = tensor("aw_1031_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1031_cast_fp16 = einsum(equation = aw_1031_equation_0, values = (var_6923_cast_fp16_15, var_6901_cast_fp16_15))[name = tensor("aw_1031_cast_fp16")]; tensor aw_1033_equation_0 = const()[name = tensor("aw_1033_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1033_cast_fp16 = einsum(equation = aw_1033_equation_0, values = (var_6923_cast_fp16_16, var_6901_cast_fp16_16))[name = tensor("aw_1033_cast_fp16")]; tensor aw_1035_equation_0 = const()[name = tensor("aw_1035_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1035_cast_fp16 = einsum(equation = aw_1035_equation_0, values = (var_6923_cast_fp16_17, var_6901_cast_fp16_17))[name = tensor("aw_1035_cast_fp16")]; tensor aw_1037_equation_0 = const()[name = tensor("aw_1037_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1037_cast_fp16 = einsum(equation = aw_1037_equation_0, values = (var_6923_cast_fp16_18, var_6901_cast_fp16_18))[name = tensor("aw_1037_cast_fp16")]; tensor aw_1039_equation_0 = const()[name = tensor("aw_1039_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1039_cast_fp16 = einsum(equation = aw_1039_equation_0, values = (var_6923_cast_fp16_19, var_6901_cast_fp16_19))[name = tensor("aw_1039_cast_fp16")]; tensor var_7005_cast_fp16 = softmax(axis = var_6849, x = aw_1001_cast_fp16)[name = tensor("op_7005_cast_fp16")]; tensor var_7006_cast_fp16 = softmax(axis = var_6849, x = aw_1003_cast_fp16)[name = tensor("op_7006_cast_fp16")]; tensor var_7007_cast_fp16 = softmax(axis = var_6849, x = aw_1005_cast_fp16)[name = tensor("op_7007_cast_fp16")]; tensor var_7008_cast_fp16 = softmax(axis = var_6849, x = aw_1007_cast_fp16)[name = tensor("op_7008_cast_fp16")]; tensor var_7009_cast_fp16 = softmax(axis = var_6849, x = aw_1009_cast_fp16)[name = tensor("op_7009_cast_fp16")]; tensor var_7010_cast_fp16 = softmax(axis = var_6849, x = aw_1011_cast_fp16)[name = tensor("op_7010_cast_fp16")]; tensor var_7011_cast_fp16 = softmax(axis = var_6849, x = aw_1013_cast_fp16)[name = tensor("op_7011_cast_fp16")]; tensor var_7012_cast_fp16 = softmax(axis = var_6849, x = aw_1015_cast_fp16)[name = tensor("op_7012_cast_fp16")]; tensor var_7013_cast_fp16 = softmax(axis = var_6849, x = aw_1017_cast_fp16)[name = tensor("op_7013_cast_fp16")]; tensor var_7014_cast_fp16 = softmax(axis = var_6849, x = aw_1019_cast_fp16)[name = tensor("op_7014_cast_fp16")]; tensor var_7015_cast_fp16 = softmax(axis = var_6849, x = aw_1021_cast_fp16)[name = tensor("op_7015_cast_fp16")]; tensor var_7016_cast_fp16 = softmax(axis = var_6849, x = aw_1023_cast_fp16)[name = tensor("op_7016_cast_fp16")]; tensor var_7017_cast_fp16 = softmax(axis = var_6849, x = aw_1025_cast_fp16)[name = tensor("op_7017_cast_fp16")]; tensor var_7018_cast_fp16 = softmax(axis = var_6849, x = aw_1027_cast_fp16)[name = tensor("op_7018_cast_fp16")]; tensor var_7019_cast_fp16 = softmax(axis = var_6849, x = aw_1029_cast_fp16)[name = tensor("op_7019_cast_fp16")]; tensor var_7020_cast_fp16 = softmax(axis = var_6849, x = aw_1031_cast_fp16)[name = tensor("op_7020_cast_fp16")]; tensor var_7021_cast_fp16 = softmax(axis = var_6849, x = aw_1033_cast_fp16)[name = tensor("op_7021_cast_fp16")]; tensor var_7022_cast_fp16 = softmax(axis = var_6849, x = aw_1035_cast_fp16)[name = tensor("op_7022_cast_fp16")]; tensor var_7023_cast_fp16 = softmax(axis = var_6849, x = aw_1037_cast_fp16)[name = tensor("op_7023_cast_fp16")]; tensor var_7024_cast_fp16 = softmax(axis = var_6849, x = aw_1039_cast_fp16)[name = tensor("op_7024_cast_fp16")]; tensor var_7026_equation_0 = const()[name = tensor("op_7026_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7026_cast_fp16 = einsum(equation = var_7026_equation_0, values = (var_6944_cast_fp16_0, var_7005_cast_fp16))[name = tensor("op_7026_cast_fp16")]; tensor var_7028_equation_0 = const()[name = tensor("op_7028_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7028_cast_fp16 = einsum(equation = var_7028_equation_0, values = (var_6944_cast_fp16_1, var_7006_cast_fp16))[name = tensor("op_7028_cast_fp16")]; tensor var_7030_equation_0 = const()[name = tensor("op_7030_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7030_cast_fp16 = einsum(equation = var_7030_equation_0, values = (var_6944_cast_fp16_2, var_7007_cast_fp16))[name = tensor("op_7030_cast_fp16")]; tensor var_7032_equation_0 = const()[name = tensor("op_7032_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7032_cast_fp16 = einsum(equation = var_7032_equation_0, values = (var_6944_cast_fp16_3, var_7008_cast_fp16))[name = tensor("op_7032_cast_fp16")]; tensor var_7034_equation_0 = const()[name = tensor("op_7034_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7034_cast_fp16 = einsum(equation = var_7034_equation_0, values = (var_6944_cast_fp16_4, var_7009_cast_fp16))[name = tensor("op_7034_cast_fp16")]; tensor var_7036_equation_0 = const()[name = tensor("op_7036_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7036_cast_fp16 = einsum(equation = var_7036_equation_0, values = (var_6944_cast_fp16_5, var_7010_cast_fp16))[name = tensor("op_7036_cast_fp16")]; tensor var_7038_equation_0 = const()[name = tensor("op_7038_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7038_cast_fp16 = einsum(equation = var_7038_equation_0, values = (var_6944_cast_fp16_6, var_7011_cast_fp16))[name = tensor("op_7038_cast_fp16")]; tensor var_7040_equation_0 = const()[name = tensor("op_7040_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7040_cast_fp16 = einsum(equation = var_7040_equation_0, values = (var_6944_cast_fp16_7, var_7012_cast_fp16))[name = tensor("op_7040_cast_fp16")]; tensor var_7042_equation_0 = const()[name = tensor("op_7042_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7042_cast_fp16 = einsum(equation = var_7042_equation_0, values = (var_6944_cast_fp16_8, var_7013_cast_fp16))[name = tensor("op_7042_cast_fp16")]; tensor var_7044_equation_0 = const()[name = tensor("op_7044_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7044_cast_fp16 = einsum(equation = var_7044_equation_0, values = (var_6944_cast_fp16_9, var_7014_cast_fp16))[name = tensor("op_7044_cast_fp16")]; tensor var_7046_equation_0 = const()[name = tensor("op_7046_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7046_cast_fp16 = einsum(equation = var_7046_equation_0, values = (var_6944_cast_fp16_10, var_7015_cast_fp16))[name = tensor("op_7046_cast_fp16")]; tensor var_7048_equation_0 = const()[name = tensor("op_7048_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7048_cast_fp16 = einsum(equation = var_7048_equation_0, values = (var_6944_cast_fp16_11, var_7016_cast_fp16))[name = tensor("op_7048_cast_fp16")]; tensor var_7050_equation_0 = const()[name = tensor("op_7050_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7050_cast_fp16 = einsum(equation = var_7050_equation_0, values = (var_6944_cast_fp16_12, var_7017_cast_fp16))[name = tensor("op_7050_cast_fp16")]; tensor var_7052_equation_0 = const()[name = tensor("op_7052_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7052_cast_fp16 = einsum(equation = var_7052_equation_0, values = (var_6944_cast_fp16_13, var_7018_cast_fp16))[name = tensor("op_7052_cast_fp16")]; tensor var_7054_equation_0 = const()[name = tensor("op_7054_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7054_cast_fp16 = einsum(equation = var_7054_equation_0, values = (var_6944_cast_fp16_14, var_7019_cast_fp16))[name = tensor("op_7054_cast_fp16")]; tensor var_7056_equation_0 = const()[name = tensor("op_7056_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7056_cast_fp16 = einsum(equation = var_7056_equation_0, values = (var_6944_cast_fp16_15, var_7020_cast_fp16))[name = tensor("op_7056_cast_fp16")]; tensor var_7058_equation_0 = const()[name = tensor("op_7058_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7058_cast_fp16 = einsum(equation = var_7058_equation_0, values = (var_6944_cast_fp16_16, var_7021_cast_fp16))[name = tensor("op_7058_cast_fp16")]; tensor var_7060_equation_0 = const()[name = tensor("op_7060_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7060_cast_fp16 = einsum(equation = var_7060_equation_0, values = (var_6944_cast_fp16_17, var_7022_cast_fp16))[name = tensor("op_7060_cast_fp16")]; tensor var_7062_equation_0 = const()[name = tensor("op_7062_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7062_cast_fp16 = einsum(equation = var_7062_equation_0, values = (var_6944_cast_fp16_18, var_7023_cast_fp16))[name = tensor("op_7062_cast_fp16")]; tensor var_7064_equation_0 = const()[name = tensor("op_7064_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7064_cast_fp16 = einsum(equation = var_7064_equation_0, values = (var_6944_cast_fp16_19, var_7024_cast_fp16))[name = tensor("op_7064_cast_fp16")]; tensor input_255_interleave_0 = const()[name = tensor("input_255_interleave_0"), val = tensor(false)]; tensor input_255_cast_fp16 = concat(axis = var_6849, interleave = input_255_interleave_0, values = (var_7026_cast_fp16, var_7028_cast_fp16, var_7030_cast_fp16, var_7032_cast_fp16, var_7034_cast_fp16, var_7036_cast_fp16, var_7038_cast_fp16, var_7040_cast_fp16, var_7042_cast_fp16, var_7044_cast_fp16, var_7046_cast_fp16, var_7048_cast_fp16, var_7050_cast_fp16, var_7052_cast_fp16, var_7054_cast_fp16, var_7056_cast_fp16, var_7058_cast_fp16, var_7060_cast_fp16, var_7062_cast_fp16, var_7064_cast_fp16))[name = tensor("input_255_cast_fp16")]; tensor var_7073_pad_type_0 = const()[name = tensor("op_7073_pad_type_0"), val = tensor("valid")]; tensor var_7073_strides_0 = const()[name = tensor("op_7073_strides_0"), val = tensor([1, 1])]; tensor var_7073_pad_0 = const()[name = tensor("op_7073_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_7073_dilations_0 = const()[name = tensor("op_7073_dilations_0"), val = tensor([1, 1])]; tensor var_7073_groups_0 = const()[name = tensor("op_7073_groups_0"), val = tensor(1)]; tensor blocks_25_attn_out_weight_to_fp16 = const()[name = tensor("blocks_25_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1008332032)))]; tensor blocks_25_attn_out_bias_to_fp16 = const()[name = tensor("blocks_25_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1011608896)))]; tensor var_7073_cast_fp16 = conv(bias = blocks_25_attn_out_bias_to_fp16, dilations = var_7073_dilations_0, groups = var_7073_groups_0, pad = var_7073_pad_0, pad_type = var_7073_pad_type_0, strides = var_7073_strides_0, weight = blocks_25_attn_out_weight_to_fp16, x = input_255_cast_fp16)[name = tensor("op_7073_cast_fp16")]; tensor inputs_103_cast_fp16 = add(x = inputs_101_cast_fp16, y = var_7073_cast_fp16)[name = tensor("inputs_103_cast_fp16")]; tensor input_257_axes_0 = const()[name = tensor("input_257_axes_0"), val = tensor([1])]; tensor input_257_gamma_0_to_fp16 = const()[name = tensor("input_257_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1011611520)))]; tensor input_257_beta_0_to_fp16 = const()[name = tensor("input_257_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1011614144)))]; tensor var_7083_to_fp16 = const()[name = tensor("op_7083_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_257_cast_fp16 = layer_norm(axes = input_257_axes_0, beta = input_257_beta_0_to_fp16, epsilon = var_7083_to_fp16, gamma = input_257_gamma_0_to_fp16, x = inputs_103_cast_fp16)[name = tensor("input_257_cast_fp16")]; tensor input_259_pad_type_0 = const()[name = tensor("input_259_pad_type_0"), val = tensor("valid")]; tensor input_259_strides_0 = const()[name = tensor("input_259_strides_0"), val = tensor([1, 1])]; tensor input_259_pad_0 = const()[name = tensor("input_259_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_259_dilations_0 = const()[name = tensor("input_259_dilations_0"), val = tensor([1, 1])]; tensor input_259_groups_0 = const()[name = tensor("input_259_groups_0"), val = tensor(1)]; tensor blocks_25_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_25_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1011616768)))]; tensor blocks_25_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_25_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1024724032)))]; tensor input_259_cast_fp16 = conv(bias = blocks_25_mlp_0_bias_to_fp16, dilations = input_259_dilations_0, groups = input_259_groups_0, pad = input_259_pad_0, pad_type = input_259_pad_type_0, strides = input_259_strides_0, weight = blocks_25_mlp_0_weight_to_fp16, x = input_257_cast_fp16)[name = tensor("input_259_cast_fp16")]; tensor input_261_mode_0 = const()[name = tensor("input_261_mode_0"), val = tensor("EXACT")]; tensor input_261_cast_fp16 = gelu(mode = input_261_mode_0, x = input_259_cast_fp16)[name = tensor("input_261_cast_fp16")]; tensor var_7109_pad_type_0 = const()[name = tensor("op_7109_pad_type_0"), val = tensor("valid")]; tensor var_7109_strides_0 = const()[name = tensor("op_7109_strides_0"), val = tensor([1, 1])]; tensor var_7109_pad_0 = const()[name = tensor("op_7109_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_7109_dilations_0 = const()[name = tensor("op_7109_dilations_0"), val = tensor([1, 1])]; tensor var_7109_groups_0 = const()[name = tensor("op_7109_groups_0"), val = tensor(1)]; tensor blocks_25_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_25_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1024734336)))]; tensor blocks_25_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_25_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1037841600)))]; tensor var_7109_cast_fp16 = conv(bias = blocks_25_mlp_2_bias_to_fp16, dilations = var_7109_dilations_0, groups = var_7109_groups_0, pad = var_7109_pad_0, pad_type = var_7109_pad_type_0, strides = var_7109_strides_0, weight = blocks_25_mlp_2_weight_to_fp16, x = input_261_cast_fp16)[name = tensor("op_7109_cast_fp16")]; tensor inputs_105_cast_fp16 = add(x = inputs_103_cast_fp16, y = var_7109_cast_fp16)[name = tensor("inputs_105_cast_fp16")]; tensor var_7118 = const()[name = tensor("op_7118"), val = tensor(1)]; tensor input_263_axes_0 = const()[name = tensor("input_263_axes_0"), val = tensor([1])]; tensor input_263_gamma_0_to_fp16 = const()[name = tensor("input_263_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1037844224)))]; tensor input_263_beta_0_to_fp16 = const()[name = tensor("input_263_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1037846848)))]; tensor var_7134_to_fp16 = const()[name = tensor("op_7134_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_263_cast_fp16 = layer_norm(axes = input_263_axes_0, beta = input_263_beta_0_to_fp16, epsilon = var_7134_to_fp16, gamma = input_263_gamma_0_to_fp16, x = inputs_105_cast_fp16)[name = tensor("input_263_cast_fp16")]; tensor q_53_pad_type_0 = const()[name = tensor("q_53_pad_type_0"), val = tensor("valid")]; tensor q_53_strides_0 = const()[name = tensor("q_53_strides_0"), val = tensor([1, 1])]; tensor q_53_pad_0 = const()[name = tensor("q_53_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_53_dilations_0 = const()[name = tensor("q_53_dilations_0"), val = tensor([1, 1])]; tensor q_53_groups_0 = const()[name = tensor("q_53_groups_0"), val = tensor(1)]; tensor var_7169_weight_0_to_fp16 = const()[name = tensor("op_7169_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1037849472)))]; tensor var_7169_bias_0_to_fp16 = const()[name = tensor("op_7169_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1041126336)))]; tensor var_7169_cast_fp16 = conv(bias = var_7169_bias_0_to_fp16, dilations = q_53_dilations_0, groups = q_53_groups_0, pad = q_53_pad_0, pad_type = q_53_pad_type_0, strides = q_53_strides_0, weight = var_7169_weight_0_to_fp16, x = input_263_cast_fp16)[name = tensor("op_7169_cast_fp16")]; tensor k_53_pad_type_0 = const()[name = tensor("k_53_pad_type_0"), val = tensor("valid")]; tensor k_53_strides_0 = const()[name = tensor("k_53_strides_0"), val = tensor([1, 1])]; tensor k_53_pad_0 = const()[name = tensor("k_53_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_53_dilations_0 = const()[name = tensor("k_53_dilations_0"), val = tensor([1, 1])]; tensor k_53_groups_0 = const()[name = tensor("k_53_groups_0"), val = tensor(1)]; tensor blocks_26_attn_key_weight_to_fp16 = const()[name = tensor("blocks_26_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1041128960)))]; tensor k_53_cast_fp16 = conv(dilations = k_53_dilations_0, groups = k_53_groups_0, pad = k_53_pad_0, pad_type = k_53_pad_type_0, strides = k_53_strides_0, weight = blocks_26_attn_key_weight_to_fp16, x = input_263_cast_fp16)[name = tensor("k_53_cast_fp16")]; tensor var_7167_pad_type_0 = const()[name = tensor("op_7167_pad_type_0"), val = tensor("valid")]; tensor var_7167_strides_0 = const()[name = tensor("op_7167_strides_0"), val = tensor([1, 1])]; tensor var_7167_pad_0 = const()[name = tensor("op_7167_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_7167_dilations_0 = const()[name = tensor("op_7167_dilations_0"), val = tensor([1, 1])]; tensor var_7167_groups_0 = const()[name = tensor("op_7167_groups_0"), val = tensor(1)]; tensor blocks_26_attn_value_weight_to_fp16 = const()[name = tensor("blocks_26_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1044405824)))]; tensor blocks_26_attn_value_bias_to_fp16 = const()[name = tensor("blocks_26_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1047682688)))]; tensor var_7167_cast_fp16 = conv(bias = blocks_26_attn_value_bias_to_fp16, dilations = var_7167_dilations_0, groups = var_7167_groups_0, pad = var_7167_pad_0, pad_type = var_7167_pad_type_0, strides = var_7167_strides_0, weight = blocks_26_attn_value_weight_to_fp16, x = input_263_cast_fp16)[name = tensor("op_7167_cast_fp16")]; tensor tile_78 = const()[name = tensor("tile_78"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_7170_axis_0 = const()[name = tensor("op_7170_axis_0"), val = tensor(1)]; tensor var_7170_cast_fp16_0, tensor var_7170_cast_fp16_1, tensor var_7170_cast_fp16_2, tensor var_7170_cast_fp16_3, tensor var_7170_cast_fp16_4, tensor var_7170_cast_fp16_5, tensor var_7170_cast_fp16_6, tensor var_7170_cast_fp16_7, tensor var_7170_cast_fp16_8, tensor var_7170_cast_fp16_9, tensor var_7170_cast_fp16_10, tensor var_7170_cast_fp16_11, tensor var_7170_cast_fp16_12, tensor var_7170_cast_fp16_13, tensor var_7170_cast_fp16_14, tensor var_7170_cast_fp16_15, tensor var_7170_cast_fp16_16, tensor var_7170_cast_fp16_17, tensor var_7170_cast_fp16_18, tensor var_7170_cast_fp16_19 = split(axis = var_7170_axis_0, split_sizes = tile_78, x = var_7169_cast_fp16)[name = tensor("op_7170_cast_fp16")]; tensor var_7191_perm_0 = const()[name = tensor("op_7191_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_79 = const()[name = tensor("tile_79"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_7192_axis_0 = const()[name = tensor("op_7192_axis_0"), val = tensor(3)]; tensor var_7191_cast_fp16 = transpose(perm = var_7191_perm_0, x = k_53_cast_fp16)[name = tensor("transpose_6")]; tensor var_7192_cast_fp16_0, tensor var_7192_cast_fp16_1, tensor var_7192_cast_fp16_2, tensor var_7192_cast_fp16_3, tensor var_7192_cast_fp16_4, tensor var_7192_cast_fp16_5, tensor var_7192_cast_fp16_6, tensor var_7192_cast_fp16_7, tensor var_7192_cast_fp16_8, tensor var_7192_cast_fp16_9, tensor var_7192_cast_fp16_10, tensor var_7192_cast_fp16_11, tensor var_7192_cast_fp16_12, tensor var_7192_cast_fp16_13, tensor var_7192_cast_fp16_14, tensor var_7192_cast_fp16_15, tensor var_7192_cast_fp16_16, tensor var_7192_cast_fp16_17, tensor var_7192_cast_fp16_18, tensor var_7192_cast_fp16_19 = split(axis = var_7192_axis_0, split_sizes = tile_79, x = var_7191_cast_fp16)[name = tensor("op_7192_cast_fp16")]; tensor tile_80 = const()[name = tensor("tile_80"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_7213_axis_0 = const()[name = tensor("op_7213_axis_0"), val = tensor(1)]; tensor var_7213_cast_fp16_0, tensor var_7213_cast_fp16_1, tensor var_7213_cast_fp16_2, tensor var_7213_cast_fp16_3, tensor var_7213_cast_fp16_4, tensor var_7213_cast_fp16_5, tensor var_7213_cast_fp16_6, tensor var_7213_cast_fp16_7, tensor var_7213_cast_fp16_8, tensor var_7213_cast_fp16_9, tensor var_7213_cast_fp16_10, tensor var_7213_cast_fp16_11, tensor var_7213_cast_fp16_12, tensor var_7213_cast_fp16_13, tensor var_7213_cast_fp16_14, tensor var_7213_cast_fp16_15, tensor var_7213_cast_fp16_16, tensor var_7213_cast_fp16_17, tensor var_7213_cast_fp16_18, tensor var_7213_cast_fp16_19 = split(axis = var_7213_axis_0, split_sizes = tile_80, x = var_7167_cast_fp16)[name = tensor("op_7213_cast_fp16")]; tensor aw_1041_equation_0 = const()[name = tensor("aw_1041_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1041_cast_fp16 = einsum(equation = aw_1041_equation_0, values = (var_7192_cast_fp16_0, var_7170_cast_fp16_0))[name = tensor("aw_1041_cast_fp16")]; tensor aw_1043_equation_0 = const()[name = tensor("aw_1043_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1043_cast_fp16 = einsum(equation = aw_1043_equation_0, values = (var_7192_cast_fp16_1, var_7170_cast_fp16_1))[name = tensor("aw_1043_cast_fp16")]; tensor aw_1045_equation_0 = const()[name = tensor("aw_1045_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1045_cast_fp16 = einsum(equation = aw_1045_equation_0, values = (var_7192_cast_fp16_2, var_7170_cast_fp16_2))[name = tensor("aw_1045_cast_fp16")]; tensor aw_1047_equation_0 = const()[name = tensor("aw_1047_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1047_cast_fp16 = einsum(equation = aw_1047_equation_0, values = (var_7192_cast_fp16_3, var_7170_cast_fp16_3))[name = tensor("aw_1047_cast_fp16")]; tensor aw_1049_equation_0 = const()[name = tensor("aw_1049_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1049_cast_fp16 = einsum(equation = aw_1049_equation_0, values = (var_7192_cast_fp16_4, var_7170_cast_fp16_4))[name = tensor("aw_1049_cast_fp16")]; tensor aw_1051_equation_0 = const()[name = tensor("aw_1051_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1051_cast_fp16 = einsum(equation = aw_1051_equation_0, values = (var_7192_cast_fp16_5, var_7170_cast_fp16_5))[name = tensor("aw_1051_cast_fp16")]; tensor aw_1053_equation_0 = const()[name = tensor("aw_1053_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1053_cast_fp16 = einsum(equation = aw_1053_equation_0, values = (var_7192_cast_fp16_6, var_7170_cast_fp16_6))[name = tensor("aw_1053_cast_fp16")]; tensor aw_1055_equation_0 = const()[name = tensor("aw_1055_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1055_cast_fp16 = einsum(equation = aw_1055_equation_0, values = (var_7192_cast_fp16_7, var_7170_cast_fp16_7))[name = tensor("aw_1055_cast_fp16")]; tensor aw_1057_equation_0 = const()[name = tensor("aw_1057_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1057_cast_fp16 = einsum(equation = aw_1057_equation_0, values = (var_7192_cast_fp16_8, var_7170_cast_fp16_8))[name = tensor("aw_1057_cast_fp16")]; tensor aw_1059_equation_0 = const()[name = tensor("aw_1059_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1059_cast_fp16 = einsum(equation = aw_1059_equation_0, values = (var_7192_cast_fp16_9, var_7170_cast_fp16_9))[name = tensor("aw_1059_cast_fp16")]; tensor aw_1061_equation_0 = const()[name = tensor("aw_1061_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1061_cast_fp16 = einsum(equation = aw_1061_equation_0, values = (var_7192_cast_fp16_10, var_7170_cast_fp16_10))[name = tensor("aw_1061_cast_fp16")]; tensor aw_1063_equation_0 = const()[name = tensor("aw_1063_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1063_cast_fp16 = einsum(equation = aw_1063_equation_0, values = (var_7192_cast_fp16_11, var_7170_cast_fp16_11))[name = tensor("aw_1063_cast_fp16")]; tensor aw_1065_equation_0 = const()[name = tensor("aw_1065_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1065_cast_fp16 = einsum(equation = aw_1065_equation_0, values = (var_7192_cast_fp16_12, var_7170_cast_fp16_12))[name = tensor("aw_1065_cast_fp16")]; tensor aw_1067_equation_0 = const()[name = tensor("aw_1067_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1067_cast_fp16 = einsum(equation = aw_1067_equation_0, values = (var_7192_cast_fp16_13, var_7170_cast_fp16_13))[name = tensor("aw_1067_cast_fp16")]; tensor aw_1069_equation_0 = const()[name = tensor("aw_1069_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1069_cast_fp16 = einsum(equation = aw_1069_equation_0, values = (var_7192_cast_fp16_14, var_7170_cast_fp16_14))[name = tensor("aw_1069_cast_fp16")]; tensor aw_1071_equation_0 = const()[name = tensor("aw_1071_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1071_cast_fp16 = einsum(equation = aw_1071_equation_0, values = (var_7192_cast_fp16_15, var_7170_cast_fp16_15))[name = tensor("aw_1071_cast_fp16")]; tensor aw_1073_equation_0 = const()[name = tensor("aw_1073_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1073_cast_fp16 = einsum(equation = aw_1073_equation_0, values = (var_7192_cast_fp16_16, var_7170_cast_fp16_16))[name = tensor("aw_1073_cast_fp16")]; tensor aw_1075_equation_0 = const()[name = tensor("aw_1075_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1075_cast_fp16 = einsum(equation = aw_1075_equation_0, values = (var_7192_cast_fp16_17, var_7170_cast_fp16_17))[name = tensor("aw_1075_cast_fp16")]; tensor aw_1077_equation_0 = const()[name = tensor("aw_1077_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1077_cast_fp16 = einsum(equation = aw_1077_equation_0, values = (var_7192_cast_fp16_18, var_7170_cast_fp16_18))[name = tensor("aw_1077_cast_fp16")]; tensor aw_1079_equation_0 = const()[name = tensor("aw_1079_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1079_cast_fp16 = einsum(equation = aw_1079_equation_0, values = (var_7192_cast_fp16_19, var_7170_cast_fp16_19))[name = tensor("aw_1079_cast_fp16")]; tensor var_7274_cast_fp16 = softmax(axis = var_7118, x = aw_1041_cast_fp16)[name = tensor("op_7274_cast_fp16")]; tensor var_7275_cast_fp16 = softmax(axis = var_7118, x = aw_1043_cast_fp16)[name = tensor("op_7275_cast_fp16")]; tensor var_7276_cast_fp16 = softmax(axis = var_7118, x = aw_1045_cast_fp16)[name = tensor("op_7276_cast_fp16")]; tensor var_7277_cast_fp16 = softmax(axis = var_7118, x = aw_1047_cast_fp16)[name = tensor("op_7277_cast_fp16")]; tensor var_7278_cast_fp16 = softmax(axis = var_7118, x = aw_1049_cast_fp16)[name = tensor("op_7278_cast_fp16")]; tensor var_7279_cast_fp16 = softmax(axis = var_7118, x = aw_1051_cast_fp16)[name = tensor("op_7279_cast_fp16")]; tensor var_7280_cast_fp16 = softmax(axis = var_7118, x = aw_1053_cast_fp16)[name = tensor("op_7280_cast_fp16")]; tensor var_7281_cast_fp16 = softmax(axis = var_7118, x = aw_1055_cast_fp16)[name = tensor("op_7281_cast_fp16")]; tensor var_7282_cast_fp16 = softmax(axis = var_7118, x = aw_1057_cast_fp16)[name = tensor("op_7282_cast_fp16")]; tensor var_7283_cast_fp16 = softmax(axis = var_7118, x = aw_1059_cast_fp16)[name = tensor("op_7283_cast_fp16")]; tensor var_7284_cast_fp16 = softmax(axis = var_7118, x = aw_1061_cast_fp16)[name = tensor("op_7284_cast_fp16")]; tensor var_7285_cast_fp16 = softmax(axis = var_7118, x = aw_1063_cast_fp16)[name = tensor("op_7285_cast_fp16")]; tensor var_7286_cast_fp16 = softmax(axis = var_7118, x = aw_1065_cast_fp16)[name = tensor("op_7286_cast_fp16")]; tensor var_7287_cast_fp16 = softmax(axis = var_7118, x = aw_1067_cast_fp16)[name = tensor("op_7287_cast_fp16")]; tensor var_7288_cast_fp16 = softmax(axis = var_7118, x = aw_1069_cast_fp16)[name = tensor("op_7288_cast_fp16")]; tensor var_7289_cast_fp16 = softmax(axis = var_7118, x = aw_1071_cast_fp16)[name = tensor("op_7289_cast_fp16")]; tensor var_7290_cast_fp16 = softmax(axis = var_7118, x = aw_1073_cast_fp16)[name = tensor("op_7290_cast_fp16")]; tensor var_7291_cast_fp16 = softmax(axis = var_7118, x = aw_1075_cast_fp16)[name = tensor("op_7291_cast_fp16")]; tensor var_7292_cast_fp16 = softmax(axis = var_7118, x = aw_1077_cast_fp16)[name = tensor("op_7292_cast_fp16")]; tensor var_7293_cast_fp16 = softmax(axis = var_7118, x = aw_1079_cast_fp16)[name = tensor("op_7293_cast_fp16")]; tensor var_7295_equation_0 = const()[name = tensor("op_7295_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7295_cast_fp16 = einsum(equation = var_7295_equation_0, values = (var_7213_cast_fp16_0, var_7274_cast_fp16))[name = tensor("op_7295_cast_fp16")]; tensor var_7297_equation_0 = const()[name = tensor("op_7297_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7297_cast_fp16 = einsum(equation = var_7297_equation_0, values = (var_7213_cast_fp16_1, var_7275_cast_fp16))[name = tensor("op_7297_cast_fp16")]; tensor var_7299_equation_0 = const()[name = tensor("op_7299_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7299_cast_fp16 = einsum(equation = var_7299_equation_0, values = (var_7213_cast_fp16_2, var_7276_cast_fp16))[name = tensor("op_7299_cast_fp16")]; tensor var_7301_equation_0 = const()[name = tensor("op_7301_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7301_cast_fp16 = einsum(equation = var_7301_equation_0, values = (var_7213_cast_fp16_3, var_7277_cast_fp16))[name = tensor("op_7301_cast_fp16")]; tensor var_7303_equation_0 = const()[name = tensor("op_7303_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7303_cast_fp16 = einsum(equation = var_7303_equation_0, values = (var_7213_cast_fp16_4, var_7278_cast_fp16))[name = tensor("op_7303_cast_fp16")]; tensor var_7305_equation_0 = const()[name = tensor("op_7305_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7305_cast_fp16 = einsum(equation = var_7305_equation_0, values = (var_7213_cast_fp16_5, var_7279_cast_fp16))[name = tensor("op_7305_cast_fp16")]; tensor var_7307_equation_0 = const()[name = tensor("op_7307_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7307_cast_fp16 = einsum(equation = var_7307_equation_0, values = (var_7213_cast_fp16_6, var_7280_cast_fp16))[name = tensor("op_7307_cast_fp16")]; tensor var_7309_equation_0 = const()[name = tensor("op_7309_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7309_cast_fp16 = einsum(equation = var_7309_equation_0, values = (var_7213_cast_fp16_7, var_7281_cast_fp16))[name = tensor("op_7309_cast_fp16")]; tensor var_7311_equation_0 = const()[name = tensor("op_7311_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7311_cast_fp16 = einsum(equation = var_7311_equation_0, values = (var_7213_cast_fp16_8, var_7282_cast_fp16))[name = tensor("op_7311_cast_fp16")]; tensor var_7313_equation_0 = const()[name = tensor("op_7313_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7313_cast_fp16 = einsum(equation = var_7313_equation_0, values = (var_7213_cast_fp16_9, var_7283_cast_fp16))[name = tensor("op_7313_cast_fp16")]; tensor var_7315_equation_0 = const()[name = tensor("op_7315_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7315_cast_fp16 = einsum(equation = var_7315_equation_0, values = (var_7213_cast_fp16_10, var_7284_cast_fp16))[name = tensor("op_7315_cast_fp16")]; tensor var_7317_equation_0 = const()[name = tensor("op_7317_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7317_cast_fp16 = einsum(equation = var_7317_equation_0, values = (var_7213_cast_fp16_11, var_7285_cast_fp16))[name = tensor("op_7317_cast_fp16")]; tensor var_7319_equation_0 = const()[name = tensor("op_7319_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7319_cast_fp16 = einsum(equation = var_7319_equation_0, values = (var_7213_cast_fp16_12, var_7286_cast_fp16))[name = tensor("op_7319_cast_fp16")]; tensor var_7321_equation_0 = const()[name = tensor("op_7321_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7321_cast_fp16 = einsum(equation = var_7321_equation_0, values = (var_7213_cast_fp16_13, var_7287_cast_fp16))[name = tensor("op_7321_cast_fp16")]; tensor var_7323_equation_0 = const()[name = tensor("op_7323_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7323_cast_fp16 = einsum(equation = var_7323_equation_0, values = (var_7213_cast_fp16_14, var_7288_cast_fp16))[name = tensor("op_7323_cast_fp16")]; tensor var_7325_equation_0 = const()[name = tensor("op_7325_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7325_cast_fp16 = einsum(equation = var_7325_equation_0, values = (var_7213_cast_fp16_15, var_7289_cast_fp16))[name = tensor("op_7325_cast_fp16")]; tensor var_7327_equation_0 = const()[name = tensor("op_7327_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7327_cast_fp16 = einsum(equation = var_7327_equation_0, values = (var_7213_cast_fp16_16, var_7290_cast_fp16))[name = tensor("op_7327_cast_fp16")]; tensor var_7329_equation_0 = const()[name = tensor("op_7329_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7329_cast_fp16 = einsum(equation = var_7329_equation_0, values = (var_7213_cast_fp16_17, var_7291_cast_fp16))[name = tensor("op_7329_cast_fp16")]; tensor var_7331_equation_0 = const()[name = tensor("op_7331_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7331_cast_fp16 = einsum(equation = var_7331_equation_0, values = (var_7213_cast_fp16_18, var_7292_cast_fp16))[name = tensor("op_7331_cast_fp16")]; tensor var_7333_equation_0 = const()[name = tensor("op_7333_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7333_cast_fp16 = einsum(equation = var_7333_equation_0, values = (var_7213_cast_fp16_19, var_7293_cast_fp16))[name = tensor("op_7333_cast_fp16")]; tensor input_265_interleave_0 = const()[name = tensor("input_265_interleave_0"), val = tensor(false)]; tensor input_265_cast_fp16 = concat(axis = var_7118, interleave = input_265_interleave_0, values = (var_7295_cast_fp16, var_7297_cast_fp16, var_7299_cast_fp16, var_7301_cast_fp16, var_7303_cast_fp16, var_7305_cast_fp16, var_7307_cast_fp16, var_7309_cast_fp16, var_7311_cast_fp16, var_7313_cast_fp16, var_7315_cast_fp16, var_7317_cast_fp16, var_7319_cast_fp16, var_7321_cast_fp16, var_7323_cast_fp16, var_7325_cast_fp16, var_7327_cast_fp16, var_7329_cast_fp16, var_7331_cast_fp16, var_7333_cast_fp16))[name = tensor("input_265_cast_fp16")]; tensor var_7342_pad_type_0 = const()[name = tensor("op_7342_pad_type_0"), val = tensor("valid")]; tensor var_7342_strides_0 = const()[name = tensor("op_7342_strides_0"), val = tensor([1, 1])]; tensor var_7342_pad_0 = const()[name = tensor("op_7342_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_7342_dilations_0 = const()[name = tensor("op_7342_dilations_0"), val = tensor([1, 1])]; tensor var_7342_groups_0 = const()[name = tensor("op_7342_groups_0"), val = tensor(1)]; tensor blocks_26_attn_out_weight_to_fp16 = const()[name = tensor("blocks_26_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1047685312)))]; tensor blocks_26_attn_out_bias_to_fp16 = const()[name = tensor("blocks_26_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050962176)))]; tensor var_7342_cast_fp16 = conv(bias = blocks_26_attn_out_bias_to_fp16, dilations = var_7342_dilations_0, groups = var_7342_groups_0, pad = var_7342_pad_0, pad_type = var_7342_pad_type_0, strides = var_7342_strides_0, weight = blocks_26_attn_out_weight_to_fp16, x = input_265_cast_fp16)[name = tensor("op_7342_cast_fp16")]; tensor inputs_107_cast_fp16 = add(x = inputs_105_cast_fp16, y = var_7342_cast_fp16)[name = tensor("inputs_107_cast_fp16")]; tensor input_267_axes_0 = const()[name = tensor("input_267_axes_0"), val = tensor([1])]; tensor input_267_gamma_0_to_fp16 = const()[name = tensor("input_267_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050964800)))]; tensor input_267_beta_0_to_fp16 = const()[name = tensor("input_267_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050967424)))]; tensor var_7352_to_fp16 = const()[name = tensor("op_7352_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_267_cast_fp16 = layer_norm(axes = input_267_axes_0, beta = input_267_beta_0_to_fp16, epsilon = var_7352_to_fp16, gamma = input_267_gamma_0_to_fp16, x = inputs_107_cast_fp16)[name = tensor("input_267_cast_fp16")]; tensor input_269_pad_type_0 = const()[name = tensor("input_269_pad_type_0"), val = tensor("valid")]; tensor input_269_strides_0 = const()[name = tensor("input_269_strides_0"), val = tensor([1, 1])]; tensor input_269_pad_0 = const()[name = tensor("input_269_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_269_dilations_0 = const()[name = tensor("input_269_dilations_0"), val = tensor([1, 1])]; tensor input_269_groups_0 = const()[name = tensor("input_269_groups_0"), val = tensor(1)]; tensor blocks_26_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_26_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1050970048)))]; tensor blocks_26_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_26_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1064077312)))]; tensor input_269_cast_fp16 = conv(bias = blocks_26_mlp_0_bias_to_fp16, dilations = input_269_dilations_0, groups = input_269_groups_0, pad = input_269_pad_0, pad_type = input_269_pad_type_0, strides = input_269_strides_0, weight = blocks_26_mlp_0_weight_to_fp16, x = input_267_cast_fp16)[name = tensor("input_269_cast_fp16")]; tensor input_271_mode_0 = const()[name = tensor("input_271_mode_0"), val = tensor("EXACT")]; tensor input_271_cast_fp16 = gelu(mode = input_271_mode_0, x = input_269_cast_fp16)[name = tensor("input_271_cast_fp16")]; tensor var_7378_pad_type_0 = const()[name = tensor("op_7378_pad_type_0"), val = tensor("valid")]; tensor var_7378_strides_0 = const()[name = tensor("op_7378_strides_0"), val = tensor([1, 1])]; tensor var_7378_pad_0 = const()[name = tensor("op_7378_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_7378_dilations_0 = const()[name = tensor("op_7378_dilations_0"), val = tensor([1, 1])]; tensor var_7378_groups_0 = const()[name = tensor("op_7378_groups_0"), val = tensor(1)]; tensor blocks_26_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_26_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1064087616)))]; tensor blocks_26_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_26_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1077194880)))]; tensor var_7378_cast_fp16 = conv(bias = blocks_26_mlp_2_bias_to_fp16, dilations = var_7378_dilations_0, groups = var_7378_groups_0, pad = var_7378_pad_0, pad_type = var_7378_pad_type_0, strides = var_7378_strides_0, weight = blocks_26_mlp_2_weight_to_fp16, x = input_271_cast_fp16)[name = tensor("op_7378_cast_fp16")]; tensor inputs_109_cast_fp16 = add(x = inputs_107_cast_fp16, y = var_7378_cast_fp16)[name = tensor("inputs_109_cast_fp16")]; tensor var_7387 = const()[name = tensor("op_7387"), val = tensor(1)]; tensor input_273_axes_0 = const()[name = tensor("input_273_axes_0"), val = tensor([1])]; tensor input_273_gamma_0_to_fp16 = const()[name = tensor("input_273_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1077197504)))]; tensor input_273_beta_0_to_fp16 = const()[name = tensor("input_273_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1077200128)))]; tensor var_7403_to_fp16 = const()[name = tensor("op_7403_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_273_cast_fp16 = layer_norm(axes = input_273_axes_0, beta = input_273_beta_0_to_fp16, epsilon = var_7403_to_fp16, gamma = input_273_gamma_0_to_fp16, x = inputs_109_cast_fp16)[name = tensor("input_273_cast_fp16")]; tensor q_55_pad_type_0 = const()[name = tensor("q_55_pad_type_0"), val = tensor("valid")]; tensor q_55_strides_0 = const()[name = tensor("q_55_strides_0"), val = tensor([1, 1])]; tensor q_55_pad_0 = const()[name = tensor("q_55_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_55_dilations_0 = const()[name = tensor("q_55_dilations_0"), val = tensor([1, 1])]; tensor q_55_groups_0 = const()[name = tensor("q_55_groups_0"), val = tensor(1)]; tensor var_7438_weight_0_to_fp16 = const()[name = tensor("op_7438_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1077202752)))]; tensor var_7438_bias_0_to_fp16 = const()[name = tensor("op_7438_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1080479616)))]; tensor var_7438_cast_fp16 = conv(bias = var_7438_bias_0_to_fp16, dilations = q_55_dilations_0, groups = q_55_groups_0, pad = q_55_pad_0, pad_type = q_55_pad_type_0, strides = q_55_strides_0, weight = var_7438_weight_0_to_fp16, x = input_273_cast_fp16)[name = tensor("op_7438_cast_fp16")]; tensor k_55_pad_type_0 = const()[name = tensor("k_55_pad_type_0"), val = tensor("valid")]; tensor k_55_strides_0 = const()[name = tensor("k_55_strides_0"), val = tensor([1, 1])]; tensor k_55_pad_0 = const()[name = tensor("k_55_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_55_dilations_0 = const()[name = tensor("k_55_dilations_0"), val = tensor([1, 1])]; tensor k_55_groups_0 = const()[name = tensor("k_55_groups_0"), val = tensor(1)]; tensor blocks_27_attn_key_weight_to_fp16 = const()[name = tensor("blocks_27_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1080482240)))]; tensor k_55_cast_fp16 = conv(dilations = k_55_dilations_0, groups = k_55_groups_0, pad = k_55_pad_0, pad_type = k_55_pad_type_0, strides = k_55_strides_0, weight = blocks_27_attn_key_weight_to_fp16, x = input_273_cast_fp16)[name = tensor("k_55_cast_fp16")]; tensor var_7436_pad_type_0 = const()[name = tensor("op_7436_pad_type_0"), val = tensor("valid")]; tensor var_7436_strides_0 = const()[name = tensor("op_7436_strides_0"), val = tensor([1, 1])]; tensor var_7436_pad_0 = const()[name = tensor("op_7436_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_7436_dilations_0 = const()[name = tensor("op_7436_dilations_0"), val = tensor([1, 1])]; tensor var_7436_groups_0 = const()[name = tensor("op_7436_groups_0"), val = tensor(1)]; tensor blocks_27_attn_value_weight_to_fp16 = const()[name = tensor("blocks_27_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1083759104)))]; tensor blocks_27_attn_value_bias_to_fp16 = const()[name = tensor("blocks_27_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1087035968)))]; tensor var_7436_cast_fp16 = conv(bias = blocks_27_attn_value_bias_to_fp16, dilations = var_7436_dilations_0, groups = var_7436_groups_0, pad = var_7436_pad_0, pad_type = var_7436_pad_type_0, strides = var_7436_strides_0, weight = blocks_27_attn_value_weight_to_fp16, x = input_273_cast_fp16)[name = tensor("op_7436_cast_fp16")]; tensor tile_81 = const()[name = tensor("tile_81"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_7439_axis_0 = const()[name = tensor("op_7439_axis_0"), val = tensor(1)]; tensor var_7439_cast_fp16_0, tensor var_7439_cast_fp16_1, tensor var_7439_cast_fp16_2, tensor var_7439_cast_fp16_3, tensor var_7439_cast_fp16_4, tensor var_7439_cast_fp16_5, tensor var_7439_cast_fp16_6, tensor var_7439_cast_fp16_7, tensor var_7439_cast_fp16_8, tensor var_7439_cast_fp16_9, tensor var_7439_cast_fp16_10, tensor var_7439_cast_fp16_11, tensor var_7439_cast_fp16_12, tensor var_7439_cast_fp16_13, tensor var_7439_cast_fp16_14, tensor var_7439_cast_fp16_15, tensor var_7439_cast_fp16_16, tensor var_7439_cast_fp16_17, tensor var_7439_cast_fp16_18, tensor var_7439_cast_fp16_19 = split(axis = var_7439_axis_0, split_sizes = tile_81, x = var_7438_cast_fp16)[name = tensor("op_7439_cast_fp16")]; tensor var_7460_perm_0 = const()[name = tensor("op_7460_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_82 = const()[name = tensor("tile_82"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_7461_axis_0 = const()[name = tensor("op_7461_axis_0"), val = tensor(3)]; tensor var_7460_cast_fp16 = transpose(perm = var_7460_perm_0, x = k_55_cast_fp16)[name = tensor("transpose_5")]; tensor var_7461_cast_fp16_0, tensor var_7461_cast_fp16_1, tensor var_7461_cast_fp16_2, tensor var_7461_cast_fp16_3, tensor var_7461_cast_fp16_4, tensor var_7461_cast_fp16_5, tensor var_7461_cast_fp16_6, tensor var_7461_cast_fp16_7, tensor var_7461_cast_fp16_8, tensor var_7461_cast_fp16_9, tensor var_7461_cast_fp16_10, tensor var_7461_cast_fp16_11, tensor var_7461_cast_fp16_12, tensor var_7461_cast_fp16_13, tensor var_7461_cast_fp16_14, tensor var_7461_cast_fp16_15, tensor var_7461_cast_fp16_16, tensor var_7461_cast_fp16_17, tensor var_7461_cast_fp16_18, tensor var_7461_cast_fp16_19 = split(axis = var_7461_axis_0, split_sizes = tile_82, x = var_7460_cast_fp16)[name = tensor("op_7461_cast_fp16")]; tensor tile_83 = const()[name = tensor("tile_83"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_7482_axis_0 = const()[name = tensor("op_7482_axis_0"), val = tensor(1)]; tensor var_7482_cast_fp16_0, tensor var_7482_cast_fp16_1, tensor var_7482_cast_fp16_2, tensor var_7482_cast_fp16_3, tensor var_7482_cast_fp16_4, tensor var_7482_cast_fp16_5, tensor var_7482_cast_fp16_6, tensor var_7482_cast_fp16_7, tensor var_7482_cast_fp16_8, tensor var_7482_cast_fp16_9, tensor var_7482_cast_fp16_10, tensor var_7482_cast_fp16_11, tensor var_7482_cast_fp16_12, tensor var_7482_cast_fp16_13, tensor var_7482_cast_fp16_14, tensor var_7482_cast_fp16_15, tensor var_7482_cast_fp16_16, tensor var_7482_cast_fp16_17, tensor var_7482_cast_fp16_18, tensor var_7482_cast_fp16_19 = split(axis = var_7482_axis_0, split_sizes = tile_83, x = var_7436_cast_fp16)[name = tensor("op_7482_cast_fp16")]; tensor aw_1081_equation_0 = const()[name = tensor("aw_1081_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1081_cast_fp16 = einsum(equation = aw_1081_equation_0, values = (var_7461_cast_fp16_0, var_7439_cast_fp16_0))[name = tensor("aw_1081_cast_fp16")]; tensor aw_1083_equation_0 = const()[name = tensor("aw_1083_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1083_cast_fp16 = einsum(equation = aw_1083_equation_0, values = (var_7461_cast_fp16_1, var_7439_cast_fp16_1))[name = tensor("aw_1083_cast_fp16")]; tensor aw_1085_equation_0 = const()[name = tensor("aw_1085_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1085_cast_fp16 = einsum(equation = aw_1085_equation_0, values = (var_7461_cast_fp16_2, var_7439_cast_fp16_2))[name = tensor("aw_1085_cast_fp16")]; tensor aw_1087_equation_0 = const()[name = tensor("aw_1087_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1087_cast_fp16 = einsum(equation = aw_1087_equation_0, values = (var_7461_cast_fp16_3, var_7439_cast_fp16_3))[name = tensor("aw_1087_cast_fp16")]; tensor aw_1089_equation_0 = const()[name = tensor("aw_1089_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1089_cast_fp16 = einsum(equation = aw_1089_equation_0, values = (var_7461_cast_fp16_4, var_7439_cast_fp16_4))[name = tensor("aw_1089_cast_fp16")]; tensor aw_1091_equation_0 = const()[name = tensor("aw_1091_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1091_cast_fp16 = einsum(equation = aw_1091_equation_0, values = (var_7461_cast_fp16_5, var_7439_cast_fp16_5))[name = tensor("aw_1091_cast_fp16")]; tensor aw_1093_equation_0 = const()[name = tensor("aw_1093_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1093_cast_fp16 = einsum(equation = aw_1093_equation_0, values = (var_7461_cast_fp16_6, var_7439_cast_fp16_6))[name = tensor("aw_1093_cast_fp16")]; tensor aw_1095_equation_0 = const()[name = tensor("aw_1095_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1095_cast_fp16 = einsum(equation = aw_1095_equation_0, values = (var_7461_cast_fp16_7, var_7439_cast_fp16_7))[name = tensor("aw_1095_cast_fp16")]; tensor aw_1097_equation_0 = const()[name = tensor("aw_1097_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1097_cast_fp16 = einsum(equation = aw_1097_equation_0, values = (var_7461_cast_fp16_8, var_7439_cast_fp16_8))[name = tensor("aw_1097_cast_fp16")]; tensor aw_1099_equation_0 = const()[name = tensor("aw_1099_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1099_cast_fp16 = einsum(equation = aw_1099_equation_0, values = (var_7461_cast_fp16_9, var_7439_cast_fp16_9))[name = tensor("aw_1099_cast_fp16")]; tensor aw_1101_equation_0 = const()[name = tensor("aw_1101_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1101_cast_fp16 = einsum(equation = aw_1101_equation_0, values = (var_7461_cast_fp16_10, var_7439_cast_fp16_10))[name = tensor("aw_1101_cast_fp16")]; tensor aw_1103_equation_0 = const()[name = tensor("aw_1103_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1103_cast_fp16 = einsum(equation = aw_1103_equation_0, values = (var_7461_cast_fp16_11, var_7439_cast_fp16_11))[name = tensor("aw_1103_cast_fp16")]; tensor aw_1105_equation_0 = const()[name = tensor("aw_1105_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1105_cast_fp16 = einsum(equation = aw_1105_equation_0, values = (var_7461_cast_fp16_12, var_7439_cast_fp16_12))[name = tensor("aw_1105_cast_fp16")]; tensor aw_1107_equation_0 = const()[name = tensor("aw_1107_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1107_cast_fp16 = einsum(equation = aw_1107_equation_0, values = (var_7461_cast_fp16_13, var_7439_cast_fp16_13))[name = tensor("aw_1107_cast_fp16")]; tensor aw_1109_equation_0 = const()[name = tensor("aw_1109_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1109_cast_fp16 = einsum(equation = aw_1109_equation_0, values = (var_7461_cast_fp16_14, var_7439_cast_fp16_14))[name = tensor("aw_1109_cast_fp16")]; tensor aw_1111_equation_0 = const()[name = tensor("aw_1111_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1111_cast_fp16 = einsum(equation = aw_1111_equation_0, values = (var_7461_cast_fp16_15, var_7439_cast_fp16_15))[name = tensor("aw_1111_cast_fp16")]; tensor aw_1113_equation_0 = const()[name = tensor("aw_1113_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1113_cast_fp16 = einsum(equation = aw_1113_equation_0, values = (var_7461_cast_fp16_16, var_7439_cast_fp16_16))[name = tensor("aw_1113_cast_fp16")]; tensor aw_1115_equation_0 = const()[name = tensor("aw_1115_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1115_cast_fp16 = einsum(equation = aw_1115_equation_0, values = (var_7461_cast_fp16_17, var_7439_cast_fp16_17))[name = tensor("aw_1115_cast_fp16")]; tensor aw_1117_equation_0 = const()[name = tensor("aw_1117_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1117_cast_fp16 = einsum(equation = aw_1117_equation_0, values = (var_7461_cast_fp16_18, var_7439_cast_fp16_18))[name = tensor("aw_1117_cast_fp16")]; tensor aw_1119_equation_0 = const()[name = tensor("aw_1119_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1119_cast_fp16 = einsum(equation = aw_1119_equation_0, values = (var_7461_cast_fp16_19, var_7439_cast_fp16_19))[name = tensor("aw_1119_cast_fp16")]; tensor var_7543_cast_fp16 = softmax(axis = var_7387, x = aw_1081_cast_fp16)[name = tensor("op_7543_cast_fp16")]; tensor var_7544_cast_fp16 = softmax(axis = var_7387, x = aw_1083_cast_fp16)[name = tensor("op_7544_cast_fp16")]; tensor var_7545_cast_fp16 = softmax(axis = var_7387, x = aw_1085_cast_fp16)[name = tensor("op_7545_cast_fp16")]; tensor var_7546_cast_fp16 = softmax(axis = var_7387, x = aw_1087_cast_fp16)[name = tensor("op_7546_cast_fp16")]; tensor var_7547_cast_fp16 = softmax(axis = var_7387, x = aw_1089_cast_fp16)[name = tensor("op_7547_cast_fp16")]; tensor var_7548_cast_fp16 = softmax(axis = var_7387, x = aw_1091_cast_fp16)[name = tensor("op_7548_cast_fp16")]; tensor var_7549_cast_fp16 = softmax(axis = var_7387, x = aw_1093_cast_fp16)[name = tensor("op_7549_cast_fp16")]; tensor var_7550_cast_fp16 = softmax(axis = var_7387, x = aw_1095_cast_fp16)[name = tensor("op_7550_cast_fp16")]; tensor var_7551_cast_fp16 = softmax(axis = var_7387, x = aw_1097_cast_fp16)[name = tensor("op_7551_cast_fp16")]; tensor var_7552_cast_fp16 = softmax(axis = var_7387, x = aw_1099_cast_fp16)[name = tensor("op_7552_cast_fp16")]; tensor var_7553_cast_fp16 = softmax(axis = var_7387, x = aw_1101_cast_fp16)[name = tensor("op_7553_cast_fp16")]; tensor var_7554_cast_fp16 = softmax(axis = var_7387, x = aw_1103_cast_fp16)[name = tensor("op_7554_cast_fp16")]; tensor var_7555_cast_fp16 = softmax(axis = var_7387, x = aw_1105_cast_fp16)[name = tensor("op_7555_cast_fp16")]; tensor var_7556_cast_fp16 = softmax(axis = var_7387, x = aw_1107_cast_fp16)[name = tensor("op_7556_cast_fp16")]; tensor var_7557_cast_fp16 = softmax(axis = var_7387, x = aw_1109_cast_fp16)[name = tensor("op_7557_cast_fp16")]; tensor var_7558_cast_fp16 = softmax(axis = var_7387, x = aw_1111_cast_fp16)[name = tensor("op_7558_cast_fp16")]; tensor var_7559_cast_fp16 = softmax(axis = var_7387, x = aw_1113_cast_fp16)[name = tensor("op_7559_cast_fp16")]; tensor var_7560_cast_fp16 = softmax(axis = var_7387, x = aw_1115_cast_fp16)[name = tensor("op_7560_cast_fp16")]; tensor var_7561_cast_fp16 = softmax(axis = var_7387, x = aw_1117_cast_fp16)[name = tensor("op_7561_cast_fp16")]; tensor var_7562_cast_fp16 = softmax(axis = var_7387, x = aw_1119_cast_fp16)[name = tensor("op_7562_cast_fp16")]; tensor var_7564_equation_0 = const()[name = tensor("op_7564_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7564_cast_fp16 = einsum(equation = var_7564_equation_0, values = (var_7482_cast_fp16_0, var_7543_cast_fp16))[name = tensor("op_7564_cast_fp16")]; tensor var_7566_equation_0 = const()[name = tensor("op_7566_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7566_cast_fp16 = einsum(equation = var_7566_equation_0, values = (var_7482_cast_fp16_1, var_7544_cast_fp16))[name = tensor("op_7566_cast_fp16")]; tensor var_7568_equation_0 = const()[name = tensor("op_7568_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7568_cast_fp16 = einsum(equation = var_7568_equation_0, values = (var_7482_cast_fp16_2, var_7545_cast_fp16))[name = tensor("op_7568_cast_fp16")]; tensor var_7570_equation_0 = const()[name = tensor("op_7570_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7570_cast_fp16 = einsum(equation = var_7570_equation_0, values = (var_7482_cast_fp16_3, var_7546_cast_fp16))[name = tensor("op_7570_cast_fp16")]; tensor var_7572_equation_0 = const()[name = tensor("op_7572_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7572_cast_fp16 = einsum(equation = var_7572_equation_0, values = (var_7482_cast_fp16_4, var_7547_cast_fp16))[name = tensor("op_7572_cast_fp16")]; tensor var_7574_equation_0 = const()[name = tensor("op_7574_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7574_cast_fp16 = einsum(equation = var_7574_equation_0, values = (var_7482_cast_fp16_5, var_7548_cast_fp16))[name = tensor("op_7574_cast_fp16")]; tensor var_7576_equation_0 = const()[name = tensor("op_7576_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7576_cast_fp16 = einsum(equation = var_7576_equation_0, values = (var_7482_cast_fp16_6, var_7549_cast_fp16))[name = tensor("op_7576_cast_fp16")]; tensor var_7578_equation_0 = const()[name = tensor("op_7578_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7578_cast_fp16 = einsum(equation = var_7578_equation_0, values = (var_7482_cast_fp16_7, var_7550_cast_fp16))[name = tensor("op_7578_cast_fp16")]; tensor var_7580_equation_0 = const()[name = tensor("op_7580_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7580_cast_fp16 = einsum(equation = var_7580_equation_0, values = (var_7482_cast_fp16_8, var_7551_cast_fp16))[name = tensor("op_7580_cast_fp16")]; tensor var_7582_equation_0 = const()[name = tensor("op_7582_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7582_cast_fp16 = einsum(equation = var_7582_equation_0, values = (var_7482_cast_fp16_9, var_7552_cast_fp16))[name = tensor("op_7582_cast_fp16")]; tensor var_7584_equation_0 = const()[name = tensor("op_7584_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7584_cast_fp16 = einsum(equation = var_7584_equation_0, values = (var_7482_cast_fp16_10, var_7553_cast_fp16))[name = tensor("op_7584_cast_fp16")]; tensor var_7586_equation_0 = const()[name = tensor("op_7586_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7586_cast_fp16 = einsum(equation = var_7586_equation_0, values = (var_7482_cast_fp16_11, var_7554_cast_fp16))[name = tensor("op_7586_cast_fp16")]; tensor var_7588_equation_0 = const()[name = tensor("op_7588_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7588_cast_fp16 = einsum(equation = var_7588_equation_0, values = (var_7482_cast_fp16_12, var_7555_cast_fp16))[name = tensor("op_7588_cast_fp16")]; tensor var_7590_equation_0 = const()[name = tensor("op_7590_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7590_cast_fp16 = einsum(equation = var_7590_equation_0, values = (var_7482_cast_fp16_13, var_7556_cast_fp16))[name = tensor("op_7590_cast_fp16")]; tensor var_7592_equation_0 = const()[name = tensor("op_7592_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7592_cast_fp16 = einsum(equation = var_7592_equation_0, values = (var_7482_cast_fp16_14, var_7557_cast_fp16))[name = tensor("op_7592_cast_fp16")]; tensor var_7594_equation_0 = const()[name = tensor("op_7594_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7594_cast_fp16 = einsum(equation = var_7594_equation_0, values = (var_7482_cast_fp16_15, var_7558_cast_fp16))[name = tensor("op_7594_cast_fp16")]; tensor var_7596_equation_0 = const()[name = tensor("op_7596_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7596_cast_fp16 = einsum(equation = var_7596_equation_0, values = (var_7482_cast_fp16_16, var_7559_cast_fp16))[name = tensor("op_7596_cast_fp16")]; tensor var_7598_equation_0 = const()[name = tensor("op_7598_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7598_cast_fp16 = einsum(equation = var_7598_equation_0, values = (var_7482_cast_fp16_17, var_7560_cast_fp16))[name = tensor("op_7598_cast_fp16")]; tensor var_7600_equation_0 = const()[name = tensor("op_7600_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7600_cast_fp16 = einsum(equation = var_7600_equation_0, values = (var_7482_cast_fp16_18, var_7561_cast_fp16))[name = tensor("op_7600_cast_fp16")]; tensor var_7602_equation_0 = const()[name = tensor("op_7602_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7602_cast_fp16 = einsum(equation = var_7602_equation_0, values = (var_7482_cast_fp16_19, var_7562_cast_fp16))[name = tensor("op_7602_cast_fp16")]; tensor input_275_interleave_0 = const()[name = tensor("input_275_interleave_0"), val = tensor(false)]; tensor input_275_cast_fp16 = concat(axis = var_7387, interleave = input_275_interleave_0, values = (var_7564_cast_fp16, var_7566_cast_fp16, var_7568_cast_fp16, var_7570_cast_fp16, var_7572_cast_fp16, var_7574_cast_fp16, var_7576_cast_fp16, var_7578_cast_fp16, var_7580_cast_fp16, var_7582_cast_fp16, var_7584_cast_fp16, var_7586_cast_fp16, var_7588_cast_fp16, var_7590_cast_fp16, var_7592_cast_fp16, var_7594_cast_fp16, var_7596_cast_fp16, var_7598_cast_fp16, var_7600_cast_fp16, var_7602_cast_fp16))[name = tensor("input_275_cast_fp16")]; tensor var_7611_pad_type_0 = const()[name = tensor("op_7611_pad_type_0"), val = tensor("valid")]; tensor var_7611_strides_0 = const()[name = tensor("op_7611_strides_0"), val = tensor([1, 1])]; tensor var_7611_pad_0 = const()[name = tensor("op_7611_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_7611_dilations_0 = const()[name = tensor("op_7611_dilations_0"), val = tensor([1, 1])]; tensor var_7611_groups_0 = const()[name = tensor("op_7611_groups_0"), val = tensor(1)]; tensor blocks_27_attn_out_weight_to_fp16 = const()[name = tensor("blocks_27_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1087038592)))]; tensor blocks_27_attn_out_bias_to_fp16 = const()[name = tensor("blocks_27_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1090315456)))]; tensor var_7611_cast_fp16 = conv(bias = blocks_27_attn_out_bias_to_fp16, dilations = var_7611_dilations_0, groups = var_7611_groups_0, pad = var_7611_pad_0, pad_type = var_7611_pad_type_0, strides = var_7611_strides_0, weight = blocks_27_attn_out_weight_to_fp16, x = input_275_cast_fp16)[name = tensor("op_7611_cast_fp16")]; tensor inputs_111_cast_fp16 = add(x = inputs_109_cast_fp16, y = var_7611_cast_fp16)[name = tensor("inputs_111_cast_fp16")]; tensor input_277_axes_0 = const()[name = tensor("input_277_axes_0"), val = tensor([1])]; tensor input_277_gamma_0_to_fp16 = const()[name = tensor("input_277_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1090318080)))]; tensor input_277_beta_0_to_fp16 = const()[name = tensor("input_277_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1090320704)))]; tensor var_7621_to_fp16 = const()[name = tensor("op_7621_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_277_cast_fp16 = layer_norm(axes = input_277_axes_0, beta = input_277_beta_0_to_fp16, epsilon = var_7621_to_fp16, gamma = input_277_gamma_0_to_fp16, x = inputs_111_cast_fp16)[name = tensor("input_277_cast_fp16")]; tensor input_279_pad_type_0 = const()[name = tensor("input_279_pad_type_0"), val = tensor("valid")]; tensor input_279_strides_0 = const()[name = tensor("input_279_strides_0"), val = tensor([1, 1])]; tensor input_279_pad_0 = const()[name = tensor("input_279_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_279_dilations_0 = const()[name = tensor("input_279_dilations_0"), val = tensor([1, 1])]; tensor input_279_groups_0 = const()[name = tensor("input_279_groups_0"), val = tensor(1)]; tensor blocks_27_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_27_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1090323328)))]; tensor blocks_27_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_27_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1103430592)))]; tensor input_279_cast_fp16 = conv(bias = blocks_27_mlp_0_bias_to_fp16, dilations = input_279_dilations_0, groups = input_279_groups_0, pad = input_279_pad_0, pad_type = input_279_pad_type_0, strides = input_279_strides_0, weight = blocks_27_mlp_0_weight_to_fp16, x = input_277_cast_fp16)[name = tensor("input_279_cast_fp16")]; tensor input_281_mode_0 = const()[name = tensor("input_281_mode_0"), val = tensor("EXACT")]; tensor input_281_cast_fp16 = gelu(mode = input_281_mode_0, x = input_279_cast_fp16)[name = tensor("input_281_cast_fp16")]; tensor var_7647_pad_type_0 = const()[name = tensor("op_7647_pad_type_0"), val = tensor("valid")]; tensor var_7647_strides_0 = const()[name = tensor("op_7647_strides_0"), val = tensor([1, 1])]; tensor var_7647_pad_0 = const()[name = tensor("op_7647_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_7647_dilations_0 = const()[name = tensor("op_7647_dilations_0"), val = tensor([1, 1])]; tensor var_7647_groups_0 = const()[name = tensor("op_7647_groups_0"), val = tensor(1)]; tensor blocks_27_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_27_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1103440896)))]; tensor blocks_27_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_27_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1116548160)))]; tensor var_7647_cast_fp16 = conv(bias = blocks_27_mlp_2_bias_to_fp16, dilations = var_7647_dilations_0, groups = var_7647_groups_0, pad = var_7647_pad_0, pad_type = var_7647_pad_type_0, strides = var_7647_strides_0, weight = blocks_27_mlp_2_weight_to_fp16, x = input_281_cast_fp16)[name = tensor("op_7647_cast_fp16")]; tensor inputs_113_cast_fp16 = add(x = inputs_111_cast_fp16, y = var_7647_cast_fp16)[name = tensor("inputs_113_cast_fp16")]; tensor var_7656 = const()[name = tensor("op_7656"), val = tensor(1)]; tensor input_283_axes_0 = const()[name = tensor("input_283_axes_0"), val = tensor([1])]; tensor input_283_gamma_0_to_fp16 = const()[name = tensor("input_283_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1116550784)))]; tensor input_283_beta_0_to_fp16 = const()[name = tensor("input_283_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1116553408)))]; tensor var_7672_to_fp16 = const()[name = tensor("op_7672_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_283_cast_fp16 = layer_norm(axes = input_283_axes_0, beta = input_283_beta_0_to_fp16, epsilon = var_7672_to_fp16, gamma = input_283_gamma_0_to_fp16, x = inputs_113_cast_fp16)[name = tensor("input_283_cast_fp16")]; tensor q_57_pad_type_0 = const()[name = tensor("q_57_pad_type_0"), val = tensor("valid")]; tensor q_57_strides_0 = const()[name = tensor("q_57_strides_0"), val = tensor([1, 1])]; tensor q_57_pad_0 = const()[name = tensor("q_57_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_57_dilations_0 = const()[name = tensor("q_57_dilations_0"), val = tensor([1, 1])]; tensor q_57_groups_0 = const()[name = tensor("q_57_groups_0"), val = tensor(1)]; tensor var_7707_weight_0_to_fp16 = const()[name = tensor("op_7707_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1116556032)))]; tensor var_7707_bias_0_to_fp16 = const()[name = tensor("op_7707_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1119832896)))]; tensor var_7707_cast_fp16 = conv(bias = var_7707_bias_0_to_fp16, dilations = q_57_dilations_0, groups = q_57_groups_0, pad = q_57_pad_0, pad_type = q_57_pad_type_0, strides = q_57_strides_0, weight = var_7707_weight_0_to_fp16, x = input_283_cast_fp16)[name = tensor("op_7707_cast_fp16")]; tensor k_57_pad_type_0 = const()[name = tensor("k_57_pad_type_0"), val = tensor("valid")]; tensor k_57_strides_0 = const()[name = tensor("k_57_strides_0"), val = tensor([1, 1])]; tensor k_57_pad_0 = const()[name = tensor("k_57_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_57_dilations_0 = const()[name = tensor("k_57_dilations_0"), val = tensor([1, 1])]; tensor k_57_groups_0 = const()[name = tensor("k_57_groups_0"), val = tensor(1)]; tensor blocks_28_attn_key_weight_to_fp16 = const()[name = tensor("blocks_28_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1119835520)))]; tensor k_57_cast_fp16 = conv(dilations = k_57_dilations_0, groups = k_57_groups_0, pad = k_57_pad_0, pad_type = k_57_pad_type_0, strides = k_57_strides_0, weight = blocks_28_attn_key_weight_to_fp16, x = input_283_cast_fp16)[name = tensor("k_57_cast_fp16")]; tensor var_7705_pad_type_0 = const()[name = tensor("op_7705_pad_type_0"), val = tensor("valid")]; tensor var_7705_strides_0 = const()[name = tensor("op_7705_strides_0"), val = tensor([1, 1])]; tensor var_7705_pad_0 = const()[name = tensor("op_7705_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_7705_dilations_0 = const()[name = tensor("op_7705_dilations_0"), val = tensor([1, 1])]; tensor var_7705_groups_0 = const()[name = tensor("op_7705_groups_0"), val = tensor(1)]; tensor blocks_28_attn_value_weight_to_fp16 = const()[name = tensor("blocks_28_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1123112384)))]; tensor blocks_28_attn_value_bias_to_fp16 = const()[name = tensor("blocks_28_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1126389248)))]; tensor var_7705_cast_fp16 = conv(bias = blocks_28_attn_value_bias_to_fp16, dilations = var_7705_dilations_0, groups = var_7705_groups_0, pad = var_7705_pad_0, pad_type = var_7705_pad_type_0, strides = var_7705_strides_0, weight = blocks_28_attn_value_weight_to_fp16, x = input_283_cast_fp16)[name = tensor("op_7705_cast_fp16")]; tensor tile_84 = const()[name = tensor("tile_84"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_7708_axis_0 = const()[name = tensor("op_7708_axis_0"), val = tensor(1)]; tensor var_7708_cast_fp16_0, tensor var_7708_cast_fp16_1, tensor var_7708_cast_fp16_2, tensor var_7708_cast_fp16_3, tensor var_7708_cast_fp16_4, tensor var_7708_cast_fp16_5, tensor var_7708_cast_fp16_6, tensor var_7708_cast_fp16_7, tensor var_7708_cast_fp16_8, tensor var_7708_cast_fp16_9, tensor var_7708_cast_fp16_10, tensor var_7708_cast_fp16_11, tensor var_7708_cast_fp16_12, tensor var_7708_cast_fp16_13, tensor var_7708_cast_fp16_14, tensor var_7708_cast_fp16_15, tensor var_7708_cast_fp16_16, tensor var_7708_cast_fp16_17, tensor var_7708_cast_fp16_18, tensor var_7708_cast_fp16_19 = split(axis = var_7708_axis_0, split_sizes = tile_84, x = var_7707_cast_fp16)[name = tensor("op_7708_cast_fp16")]; tensor var_7729_perm_0 = const()[name = tensor("op_7729_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_85 = const()[name = tensor("tile_85"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_7730_axis_0 = const()[name = tensor("op_7730_axis_0"), val = tensor(3)]; tensor var_7729_cast_fp16 = transpose(perm = var_7729_perm_0, x = k_57_cast_fp16)[name = tensor("transpose_4")]; tensor var_7730_cast_fp16_0, tensor var_7730_cast_fp16_1, tensor var_7730_cast_fp16_2, tensor var_7730_cast_fp16_3, tensor var_7730_cast_fp16_4, tensor var_7730_cast_fp16_5, tensor var_7730_cast_fp16_6, tensor var_7730_cast_fp16_7, tensor var_7730_cast_fp16_8, tensor var_7730_cast_fp16_9, tensor var_7730_cast_fp16_10, tensor var_7730_cast_fp16_11, tensor var_7730_cast_fp16_12, tensor var_7730_cast_fp16_13, tensor var_7730_cast_fp16_14, tensor var_7730_cast_fp16_15, tensor var_7730_cast_fp16_16, tensor var_7730_cast_fp16_17, tensor var_7730_cast_fp16_18, tensor var_7730_cast_fp16_19 = split(axis = var_7730_axis_0, split_sizes = tile_85, x = var_7729_cast_fp16)[name = tensor("op_7730_cast_fp16")]; tensor tile_86 = const()[name = tensor("tile_86"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_7751_axis_0 = const()[name = tensor("op_7751_axis_0"), val = tensor(1)]; tensor var_7751_cast_fp16_0, tensor var_7751_cast_fp16_1, tensor var_7751_cast_fp16_2, tensor var_7751_cast_fp16_3, tensor var_7751_cast_fp16_4, tensor var_7751_cast_fp16_5, tensor var_7751_cast_fp16_6, tensor var_7751_cast_fp16_7, tensor var_7751_cast_fp16_8, tensor var_7751_cast_fp16_9, tensor var_7751_cast_fp16_10, tensor var_7751_cast_fp16_11, tensor var_7751_cast_fp16_12, tensor var_7751_cast_fp16_13, tensor var_7751_cast_fp16_14, tensor var_7751_cast_fp16_15, tensor var_7751_cast_fp16_16, tensor var_7751_cast_fp16_17, tensor var_7751_cast_fp16_18, tensor var_7751_cast_fp16_19 = split(axis = var_7751_axis_0, split_sizes = tile_86, x = var_7705_cast_fp16)[name = tensor("op_7751_cast_fp16")]; tensor aw_1121_equation_0 = const()[name = tensor("aw_1121_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1121_cast_fp16 = einsum(equation = aw_1121_equation_0, values = (var_7730_cast_fp16_0, var_7708_cast_fp16_0))[name = tensor("aw_1121_cast_fp16")]; tensor aw_1123_equation_0 = const()[name = tensor("aw_1123_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1123_cast_fp16 = einsum(equation = aw_1123_equation_0, values = (var_7730_cast_fp16_1, var_7708_cast_fp16_1))[name = tensor("aw_1123_cast_fp16")]; tensor aw_1125_equation_0 = const()[name = tensor("aw_1125_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1125_cast_fp16 = einsum(equation = aw_1125_equation_0, values = (var_7730_cast_fp16_2, var_7708_cast_fp16_2))[name = tensor("aw_1125_cast_fp16")]; tensor aw_1127_equation_0 = const()[name = tensor("aw_1127_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1127_cast_fp16 = einsum(equation = aw_1127_equation_0, values = (var_7730_cast_fp16_3, var_7708_cast_fp16_3))[name = tensor("aw_1127_cast_fp16")]; tensor aw_1129_equation_0 = const()[name = tensor("aw_1129_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1129_cast_fp16 = einsum(equation = aw_1129_equation_0, values = (var_7730_cast_fp16_4, var_7708_cast_fp16_4))[name = tensor("aw_1129_cast_fp16")]; tensor aw_1131_equation_0 = const()[name = tensor("aw_1131_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1131_cast_fp16 = einsum(equation = aw_1131_equation_0, values = (var_7730_cast_fp16_5, var_7708_cast_fp16_5))[name = tensor("aw_1131_cast_fp16")]; tensor aw_1133_equation_0 = const()[name = tensor("aw_1133_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1133_cast_fp16 = einsum(equation = aw_1133_equation_0, values = (var_7730_cast_fp16_6, var_7708_cast_fp16_6))[name = tensor("aw_1133_cast_fp16")]; tensor aw_1135_equation_0 = const()[name = tensor("aw_1135_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1135_cast_fp16 = einsum(equation = aw_1135_equation_0, values = (var_7730_cast_fp16_7, var_7708_cast_fp16_7))[name = tensor("aw_1135_cast_fp16")]; tensor aw_1137_equation_0 = const()[name = tensor("aw_1137_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1137_cast_fp16 = einsum(equation = aw_1137_equation_0, values = (var_7730_cast_fp16_8, var_7708_cast_fp16_8))[name = tensor("aw_1137_cast_fp16")]; tensor aw_1139_equation_0 = const()[name = tensor("aw_1139_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1139_cast_fp16 = einsum(equation = aw_1139_equation_0, values = (var_7730_cast_fp16_9, var_7708_cast_fp16_9))[name = tensor("aw_1139_cast_fp16")]; tensor aw_1141_equation_0 = const()[name = tensor("aw_1141_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1141_cast_fp16 = einsum(equation = aw_1141_equation_0, values = (var_7730_cast_fp16_10, var_7708_cast_fp16_10))[name = tensor("aw_1141_cast_fp16")]; tensor aw_1143_equation_0 = const()[name = tensor("aw_1143_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1143_cast_fp16 = einsum(equation = aw_1143_equation_0, values = (var_7730_cast_fp16_11, var_7708_cast_fp16_11))[name = tensor("aw_1143_cast_fp16")]; tensor aw_1145_equation_0 = const()[name = tensor("aw_1145_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1145_cast_fp16 = einsum(equation = aw_1145_equation_0, values = (var_7730_cast_fp16_12, var_7708_cast_fp16_12))[name = tensor("aw_1145_cast_fp16")]; tensor aw_1147_equation_0 = const()[name = tensor("aw_1147_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1147_cast_fp16 = einsum(equation = aw_1147_equation_0, values = (var_7730_cast_fp16_13, var_7708_cast_fp16_13))[name = tensor("aw_1147_cast_fp16")]; tensor aw_1149_equation_0 = const()[name = tensor("aw_1149_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1149_cast_fp16 = einsum(equation = aw_1149_equation_0, values = (var_7730_cast_fp16_14, var_7708_cast_fp16_14))[name = tensor("aw_1149_cast_fp16")]; tensor aw_1151_equation_0 = const()[name = tensor("aw_1151_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1151_cast_fp16 = einsum(equation = aw_1151_equation_0, values = (var_7730_cast_fp16_15, var_7708_cast_fp16_15))[name = tensor("aw_1151_cast_fp16")]; tensor aw_1153_equation_0 = const()[name = tensor("aw_1153_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1153_cast_fp16 = einsum(equation = aw_1153_equation_0, values = (var_7730_cast_fp16_16, var_7708_cast_fp16_16))[name = tensor("aw_1153_cast_fp16")]; tensor aw_1155_equation_0 = const()[name = tensor("aw_1155_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1155_cast_fp16 = einsum(equation = aw_1155_equation_0, values = (var_7730_cast_fp16_17, var_7708_cast_fp16_17))[name = tensor("aw_1155_cast_fp16")]; tensor aw_1157_equation_0 = const()[name = tensor("aw_1157_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1157_cast_fp16 = einsum(equation = aw_1157_equation_0, values = (var_7730_cast_fp16_18, var_7708_cast_fp16_18))[name = tensor("aw_1157_cast_fp16")]; tensor aw_1159_equation_0 = const()[name = tensor("aw_1159_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1159_cast_fp16 = einsum(equation = aw_1159_equation_0, values = (var_7730_cast_fp16_19, var_7708_cast_fp16_19))[name = tensor("aw_1159_cast_fp16")]; tensor var_7812_cast_fp16 = softmax(axis = var_7656, x = aw_1121_cast_fp16)[name = tensor("op_7812_cast_fp16")]; tensor var_7813_cast_fp16 = softmax(axis = var_7656, x = aw_1123_cast_fp16)[name = tensor("op_7813_cast_fp16")]; tensor var_7814_cast_fp16 = softmax(axis = var_7656, x = aw_1125_cast_fp16)[name = tensor("op_7814_cast_fp16")]; tensor var_7815_cast_fp16 = softmax(axis = var_7656, x = aw_1127_cast_fp16)[name = tensor("op_7815_cast_fp16")]; tensor var_7816_cast_fp16 = softmax(axis = var_7656, x = aw_1129_cast_fp16)[name = tensor("op_7816_cast_fp16")]; tensor var_7817_cast_fp16 = softmax(axis = var_7656, x = aw_1131_cast_fp16)[name = tensor("op_7817_cast_fp16")]; tensor var_7818_cast_fp16 = softmax(axis = var_7656, x = aw_1133_cast_fp16)[name = tensor("op_7818_cast_fp16")]; tensor var_7819_cast_fp16 = softmax(axis = var_7656, x = aw_1135_cast_fp16)[name = tensor("op_7819_cast_fp16")]; tensor var_7820_cast_fp16 = softmax(axis = var_7656, x = aw_1137_cast_fp16)[name = tensor("op_7820_cast_fp16")]; tensor var_7821_cast_fp16 = softmax(axis = var_7656, x = aw_1139_cast_fp16)[name = tensor("op_7821_cast_fp16")]; tensor var_7822_cast_fp16 = softmax(axis = var_7656, x = aw_1141_cast_fp16)[name = tensor("op_7822_cast_fp16")]; tensor var_7823_cast_fp16 = softmax(axis = var_7656, x = aw_1143_cast_fp16)[name = tensor("op_7823_cast_fp16")]; tensor var_7824_cast_fp16 = softmax(axis = var_7656, x = aw_1145_cast_fp16)[name = tensor("op_7824_cast_fp16")]; tensor var_7825_cast_fp16 = softmax(axis = var_7656, x = aw_1147_cast_fp16)[name = tensor("op_7825_cast_fp16")]; tensor var_7826_cast_fp16 = softmax(axis = var_7656, x = aw_1149_cast_fp16)[name = tensor("op_7826_cast_fp16")]; tensor var_7827_cast_fp16 = softmax(axis = var_7656, x = aw_1151_cast_fp16)[name = tensor("op_7827_cast_fp16")]; tensor var_7828_cast_fp16 = softmax(axis = var_7656, x = aw_1153_cast_fp16)[name = tensor("op_7828_cast_fp16")]; tensor var_7829_cast_fp16 = softmax(axis = var_7656, x = aw_1155_cast_fp16)[name = tensor("op_7829_cast_fp16")]; tensor var_7830_cast_fp16 = softmax(axis = var_7656, x = aw_1157_cast_fp16)[name = tensor("op_7830_cast_fp16")]; tensor var_7831_cast_fp16 = softmax(axis = var_7656, x = aw_1159_cast_fp16)[name = tensor("op_7831_cast_fp16")]; tensor var_7833_equation_0 = const()[name = tensor("op_7833_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7833_cast_fp16 = einsum(equation = var_7833_equation_0, values = (var_7751_cast_fp16_0, var_7812_cast_fp16))[name = tensor("op_7833_cast_fp16")]; tensor var_7835_equation_0 = const()[name = tensor("op_7835_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7835_cast_fp16 = einsum(equation = var_7835_equation_0, values = (var_7751_cast_fp16_1, var_7813_cast_fp16))[name = tensor("op_7835_cast_fp16")]; tensor var_7837_equation_0 = const()[name = tensor("op_7837_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7837_cast_fp16 = einsum(equation = var_7837_equation_0, values = (var_7751_cast_fp16_2, var_7814_cast_fp16))[name = tensor("op_7837_cast_fp16")]; tensor var_7839_equation_0 = const()[name = tensor("op_7839_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7839_cast_fp16 = einsum(equation = var_7839_equation_0, values = (var_7751_cast_fp16_3, var_7815_cast_fp16))[name = tensor("op_7839_cast_fp16")]; tensor var_7841_equation_0 = const()[name = tensor("op_7841_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7841_cast_fp16 = einsum(equation = var_7841_equation_0, values = (var_7751_cast_fp16_4, var_7816_cast_fp16))[name = tensor("op_7841_cast_fp16")]; tensor var_7843_equation_0 = const()[name = tensor("op_7843_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7843_cast_fp16 = einsum(equation = var_7843_equation_0, values = (var_7751_cast_fp16_5, var_7817_cast_fp16))[name = tensor("op_7843_cast_fp16")]; tensor var_7845_equation_0 = const()[name = tensor("op_7845_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7845_cast_fp16 = einsum(equation = var_7845_equation_0, values = (var_7751_cast_fp16_6, var_7818_cast_fp16))[name = tensor("op_7845_cast_fp16")]; tensor var_7847_equation_0 = const()[name = tensor("op_7847_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7847_cast_fp16 = einsum(equation = var_7847_equation_0, values = (var_7751_cast_fp16_7, var_7819_cast_fp16))[name = tensor("op_7847_cast_fp16")]; tensor var_7849_equation_0 = const()[name = tensor("op_7849_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7849_cast_fp16 = einsum(equation = var_7849_equation_0, values = (var_7751_cast_fp16_8, var_7820_cast_fp16))[name = tensor("op_7849_cast_fp16")]; tensor var_7851_equation_0 = const()[name = tensor("op_7851_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7851_cast_fp16 = einsum(equation = var_7851_equation_0, values = (var_7751_cast_fp16_9, var_7821_cast_fp16))[name = tensor("op_7851_cast_fp16")]; tensor var_7853_equation_0 = const()[name = tensor("op_7853_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7853_cast_fp16 = einsum(equation = var_7853_equation_0, values = (var_7751_cast_fp16_10, var_7822_cast_fp16))[name = tensor("op_7853_cast_fp16")]; tensor var_7855_equation_0 = const()[name = tensor("op_7855_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7855_cast_fp16 = einsum(equation = var_7855_equation_0, values = (var_7751_cast_fp16_11, var_7823_cast_fp16))[name = tensor("op_7855_cast_fp16")]; tensor var_7857_equation_0 = const()[name = tensor("op_7857_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7857_cast_fp16 = einsum(equation = var_7857_equation_0, values = (var_7751_cast_fp16_12, var_7824_cast_fp16))[name = tensor("op_7857_cast_fp16")]; tensor var_7859_equation_0 = const()[name = tensor("op_7859_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7859_cast_fp16 = einsum(equation = var_7859_equation_0, values = (var_7751_cast_fp16_13, var_7825_cast_fp16))[name = tensor("op_7859_cast_fp16")]; tensor var_7861_equation_0 = const()[name = tensor("op_7861_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7861_cast_fp16 = einsum(equation = var_7861_equation_0, values = (var_7751_cast_fp16_14, var_7826_cast_fp16))[name = tensor("op_7861_cast_fp16")]; tensor var_7863_equation_0 = const()[name = tensor("op_7863_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7863_cast_fp16 = einsum(equation = var_7863_equation_0, values = (var_7751_cast_fp16_15, var_7827_cast_fp16))[name = tensor("op_7863_cast_fp16")]; tensor var_7865_equation_0 = const()[name = tensor("op_7865_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7865_cast_fp16 = einsum(equation = var_7865_equation_0, values = (var_7751_cast_fp16_16, var_7828_cast_fp16))[name = tensor("op_7865_cast_fp16")]; tensor var_7867_equation_0 = const()[name = tensor("op_7867_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7867_cast_fp16 = einsum(equation = var_7867_equation_0, values = (var_7751_cast_fp16_17, var_7829_cast_fp16))[name = tensor("op_7867_cast_fp16")]; tensor var_7869_equation_0 = const()[name = tensor("op_7869_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7869_cast_fp16 = einsum(equation = var_7869_equation_0, values = (var_7751_cast_fp16_18, var_7830_cast_fp16))[name = tensor("op_7869_cast_fp16")]; tensor var_7871_equation_0 = const()[name = tensor("op_7871_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_7871_cast_fp16 = einsum(equation = var_7871_equation_0, values = (var_7751_cast_fp16_19, var_7831_cast_fp16))[name = tensor("op_7871_cast_fp16")]; tensor input_285_interleave_0 = const()[name = tensor("input_285_interleave_0"), val = tensor(false)]; tensor input_285_cast_fp16 = concat(axis = var_7656, interleave = input_285_interleave_0, values = (var_7833_cast_fp16, var_7835_cast_fp16, var_7837_cast_fp16, var_7839_cast_fp16, var_7841_cast_fp16, var_7843_cast_fp16, var_7845_cast_fp16, var_7847_cast_fp16, var_7849_cast_fp16, var_7851_cast_fp16, var_7853_cast_fp16, var_7855_cast_fp16, var_7857_cast_fp16, var_7859_cast_fp16, var_7861_cast_fp16, var_7863_cast_fp16, var_7865_cast_fp16, var_7867_cast_fp16, var_7869_cast_fp16, var_7871_cast_fp16))[name = tensor("input_285_cast_fp16")]; tensor var_7880_pad_type_0 = const()[name = tensor("op_7880_pad_type_0"), val = tensor("valid")]; tensor var_7880_strides_0 = const()[name = tensor("op_7880_strides_0"), val = tensor([1, 1])]; tensor var_7880_pad_0 = const()[name = tensor("op_7880_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_7880_dilations_0 = const()[name = tensor("op_7880_dilations_0"), val = tensor([1, 1])]; tensor var_7880_groups_0 = const()[name = tensor("op_7880_groups_0"), val = tensor(1)]; tensor blocks_28_attn_out_weight_to_fp16 = const()[name = tensor("blocks_28_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1126391872)))]; tensor blocks_28_attn_out_bias_to_fp16 = const()[name = tensor("blocks_28_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1129668736)))]; tensor var_7880_cast_fp16 = conv(bias = blocks_28_attn_out_bias_to_fp16, dilations = var_7880_dilations_0, groups = var_7880_groups_0, pad = var_7880_pad_0, pad_type = var_7880_pad_type_0, strides = var_7880_strides_0, weight = blocks_28_attn_out_weight_to_fp16, x = input_285_cast_fp16)[name = tensor("op_7880_cast_fp16")]; tensor inputs_115_cast_fp16 = add(x = inputs_113_cast_fp16, y = var_7880_cast_fp16)[name = tensor("inputs_115_cast_fp16")]; tensor input_287_axes_0 = const()[name = tensor("input_287_axes_0"), val = tensor([1])]; tensor input_287_gamma_0_to_fp16 = const()[name = tensor("input_287_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1129671360)))]; tensor input_287_beta_0_to_fp16 = const()[name = tensor("input_287_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1129673984)))]; tensor var_7890_to_fp16 = const()[name = tensor("op_7890_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_287_cast_fp16 = layer_norm(axes = input_287_axes_0, beta = input_287_beta_0_to_fp16, epsilon = var_7890_to_fp16, gamma = input_287_gamma_0_to_fp16, x = inputs_115_cast_fp16)[name = tensor("input_287_cast_fp16")]; tensor input_289_pad_type_0 = const()[name = tensor("input_289_pad_type_0"), val = tensor("valid")]; tensor input_289_strides_0 = const()[name = tensor("input_289_strides_0"), val = tensor([1, 1])]; tensor input_289_pad_0 = const()[name = tensor("input_289_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_289_dilations_0 = const()[name = tensor("input_289_dilations_0"), val = tensor([1, 1])]; tensor input_289_groups_0 = const()[name = tensor("input_289_groups_0"), val = tensor(1)]; tensor blocks_28_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_28_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1129676608)))]; tensor blocks_28_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_28_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1142783872)))]; tensor input_289_cast_fp16 = conv(bias = blocks_28_mlp_0_bias_to_fp16, dilations = input_289_dilations_0, groups = input_289_groups_0, pad = input_289_pad_0, pad_type = input_289_pad_type_0, strides = input_289_strides_0, weight = blocks_28_mlp_0_weight_to_fp16, x = input_287_cast_fp16)[name = tensor("input_289_cast_fp16")]; tensor input_291_mode_0 = const()[name = tensor("input_291_mode_0"), val = tensor("EXACT")]; tensor input_291_cast_fp16 = gelu(mode = input_291_mode_0, x = input_289_cast_fp16)[name = tensor("input_291_cast_fp16")]; tensor var_7916_pad_type_0 = const()[name = tensor("op_7916_pad_type_0"), val = tensor("valid")]; tensor var_7916_strides_0 = const()[name = tensor("op_7916_strides_0"), val = tensor([1, 1])]; tensor var_7916_pad_0 = const()[name = tensor("op_7916_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_7916_dilations_0 = const()[name = tensor("op_7916_dilations_0"), val = tensor([1, 1])]; tensor var_7916_groups_0 = const()[name = tensor("op_7916_groups_0"), val = tensor(1)]; tensor blocks_28_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_28_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1142794176)))]; tensor blocks_28_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_28_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1155901440)))]; tensor var_7916_cast_fp16 = conv(bias = blocks_28_mlp_2_bias_to_fp16, dilations = var_7916_dilations_0, groups = var_7916_groups_0, pad = var_7916_pad_0, pad_type = var_7916_pad_type_0, strides = var_7916_strides_0, weight = blocks_28_mlp_2_weight_to_fp16, x = input_291_cast_fp16)[name = tensor("op_7916_cast_fp16")]; tensor inputs_117_cast_fp16 = add(x = inputs_115_cast_fp16, y = var_7916_cast_fp16)[name = tensor("inputs_117_cast_fp16")]; tensor var_7925 = const()[name = tensor("op_7925"), val = tensor(1)]; tensor input_293_axes_0 = const()[name = tensor("input_293_axes_0"), val = tensor([1])]; tensor input_293_gamma_0_to_fp16 = const()[name = tensor("input_293_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1155904064)))]; tensor input_293_beta_0_to_fp16 = const()[name = tensor("input_293_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1155906688)))]; tensor var_7941_to_fp16 = const()[name = tensor("op_7941_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_293_cast_fp16 = layer_norm(axes = input_293_axes_0, beta = input_293_beta_0_to_fp16, epsilon = var_7941_to_fp16, gamma = input_293_gamma_0_to_fp16, x = inputs_117_cast_fp16)[name = tensor("input_293_cast_fp16")]; tensor q_59_pad_type_0 = const()[name = tensor("q_59_pad_type_0"), val = tensor("valid")]; tensor q_59_strides_0 = const()[name = tensor("q_59_strides_0"), val = tensor([1, 1])]; tensor q_59_pad_0 = const()[name = tensor("q_59_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_59_dilations_0 = const()[name = tensor("q_59_dilations_0"), val = tensor([1, 1])]; tensor q_59_groups_0 = const()[name = tensor("q_59_groups_0"), val = tensor(1)]; tensor var_7976_weight_0_to_fp16 = const()[name = tensor("op_7976_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1155909312)))]; tensor var_7976_bias_0_to_fp16 = const()[name = tensor("op_7976_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1159186176)))]; tensor var_7976_cast_fp16 = conv(bias = var_7976_bias_0_to_fp16, dilations = q_59_dilations_0, groups = q_59_groups_0, pad = q_59_pad_0, pad_type = q_59_pad_type_0, strides = q_59_strides_0, weight = var_7976_weight_0_to_fp16, x = input_293_cast_fp16)[name = tensor("op_7976_cast_fp16")]; tensor k_59_pad_type_0 = const()[name = tensor("k_59_pad_type_0"), val = tensor("valid")]; tensor k_59_strides_0 = const()[name = tensor("k_59_strides_0"), val = tensor([1, 1])]; tensor k_59_pad_0 = const()[name = tensor("k_59_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_59_dilations_0 = const()[name = tensor("k_59_dilations_0"), val = tensor([1, 1])]; tensor k_59_groups_0 = const()[name = tensor("k_59_groups_0"), val = tensor(1)]; tensor blocks_29_attn_key_weight_to_fp16 = const()[name = tensor("blocks_29_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1159188800)))]; tensor k_59_cast_fp16 = conv(dilations = k_59_dilations_0, groups = k_59_groups_0, pad = k_59_pad_0, pad_type = k_59_pad_type_0, strides = k_59_strides_0, weight = blocks_29_attn_key_weight_to_fp16, x = input_293_cast_fp16)[name = tensor("k_59_cast_fp16")]; tensor var_7974_pad_type_0 = const()[name = tensor("op_7974_pad_type_0"), val = tensor("valid")]; tensor var_7974_strides_0 = const()[name = tensor("op_7974_strides_0"), val = tensor([1, 1])]; tensor var_7974_pad_0 = const()[name = tensor("op_7974_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_7974_dilations_0 = const()[name = tensor("op_7974_dilations_0"), val = tensor([1, 1])]; tensor var_7974_groups_0 = const()[name = tensor("op_7974_groups_0"), val = tensor(1)]; tensor blocks_29_attn_value_weight_to_fp16 = const()[name = tensor("blocks_29_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1162465664)))]; tensor blocks_29_attn_value_bias_to_fp16 = const()[name = tensor("blocks_29_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1165742528)))]; tensor var_7974_cast_fp16 = conv(bias = blocks_29_attn_value_bias_to_fp16, dilations = var_7974_dilations_0, groups = var_7974_groups_0, pad = var_7974_pad_0, pad_type = var_7974_pad_type_0, strides = var_7974_strides_0, weight = blocks_29_attn_value_weight_to_fp16, x = input_293_cast_fp16)[name = tensor("op_7974_cast_fp16")]; tensor tile_87 = const()[name = tensor("tile_87"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_7977_axis_0 = const()[name = tensor("op_7977_axis_0"), val = tensor(1)]; tensor var_7977_cast_fp16_0, tensor var_7977_cast_fp16_1, tensor var_7977_cast_fp16_2, tensor var_7977_cast_fp16_3, tensor var_7977_cast_fp16_4, tensor var_7977_cast_fp16_5, tensor var_7977_cast_fp16_6, tensor var_7977_cast_fp16_7, tensor var_7977_cast_fp16_8, tensor var_7977_cast_fp16_9, tensor var_7977_cast_fp16_10, tensor var_7977_cast_fp16_11, tensor var_7977_cast_fp16_12, tensor var_7977_cast_fp16_13, tensor var_7977_cast_fp16_14, tensor var_7977_cast_fp16_15, tensor var_7977_cast_fp16_16, tensor var_7977_cast_fp16_17, tensor var_7977_cast_fp16_18, tensor var_7977_cast_fp16_19 = split(axis = var_7977_axis_0, split_sizes = tile_87, x = var_7976_cast_fp16)[name = tensor("op_7977_cast_fp16")]; tensor var_7998_perm_0 = const()[name = tensor("op_7998_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_88 = const()[name = tensor("tile_88"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_7999_axis_0 = const()[name = tensor("op_7999_axis_0"), val = tensor(3)]; tensor var_7998_cast_fp16 = transpose(perm = var_7998_perm_0, x = k_59_cast_fp16)[name = tensor("transpose_3")]; tensor var_7999_cast_fp16_0, tensor var_7999_cast_fp16_1, tensor var_7999_cast_fp16_2, tensor var_7999_cast_fp16_3, tensor var_7999_cast_fp16_4, tensor var_7999_cast_fp16_5, tensor var_7999_cast_fp16_6, tensor var_7999_cast_fp16_7, tensor var_7999_cast_fp16_8, tensor var_7999_cast_fp16_9, tensor var_7999_cast_fp16_10, tensor var_7999_cast_fp16_11, tensor var_7999_cast_fp16_12, tensor var_7999_cast_fp16_13, tensor var_7999_cast_fp16_14, tensor var_7999_cast_fp16_15, tensor var_7999_cast_fp16_16, tensor var_7999_cast_fp16_17, tensor var_7999_cast_fp16_18, tensor var_7999_cast_fp16_19 = split(axis = var_7999_axis_0, split_sizes = tile_88, x = var_7998_cast_fp16)[name = tensor("op_7999_cast_fp16")]; tensor tile_89 = const()[name = tensor("tile_89"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_8020_axis_0 = const()[name = tensor("op_8020_axis_0"), val = tensor(1)]; tensor var_8020_cast_fp16_0, tensor var_8020_cast_fp16_1, tensor var_8020_cast_fp16_2, tensor var_8020_cast_fp16_3, tensor var_8020_cast_fp16_4, tensor var_8020_cast_fp16_5, tensor var_8020_cast_fp16_6, tensor var_8020_cast_fp16_7, tensor var_8020_cast_fp16_8, tensor var_8020_cast_fp16_9, tensor var_8020_cast_fp16_10, tensor var_8020_cast_fp16_11, tensor var_8020_cast_fp16_12, tensor var_8020_cast_fp16_13, tensor var_8020_cast_fp16_14, tensor var_8020_cast_fp16_15, tensor var_8020_cast_fp16_16, tensor var_8020_cast_fp16_17, tensor var_8020_cast_fp16_18, tensor var_8020_cast_fp16_19 = split(axis = var_8020_axis_0, split_sizes = tile_89, x = var_7974_cast_fp16)[name = tensor("op_8020_cast_fp16")]; tensor aw_1161_equation_0 = const()[name = tensor("aw_1161_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1161_cast_fp16 = einsum(equation = aw_1161_equation_0, values = (var_7999_cast_fp16_0, var_7977_cast_fp16_0))[name = tensor("aw_1161_cast_fp16")]; tensor aw_1163_equation_0 = const()[name = tensor("aw_1163_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1163_cast_fp16 = einsum(equation = aw_1163_equation_0, values = (var_7999_cast_fp16_1, var_7977_cast_fp16_1))[name = tensor("aw_1163_cast_fp16")]; tensor aw_1165_equation_0 = const()[name = tensor("aw_1165_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1165_cast_fp16 = einsum(equation = aw_1165_equation_0, values = (var_7999_cast_fp16_2, var_7977_cast_fp16_2))[name = tensor("aw_1165_cast_fp16")]; tensor aw_1167_equation_0 = const()[name = tensor("aw_1167_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1167_cast_fp16 = einsum(equation = aw_1167_equation_0, values = (var_7999_cast_fp16_3, var_7977_cast_fp16_3))[name = tensor("aw_1167_cast_fp16")]; tensor aw_1169_equation_0 = const()[name = tensor("aw_1169_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1169_cast_fp16 = einsum(equation = aw_1169_equation_0, values = (var_7999_cast_fp16_4, var_7977_cast_fp16_4))[name = tensor("aw_1169_cast_fp16")]; tensor aw_1171_equation_0 = const()[name = tensor("aw_1171_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1171_cast_fp16 = einsum(equation = aw_1171_equation_0, values = (var_7999_cast_fp16_5, var_7977_cast_fp16_5))[name = tensor("aw_1171_cast_fp16")]; tensor aw_1173_equation_0 = const()[name = tensor("aw_1173_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1173_cast_fp16 = einsum(equation = aw_1173_equation_0, values = (var_7999_cast_fp16_6, var_7977_cast_fp16_6))[name = tensor("aw_1173_cast_fp16")]; tensor aw_1175_equation_0 = const()[name = tensor("aw_1175_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1175_cast_fp16 = einsum(equation = aw_1175_equation_0, values = (var_7999_cast_fp16_7, var_7977_cast_fp16_7))[name = tensor("aw_1175_cast_fp16")]; tensor aw_1177_equation_0 = const()[name = tensor("aw_1177_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1177_cast_fp16 = einsum(equation = aw_1177_equation_0, values = (var_7999_cast_fp16_8, var_7977_cast_fp16_8))[name = tensor("aw_1177_cast_fp16")]; tensor aw_1179_equation_0 = const()[name = tensor("aw_1179_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1179_cast_fp16 = einsum(equation = aw_1179_equation_0, values = (var_7999_cast_fp16_9, var_7977_cast_fp16_9))[name = tensor("aw_1179_cast_fp16")]; tensor aw_1181_equation_0 = const()[name = tensor("aw_1181_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1181_cast_fp16 = einsum(equation = aw_1181_equation_0, values = (var_7999_cast_fp16_10, var_7977_cast_fp16_10))[name = tensor("aw_1181_cast_fp16")]; tensor aw_1183_equation_0 = const()[name = tensor("aw_1183_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1183_cast_fp16 = einsum(equation = aw_1183_equation_0, values = (var_7999_cast_fp16_11, var_7977_cast_fp16_11))[name = tensor("aw_1183_cast_fp16")]; tensor aw_1185_equation_0 = const()[name = tensor("aw_1185_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1185_cast_fp16 = einsum(equation = aw_1185_equation_0, values = (var_7999_cast_fp16_12, var_7977_cast_fp16_12))[name = tensor("aw_1185_cast_fp16")]; tensor aw_1187_equation_0 = const()[name = tensor("aw_1187_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1187_cast_fp16 = einsum(equation = aw_1187_equation_0, values = (var_7999_cast_fp16_13, var_7977_cast_fp16_13))[name = tensor("aw_1187_cast_fp16")]; tensor aw_1189_equation_0 = const()[name = tensor("aw_1189_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1189_cast_fp16 = einsum(equation = aw_1189_equation_0, values = (var_7999_cast_fp16_14, var_7977_cast_fp16_14))[name = tensor("aw_1189_cast_fp16")]; tensor aw_1191_equation_0 = const()[name = tensor("aw_1191_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1191_cast_fp16 = einsum(equation = aw_1191_equation_0, values = (var_7999_cast_fp16_15, var_7977_cast_fp16_15))[name = tensor("aw_1191_cast_fp16")]; tensor aw_1193_equation_0 = const()[name = tensor("aw_1193_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1193_cast_fp16 = einsum(equation = aw_1193_equation_0, values = (var_7999_cast_fp16_16, var_7977_cast_fp16_16))[name = tensor("aw_1193_cast_fp16")]; tensor aw_1195_equation_0 = const()[name = tensor("aw_1195_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1195_cast_fp16 = einsum(equation = aw_1195_equation_0, values = (var_7999_cast_fp16_17, var_7977_cast_fp16_17))[name = tensor("aw_1195_cast_fp16")]; tensor aw_1197_equation_0 = const()[name = tensor("aw_1197_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1197_cast_fp16 = einsum(equation = aw_1197_equation_0, values = (var_7999_cast_fp16_18, var_7977_cast_fp16_18))[name = tensor("aw_1197_cast_fp16")]; tensor aw_1199_equation_0 = const()[name = tensor("aw_1199_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1199_cast_fp16 = einsum(equation = aw_1199_equation_0, values = (var_7999_cast_fp16_19, var_7977_cast_fp16_19))[name = tensor("aw_1199_cast_fp16")]; tensor var_8081_cast_fp16 = softmax(axis = var_7925, x = aw_1161_cast_fp16)[name = tensor("op_8081_cast_fp16")]; tensor var_8082_cast_fp16 = softmax(axis = var_7925, x = aw_1163_cast_fp16)[name = tensor("op_8082_cast_fp16")]; tensor var_8083_cast_fp16 = softmax(axis = var_7925, x = aw_1165_cast_fp16)[name = tensor("op_8083_cast_fp16")]; tensor var_8084_cast_fp16 = softmax(axis = var_7925, x = aw_1167_cast_fp16)[name = tensor("op_8084_cast_fp16")]; tensor var_8085_cast_fp16 = softmax(axis = var_7925, x = aw_1169_cast_fp16)[name = tensor("op_8085_cast_fp16")]; tensor var_8086_cast_fp16 = softmax(axis = var_7925, x = aw_1171_cast_fp16)[name = tensor("op_8086_cast_fp16")]; tensor var_8087_cast_fp16 = softmax(axis = var_7925, x = aw_1173_cast_fp16)[name = tensor("op_8087_cast_fp16")]; tensor var_8088_cast_fp16 = softmax(axis = var_7925, x = aw_1175_cast_fp16)[name = tensor("op_8088_cast_fp16")]; tensor var_8089_cast_fp16 = softmax(axis = var_7925, x = aw_1177_cast_fp16)[name = tensor("op_8089_cast_fp16")]; tensor var_8090_cast_fp16 = softmax(axis = var_7925, x = aw_1179_cast_fp16)[name = tensor("op_8090_cast_fp16")]; tensor var_8091_cast_fp16 = softmax(axis = var_7925, x = aw_1181_cast_fp16)[name = tensor("op_8091_cast_fp16")]; tensor var_8092_cast_fp16 = softmax(axis = var_7925, x = aw_1183_cast_fp16)[name = tensor("op_8092_cast_fp16")]; tensor var_8093_cast_fp16 = softmax(axis = var_7925, x = aw_1185_cast_fp16)[name = tensor("op_8093_cast_fp16")]; tensor var_8094_cast_fp16 = softmax(axis = var_7925, x = aw_1187_cast_fp16)[name = tensor("op_8094_cast_fp16")]; tensor var_8095_cast_fp16 = softmax(axis = var_7925, x = aw_1189_cast_fp16)[name = tensor("op_8095_cast_fp16")]; tensor var_8096_cast_fp16 = softmax(axis = var_7925, x = aw_1191_cast_fp16)[name = tensor("op_8096_cast_fp16")]; tensor var_8097_cast_fp16 = softmax(axis = var_7925, x = aw_1193_cast_fp16)[name = tensor("op_8097_cast_fp16")]; tensor var_8098_cast_fp16 = softmax(axis = var_7925, x = aw_1195_cast_fp16)[name = tensor("op_8098_cast_fp16")]; tensor var_8099_cast_fp16 = softmax(axis = var_7925, x = aw_1197_cast_fp16)[name = tensor("op_8099_cast_fp16")]; tensor var_8100_cast_fp16 = softmax(axis = var_7925, x = aw_1199_cast_fp16)[name = tensor("op_8100_cast_fp16")]; tensor var_8102_equation_0 = const()[name = tensor("op_8102_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8102_cast_fp16 = einsum(equation = var_8102_equation_0, values = (var_8020_cast_fp16_0, var_8081_cast_fp16))[name = tensor("op_8102_cast_fp16")]; tensor var_8104_equation_0 = const()[name = tensor("op_8104_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8104_cast_fp16 = einsum(equation = var_8104_equation_0, values = (var_8020_cast_fp16_1, var_8082_cast_fp16))[name = tensor("op_8104_cast_fp16")]; tensor var_8106_equation_0 = const()[name = tensor("op_8106_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8106_cast_fp16 = einsum(equation = var_8106_equation_0, values = (var_8020_cast_fp16_2, var_8083_cast_fp16))[name = tensor("op_8106_cast_fp16")]; tensor var_8108_equation_0 = const()[name = tensor("op_8108_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8108_cast_fp16 = einsum(equation = var_8108_equation_0, values = (var_8020_cast_fp16_3, var_8084_cast_fp16))[name = tensor("op_8108_cast_fp16")]; tensor var_8110_equation_0 = const()[name = tensor("op_8110_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8110_cast_fp16 = einsum(equation = var_8110_equation_0, values = (var_8020_cast_fp16_4, var_8085_cast_fp16))[name = tensor("op_8110_cast_fp16")]; tensor var_8112_equation_0 = const()[name = tensor("op_8112_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8112_cast_fp16 = einsum(equation = var_8112_equation_0, values = (var_8020_cast_fp16_5, var_8086_cast_fp16))[name = tensor("op_8112_cast_fp16")]; tensor var_8114_equation_0 = const()[name = tensor("op_8114_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8114_cast_fp16 = einsum(equation = var_8114_equation_0, values = (var_8020_cast_fp16_6, var_8087_cast_fp16))[name = tensor("op_8114_cast_fp16")]; tensor var_8116_equation_0 = const()[name = tensor("op_8116_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8116_cast_fp16 = einsum(equation = var_8116_equation_0, values = (var_8020_cast_fp16_7, var_8088_cast_fp16))[name = tensor("op_8116_cast_fp16")]; tensor var_8118_equation_0 = const()[name = tensor("op_8118_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8118_cast_fp16 = einsum(equation = var_8118_equation_0, values = (var_8020_cast_fp16_8, var_8089_cast_fp16))[name = tensor("op_8118_cast_fp16")]; tensor var_8120_equation_0 = const()[name = tensor("op_8120_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8120_cast_fp16 = einsum(equation = var_8120_equation_0, values = (var_8020_cast_fp16_9, var_8090_cast_fp16))[name = tensor("op_8120_cast_fp16")]; tensor var_8122_equation_0 = const()[name = tensor("op_8122_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8122_cast_fp16 = einsum(equation = var_8122_equation_0, values = (var_8020_cast_fp16_10, var_8091_cast_fp16))[name = tensor("op_8122_cast_fp16")]; tensor var_8124_equation_0 = const()[name = tensor("op_8124_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8124_cast_fp16 = einsum(equation = var_8124_equation_0, values = (var_8020_cast_fp16_11, var_8092_cast_fp16))[name = tensor("op_8124_cast_fp16")]; tensor var_8126_equation_0 = const()[name = tensor("op_8126_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8126_cast_fp16 = einsum(equation = var_8126_equation_0, values = (var_8020_cast_fp16_12, var_8093_cast_fp16))[name = tensor("op_8126_cast_fp16")]; tensor var_8128_equation_0 = const()[name = tensor("op_8128_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8128_cast_fp16 = einsum(equation = var_8128_equation_0, values = (var_8020_cast_fp16_13, var_8094_cast_fp16))[name = tensor("op_8128_cast_fp16")]; tensor var_8130_equation_0 = const()[name = tensor("op_8130_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8130_cast_fp16 = einsum(equation = var_8130_equation_0, values = (var_8020_cast_fp16_14, var_8095_cast_fp16))[name = tensor("op_8130_cast_fp16")]; tensor var_8132_equation_0 = const()[name = tensor("op_8132_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8132_cast_fp16 = einsum(equation = var_8132_equation_0, values = (var_8020_cast_fp16_15, var_8096_cast_fp16))[name = tensor("op_8132_cast_fp16")]; tensor var_8134_equation_0 = const()[name = tensor("op_8134_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8134_cast_fp16 = einsum(equation = var_8134_equation_0, values = (var_8020_cast_fp16_16, var_8097_cast_fp16))[name = tensor("op_8134_cast_fp16")]; tensor var_8136_equation_0 = const()[name = tensor("op_8136_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8136_cast_fp16 = einsum(equation = var_8136_equation_0, values = (var_8020_cast_fp16_17, var_8098_cast_fp16))[name = tensor("op_8136_cast_fp16")]; tensor var_8138_equation_0 = const()[name = tensor("op_8138_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8138_cast_fp16 = einsum(equation = var_8138_equation_0, values = (var_8020_cast_fp16_18, var_8099_cast_fp16))[name = tensor("op_8138_cast_fp16")]; tensor var_8140_equation_0 = const()[name = tensor("op_8140_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8140_cast_fp16 = einsum(equation = var_8140_equation_0, values = (var_8020_cast_fp16_19, var_8100_cast_fp16))[name = tensor("op_8140_cast_fp16")]; tensor input_295_interleave_0 = const()[name = tensor("input_295_interleave_0"), val = tensor(false)]; tensor input_295_cast_fp16 = concat(axis = var_7925, interleave = input_295_interleave_0, values = (var_8102_cast_fp16, var_8104_cast_fp16, var_8106_cast_fp16, var_8108_cast_fp16, var_8110_cast_fp16, var_8112_cast_fp16, var_8114_cast_fp16, var_8116_cast_fp16, var_8118_cast_fp16, var_8120_cast_fp16, var_8122_cast_fp16, var_8124_cast_fp16, var_8126_cast_fp16, var_8128_cast_fp16, var_8130_cast_fp16, var_8132_cast_fp16, var_8134_cast_fp16, var_8136_cast_fp16, var_8138_cast_fp16, var_8140_cast_fp16))[name = tensor("input_295_cast_fp16")]; tensor var_8149_pad_type_0 = const()[name = tensor("op_8149_pad_type_0"), val = tensor("valid")]; tensor var_8149_strides_0 = const()[name = tensor("op_8149_strides_0"), val = tensor([1, 1])]; tensor var_8149_pad_0 = const()[name = tensor("op_8149_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_8149_dilations_0 = const()[name = tensor("op_8149_dilations_0"), val = tensor([1, 1])]; tensor var_8149_groups_0 = const()[name = tensor("op_8149_groups_0"), val = tensor(1)]; tensor blocks_29_attn_out_weight_to_fp16 = const()[name = tensor("blocks_29_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1165745152)))]; tensor blocks_29_attn_out_bias_to_fp16 = const()[name = tensor("blocks_29_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1169022016)))]; tensor var_8149_cast_fp16 = conv(bias = blocks_29_attn_out_bias_to_fp16, dilations = var_8149_dilations_0, groups = var_8149_groups_0, pad = var_8149_pad_0, pad_type = var_8149_pad_type_0, strides = var_8149_strides_0, weight = blocks_29_attn_out_weight_to_fp16, x = input_295_cast_fp16)[name = tensor("op_8149_cast_fp16")]; tensor inputs_119_cast_fp16 = add(x = inputs_117_cast_fp16, y = var_8149_cast_fp16)[name = tensor("inputs_119_cast_fp16")]; tensor input_297_axes_0 = const()[name = tensor("input_297_axes_0"), val = tensor([1])]; tensor input_297_gamma_0_to_fp16 = const()[name = tensor("input_297_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1169024640)))]; tensor input_297_beta_0_to_fp16 = const()[name = tensor("input_297_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1169027264)))]; tensor var_8159_to_fp16 = const()[name = tensor("op_8159_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_297_cast_fp16 = layer_norm(axes = input_297_axes_0, beta = input_297_beta_0_to_fp16, epsilon = var_8159_to_fp16, gamma = input_297_gamma_0_to_fp16, x = inputs_119_cast_fp16)[name = tensor("input_297_cast_fp16")]; tensor input_299_pad_type_0 = const()[name = tensor("input_299_pad_type_0"), val = tensor("valid")]; tensor input_299_strides_0 = const()[name = tensor("input_299_strides_0"), val = tensor([1, 1])]; tensor input_299_pad_0 = const()[name = tensor("input_299_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_299_dilations_0 = const()[name = tensor("input_299_dilations_0"), val = tensor([1, 1])]; tensor input_299_groups_0 = const()[name = tensor("input_299_groups_0"), val = tensor(1)]; tensor blocks_29_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_29_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1169029888)))]; tensor blocks_29_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_29_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1182137152)))]; tensor input_299_cast_fp16 = conv(bias = blocks_29_mlp_0_bias_to_fp16, dilations = input_299_dilations_0, groups = input_299_groups_0, pad = input_299_pad_0, pad_type = input_299_pad_type_0, strides = input_299_strides_0, weight = blocks_29_mlp_0_weight_to_fp16, x = input_297_cast_fp16)[name = tensor("input_299_cast_fp16")]; tensor input_301_mode_0 = const()[name = tensor("input_301_mode_0"), val = tensor("EXACT")]; tensor input_301_cast_fp16 = gelu(mode = input_301_mode_0, x = input_299_cast_fp16)[name = tensor("input_301_cast_fp16")]; tensor var_8185_pad_type_0 = const()[name = tensor("op_8185_pad_type_0"), val = tensor("valid")]; tensor var_8185_strides_0 = const()[name = tensor("op_8185_strides_0"), val = tensor([1, 1])]; tensor var_8185_pad_0 = const()[name = tensor("op_8185_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_8185_dilations_0 = const()[name = tensor("op_8185_dilations_0"), val = tensor([1, 1])]; tensor var_8185_groups_0 = const()[name = tensor("op_8185_groups_0"), val = tensor(1)]; tensor blocks_29_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_29_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1182147456)))]; tensor blocks_29_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_29_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1195254720)))]; tensor var_8185_cast_fp16 = conv(bias = blocks_29_mlp_2_bias_to_fp16, dilations = var_8185_dilations_0, groups = var_8185_groups_0, pad = var_8185_pad_0, pad_type = var_8185_pad_type_0, strides = var_8185_strides_0, weight = blocks_29_mlp_2_weight_to_fp16, x = input_301_cast_fp16)[name = tensor("op_8185_cast_fp16")]; tensor inputs_121_cast_fp16 = add(x = inputs_119_cast_fp16, y = var_8185_cast_fp16)[name = tensor("inputs_121_cast_fp16")]; tensor var_8194 = const()[name = tensor("op_8194"), val = tensor(1)]; tensor input_303_axes_0 = const()[name = tensor("input_303_axes_0"), val = tensor([1])]; tensor input_303_gamma_0_to_fp16 = const()[name = tensor("input_303_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1195257344)))]; tensor input_303_beta_0_to_fp16 = const()[name = tensor("input_303_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1195259968)))]; tensor var_8210_to_fp16 = const()[name = tensor("op_8210_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_303_cast_fp16 = layer_norm(axes = input_303_axes_0, beta = input_303_beta_0_to_fp16, epsilon = var_8210_to_fp16, gamma = input_303_gamma_0_to_fp16, x = inputs_121_cast_fp16)[name = tensor("input_303_cast_fp16")]; tensor q_61_pad_type_0 = const()[name = tensor("q_61_pad_type_0"), val = tensor("valid")]; tensor q_61_strides_0 = const()[name = tensor("q_61_strides_0"), val = tensor([1, 1])]; tensor q_61_pad_0 = const()[name = tensor("q_61_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_61_dilations_0 = const()[name = tensor("q_61_dilations_0"), val = tensor([1, 1])]; tensor q_61_groups_0 = const()[name = tensor("q_61_groups_0"), val = tensor(1)]; tensor var_8245_weight_0_to_fp16 = const()[name = tensor("op_8245_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1195262592)))]; tensor var_8245_bias_0_to_fp16 = const()[name = tensor("op_8245_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1198539456)))]; tensor var_8245_cast_fp16 = conv(bias = var_8245_bias_0_to_fp16, dilations = q_61_dilations_0, groups = q_61_groups_0, pad = q_61_pad_0, pad_type = q_61_pad_type_0, strides = q_61_strides_0, weight = var_8245_weight_0_to_fp16, x = input_303_cast_fp16)[name = tensor("op_8245_cast_fp16")]; tensor k_61_pad_type_0 = const()[name = tensor("k_61_pad_type_0"), val = tensor("valid")]; tensor k_61_strides_0 = const()[name = tensor("k_61_strides_0"), val = tensor([1, 1])]; tensor k_61_pad_0 = const()[name = tensor("k_61_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_61_dilations_0 = const()[name = tensor("k_61_dilations_0"), val = tensor([1, 1])]; tensor k_61_groups_0 = const()[name = tensor("k_61_groups_0"), val = tensor(1)]; tensor blocks_30_attn_key_weight_to_fp16 = const()[name = tensor("blocks_30_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1198542080)))]; tensor k_61_cast_fp16 = conv(dilations = k_61_dilations_0, groups = k_61_groups_0, pad = k_61_pad_0, pad_type = k_61_pad_type_0, strides = k_61_strides_0, weight = blocks_30_attn_key_weight_to_fp16, x = input_303_cast_fp16)[name = tensor("k_61_cast_fp16")]; tensor var_8243_pad_type_0 = const()[name = tensor("op_8243_pad_type_0"), val = tensor("valid")]; tensor var_8243_strides_0 = const()[name = tensor("op_8243_strides_0"), val = tensor([1, 1])]; tensor var_8243_pad_0 = const()[name = tensor("op_8243_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_8243_dilations_0 = const()[name = tensor("op_8243_dilations_0"), val = tensor([1, 1])]; tensor var_8243_groups_0 = const()[name = tensor("op_8243_groups_0"), val = tensor(1)]; tensor blocks_30_attn_value_weight_to_fp16 = const()[name = tensor("blocks_30_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1201818944)))]; tensor blocks_30_attn_value_bias_to_fp16 = const()[name = tensor("blocks_30_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1205095808)))]; tensor var_8243_cast_fp16 = conv(bias = blocks_30_attn_value_bias_to_fp16, dilations = var_8243_dilations_0, groups = var_8243_groups_0, pad = var_8243_pad_0, pad_type = var_8243_pad_type_0, strides = var_8243_strides_0, weight = blocks_30_attn_value_weight_to_fp16, x = input_303_cast_fp16)[name = tensor("op_8243_cast_fp16")]; tensor tile_90 = const()[name = tensor("tile_90"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_8246_axis_0 = const()[name = tensor("op_8246_axis_0"), val = tensor(1)]; tensor var_8246_cast_fp16_0, tensor var_8246_cast_fp16_1, tensor var_8246_cast_fp16_2, tensor var_8246_cast_fp16_3, tensor var_8246_cast_fp16_4, tensor var_8246_cast_fp16_5, tensor var_8246_cast_fp16_6, tensor var_8246_cast_fp16_7, tensor var_8246_cast_fp16_8, tensor var_8246_cast_fp16_9, tensor var_8246_cast_fp16_10, tensor var_8246_cast_fp16_11, tensor var_8246_cast_fp16_12, tensor var_8246_cast_fp16_13, tensor var_8246_cast_fp16_14, tensor var_8246_cast_fp16_15, tensor var_8246_cast_fp16_16, tensor var_8246_cast_fp16_17, tensor var_8246_cast_fp16_18, tensor var_8246_cast_fp16_19 = split(axis = var_8246_axis_0, split_sizes = tile_90, x = var_8245_cast_fp16)[name = tensor("op_8246_cast_fp16")]; tensor var_8267_perm_0 = const()[name = tensor("op_8267_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_91 = const()[name = tensor("tile_91"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_8268_axis_0 = const()[name = tensor("op_8268_axis_0"), val = tensor(3)]; tensor var_8267_cast_fp16 = transpose(perm = var_8267_perm_0, x = k_61_cast_fp16)[name = tensor("transpose_2")]; tensor var_8268_cast_fp16_0, tensor var_8268_cast_fp16_1, tensor var_8268_cast_fp16_2, tensor var_8268_cast_fp16_3, tensor var_8268_cast_fp16_4, tensor var_8268_cast_fp16_5, tensor var_8268_cast_fp16_6, tensor var_8268_cast_fp16_7, tensor var_8268_cast_fp16_8, tensor var_8268_cast_fp16_9, tensor var_8268_cast_fp16_10, tensor var_8268_cast_fp16_11, tensor var_8268_cast_fp16_12, tensor var_8268_cast_fp16_13, tensor var_8268_cast_fp16_14, tensor var_8268_cast_fp16_15, tensor var_8268_cast_fp16_16, tensor var_8268_cast_fp16_17, tensor var_8268_cast_fp16_18, tensor var_8268_cast_fp16_19 = split(axis = var_8268_axis_0, split_sizes = tile_91, x = var_8267_cast_fp16)[name = tensor("op_8268_cast_fp16")]; tensor tile_92 = const()[name = tensor("tile_92"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_8289_axis_0 = const()[name = tensor("op_8289_axis_0"), val = tensor(1)]; tensor var_8289_cast_fp16_0, tensor var_8289_cast_fp16_1, tensor var_8289_cast_fp16_2, tensor var_8289_cast_fp16_3, tensor var_8289_cast_fp16_4, tensor var_8289_cast_fp16_5, tensor var_8289_cast_fp16_6, tensor var_8289_cast_fp16_7, tensor var_8289_cast_fp16_8, tensor var_8289_cast_fp16_9, tensor var_8289_cast_fp16_10, tensor var_8289_cast_fp16_11, tensor var_8289_cast_fp16_12, tensor var_8289_cast_fp16_13, tensor var_8289_cast_fp16_14, tensor var_8289_cast_fp16_15, tensor var_8289_cast_fp16_16, tensor var_8289_cast_fp16_17, tensor var_8289_cast_fp16_18, tensor var_8289_cast_fp16_19 = split(axis = var_8289_axis_0, split_sizes = tile_92, x = var_8243_cast_fp16)[name = tensor("op_8289_cast_fp16")]; tensor aw_1201_equation_0 = const()[name = tensor("aw_1201_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1201_cast_fp16 = einsum(equation = aw_1201_equation_0, values = (var_8268_cast_fp16_0, var_8246_cast_fp16_0))[name = tensor("aw_1201_cast_fp16")]; tensor aw_1203_equation_0 = const()[name = tensor("aw_1203_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1203_cast_fp16 = einsum(equation = aw_1203_equation_0, values = (var_8268_cast_fp16_1, var_8246_cast_fp16_1))[name = tensor("aw_1203_cast_fp16")]; tensor aw_1205_equation_0 = const()[name = tensor("aw_1205_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1205_cast_fp16 = einsum(equation = aw_1205_equation_0, values = (var_8268_cast_fp16_2, var_8246_cast_fp16_2))[name = tensor("aw_1205_cast_fp16")]; tensor aw_1207_equation_0 = const()[name = tensor("aw_1207_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1207_cast_fp16 = einsum(equation = aw_1207_equation_0, values = (var_8268_cast_fp16_3, var_8246_cast_fp16_3))[name = tensor("aw_1207_cast_fp16")]; tensor aw_1209_equation_0 = const()[name = tensor("aw_1209_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1209_cast_fp16 = einsum(equation = aw_1209_equation_0, values = (var_8268_cast_fp16_4, var_8246_cast_fp16_4))[name = tensor("aw_1209_cast_fp16")]; tensor aw_1211_equation_0 = const()[name = tensor("aw_1211_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1211_cast_fp16 = einsum(equation = aw_1211_equation_0, values = (var_8268_cast_fp16_5, var_8246_cast_fp16_5))[name = tensor("aw_1211_cast_fp16")]; tensor aw_1213_equation_0 = const()[name = tensor("aw_1213_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1213_cast_fp16 = einsum(equation = aw_1213_equation_0, values = (var_8268_cast_fp16_6, var_8246_cast_fp16_6))[name = tensor("aw_1213_cast_fp16")]; tensor aw_1215_equation_0 = const()[name = tensor("aw_1215_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1215_cast_fp16 = einsum(equation = aw_1215_equation_0, values = (var_8268_cast_fp16_7, var_8246_cast_fp16_7))[name = tensor("aw_1215_cast_fp16")]; tensor aw_1217_equation_0 = const()[name = tensor("aw_1217_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1217_cast_fp16 = einsum(equation = aw_1217_equation_0, values = (var_8268_cast_fp16_8, var_8246_cast_fp16_8))[name = tensor("aw_1217_cast_fp16")]; tensor aw_1219_equation_0 = const()[name = tensor("aw_1219_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1219_cast_fp16 = einsum(equation = aw_1219_equation_0, values = (var_8268_cast_fp16_9, var_8246_cast_fp16_9))[name = tensor("aw_1219_cast_fp16")]; tensor aw_1221_equation_0 = const()[name = tensor("aw_1221_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1221_cast_fp16 = einsum(equation = aw_1221_equation_0, values = (var_8268_cast_fp16_10, var_8246_cast_fp16_10))[name = tensor("aw_1221_cast_fp16")]; tensor aw_1223_equation_0 = const()[name = tensor("aw_1223_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1223_cast_fp16 = einsum(equation = aw_1223_equation_0, values = (var_8268_cast_fp16_11, var_8246_cast_fp16_11))[name = tensor("aw_1223_cast_fp16")]; tensor aw_1225_equation_0 = const()[name = tensor("aw_1225_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1225_cast_fp16 = einsum(equation = aw_1225_equation_0, values = (var_8268_cast_fp16_12, var_8246_cast_fp16_12))[name = tensor("aw_1225_cast_fp16")]; tensor aw_1227_equation_0 = const()[name = tensor("aw_1227_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1227_cast_fp16 = einsum(equation = aw_1227_equation_0, values = (var_8268_cast_fp16_13, var_8246_cast_fp16_13))[name = tensor("aw_1227_cast_fp16")]; tensor aw_1229_equation_0 = const()[name = tensor("aw_1229_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1229_cast_fp16 = einsum(equation = aw_1229_equation_0, values = (var_8268_cast_fp16_14, var_8246_cast_fp16_14))[name = tensor("aw_1229_cast_fp16")]; tensor aw_1231_equation_0 = const()[name = tensor("aw_1231_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1231_cast_fp16 = einsum(equation = aw_1231_equation_0, values = (var_8268_cast_fp16_15, var_8246_cast_fp16_15))[name = tensor("aw_1231_cast_fp16")]; tensor aw_1233_equation_0 = const()[name = tensor("aw_1233_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1233_cast_fp16 = einsum(equation = aw_1233_equation_0, values = (var_8268_cast_fp16_16, var_8246_cast_fp16_16))[name = tensor("aw_1233_cast_fp16")]; tensor aw_1235_equation_0 = const()[name = tensor("aw_1235_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1235_cast_fp16 = einsum(equation = aw_1235_equation_0, values = (var_8268_cast_fp16_17, var_8246_cast_fp16_17))[name = tensor("aw_1235_cast_fp16")]; tensor aw_1237_equation_0 = const()[name = tensor("aw_1237_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1237_cast_fp16 = einsum(equation = aw_1237_equation_0, values = (var_8268_cast_fp16_18, var_8246_cast_fp16_18))[name = tensor("aw_1237_cast_fp16")]; tensor aw_1239_equation_0 = const()[name = tensor("aw_1239_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1239_cast_fp16 = einsum(equation = aw_1239_equation_0, values = (var_8268_cast_fp16_19, var_8246_cast_fp16_19))[name = tensor("aw_1239_cast_fp16")]; tensor var_8350_cast_fp16 = softmax(axis = var_8194, x = aw_1201_cast_fp16)[name = tensor("op_8350_cast_fp16")]; tensor var_8351_cast_fp16 = softmax(axis = var_8194, x = aw_1203_cast_fp16)[name = tensor("op_8351_cast_fp16")]; tensor var_8352_cast_fp16 = softmax(axis = var_8194, x = aw_1205_cast_fp16)[name = tensor("op_8352_cast_fp16")]; tensor var_8353_cast_fp16 = softmax(axis = var_8194, x = aw_1207_cast_fp16)[name = tensor("op_8353_cast_fp16")]; tensor var_8354_cast_fp16 = softmax(axis = var_8194, x = aw_1209_cast_fp16)[name = tensor("op_8354_cast_fp16")]; tensor var_8355_cast_fp16 = softmax(axis = var_8194, x = aw_1211_cast_fp16)[name = tensor("op_8355_cast_fp16")]; tensor var_8356_cast_fp16 = softmax(axis = var_8194, x = aw_1213_cast_fp16)[name = tensor("op_8356_cast_fp16")]; tensor var_8357_cast_fp16 = softmax(axis = var_8194, x = aw_1215_cast_fp16)[name = tensor("op_8357_cast_fp16")]; tensor var_8358_cast_fp16 = softmax(axis = var_8194, x = aw_1217_cast_fp16)[name = tensor("op_8358_cast_fp16")]; tensor var_8359_cast_fp16 = softmax(axis = var_8194, x = aw_1219_cast_fp16)[name = tensor("op_8359_cast_fp16")]; tensor var_8360_cast_fp16 = softmax(axis = var_8194, x = aw_1221_cast_fp16)[name = tensor("op_8360_cast_fp16")]; tensor var_8361_cast_fp16 = softmax(axis = var_8194, x = aw_1223_cast_fp16)[name = tensor("op_8361_cast_fp16")]; tensor var_8362_cast_fp16 = softmax(axis = var_8194, x = aw_1225_cast_fp16)[name = tensor("op_8362_cast_fp16")]; tensor var_8363_cast_fp16 = softmax(axis = var_8194, x = aw_1227_cast_fp16)[name = tensor("op_8363_cast_fp16")]; tensor var_8364_cast_fp16 = softmax(axis = var_8194, x = aw_1229_cast_fp16)[name = tensor("op_8364_cast_fp16")]; tensor var_8365_cast_fp16 = softmax(axis = var_8194, x = aw_1231_cast_fp16)[name = tensor("op_8365_cast_fp16")]; tensor var_8366_cast_fp16 = softmax(axis = var_8194, x = aw_1233_cast_fp16)[name = tensor("op_8366_cast_fp16")]; tensor var_8367_cast_fp16 = softmax(axis = var_8194, x = aw_1235_cast_fp16)[name = tensor("op_8367_cast_fp16")]; tensor var_8368_cast_fp16 = softmax(axis = var_8194, x = aw_1237_cast_fp16)[name = tensor("op_8368_cast_fp16")]; tensor var_8369_cast_fp16 = softmax(axis = var_8194, x = aw_1239_cast_fp16)[name = tensor("op_8369_cast_fp16")]; tensor var_8371_equation_0 = const()[name = tensor("op_8371_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8371_cast_fp16 = einsum(equation = var_8371_equation_0, values = (var_8289_cast_fp16_0, var_8350_cast_fp16))[name = tensor("op_8371_cast_fp16")]; tensor var_8373_equation_0 = const()[name = tensor("op_8373_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8373_cast_fp16 = einsum(equation = var_8373_equation_0, values = (var_8289_cast_fp16_1, var_8351_cast_fp16))[name = tensor("op_8373_cast_fp16")]; tensor var_8375_equation_0 = const()[name = tensor("op_8375_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8375_cast_fp16 = einsum(equation = var_8375_equation_0, values = (var_8289_cast_fp16_2, var_8352_cast_fp16))[name = tensor("op_8375_cast_fp16")]; tensor var_8377_equation_0 = const()[name = tensor("op_8377_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8377_cast_fp16 = einsum(equation = var_8377_equation_0, values = (var_8289_cast_fp16_3, var_8353_cast_fp16))[name = tensor("op_8377_cast_fp16")]; tensor var_8379_equation_0 = const()[name = tensor("op_8379_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8379_cast_fp16 = einsum(equation = var_8379_equation_0, values = (var_8289_cast_fp16_4, var_8354_cast_fp16))[name = tensor("op_8379_cast_fp16")]; tensor var_8381_equation_0 = const()[name = tensor("op_8381_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8381_cast_fp16 = einsum(equation = var_8381_equation_0, values = (var_8289_cast_fp16_5, var_8355_cast_fp16))[name = tensor("op_8381_cast_fp16")]; tensor var_8383_equation_0 = const()[name = tensor("op_8383_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8383_cast_fp16 = einsum(equation = var_8383_equation_0, values = (var_8289_cast_fp16_6, var_8356_cast_fp16))[name = tensor("op_8383_cast_fp16")]; tensor var_8385_equation_0 = const()[name = tensor("op_8385_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8385_cast_fp16 = einsum(equation = var_8385_equation_0, values = (var_8289_cast_fp16_7, var_8357_cast_fp16))[name = tensor("op_8385_cast_fp16")]; tensor var_8387_equation_0 = const()[name = tensor("op_8387_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8387_cast_fp16 = einsum(equation = var_8387_equation_0, values = (var_8289_cast_fp16_8, var_8358_cast_fp16))[name = tensor("op_8387_cast_fp16")]; tensor var_8389_equation_0 = const()[name = tensor("op_8389_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8389_cast_fp16 = einsum(equation = var_8389_equation_0, values = (var_8289_cast_fp16_9, var_8359_cast_fp16))[name = tensor("op_8389_cast_fp16")]; tensor var_8391_equation_0 = const()[name = tensor("op_8391_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8391_cast_fp16 = einsum(equation = var_8391_equation_0, values = (var_8289_cast_fp16_10, var_8360_cast_fp16))[name = tensor("op_8391_cast_fp16")]; tensor var_8393_equation_0 = const()[name = tensor("op_8393_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8393_cast_fp16 = einsum(equation = var_8393_equation_0, values = (var_8289_cast_fp16_11, var_8361_cast_fp16))[name = tensor("op_8393_cast_fp16")]; tensor var_8395_equation_0 = const()[name = tensor("op_8395_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8395_cast_fp16 = einsum(equation = var_8395_equation_0, values = (var_8289_cast_fp16_12, var_8362_cast_fp16))[name = tensor("op_8395_cast_fp16")]; tensor var_8397_equation_0 = const()[name = tensor("op_8397_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8397_cast_fp16 = einsum(equation = var_8397_equation_0, values = (var_8289_cast_fp16_13, var_8363_cast_fp16))[name = tensor("op_8397_cast_fp16")]; tensor var_8399_equation_0 = const()[name = tensor("op_8399_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8399_cast_fp16 = einsum(equation = var_8399_equation_0, values = (var_8289_cast_fp16_14, var_8364_cast_fp16))[name = tensor("op_8399_cast_fp16")]; tensor var_8401_equation_0 = const()[name = tensor("op_8401_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8401_cast_fp16 = einsum(equation = var_8401_equation_0, values = (var_8289_cast_fp16_15, var_8365_cast_fp16))[name = tensor("op_8401_cast_fp16")]; tensor var_8403_equation_0 = const()[name = tensor("op_8403_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8403_cast_fp16 = einsum(equation = var_8403_equation_0, values = (var_8289_cast_fp16_16, var_8366_cast_fp16))[name = tensor("op_8403_cast_fp16")]; tensor var_8405_equation_0 = const()[name = tensor("op_8405_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8405_cast_fp16 = einsum(equation = var_8405_equation_0, values = (var_8289_cast_fp16_17, var_8367_cast_fp16))[name = tensor("op_8405_cast_fp16")]; tensor var_8407_equation_0 = const()[name = tensor("op_8407_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8407_cast_fp16 = einsum(equation = var_8407_equation_0, values = (var_8289_cast_fp16_18, var_8368_cast_fp16))[name = tensor("op_8407_cast_fp16")]; tensor var_8409_equation_0 = const()[name = tensor("op_8409_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8409_cast_fp16 = einsum(equation = var_8409_equation_0, values = (var_8289_cast_fp16_19, var_8369_cast_fp16))[name = tensor("op_8409_cast_fp16")]; tensor input_305_interleave_0 = const()[name = tensor("input_305_interleave_0"), val = tensor(false)]; tensor input_305_cast_fp16 = concat(axis = var_8194, interleave = input_305_interleave_0, values = (var_8371_cast_fp16, var_8373_cast_fp16, var_8375_cast_fp16, var_8377_cast_fp16, var_8379_cast_fp16, var_8381_cast_fp16, var_8383_cast_fp16, var_8385_cast_fp16, var_8387_cast_fp16, var_8389_cast_fp16, var_8391_cast_fp16, var_8393_cast_fp16, var_8395_cast_fp16, var_8397_cast_fp16, var_8399_cast_fp16, var_8401_cast_fp16, var_8403_cast_fp16, var_8405_cast_fp16, var_8407_cast_fp16, var_8409_cast_fp16))[name = tensor("input_305_cast_fp16")]; tensor var_8418_pad_type_0 = const()[name = tensor("op_8418_pad_type_0"), val = tensor("valid")]; tensor var_8418_strides_0 = const()[name = tensor("op_8418_strides_0"), val = tensor([1, 1])]; tensor var_8418_pad_0 = const()[name = tensor("op_8418_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_8418_dilations_0 = const()[name = tensor("op_8418_dilations_0"), val = tensor([1, 1])]; tensor var_8418_groups_0 = const()[name = tensor("op_8418_groups_0"), val = tensor(1)]; tensor blocks_30_attn_out_weight_to_fp16 = const()[name = tensor("blocks_30_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1205098432)))]; tensor blocks_30_attn_out_bias_to_fp16 = const()[name = tensor("blocks_30_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1208375296)))]; tensor var_8418_cast_fp16 = conv(bias = blocks_30_attn_out_bias_to_fp16, dilations = var_8418_dilations_0, groups = var_8418_groups_0, pad = var_8418_pad_0, pad_type = var_8418_pad_type_0, strides = var_8418_strides_0, weight = blocks_30_attn_out_weight_to_fp16, x = input_305_cast_fp16)[name = tensor("op_8418_cast_fp16")]; tensor inputs_123_cast_fp16 = add(x = inputs_121_cast_fp16, y = var_8418_cast_fp16)[name = tensor("inputs_123_cast_fp16")]; tensor input_307_axes_0 = const()[name = tensor("input_307_axes_0"), val = tensor([1])]; tensor input_307_gamma_0_to_fp16 = const()[name = tensor("input_307_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1208377920)))]; tensor input_307_beta_0_to_fp16 = const()[name = tensor("input_307_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1208380544)))]; tensor var_8428_to_fp16 = const()[name = tensor("op_8428_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_307_cast_fp16 = layer_norm(axes = input_307_axes_0, beta = input_307_beta_0_to_fp16, epsilon = var_8428_to_fp16, gamma = input_307_gamma_0_to_fp16, x = inputs_123_cast_fp16)[name = tensor("input_307_cast_fp16")]; tensor input_309_pad_type_0 = const()[name = tensor("input_309_pad_type_0"), val = tensor("valid")]; tensor input_309_strides_0 = const()[name = tensor("input_309_strides_0"), val = tensor([1, 1])]; tensor input_309_pad_0 = const()[name = tensor("input_309_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_309_dilations_0 = const()[name = tensor("input_309_dilations_0"), val = tensor([1, 1])]; tensor input_309_groups_0 = const()[name = tensor("input_309_groups_0"), val = tensor(1)]; tensor blocks_30_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_30_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1208383168)))]; tensor blocks_30_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_30_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1221490432)))]; tensor input_309_cast_fp16 = conv(bias = blocks_30_mlp_0_bias_to_fp16, dilations = input_309_dilations_0, groups = input_309_groups_0, pad = input_309_pad_0, pad_type = input_309_pad_type_0, strides = input_309_strides_0, weight = blocks_30_mlp_0_weight_to_fp16, x = input_307_cast_fp16)[name = tensor("input_309_cast_fp16")]; tensor input_311_mode_0 = const()[name = tensor("input_311_mode_0"), val = tensor("EXACT")]; tensor input_311_cast_fp16 = gelu(mode = input_311_mode_0, x = input_309_cast_fp16)[name = tensor("input_311_cast_fp16")]; tensor var_8454_pad_type_0 = const()[name = tensor("op_8454_pad_type_0"), val = tensor("valid")]; tensor var_8454_strides_0 = const()[name = tensor("op_8454_strides_0"), val = tensor([1, 1])]; tensor var_8454_pad_0 = const()[name = tensor("op_8454_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_8454_dilations_0 = const()[name = tensor("op_8454_dilations_0"), val = tensor([1, 1])]; tensor var_8454_groups_0 = const()[name = tensor("op_8454_groups_0"), val = tensor(1)]; tensor blocks_30_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_30_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1221500736)))]; tensor blocks_30_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_30_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1234608000)))]; tensor var_8454_cast_fp16 = conv(bias = blocks_30_mlp_2_bias_to_fp16, dilations = var_8454_dilations_0, groups = var_8454_groups_0, pad = var_8454_pad_0, pad_type = var_8454_pad_type_0, strides = var_8454_strides_0, weight = blocks_30_mlp_2_weight_to_fp16, x = input_311_cast_fp16)[name = tensor("op_8454_cast_fp16")]; tensor inputs_125_cast_fp16 = add(x = inputs_123_cast_fp16, y = var_8454_cast_fp16)[name = tensor("inputs_125_cast_fp16")]; tensor var_8463 = const()[name = tensor("op_8463"), val = tensor(1)]; tensor input_313_axes_0 = const()[name = tensor("input_313_axes_0"), val = tensor([1])]; tensor input_313_gamma_0_to_fp16 = const()[name = tensor("input_313_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1234610624)))]; tensor input_313_beta_0_to_fp16 = const()[name = tensor("input_313_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1234613248)))]; tensor var_8479_to_fp16 = const()[name = tensor("op_8479_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_313_cast_fp16 = layer_norm(axes = input_313_axes_0, beta = input_313_beta_0_to_fp16, epsilon = var_8479_to_fp16, gamma = input_313_gamma_0_to_fp16, x = inputs_125_cast_fp16)[name = tensor("input_313_cast_fp16")]; tensor q_pad_type_0 = const()[name = tensor("q_pad_type_0"), val = tensor("valid")]; tensor q_strides_0 = const()[name = tensor("q_strides_0"), val = tensor([1, 1])]; tensor q_pad_0 = const()[name = tensor("q_pad_0"), val = tensor([0, 0, 0, 0])]; tensor q_dilations_0 = const()[name = tensor("q_dilations_0"), val = tensor([1, 1])]; tensor q_groups_0 = const()[name = tensor("q_groups_0"), val = tensor(1)]; tensor var_8514_weight_0_to_fp16 = const()[name = tensor("op_8514_weight_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1234615872)))]; tensor var_8514_bias_0_to_fp16 = const()[name = tensor("op_8514_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1237892736)))]; tensor var_8514_cast_fp16 = conv(bias = var_8514_bias_0_to_fp16, dilations = q_dilations_0, groups = q_groups_0, pad = q_pad_0, pad_type = q_pad_type_0, strides = q_strides_0, weight = var_8514_weight_0_to_fp16, x = input_313_cast_fp16)[name = tensor("op_8514_cast_fp16")]; tensor k_pad_type_0 = const()[name = tensor("k_pad_type_0"), val = tensor("valid")]; tensor k_strides_0 = const()[name = tensor("k_strides_0"), val = tensor([1, 1])]; tensor k_pad_0 = const()[name = tensor("k_pad_0"), val = tensor([0, 0, 0, 0])]; tensor k_dilations_0 = const()[name = tensor("k_dilations_0"), val = tensor([1, 1])]; tensor k_groups_0 = const()[name = tensor("k_groups_0"), val = tensor(1)]; tensor blocks_31_attn_key_weight_to_fp16 = const()[name = tensor("blocks_31_attn_key_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1237895360)))]; tensor k_cast_fp16 = conv(dilations = k_dilations_0, groups = k_groups_0, pad = k_pad_0, pad_type = k_pad_type_0, strides = k_strides_0, weight = blocks_31_attn_key_weight_to_fp16, x = input_313_cast_fp16)[name = tensor("k_cast_fp16")]; tensor var_8512_pad_type_0 = const()[name = tensor("op_8512_pad_type_0"), val = tensor("valid")]; tensor var_8512_strides_0 = const()[name = tensor("op_8512_strides_0"), val = tensor([1, 1])]; tensor var_8512_pad_0 = const()[name = tensor("op_8512_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_8512_dilations_0 = const()[name = tensor("op_8512_dilations_0"), val = tensor([1, 1])]; tensor var_8512_groups_0 = const()[name = tensor("op_8512_groups_0"), val = tensor(1)]; tensor blocks_31_attn_value_weight_to_fp16 = const()[name = tensor("blocks_31_attn_value_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1241172224)))]; tensor blocks_31_attn_value_bias_to_fp16 = const()[name = tensor("blocks_31_attn_value_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1244449088)))]; tensor var_8512_cast_fp16 = conv(bias = blocks_31_attn_value_bias_to_fp16, dilations = var_8512_dilations_0, groups = var_8512_groups_0, pad = var_8512_pad_0, pad_type = var_8512_pad_type_0, strides = var_8512_strides_0, weight = blocks_31_attn_value_weight_to_fp16, x = input_313_cast_fp16)[name = tensor("op_8512_cast_fp16")]; tensor tile_93 = const()[name = tensor("tile_93"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_8515_axis_0 = const()[name = tensor("op_8515_axis_0"), val = tensor(1)]; tensor var_8515_cast_fp16_0, tensor var_8515_cast_fp16_1, tensor var_8515_cast_fp16_2, tensor var_8515_cast_fp16_3, tensor var_8515_cast_fp16_4, tensor var_8515_cast_fp16_5, tensor var_8515_cast_fp16_6, tensor var_8515_cast_fp16_7, tensor var_8515_cast_fp16_8, tensor var_8515_cast_fp16_9, tensor var_8515_cast_fp16_10, tensor var_8515_cast_fp16_11, tensor var_8515_cast_fp16_12, tensor var_8515_cast_fp16_13, tensor var_8515_cast_fp16_14, tensor var_8515_cast_fp16_15, tensor var_8515_cast_fp16_16, tensor var_8515_cast_fp16_17, tensor var_8515_cast_fp16_18, tensor var_8515_cast_fp16_19 = split(axis = var_8515_axis_0, split_sizes = tile_93, x = var_8514_cast_fp16)[name = tensor("op_8515_cast_fp16")]; tensor var_8536_perm_0 = const()[name = tensor("op_8536_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_94 = const()[name = tensor("tile_94"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_8537_axis_0 = const()[name = tensor("op_8537_axis_0"), val = tensor(3)]; tensor var_8536_cast_fp16 = transpose(perm = var_8536_perm_0, x = k_cast_fp16)[name = tensor("transpose_1")]; tensor var_8537_cast_fp16_0, tensor var_8537_cast_fp16_1, tensor var_8537_cast_fp16_2, tensor var_8537_cast_fp16_3, tensor var_8537_cast_fp16_4, tensor var_8537_cast_fp16_5, tensor var_8537_cast_fp16_6, tensor var_8537_cast_fp16_7, tensor var_8537_cast_fp16_8, tensor var_8537_cast_fp16_9, tensor var_8537_cast_fp16_10, tensor var_8537_cast_fp16_11, tensor var_8537_cast_fp16_12, tensor var_8537_cast_fp16_13, tensor var_8537_cast_fp16_14, tensor var_8537_cast_fp16_15, tensor var_8537_cast_fp16_16, tensor var_8537_cast_fp16_17, tensor var_8537_cast_fp16_18, tensor var_8537_cast_fp16_19 = split(axis = var_8537_axis_0, split_sizes = tile_94, x = var_8536_cast_fp16)[name = tensor("op_8537_cast_fp16")]; tensor tile_95 = const()[name = tensor("tile_95"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64])]; tensor var_8558_axis_0 = const()[name = tensor("op_8558_axis_0"), val = tensor(1)]; tensor var_8558_cast_fp16_0, tensor var_8558_cast_fp16_1, tensor var_8558_cast_fp16_2, tensor var_8558_cast_fp16_3, tensor var_8558_cast_fp16_4, tensor var_8558_cast_fp16_5, tensor var_8558_cast_fp16_6, tensor var_8558_cast_fp16_7, tensor var_8558_cast_fp16_8, tensor var_8558_cast_fp16_9, tensor var_8558_cast_fp16_10, tensor var_8558_cast_fp16_11, tensor var_8558_cast_fp16_12, tensor var_8558_cast_fp16_13, tensor var_8558_cast_fp16_14, tensor var_8558_cast_fp16_15, tensor var_8558_cast_fp16_16, tensor var_8558_cast_fp16_17, tensor var_8558_cast_fp16_18, tensor var_8558_cast_fp16_19 = split(axis = var_8558_axis_0, split_sizes = tile_95, x = var_8512_cast_fp16)[name = tensor("op_8558_cast_fp16")]; tensor aw_1241_equation_0 = const()[name = tensor("aw_1241_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1241_cast_fp16 = einsum(equation = aw_1241_equation_0, values = (var_8537_cast_fp16_0, var_8515_cast_fp16_0))[name = tensor("aw_1241_cast_fp16")]; tensor aw_1243_equation_0 = const()[name = tensor("aw_1243_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1243_cast_fp16 = einsum(equation = aw_1243_equation_0, values = (var_8537_cast_fp16_1, var_8515_cast_fp16_1))[name = tensor("aw_1243_cast_fp16")]; tensor aw_1245_equation_0 = const()[name = tensor("aw_1245_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1245_cast_fp16 = einsum(equation = aw_1245_equation_0, values = (var_8537_cast_fp16_2, var_8515_cast_fp16_2))[name = tensor("aw_1245_cast_fp16")]; tensor aw_1247_equation_0 = const()[name = tensor("aw_1247_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1247_cast_fp16 = einsum(equation = aw_1247_equation_0, values = (var_8537_cast_fp16_3, var_8515_cast_fp16_3))[name = tensor("aw_1247_cast_fp16")]; tensor aw_1249_equation_0 = const()[name = tensor("aw_1249_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1249_cast_fp16 = einsum(equation = aw_1249_equation_0, values = (var_8537_cast_fp16_4, var_8515_cast_fp16_4))[name = tensor("aw_1249_cast_fp16")]; tensor aw_1251_equation_0 = const()[name = tensor("aw_1251_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1251_cast_fp16 = einsum(equation = aw_1251_equation_0, values = (var_8537_cast_fp16_5, var_8515_cast_fp16_5))[name = tensor("aw_1251_cast_fp16")]; tensor aw_1253_equation_0 = const()[name = tensor("aw_1253_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1253_cast_fp16 = einsum(equation = aw_1253_equation_0, values = (var_8537_cast_fp16_6, var_8515_cast_fp16_6))[name = tensor("aw_1253_cast_fp16")]; tensor aw_1255_equation_0 = const()[name = tensor("aw_1255_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1255_cast_fp16 = einsum(equation = aw_1255_equation_0, values = (var_8537_cast_fp16_7, var_8515_cast_fp16_7))[name = tensor("aw_1255_cast_fp16")]; tensor aw_1257_equation_0 = const()[name = tensor("aw_1257_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1257_cast_fp16 = einsum(equation = aw_1257_equation_0, values = (var_8537_cast_fp16_8, var_8515_cast_fp16_8))[name = tensor("aw_1257_cast_fp16")]; tensor aw_1259_equation_0 = const()[name = tensor("aw_1259_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1259_cast_fp16 = einsum(equation = aw_1259_equation_0, values = (var_8537_cast_fp16_9, var_8515_cast_fp16_9))[name = tensor("aw_1259_cast_fp16")]; tensor aw_1261_equation_0 = const()[name = tensor("aw_1261_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1261_cast_fp16 = einsum(equation = aw_1261_equation_0, values = (var_8537_cast_fp16_10, var_8515_cast_fp16_10))[name = tensor("aw_1261_cast_fp16")]; tensor aw_1263_equation_0 = const()[name = tensor("aw_1263_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1263_cast_fp16 = einsum(equation = aw_1263_equation_0, values = (var_8537_cast_fp16_11, var_8515_cast_fp16_11))[name = tensor("aw_1263_cast_fp16")]; tensor aw_1265_equation_0 = const()[name = tensor("aw_1265_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1265_cast_fp16 = einsum(equation = aw_1265_equation_0, values = (var_8537_cast_fp16_12, var_8515_cast_fp16_12))[name = tensor("aw_1265_cast_fp16")]; tensor aw_1267_equation_0 = const()[name = tensor("aw_1267_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1267_cast_fp16 = einsum(equation = aw_1267_equation_0, values = (var_8537_cast_fp16_13, var_8515_cast_fp16_13))[name = tensor("aw_1267_cast_fp16")]; tensor aw_1269_equation_0 = const()[name = tensor("aw_1269_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1269_cast_fp16 = einsum(equation = aw_1269_equation_0, values = (var_8537_cast_fp16_14, var_8515_cast_fp16_14))[name = tensor("aw_1269_cast_fp16")]; tensor aw_1271_equation_0 = const()[name = tensor("aw_1271_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1271_cast_fp16 = einsum(equation = aw_1271_equation_0, values = (var_8537_cast_fp16_15, var_8515_cast_fp16_15))[name = tensor("aw_1271_cast_fp16")]; tensor aw_1273_equation_0 = const()[name = tensor("aw_1273_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1273_cast_fp16 = einsum(equation = aw_1273_equation_0, values = (var_8537_cast_fp16_16, var_8515_cast_fp16_16))[name = tensor("aw_1273_cast_fp16")]; tensor aw_1275_equation_0 = const()[name = tensor("aw_1275_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1275_cast_fp16 = einsum(equation = aw_1275_equation_0, values = (var_8537_cast_fp16_17, var_8515_cast_fp16_17))[name = tensor("aw_1275_cast_fp16")]; tensor aw_1277_equation_0 = const()[name = tensor("aw_1277_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_1277_cast_fp16 = einsum(equation = aw_1277_equation_0, values = (var_8537_cast_fp16_18, var_8515_cast_fp16_18))[name = tensor("aw_1277_cast_fp16")]; tensor aw_equation_0 = const()[name = tensor("aw_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor aw_cast_fp16 = einsum(equation = aw_equation_0, values = (var_8537_cast_fp16_19, var_8515_cast_fp16_19))[name = tensor("aw_cast_fp16")]; tensor var_8619_cast_fp16 = softmax(axis = var_8463, x = aw_1241_cast_fp16)[name = tensor("op_8619_cast_fp16")]; tensor var_8620_cast_fp16 = softmax(axis = var_8463, x = aw_1243_cast_fp16)[name = tensor("op_8620_cast_fp16")]; tensor var_8621_cast_fp16 = softmax(axis = var_8463, x = aw_1245_cast_fp16)[name = tensor("op_8621_cast_fp16")]; tensor var_8622_cast_fp16 = softmax(axis = var_8463, x = aw_1247_cast_fp16)[name = tensor("op_8622_cast_fp16")]; tensor var_8623_cast_fp16 = softmax(axis = var_8463, x = aw_1249_cast_fp16)[name = tensor("op_8623_cast_fp16")]; tensor var_8624_cast_fp16 = softmax(axis = var_8463, x = aw_1251_cast_fp16)[name = tensor("op_8624_cast_fp16")]; tensor var_8625_cast_fp16 = softmax(axis = var_8463, x = aw_1253_cast_fp16)[name = tensor("op_8625_cast_fp16")]; tensor var_8626_cast_fp16 = softmax(axis = var_8463, x = aw_1255_cast_fp16)[name = tensor("op_8626_cast_fp16")]; tensor var_8627_cast_fp16 = softmax(axis = var_8463, x = aw_1257_cast_fp16)[name = tensor("op_8627_cast_fp16")]; tensor var_8628_cast_fp16 = softmax(axis = var_8463, x = aw_1259_cast_fp16)[name = tensor("op_8628_cast_fp16")]; tensor var_8629_cast_fp16 = softmax(axis = var_8463, x = aw_1261_cast_fp16)[name = tensor("op_8629_cast_fp16")]; tensor var_8630_cast_fp16 = softmax(axis = var_8463, x = aw_1263_cast_fp16)[name = tensor("op_8630_cast_fp16")]; tensor var_8631_cast_fp16 = softmax(axis = var_8463, x = aw_1265_cast_fp16)[name = tensor("op_8631_cast_fp16")]; tensor var_8632_cast_fp16 = softmax(axis = var_8463, x = aw_1267_cast_fp16)[name = tensor("op_8632_cast_fp16")]; tensor var_8633_cast_fp16 = softmax(axis = var_8463, x = aw_1269_cast_fp16)[name = tensor("op_8633_cast_fp16")]; tensor var_8634_cast_fp16 = softmax(axis = var_8463, x = aw_1271_cast_fp16)[name = tensor("op_8634_cast_fp16")]; tensor var_8635_cast_fp16 = softmax(axis = var_8463, x = aw_1273_cast_fp16)[name = tensor("op_8635_cast_fp16")]; tensor var_8636_cast_fp16 = softmax(axis = var_8463, x = aw_1275_cast_fp16)[name = tensor("op_8636_cast_fp16")]; tensor var_8637_cast_fp16 = softmax(axis = var_8463, x = aw_1277_cast_fp16)[name = tensor("op_8637_cast_fp16")]; tensor var_8638_cast_fp16 = softmax(axis = var_8463, x = aw_cast_fp16)[name = tensor("op_8638_cast_fp16")]; tensor var_8640_equation_0 = const()[name = tensor("op_8640_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8640_cast_fp16 = einsum(equation = var_8640_equation_0, values = (var_8558_cast_fp16_0, var_8619_cast_fp16))[name = tensor("op_8640_cast_fp16")]; tensor var_8642_equation_0 = const()[name = tensor("op_8642_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8642_cast_fp16 = einsum(equation = var_8642_equation_0, values = (var_8558_cast_fp16_1, var_8620_cast_fp16))[name = tensor("op_8642_cast_fp16")]; tensor var_8644_equation_0 = const()[name = tensor("op_8644_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8644_cast_fp16 = einsum(equation = var_8644_equation_0, values = (var_8558_cast_fp16_2, var_8621_cast_fp16))[name = tensor("op_8644_cast_fp16")]; tensor var_8646_equation_0 = const()[name = tensor("op_8646_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8646_cast_fp16 = einsum(equation = var_8646_equation_0, values = (var_8558_cast_fp16_3, var_8622_cast_fp16))[name = tensor("op_8646_cast_fp16")]; tensor var_8648_equation_0 = const()[name = tensor("op_8648_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8648_cast_fp16 = einsum(equation = var_8648_equation_0, values = (var_8558_cast_fp16_4, var_8623_cast_fp16))[name = tensor("op_8648_cast_fp16")]; tensor var_8650_equation_0 = const()[name = tensor("op_8650_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8650_cast_fp16 = einsum(equation = var_8650_equation_0, values = (var_8558_cast_fp16_5, var_8624_cast_fp16))[name = tensor("op_8650_cast_fp16")]; tensor var_8652_equation_0 = const()[name = tensor("op_8652_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8652_cast_fp16 = einsum(equation = var_8652_equation_0, values = (var_8558_cast_fp16_6, var_8625_cast_fp16))[name = tensor("op_8652_cast_fp16")]; tensor var_8654_equation_0 = const()[name = tensor("op_8654_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8654_cast_fp16 = einsum(equation = var_8654_equation_0, values = (var_8558_cast_fp16_7, var_8626_cast_fp16))[name = tensor("op_8654_cast_fp16")]; tensor var_8656_equation_0 = const()[name = tensor("op_8656_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8656_cast_fp16 = einsum(equation = var_8656_equation_0, values = (var_8558_cast_fp16_8, var_8627_cast_fp16))[name = tensor("op_8656_cast_fp16")]; tensor var_8658_equation_0 = const()[name = tensor("op_8658_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8658_cast_fp16 = einsum(equation = var_8658_equation_0, values = (var_8558_cast_fp16_9, var_8628_cast_fp16))[name = tensor("op_8658_cast_fp16")]; tensor var_8660_equation_0 = const()[name = tensor("op_8660_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8660_cast_fp16 = einsum(equation = var_8660_equation_0, values = (var_8558_cast_fp16_10, var_8629_cast_fp16))[name = tensor("op_8660_cast_fp16")]; tensor var_8662_equation_0 = const()[name = tensor("op_8662_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8662_cast_fp16 = einsum(equation = var_8662_equation_0, values = (var_8558_cast_fp16_11, var_8630_cast_fp16))[name = tensor("op_8662_cast_fp16")]; tensor var_8664_equation_0 = const()[name = tensor("op_8664_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8664_cast_fp16 = einsum(equation = var_8664_equation_0, values = (var_8558_cast_fp16_12, var_8631_cast_fp16))[name = tensor("op_8664_cast_fp16")]; tensor var_8666_equation_0 = const()[name = tensor("op_8666_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8666_cast_fp16 = einsum(equation = var_8666_equation_0, values = (var_8558_cast_fp16_13, var_8632_cast_fp16))[name = tensor("op_8666_cast_fp16")]; tensor var_8668_equation_0 = const()[name = tensor("op_8668_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8668_cast_fp16 = einsum(equation = var_8668_equation_0, values = (var_8558_cast_fp16_14, var_8633_cast_fp16))[name = tensor("op_8668_cast_fp16")]; tensor var_8670_equation_0 = const()[name = tensor("op_8670_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8670_cast_fp16 = einsum(equation = var_8670_equation_0, values = (var_8558_cast_fp16_15, var_8634_cast_fp16))[name = tensor("op_8670_cast_fp16")]; tensor var_8672_equation_0 = const()[name = tensor("op_8672_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8672_cast_fp16 = einsum(equation = var_8672_equation_0, values = (var_8558_cast_fp16_16, var_8635_cast_fp16))[name = tensor("op_8672_cast_fp16")]; tensor var_8674_equation_0 = const()[name = tensor("op_8674_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8674_cast_fp16 = einsum(equation = var_8674_equation_0, values = (var_8558_cast_fp16_17, var_8636_cast_fp16))[name = tensor("op_8674_cast_fp16")]; tensor var_8676_equation_0 = const()[name = tensor("op_8676_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8676_cast_fp16 = einsum(equation = var_8676_equation_0, values = (var_8558_cast_fp16_18, var_8637_cast_fp16))[name = tensor("op_8676_cast_fp16")]; tensor var_8678_equation_0 = const()[name = tensor("op_8678_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_8678_cast_fp16 = einsum(equation = var_8678_equation_0, values = (var_8558_cast_fp16_19, var_8638_cast_fp16))[name = tensor("op_8678_cast_fp16")]; tensor input_315_interleave_0 = const()[name = tensor("input_315_interleave_0"), val = tensor(false)]; tensor input_315_cast_fp16 = concat(axis = var_8463, interleave = input_315_interleave_0, values = (var_8640_cast_fp16, var_8642_cast_fp16, var_8644_cast_fp16, var_8646_cast_fp16, var_8648_cast_fp16, var_8650_cast_fp16, var_8652_cast_fp16, var_8654_cast_fp16, var_8656_cast_fp16, var_8658_cast_fp16, var_8660_cast_fp16, var_8662_cast_fp16, var_8664_cast_fp16, var_8666_cast_fp16, var_8668_cast_fp16, var_8670_cast_fp16, var_8672_cast_fp16, var_8674_cast_fp16, var_8676_cast_fp16, var_8678_cast_fp16))[name = tensor("input_315_cast_fp16")]; tensor var_8687_pad_type_0 = const()[name = tensor("op_8687_pad_type_0"), val = tensor("valid")]; tensor var_8687_strides_0 = const()[name = tensor("op_8687_strides_0"), val = tensor([1, 1])]; tensor var_8687_pad_0 = const()[name = tensor("op_8687_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_8687_dilations_0 = const()[name = tensor("op_8687_dilations_0"), val = tensor([1, 1])]; tensor var_8687_groups_0 = const()[name = tensor("op_8687_groups_0"), val = tensor(1)]; tensor blocks_31_attn_out_weight_to_fp16 = const()[name = tensor("blocks_31_attn_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1244451712)))]; tensor blocks_31_attn_out_bias_to_fp16 = const()[name = tensor("blocks_31_attn_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1247728576)))]; tensor var_8687_cast_fp16 = conv(bias = blocks_31_attn_out_bias_to_fp16, dilations = var_8687_dilations_0, groups = var_8687_groups_0, pad = var_8687_pad_0, pad_type = var_8687_pad_type_0, strides = var_8687_strides_0, weight = blocks_31_attn_out_weight_to_fp16, x = input_315_cast_fp16)[name = tensor("op_8687_cast_fp16")]; tensor inputs_127_cast_fp16 = add(x = inputs_125_cast_fp16, y = var_8687_cast_fp16)[name = tensor("inputs_127_cast_fp16")]; tensor input_317_axes_0 = const()[name = tensor("input_317_axes_0"), val = tensor([1])]; tensor input_317_gamma_0_to_fp16 = const()[name = tensor("input_317_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1247731200)))]; tensor input_317_beta_0_to_fp16 = const()[name = tensor("input_317_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1247733824)))]; tensor var_8697_to_fp16 = const()[name = tensor("op_8697_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_317_cast_fp16 = layer_norm(axes = input_317_axes_0, beta = input_317_beta_0_to_fp16, epsilon = var_8697_to_fp16, gamma = input_317_gamma_0_to_fp16, x = inputs_127_cast_fp16)[name = tensor("input_317_cast_fp16")]; tensor input_319_pad_type_0 = const()[name = tensor("input_319_pad_type_0"), val = tensor("valid")]; tensor input_319_strides_0 = const()[name = tensor("input_319_strides_0"), val = tensor([1, 1])]; tensor input_319_pad_0 = const()[name = tensor("input_319_pad_0"), val = tensor([0, 0, 0, 0])]; tensor input_319_dilations_0 = const()[name = tensor("input_319_dilations_0"), val = tensor([1, 1])]; tensor input_319_groups_0 = const()[name = tensor("input_319_groups_0"), val = tensor(1)]; tensor blocks_31_mlp_0_weight_to_fp16 = const()[name = tensor("blocks_31_mlp_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1247736448)))]; tensor blocks_31_mlp_0_bias_to_fp16 = const()[name = tensor("blocks_31_mlp_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1260843712)))]; tensor input_319_cast_fp16 = conv(bias = blocks_31_mlp_0_bias_to_fp16, dilations = input_319_dilations_0, groups = input_319_groups_0, pad = input_319_pad_0, pad_type = input_319_pad_type_0, strides = input_319_strides_0, weight = blocks_31_mlp_0_weight_to_fp16, x = input_317_cast_fp16)[name = tensor("input_319_cast_fp16")]; tensor input_mode_0 = const()[name = tensor("input_mode_0"), val = tensor("EXACT")]; tensor input_cast_fp16 = gelu(mode = input_mode_0, x = input_319_cast_fp16)[name = tensor("input_cast_fp16")]; tensor var_8723_pad_type_0 = const()[name = tensor("op_8723_pad_type_0"), val = tensor("valid")]; tensor var_8723_strides_0 = const()[name = tensor("op_8723_strides_0"), val = tensor([1, 1])]; tensor var_8723_pad_0 = const()[name = tensor("op_8723_pad_0"), val = tensor([0, 0, 0, 0])]; tensor var_8723_dilations_0 = const()[name = tensor("op_8723_dilations_0"), val = tensor([1, 1])]; tensor var_8723_groups_0 = const()[name = tensor("op_8723_groups_0"), val = tensor(1)]; tensor blocks_31_mlp_2_weight_to_fp16 = const()[name = tensor("blocks_31_mlp_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1260854016)))]; tensor blocks_31_mlp_2_bias_to_fp16 = const()[name = tensor("blocks_31_mlp_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1273961280)))]; tensor var_8723_cast_fp16 = conv(bias = blocks_31_mlp_2_bias_to_fp16, dilations = var_8723_dilations_0, groups = var_8723_groups_0, pad = var_8723_pad_0, pad_type = var_8723_pad_type_0, strides = var_8723_strides_0, weight = blocks_31_mlp_2_weight_to_fp16, x = input_cast_fp16)[name = tensor("op_8723_cast_fp16")]; tensor inputs_cast_fp16 = add(x = inputs_127_cast_fp16, y = var_8723_cast_fp16)[name = tensor("inputs_cast_fp16")]; tensor x_axes_0 = const()[name = tensor("x_axes_0"), val = tensor([1])]; tensor x_gamma_0_to_fp16 = const()[name = tensor("x_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1273963904)))]; tensor x_beta_0_to_fp16 = const()[name = tensor("x_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1273966528)))]; tensor var_8737_to_fp16 = const()[name = tensor("op_8737_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_cast_fp16 = layer_norm(axes = x_axes_0, beta = x_beta_0_to_fp16, epsilon = var_8737_to_fp16, gamma = x_gamma_0_to_fp16, x = inputs_cast_fp16)[name = tensor("x_cast_fp16")]; tensor var_8748_axes_0 = const()[name = tensor("op_8748_axes_0"), val = tensor([2])]; tensor var_8748_cast_fp16 = squeeze(axes = var_8748_axes_0, x = x_cast_fp16)[name = tensor("op_8748_cast_fp16")]; tensor var_8751_perm_0 = const()[name = tensor("op_8751_perm_0"), val = tensor([0, 2, 1])]; tensor var_8751_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("op_8751_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; tensor var_8751_cast_fp16 = transpose(perm = var_8751_perm_0, x = var_8748_cast_fp16)[name = tensor("transpose_0")]; tensor output = cast(dtype = var_8751_cast_fp16_to_fp32_dtype_0, x = var_8751_cast_fp16)[name = tensor("cast_130")]; } -> (output); }