program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "3304.5.2"}, {"coremlc-version", "3304.6.2"}, {"coremltools-component-torch", "2.3.0"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "7.2"}})] { func main(tensor logmel_data) { tensor var_72 = const()[name = tensor("op_72"), val = tensor(1)]; tensor var_80 = const()[name = tensor("op_80"), val = tensor([1])]; tensor var_82 = const()[name = tensor("op_82"), val = tensor([1])]; tensor var_84_pad_type_0 = const()[name = tensor("op_84_pad_type_0"), val = tensor("custom")]; tensor var_84_pad_0 = const()[name = tensor("op_84_pad_0"), val = tensor([1, 1])]; tensor weight_3_to_fp16 = const()[name = tensor("weight_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor bias_3_to_fp16 = const()[name = tensor("bias_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(614528)))]; tensor var_84_cast_fp16 = conv(bias = bias_3_to_fp16, dilations = var_82, groups = var_72, pad = var_84_pad_0, pad_type = var_84_pad_type_0, strides = var_80, weight = weight_3_to_fp16, x = logmel_data)[name = tensor("op_84_cast_fp16")]; tensor input_1_mode_0 = const()[name = tensor("input_1_mode_0"), val = tensor("EXACT")]; tensor input_1_cast_fp16 = gelu(mode = input_1_mode_0, x = var_84_cast_fp16)[name = tensor("input_1_cast_fp16")]; tensor var_89 = const()[name = tensor("op_89"), val = tensor(1)]; tensor var_98 = const()[name = tensor("op_98"), val = tensor([2])]; tensor var_100 = const()[name = tensor("op_100"), val = tensor([1])]; tensor var_102_pad_type_0 = const()[name = tensor("op_102_pad_type_0"), val = tensor("custom")]; tensor var_102_pad_0 = const()[name = tensor("op_102_pad_0"), val = tensor([1, 1])]; tensor weight_7_to_fp16 = const()[name = tensor("weight_7_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(617152)))]; tensor bias_7_to_fp16 = const()[name = tensor("bias_7_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10447616)))]; tensor var_102_cast_fp16 = conv(bias = bias_7_to_fp16, dilations = var_100, groups = var_89, pad = var_102_pad_0, pad_type = var_102_pad_type_0, strides = var_98, weight = weight_7_to_fp16, x = input_1_cast_fp16)[name = tensor("op_102_cast_fp16")]; tensor x_3_mode_0 = const()[name = tensor("x_3_mode_0"), val = tensor("EXACT")]; tensor x_3_cast_fp16 = gelu(mode = x_3_mode_0, x = var_102_cast_fp16)[name = tensor("x_3_cast_fp16")]; tensor var_108 = const()[name = tensor("op_108"), val = tensor([0, 2, 1])]; tensor positional_embedding_to_fp16 = const()[name = tensor("positional_embedding_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10450240)))]; tensor transpose_320 = transpose(perm = var_108, x = x_3_cast_fp16)[name = tensor("transpose_320")]; tensor var_111_cast_fp16 = add(x = transpose_320, y = positional_embedding_to_fp16)[name = tensor("op_111_cast_fp16")]; tensor var_124 = const()[name = tensor("op_124"), val = tensor(-1)]; tensor var_140_axes_0 = const()[name = tensor("op_140_axes_0"), val = tensor([-1])]; tensor blocks_0_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_0_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14290304)))]; tensor blocks_0_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_0_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14292928)))]; tensor var_130_to_fp16 = const()[name = tensor("op_130_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_140_cast_fp16 = layer_norm(axes = var_140_axes_0, beta = blocks_0_attn_ln_bias_to_fp16, epsilon = var_130_to_fp16, gamma = blocks_0_attn_ln_weight_to_fp16, x = var_111_cast_fp16)[name = tensor("op_140_cast_fp16")]; tensor var_151_to_fp16 = const()[name = tensor("op_151_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14295552)))]; tensor var_152_to_fp16 = const()[name = tensor("op_152_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17572416)))]; tensor linear_0_cast_fp16 = linear(bias = var_152_to_fp16, weight = var_151_to_fp16, x = var_140_cast_fp16)[name = tensor("linear_0_cast_fp16")]; tensor var_155_to_fp16 = const()[name = tensor("op_155_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17575040)))]; tensor linear_1_bias_0_to_fp16 = const()[name = tensor("linear_1_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20851904)))]; tensor linear_1_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_155_to_fp16, x = var_140_cast_fp16)[name = tensor("linear_1_cast_fp16")]; tensor var_159_to_fp16 = const()[name = tensor("op_159_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20854528)))]; tensor var_160_to_fp16 = const()[name = tensor("op_160_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24131392)))]; tensor linear_2_cast_fp16 = linear(bias = var_160_to_fp16, weight = var_159_to_fp16, x = var_140_cast_fp16)[name = tensor("linear_2_cast_fp16")]; tensor var_168 = const()[name = tensor("op_168"), val = tensor([1, 1500, 20, -1])]; tensor var_169_cast_fp16 = reshape(shape = var_168, x = linear_0_cast_fp16)[name = tensor("op_169_cast_fp16")]; tensor const_224_to_fp16 = const()[name = tensor("const_224_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_3_cast_fp16 = mul(x = var_169_cast_fp16, y = const_224_to_fp16)[name = tensor("q_3_cast_fp16")]; tensor var_175 = const()[name = tensor("op_175"), val = tensor([1, 1500, 20, -1])]; tensor var_176_cast_fp16 = reshape(shape = var_175, x = linear_1_cast_fp16)[name = tensor("op_176_cast_fp16")]; tensor const_225_to_fp16 = const()[name = tensor("const_225_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_3_cast_fp16 = mul(x = var_176_cast_fp16, y = const_225_to_fp16)[name = tensor("k_3_cast_fp16")]; tensor var_182 = const()[name = tensor("op_182"), val = tensor([1, 1500, 20, -1])]; tensor var_183_cast_fp16 = reshape(shape = var_182, x = linear_2_cast_fp16)[name = tensor("op_183_cast_fp16")]; tensor var_184 = const()[name = tensor("op_184"), val = tensor([0, 2, 1, 3])]; tensor qk_1_transpose_x_0 = const()[name = tensor("qk_1_transpose_x_0"), val = tensor(false)]; tensor qk_1_transpose_y_0 = const()[name = tensor("qk_1_transpose_y_0"), val = tensor(false)]; tensor transpose_128_perm_0 = const()[name = tensor("transpose_128_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_129_perm_0 = const()[name = tensor("transpose_129_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_317 = transpose(perm = transpose_129_perm_0, x = k_3_cast_fp16)[name = tensor("transpose_317")]; tensor transpose_318 = transpose(perm = transpose_128_perm_0, x = q_3_cast_fp16)[name = tensor("transpose_318")]; tensor qk_1_cast_fp16 = matmul(transpose_x = qk_1_transpose_x_0, transpose_y = qk_1_transpose_y_0, x = transpose_318, y = transpose_317)[name = tensor("qk_1_cast_fp16")]; tensor var_188_cast_fp16 = softmax(axis = var_124, x = qk_1_cast_fp16)[name = tensor("op_188_cast_fp16")]; tensor var_190_transpose_x_0 = const()[name = tensor("op_190_transpose_x_0"), val = tensor(false)]; tensor var_190_transpose_y_0 = const()[name = tensor("op_190_transpose_y_0"), val = tensor(false)]; tensor transpose_319 = transpose(perm = var_184, x = var_183_cast_fp16)[name = tensor("transpose_319")]; tensor var_190_cast_fp16 = matmul(transpose_x = var_190_transpose_x_0, transpose_y = var_190_transpose_y_0, x = var_188_cast_fp16, y = transpose_319)[name = tensor("op_190_cast_fp16")]; tensor var_191 = const()[name = tensor("op_191"), val = tensor([0, 2, 1, 3])]; tensor concat_0 = const()[name = tensor("concat_0"), val = tensor([1, 1500, 1280])]; tensor transpose_316 = transpose(perm = var_191, x = var_190_cast_fp16)[name = tensor("transpose_316")]; tensor x_11_cast_fp16 = reshape(shape = concat_0, x = transpose_316)[name = tensor("x_11_cast_fp16")]; tensor var_196_to_fp16 = const()[name = tensor("op_196_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24134016)))]; tensor var_197_to_fp16 = const()[name = tensor("op_197_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27410880)))]; tensor linear_3_cast_fp16 = linear(bias = var_197_to_fp16, weight = var_196_to_fp16, x = x_11_cast_fp16)[name = tensor("linear_3_cast_fp16")]; tensor x_13_cast_fp16 = add(x = var_111_cast_fp16, y = linear_3_cast_fp16)[name = tensor("x_13_cast_fp16")]; tensor var_204_axes_0 = const()[name = tensor("op_204_axes_0"), val = tensor([-1])]; tensor blocks_0_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_0_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27413504)))]; tensor blocks_0_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_0_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27416128)))]; tensor var_204_cast_fp16 = layer_norm(axes = var_204_axes_0, beta = blocks_0_mlp_ln_bias_to_fp16, epsilon = var_130_to_fp16, gamma = blocks_0_mlp_ln_weight_to_fp16, x = x_13_cast_fp16)[name = tensor("op_204_cast_fp16")]; tensor var_213_to_fp16 = const()[name = tensor("op_213_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(27418752)))]; tensor var_214_to_fp16 = const()[name = tensor("op_214_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34136256)))]; tensor linear_4_cast_fp16 = linear(bias = var_214_to_fp16, weight = var_213_to_fp16, x = var_204_cast_fp16)[name = tensor("linear_4_cast_fp16")]; tensor x_17_mode_0 = const()[name = tensor("x_17_mode_0"), val = tensor("EXACT")]; tensor x_17_cast_fp16 = gelu(mode = x_17_mode_0, x = linear_4_cast_fp16)[name = tensor("x_17_cast_fp16")]; tensor var_219_to_fp16 = const()[name = tensor("op_219_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34141568)))]; tensor var_220_to_fp16 = const()[name = tensor("op_220_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40859072)))]; tensor linear_5_cast_fp16 = linear(bias = var_220_to_fp16, weight = var_219_to_fp16, x = x_17_cast_fp16)[name = tensor("linear_5_cast_fp16")]; tensor x_19_cast_fp16 = add(x = x_13_cast_fp16, y = linear_5_cast_fp16)[name = tensor("x_19_cast_fp16")]; tensor var_230 = const()[name = tensor("op_230"), val = tensor(-1)]; tensor var_246_axes_0 = const()[name = tensor("op_246_axes_0"), val = tensor([-1])]; tensor blocks_1_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_1_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40861696)))]; tensor blocks_1_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_1_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40864320)))]; tensor var_236_to_fp16 = const()[name = tensor("op_236_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_246_cast_fp16 = layer_norm(axes = var_246_axes_0, beta = blocks_1_attn_ln_bias_to_fp16, epsilon = var_236_to_fp16, gamma = blocks_1_attn_ln_weight_to_fp16, x = x_19_cast_fp16)[name = tensor("op_246_cast_fp16")]; tensor var_257_to_fp16 = const()[name = tensor("op_257_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40866944)))]; tensor var_258_to_fp16 = const()[name = tensor("op_258_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(44143808)))]; tensor linear_6_cast_fp16 = linear(bias = var_258_to_fp16, weight = var_257_to_fp16, x = var_246_cast_fp16)[name = tensor("linear_6_cast_fp16")]; tensor var_261_to_fp16 = const()[name = tensor("op_261_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(44146432)))]; tensor linear_7_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_261_to_fp16, x = var_246_cast_fp16)[name = tensor("linear_7_cast_fp16")]; tensor var_265_to_fp16 = const()[name = tensor("op_265_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47423296)))]; tensor var_266_to_fp16 = const()[name = tensor("op_266_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50700160)))]; tensor linear_8_cast_fp16 = linear(bias = var_266_to_fp16, weight = var_265_to_fp16, x = var_246_cast_fp16)[name = tensor("linear_8_cast_fp16")]; tensor var_274 = const()[name = tensor("op_274"), val = tensor([1, 1500, 20, -1])]; tensor var_275_cast_fp16 = reshape(shape = var_274, x = linear_6_cast_fp16)[name = tensor("op_275_cast_fp16")]; tensor const_226_to_fp16 = const()[name = tensor("const_226_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_7_cast_fp16 = mul(x = var_275_cast_fp16, y = const_226_to_fp16)[name = tensor("q_7_cast_fp16")]; tensor var_281 = const()[name = tensor("op_281"), val = tensor([1, 1500, 20, -1])]; tensor var_282_cast_fp16 = reshape(shape = var_281, x = linear_7_cast_fp16)[name = tensor("op_282_cast_fp16")]; tensor const_227_to_fp16 = const()[name = tensor("const_227_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_7_cast_fp16 = mul(x = var_282_cast_fp16, y = const_227_to_fp16)[name = tensor("k_7_cast_fp16")]; tensor var_288 = const()[name = tensor("op_288"), val = tensor([1, 1500, 20, -1])]; tensor var_289_cast_fp16 = reshape(shape = var_288, x = linear_8_cast_fp16)[name = tensor("op_289_cast_fp16")]; tensor var_290 = const()[name = tensor("op_290"), val = tensor([0, 2, 1, 3])]; tensor qk_3_transpose_x_0 = const()[name = tensor("qk_3_transpose_x_0"), val = tensor(false)]; tensor qk_3_transpose_y_0 = const()[name = tensor("qk_3_transpose_y_0"), val = tensor(false)]; tensor transpose_130_perm_0 = const()[name = tensor("transpose_130_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_131_perm_0 = const()[name = tensor("transpose_131_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_313 = transpose(perm = transpose_131_perm_0, x = k_7_cast_fp16)[name = tensor("transpose_313")]; tensor transpose_314 = transpose(perm = transpose_130_perm_0, x = q_7_cast_fp16)[name = tensor("transpose_314")]; tensor qk_3_cast_fp16 = matmul(transpose_x = qk_3_transpose_x_0, transpose_y = qk_3_transpose_y_0, x = transpose_314, y = transpose_313)[name = tensor("qk_3_cast_fp16")]; tensor var_294_cast_fp16 = softmax(axis = var_230, x = qk_3_cast_fp16)[name = tensor("op_294_cast_fp16")]; tensor var_296_transpose_x_0 = const()[name = tensor("op_296_transpose_x_0"), val = tensor(false)]; tensor var_296_transpose_y_0 = const()[name = tensor("op_296_transpose_y_0"), val = tensor(false)]; tensor transpose_315 = transpose(perm = var_290, x = var_289_cast_fp16)[name = tensor("transpose_315")]; tensor var_296_cast_fp16 = matmul(transpose_x = var_296_transpose_x_0, transpose_y = var_296_transpose_y_0, x = var_294_cast_fp16, y = transpose_315)[name = tensor("op_296_cast_fp16")]; tensor var_297 = const()[name = tensor("op_297"), val = tensor([0, 2, 1, 3])]; tensor concat_1 = const()[name = tensor("concat_1"), val = tensor([1, 1500, 1280])]; tensor transpose_312 = transpose(perm = var_297, x = var_296_cast_fp16)[name = tensor("transpose_312")]; tensor x_23_cast_fp16 = reshape(shape = concat_1, x = transpose_312)[name = tensor("x_23_cast_fp16")]; tensor var_302_to_fp16 = const()[name = tensor("op_302_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50702784)))]; tensor var_303_to_fp16 = const()[name = tensor("op_303_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53979648)))]; tensor linear_9_cast_fp16 = linear(bias = var_303_to_fp16, weight = var_302_to_fp16, x = x_23_cast_fp16)[name = tensor("linear_9_cast_fp16")]; tensor x_25_cast_fp16 = add(x = x_19_cast_fp16, y = linear_9_cast_fp16)[name = tensor("x_25_cast_fp16")]; tensor var_310_axes_0 = const()[name = tensor("op_310_axes_0"), val = tensor([-1])]; tensor blocks_1_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_1_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53982272)))]; tensor blocks_1_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_1_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53984896)))]; tensor var_310_cast_fp16 = layer_norm(axes = var_310_axes_0, beta = blocks_1_mlp_ln_bias_to_fp16, epsilon = var_236_to_fp16, gamma = blocks_1_mlp_ln_weight_to_fp16, x = x_25_cast_fp16)[name = tensor("op_310_cast_fp16")]; tensor var_319_to_fp16 = const()[name = tensor("op_319_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53987520)))]; tensor var_320_to_fp16 = const()[name = tensor("op_320_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(59721984)))]; tensor linear_10_cast_fp16 = linear(bias = var_320_to_fp16, weight = var_319_to_fp16, x = var_310_cast_fp16)[name = tensor("linear_10_cast_fp16")]; tensor x_29_mode_0 = const()[name = tensor("x_29_mode_0"), val = tensor("EXACT")]; tensor x_29_cast_fp16 = gelu(mode = x_29_mode_0, x = linear_10_cast_fp16)[name = tensor("x_29_cast_fp16")]; tensor var_325_to_fp16 = const()[name = tensor("op_325_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(59726528)))]; tensor var_326_to_fp16 = const()[name = tensor("op_326_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65460992)))]; tensor linear_11_cast_fp16 = linear(bias = var_326_to_fp16, weight = var_325_to_fp16, x = x_29_cast_fp16)[name = tensor("linear_11_cast_fp16")]; tensor x_31_cast_fp16 = add(x = x_25_cast_fp16, y = linear_11_cast_fp16)[name = tensor("x_31_cast_fp16")]; tensor var_336 = const()[name = tensor("op_336"), val = tensor(-1)]; tensor var_352_axes_0 = const()[name = tensor("op_352_axes_0"), val = tensor([-1])]; tensor blocks_2_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_2_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65463616)))]; tensor blocks_2_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_2_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65466240)))]; tensor var_342_to_fp16 = const()[name = tensor("op_342_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_352_cast_fp16 = layer_norm(axes = var_352_axes_0, beta = blocks_2_attn_ln_bias_to_fp16, epsilon = var_342_to_fp16, gamma = blocks_2_attn_ln_weight_to_fp16, x = x_31_cast_fp16)[name = tensor("op_352_cast_fp16")]; tensor var_363_to_fp16 = const()[name = tensor("op_363_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65468864)))]; tensor var_364_to_fp16 = const()[name = tensor("op_364_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68745728)))]; tensor linear_12_cast_fp16 = linear(bias = var_364_to_fp16, weight = var_363_to_fp16, x = var_352_cast_fp16)[name = tensor("linear_12_cast_fp16")]; tensor var_367_to_fp16 = const()[name = tensor("op_367_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68748352)))]; tensor linear_13_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_367_to_fp16, x = var_352_cast_fp16)[name = tensor("linear_13_cast_fp16")]; tensor var_371_to_fp16 = const()[name = tensor("op_371_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(72025216)))]; tensor var_372_to_fp16 = const()[name = tensor("op_372_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75302080)))]; tensor linear_14_cast_fp16 = linear(bias = var_372_to_fp16, weight = var_371_to_fp16, x = var_352_cast_fp16)[name = tensor("linear_14_cast_fp16")]; tensor var_380 = const()[name = tensor("op_380"), val = tensor([1, 1500, 20, -1])]; tensor var_381_cast_fp16 = reshape(shape = var_380, x = linear_12_cast_fp16)[name = tensor("op_381_cast_fp16")]; tensor const_228_to_fp16 = const()[name = tensor("const_228_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_11_cast_fp16 = mul(x = var_381_cast_fp16, y = const_228_to_fp16)[name = tensor("q_11_cast_fp16")]; tensor var_387 = const()[name = tensor("op_387"), val = tensor([1, 1500, 20, -1])]; tensor var_388_cast_fp16 = reshape(shape = var_387, x = linear_13_cast_fp16)[name = tensor("op_388_cast_fp16")]; tensor const_229_to_fp16 = const()[name = tensor("const_229_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_11_cast_fp16 = mul(x = var_388_cast_fp16, y = const_229_to_fp16)[name = tensor("k_11_cast_fp16")]; tensor var_394 = const()[name = tensor("op_394"), val = tensor([1, 1500, 20, -1])]; tensor var_395_cast_fp16 = reshape(shape = var_394, x = linear_14_cast_fp16)[name = tensor("op_395_cast_fp16")]; tensor var_396 = const()[name = tensor("op_396"), val = tensor([0, 2, 1, 3])]; tensor qk_5_transpose_x_0 = const()[name = tensor("qk_5_transpose_x_0"), val = tensor(false)]; tensor qk_5_transpose_y_0 = const()[name = tensor("qk_5_transpose_y_0"), val = tensor(false)]; tensor transpose_132_perm_0 = const()[name = tensor("transpose_132_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_133_perm_0 = const()[name = tensor("transpose_133_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_309 = transpose(perm = transpose_133_perm_0, x = k_11_cast_fp16)[name = tensor("transpose_309")]; tensor transpose_310 = transpose(perm = transpose_132_perm_0, x = q_11_cast_fp16)[name = tensor("transpose_310")]; tensor qk_5_cast_fp16 = matmul(transpose_x = qk_5_transpose_x_0, transpose_y = qk_5_transpose_y_0, x = transpose_310, y = transpose_309)[name = tensor("qk_5_cast_fp16")]; tensor var_400_cast_fp16 = softmax(axis = var_336, x = qk_5_cast_fp16)[name = tensor("op_400_cast_fp16")]; tensor var_402_transpose_x_0 = const()[name = tensor("op_402_transpose_x_0"), val = tensor(false)]; tensor var_402_transpose_y_0 = const()[name = tensor("op_402_transpose_y_0"), val = tensor(false)]; tensor transpose_311 = transpose(perm = var_396, x = var_395_cast_fp16)[name = tensor("transpose_311")]; tensor var_402_cast_fp16 = matmul(transpose_x = var_402_transpose_x_0, transpose_y = var_402_transpose_y_0, x = var_400_cast_fp16, y = transpose_311)[name = tensor("op_402_cast_fp16")]; tensor var_403 = const()[name = tensor("op_403"), val = tensor([0, 2, 1, 3])]; tensor concat_2 = const()[name = tensor("concat_2"), val = tensor([1, 1500, 1280])]; tensor transpose_308 = transpose(perm = var_403, x = var_402_cast_fp16)[name = tensor("transpose_308")]; tensor x_35_cast_fp16 = reshape(shape = concat_2, x = transpose_308)[name = tensor("x_35_cast_fp16")]; tensor var_408_to_fp16 = const()[name = tensor("op_408_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75304704)))]; tensor var_409_to_fp16 = const()[name = tensor("op_409_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78581568)))]; tensor linear_15_cast_fp16 = linear(bias = var_409_to_fp16, weight = var_408_to_fp16, x = x_35_cast_fp16)[name = tensor("linear_15_cast_fp16")]; tensor x_37_cast_fp16 = add(x = x_31_cast_fp16, y = linear_15_cast_fp16)[name = tensor("x_37_cast_fp16")]; tensor var_416_axes_0 = const()[name = tensor("op_416_axes_0"), val = tensor([-1])]; tensor blocks_2_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_2_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78584192)))]; tensor blocks_2_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_2_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78586816)))]; tensor var_416_cast_fp16 = layer_norm(axes = var_416_axes_0, beta = blocks_2_mlp_ln_bias_to_fp16, epsilon = var_342_to_fp16, gamma = blocks_2_mlp_ln_weight_to_fp16, x = x_37_cast_fp16)[name = tensor("op_416_cast_fp16")]; tensor var_425_to_fp16 = const()[name = tensor("op_425_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78589440)))]; tensor var_426_to_fp16 = const()[name = tensor("op_426_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(83832384)))]; tensor linear_16_cast_fp16 = linear(bias = var_426_to_fp16, weight = var_425_to_fp16, x = var_416_cast_fp16)[name = tensor("linear_16_cast_fp16")]; tensor x_41_mode_0 = const()[name = tensor("x_41_mode_0"), val = tensor("EXACT")]; tensor x_41_cast_fp16 = gelu(mode = x_41_mode_0, x = linear_16_cast_fp16)[name = tensor("x_41_cast_fp16")]; tensor var_431_to_fp16 = const()[name = tensor("op_431_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(83836544)))]; tensor var_432_to_fp16 = const()[name = tensor("op_432_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89079488)))]; tensor linear_17_cast_fp16 = linear(bias = var_432_to_fp16, weight = var_431_to_fp16, x = x_41_cast_fp16)[name = tensor("linear_17_cast_fp16")]; tensor x_43_cast_fp16 = add(x = x_37_cast_fp16, y = linear_17_cast_fp16)[name = tensor("x_43_cast_fp16")]; tensor var_442 = const()[name = tensor("op_442"), val = tensor(-1)]; tensor var_458_axes_0 = const()[name = tensor("op_458_axes_0"), val = tensor([-1])]; tensor blocks_3_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_3_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89082112)))]; tensor blocks_3_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_3_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89084736)))]; tensor var_448_to_fp16 = const()[name = tensor("op_448_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_458_cast_fp16 = layer_norm(axes = var_458_axes_0, beta = blocks_3_attn_ln_bias_to_fp16, epsilon = var_448_to_fp16, gamma = blocks_3_attn_ln_weight_to_fp16, x = x_43_cast_fp16)[name = tensor("op_458_cast_fp16")]; tensor var_469_to_fp16 = const()[name = tensor("op_469_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89087360)))]; tensor var_470_to_fp16 = const()[name = tensor("op_470_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(92364224)))]; tensor linear_18_cast_fp16 = linear(bias = var_470_to_fp16, weight = var_469_to_fp16, x = var_458_cast_fp16)[name = tensor("linear_18_cast_fp16")]; tensor var_473_to_fp16 = const()[name = tensor("op_473_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(92366848)))]; tensor linear_19_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_473_to_fp16, x = var_458_cast_fp16)[name = tensor("linear_19_cast_fp16")]; tensor var_477_to_fp16 = const()[name = tensor("op_477_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(95643712)))]; tensor var_478_to_fp16 = const()[name = tensor("op_478_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(98920576)))]; tensor linear_20_cast_fp16 = linear(bias = var_478_to_fp16, weight = var_477_to_fp16, x = var_458_cast_fp16)[name = tensor("linear_20_cast_fp16")]; tensor var_486 = const()[name = tensor("op_486"), val = tensor([1, 1500, 20, -1])]; tensor var_487_cast_fp16 = reshape(shape = var_486, x = linear_18_cast_fp16)[name = tensor("op_487_cast_fp16")]; tensor const_230_to_fp16 = const()[name = tensor("const_230_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_15_cast_fp16 = mul(x = var_487_cast_fp16, y = const_230_to_fp16)[name = tensor("q_15_cast_fp16")]; tensor var_493 = const()[name = tensor("op_493"), val = tensor([1, 1500, 20, -1])]; tensor var_494_cast_fp16 = reshape(shape = var_493, x = linear_19_cast_fp16)[name = tensor("op_494_cast_fp16")]; tensor const_231_to_fp16 = const()[name = tensor("const_231_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_15_cast_fp16 = mul(x = var_494_cast_fp16, y = const_231_to_fp16)[name = tensor("k_15_cast_fp16")]; tensor var_500 = const()[name = tensor("op_500"), val = tensor([1, 1500, 20, -1])]; tensor var_501_cast_fp16 = reshape(shape = var_500, x = linear_20_cast_fp16)[name = tensor("op_501_cast_fp16")]; tensor var_502 = const()[name = tensor("op_502"), val = tensor([0, 2, 1, 3])]; tensor qk_7_transpose_x_0 = const()[name = tensor("qk_7_transpose_x_0"), val = tensor(false)]; tensor qk_7_transpose_y_0 = const()[name = tensor("qk_7_transpose_y_0"), val = tensor(false)]; tensor transpose_134_perm_0 = const()[name = tensor("transpose_134_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_135_perm_0 = const()[name = tensor("transpose_135_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_305 = transpose(perm = transpose_135_perm_0, x = k_15_cast_fp16)[name = tensor("transpose_305")]; tensor transpose_306 = transpose(perm = transpose_134_perm_0, x = q_15_cast_fp16)[name = tensor("transpose_306")]; tensor qk_7_cast_fp16 = matmul(transpose_x = qk_7_transpose_x_0, transpose_y = qk_7_transpose_y_0, x = transpose_306, y = transpose_305)[name = tensor("qk_7_cast_fp16")]; tensor var_506_cast_fp16 = softmax(axis = var_442, x = qk_7_cast_fp16)[name = tensor("op_506_cast_fp16")]; tensor var_508_transpose_x_0 = const()[name = tensor("op_508_transpose_x_0"), val = tensor(false)]; tensor var_508_transpose_y_0 = const()[name = tensor("op_508_transpose_y_0"), val = tensor(false)]; tensor transpose_307 = transpose(perm = var_502, x = var_501_cast_fp16)[name = tensor("transpose_307")]; tensor var_508_cast_fp16 = matmul(transpose_x = var_508_transpose_x_0, transpose_y = var_508_transpose_y_0, x = var_506_cast_fp16, y = transpose_307)[name = tensor("op_508_cast_fp16")]; tensor var_509 = const()[name = tensor("op_509"), val = tensor([0, 2, 1, 3])]; tensor concat_3 = const()[name = tensor("concat_3"), val = tensor([1, 1500, 1280])]; tensor transpose_304 = transpose(perm = var_509, x = var_508_cast_fp16)[name = tensor("transpose_304")]; tensor x_47_cast_fp16 = reshape(shape = concat_3, x = transpose_304)[name = tensor("x_47_cast_fp16")]; tensor var_514_to_fp16 = const()[name = tensor("op_514_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(98923200)))]; tensor var_515_to_fp16 = const()[name = tensor("op_515_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102200064)))]; tensor linear_21_cast_fp16 = linear(bias = var_515_to_fp16, weight = var_514_to_fp16, x = x_47_cast_fp16)[name = tensor("linear_21_cast_fp16")]; tensor x_49_cast_fp16 = add(x = x_43_cast_fp16, y = linear_21_cast_fp16)[name = tensor("x_49_cast_fp16")]; tensor var_522_axes_0 = const()[name = tensor("op_522_axes_0"), val = tensor([-1])]; tensor blocks_3_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_3_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102202688)))]; tensor blocks_3_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_3_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102205312)))]; tensor var_522_cast_fp16 = layer_norm(axes = var_522_axes_0, beta = blocks_3_mlp_ln_bias_to_fp16, epsilon = var_448_to_fp16, gamma = blocks_3_mlp_ln_weight_to_fp16, x = x_49_cast_fp16)[name = tensor("op_522_cast_fp16")]; tensor var_531_to_fp16 = const()[name = tensor("op_531_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102207936)))]; tensor var_532_to_fp16 = const()[name = tensor("op_532_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106877440)))]; tensor linear_22_cast_fp16 = linear(bias = var_532_to_fp16, weight = var_531_to_fp16, x = var_522_cast_fp16)[name = tensor("linear_22_cast_fp16")]; tensor x_53_mode_0 = const()[name = tensor("x_53_mode_0"), val = tensor("EXACT")]; tensor x_53_cast_fp16 = gelu(mode = x_53_mode_0, x = linear_22_cast_fp16)[name = tensor("x_53_cast_fp16")]; tensor var_537_to_fp16 = const()[name = tensor("op_537_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(106881152)))]; tensor var_538_to_fp16 = const()[name = tensor("op_538_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(111550656)))]; tensor linear_23_cast_fp16 = linear(bias = var_538_to_fp16, weight = var_537_to_fp16, x = x_53_cast_fp16)[name = tensor("linear_23_cast_fp16")]; tensor x_55_cast_fp16 = add(x = x_49_cast_fp16, y = linear_23_cast_fp16)[name = tensor("x_55_cast_fp16")]; tensor var_548 = const()[name = tensor("op_548"), val = tensor(-1)]; tensor var_564_axes_0 = const()[name = tensor("op_564_axes_0"), val = tensor([-1])]; tensor blocks_4_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_4_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(111553280)))]; tensor blocks_4_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_4_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(111555904)))]; tensor var_554_to_fp16 = const()[name = tensor("op_554_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_564_cast_fp16 = layer_norm(axes = var_564_axes_0, beta = blocks_4_attn_ln_bias_to_fp16, epsilon = var_554_to_fp16, gamma = blocks_4_attn_ln_weight_to_fp16, x = x_55_cast_fp16)[name = tensor("op_564_cast_fp16")]; tensor var_575_to_fp16 = const()[name = tensor("op_575_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(111558528)))]; tensor var_576_to_fp16 = const()[name = tensor("op_576_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(114835392)))]; tensor linear_24_cast_fp16 = linear(bias = var_576_to_fp16, weight = var_575_to_fp16, x = var_564_cast_fp16)[name = tensor("linear_24_cast_fp16")]; tensor var_579_to_fp16 = const()[name = tensor("op_579_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(114838016)))]; tensor linear_25_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_579_to_fp16, x = var_564_cast_fp16)[name = tensor("linear_25_cast_fp16")]; tensor var_583_to_fp16 = const()[name = tensor("op_583_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118114880)))]; tensor var_584_to_fp16 = const()[name = tensor("op_584_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(121391744)))]; tensor linear_26_cast_fp16 = linear(bias = var_584_to_fp16, weight = var_583_to_fp16, x = var_564_cast_fp16)[name = tensor("linear_26_cast_fp16")]; tensor var_592 = const()[name = tensor("op_592"), val = tensor([1, 1500, 20, -1])]; tensor var_593_cast_fp16 = reshape(shape = var_592, x = linear_24_cast_fp16)[name = tensor("op_593_cast_fp16")]; tensor const_232_to_fp16 = const()[name = tensor("const_232_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_19_cast_fp16 = mul(x = var_593_cast_fp16, y = const_232_to_fp16)[name = tensor("q_19_cast_fp16")]; tensor var_599 = const()[name = tensor("op_599"), val = tensor([1, 1500, 20, -1])]; tensor var_600_cast_fp16 = reshape(shape = var_599, x = linear_25_cast_fp16)[name = tensor("op_600_cast_fp16")]; tensor const_233_to_fp16 = const()[name = tensor("const_233_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_19_cast_fp16 = mul(x = var_600_cast_fp16, y = const_233_to_fp16)[name = tensor("k_19_cast_fp16")]; tensor var_606 = const()[name = tensor("op_606"), val = tensor([1, 1500, 20, -1])]; tensor var_607_cast_fp16 = reshape(shape = var_606, x = linear_26_cast_fp16)[name = tensor("op_607_cast_fp16")]; tensor var_608 = const()[name = tensor("op_608"), val = tensor([0, 2, 1, 3])]; tensor qk_9_transpose_x_0 = const()[name = tensor("qk_9_transpose_x_0"), val = tensor(false)]; tensor qk_9_transpose_y_0 = const()[name = tensor("qk_9_transpose_y_0"), val = tensor(false)]; tensor transpose_136_perm_0 = const()[name = tensor("transpose_136_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_137_perm_0 = const()[name = tensor("transpose_137_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_301 = transpose(perm = transpose_137_perm_0, x = k_19_cast_fp16)[name = tensor("transpose_301")]; tensor transpose_302 = transpose(perm = transpose_136_perm_0, x = q_19_cast_fp16)[name = tensor("transpose_302")]; tensor qk_9_cast_fp16 = matmul(transpose_x = qk_9_transpose_x_0, transpose_y = qk_9_transpose_y_0, x = transpose_302, y = transpose_301)[name = tensor("qk_9_cast_fp16")]; tensor var_612_cast_fp16 = softmax(axis = var_548, x = qk_9_cast_fp16)[name = tensor("op_612_cast_fp16")]; tensor var_614_transpose_x_0 = const()[name = tensor("op_614_transpose_x_0"), val = tensor(false)]; tensor var_614_transpose_y_0 = const()[name = tensor("op_614_transpose_y_0"), val = tensor(false)]; tensor transpose_303 = transpose(perm = var_608, x = var_607_cast_fp16)[name = tensor("transpose_303")]; tensor var_614_cast_fp16 = matmul(transpose_x = var_614_transpose_x_0, transpose_y = var_614_transpose_y_0, x = var_612_cast_fp16, y = transpose_303)[name = tensor("op_614_cast_fp16")]; tensor var_615 = const()[name = tensor("op_615"), val = tensor([0, 2, 1, 3])]; tensor concat_4 = const()[name = tensor("concat_4"), val = tensor([1, 1500, 1280])]; tensor transpose_300 = transpose(perm = var_615, x = var_614_cast_fp16)[name = tensor("transpose_300")]; tensor x_59_cast_fp16 = reshape(shape = concat_4, x = transpose_300)[name = tensor("x_59_cast_fp16")]; tensor var_620_to_fp16 = const()[name = tensor("op_620_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(121394368)))]; tensor var_621_to_fp16 = const()[name = tensor("op_621_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(124671232)))]; tensor linear_27_cast_fp16 = linear(bias = var_621_to_fp16, weight = var_620_to_fp16, x = x_59_cast_fp16)[name = tensor("linear_27_cast_fp16")]; tensor x_61_cast_fp16 = add(x = x_55_cast_fp16, y = linear_27_cast_fp16)[name = tensor("x_61_cast_fp16")]; tensor var_628_axes_0 = const()[name = tensor("op_628_axes_0"), val = tensor([-1])]; tensor blocks_4_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_4_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(124673856)))]; tensor blocks_4_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_4_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(124676480)))]; tensor var_628_cast_fp16 = layer_norm(axes = var_628_axes_0, beta = blocks_4_mlp_ln_bias_to_fp16, epsilon = var_554_to_fp16, gamma = blocks_4_mlp_ln_weight_to_fp16, x = x_61_cast_fp16)[name = tensor("op_628_cast_fp16")]; tensor var_637_to_fp16 = const()[name = tensor("op_637_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(124679104)))]; tensor var_638_to_fp16 = const()[name = tensor("op_638_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(130167808)))]; tensor linear_28_cast_fp16 = linear(bias = var_638_to_fp16, weight = var_637_to_fp16, x = var_628_cast_fp16)[name = tensor("linear_28_cast_fp16")]; tensor x_65_mode_0 = const()[name = tensor("x_65_mode_0"), val = tensor("EXACT")]; tensor x_65_cast_fp16 = gelu(mode = x_65_mode_0, x = linear_28_cast_fp16)[name = tensor("x_65_cast_fp16")]; tensor var_643_to_fp16 = const()[name = tensor("op_643_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(130172160)))]; tensor var_644_to_fp16 = const()[name = tensor("op_644_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135660864)))]; tensor linear_29_cast_fp16 = linear(bias = var_644_to_fp16, weight = var_643_to_fp16, x = x_65_cast_fp16)[name = tensor("linear_29_cast_fp16")]; tensor x_67_cast_fp16 = add(x = x_61_cast_fp16, y = linear_29_cast_fp16)[name = tensor("x_67_cast_fp16")]; tensor var_654 = const()[name = tensor("op_654"), val = tensor(-1)]; tensor var_670_axes_0 = const()[name = tensor("op_670_axes_0"), val = tensor([-1])]; tensor blocks_5_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_5_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135663488)))]; tensor blocks_5_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_5_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135666112)))]; tensor var_660_to_fp16 = const()[name = tensor("op_660_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_670_cast_fp16 = layer_norm(axes = var_670_axes_0, beta = blocks_5_attn_ln_bias_to_fp16, epsilon = var_660_to_fp16, gamma = blocks_5_attn_ln_weight_to_fp16, x = x_67_cast_fp16)[name = tensor("op_670_cast_fp16")]; tensor var_681_to_fp16 = const()[name = tensor("op_681_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135668736)))]; tensor var_682_to_fp16 = const()[name = tensor("op_682_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(138945600)))]; tensor linear_30_cast_fp16 = linear(bias = var_682_to_fp16, weight = var_681_to_fp16, x = var_670_cast_fp16)[name = tensor("linear_30_cast_fp16")]; tensor var_685_to_fp16 = const()[name = tensor("op_685_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(138948224)))]; tensor linear_31_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_685_to_fp16, x = var_670_cast_fp16)[name = tensor("linear_31_cast_fp16")]; tensor var_689_to_fp16 = const()[name = tensor("op_689_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(142225088)))]; tensor var_690_to_fp16 = const()[name = tensor("op_690_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145501952)))]; tensor linear_32_cast_fp16 = linear(bias = var_690_to_fp16, weight = var_689_to_fp16, x = var_670_cast_fp16)[name = tensor("linear_32_cast_fp16")]; tensor var_698 = const()[name = tensor("op_698"), val = tensor([1, 1500, 20, -1])]; tensor var_699_cast_fp16 = reshape(shape = var_698, x = linear_30_cast_fp16)[name = tensor("op_699_cast_fp16")]; tensor const_234_to_fp16 = const()[name = tensor("const_234_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_23_cast_fp16 = mul(x = var_699_cast_fp16, y = const_234_to_fp16)[name = tensor("q_23_cast_fp16")]; tensor var_705 = const()[name = tensor("op_705"), val = tensor([1, 1500, 20, -1])]; tensor var_706_cast_fp16 = reshape(shape = var_705, x = linear_31_cast_fp16)[name = tensor("op_706_cast_fp16")]; tensor const_235_to_fp16 = const()[name = tensor("const_235_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_23_cast_fp16 = mul(x = var_706_cast_fp16, y = const_235_to_fp16)[name = tensor("k_23_cast_fp16")]; tensor var_712 = const()[name = tensor("op_712"), val = tensor([1, 1500, 20, -1])]; tensor var_713_cast_fp16 = reshape(shape = var_712, x = linear_32_cast_fp16)[name = tensor("op_713_cast_fp16")]; tensor var_714 = const()[name = tensor("op_714"), val = tensor([0, 2, 1, 3])]; tensor qk_11_transpose_x_0 = const()[name = tensor("qk_11_transpose_x_0"), val = tensor(false)]; tensor qk_11_transpose_y_0 = const()[name = tensor("qk_11_transpose_y_0"), val = tensor(false)]; tensor transpose_138_perm_0 = const()[name = tensor("transpose_138_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_139_perm_0 = const()[name = tensor("transpose_139_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_297 = transpose(perm = transpose_139_perm_0, x = k_23_cast_fp16)[name = tensor("transpose_297")]; tensor transpose_298 = transpose(perm = transpose_138_perm_0, x = q_23_cast_fp16)[name = tensor("transpose_298")]; tensor qk_11_cast_fp16 = matmul(transpose_x = qk_11_transpose_x_0, transpose_y = qk_11_transpose_y_0, x = transpose_298, y = transpose_297)[name = tensor("qk_11_cast_fp16")]; tensor var_718_cast_fp16 = softmax(axis = var_654, x = qk_11_cast_fp16)[name = tensor("op_718_cast_fp16")]; tensor var_720_transpose_x_0 = const()[name = tensor("op_720_transpose_x_0"), val = tensor(false)]; tensor var_720_transpose_y_0 = const()[name = tensor("op_720_transpose_y_0"), val = tensor(false)]; tensor transpose_299 = transpose(perm = var_714, x = var_713_cast_fp16)[name = tensor("transpose_299")]; tensor var_720_cast_fp16 = matmul(transpose_x = var_720_transpose_x_0, transpose_y = var_720_transpose_y_0, x = var_718_cast_fp16, y = transpose_299)[name = tensor("op_720_cast_fp16")]; tensor var_721 = const()[name = tensor("op_721"), val = tensor([0, 2, 1, 3])]; tensor concat_5 = const()[name = tensor("concat_5"), val = tensor([1, 1500, 1280])]; tensor transpose_296 = transpose(perm = var_721, x = var_720_cast_fp16)[name = tensor("transpose_296")]; tensor x_71_cast_fp16 = reshape(shape = concat_5, x = transpose_296)[name = tensor("x_71_cast_fp16")]; tensor var_726_to_fp16 = const()[name = tensor("op_726_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145504576)))]; tensor var_727_to_fp16 = const()[name = tensor("op_727_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148781440)))]; tensor linear_33_cast_fp16 = linear(bias = var_727_to_fp16, weight = var_726_to_fp16, x = x_71_cast_fp16)[name = tensor("linear_33_cast_fp16")]; tensor x_73_cast_fp16 = add(x = x_67_cast_fp16, y = linear_33_cast_fp16)[name = tensor("x_73_cast_fp16")]; tensor var_734_axes_0 = const()[name = tensor("op_734_axes_0"), val = tensor([-1])]; tensor blocks_5_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_5_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148784064)))]; tensor blocks_5_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_5_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148786688)))]; tensor var_734_cast_fp16 = layer_norm(axes = var_734_axes_0, beta = blocks_5_mlp_ln_bias_to_fp16, epsilon = var_660_to_fp16, gamma = blocks_5_mlp_ln_weight_to_fp16, x = x_73_cast_fp16)[name = tensor("op_734_cast_fp16")]; tensor var_743_to_fp16 = const()[name = tensor("op_743_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148789312)))]; tensor var_744_to_fp16 = const()[name = tensor("op_744_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(154278016)))]; tensor linear_34_cast_fp16 = linear(bias = var_744_to_fp16, weight = var_743_to_fp16, x = var_734_cast_fp16)[name = tensor("linear_34_cast_fp16")]; tensor x_77_mode_0 = const()[name = tensor("x_77_mode_0"), val = tensor("EXACT")]; tensor x_77_cast_fp16 = gelu(mode = x_77_mode_0, x = linear_34_cast_fp16)[name = tensor("x_77_cast_fp16")]; tensor var_749_to_fp16 = const()[name = tensor("op_749_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(154282368)))]; tensor var_750_to_fp16 = const()[name = tensor("op_750_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159771072)))]; tensor linear_35_cast_fp16 = linear(bias = var_750_to_fp16, weight = var_749_to_fp16, x = x_77_cast_fp16)[name = tensor("linear_35_cast_fp16")]; tensor x_79_cast_fp16 = add(x = x_73_cast_fp16, y = linear_35_cast_fp16)[name = tensor("x_79_cast_fp16")]; tensor var_760 = const()[name = tensor("op_760"), val = tensor(-1)]; tensor var_776_axes_0 = const()[name = tensor("op_776_axes_0"), val = tensor([-1])]; tensor blocks_6_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_6_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159773696)))]; tensor blocks_6_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_6_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159776320)))]; tensor var_766_to_fp16 = const()[name = tensor("op_766_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_776_cast_fp16 = layer_norm(axes = var_776_axes_0, beta = blocks_6_attn_ln_bias_to_fp16, epsilon = var_766_to_fp16, gamma = blocks_6_attn_ln_weight_to_fp16, x = x_79_cast_fp16)[name = tensor("op_776_cast_fp16")]; tensor var_787_to_fp16 = const()[name = tensor("op_787_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159778944)))]; tensor var_788_to_fp16 = const()[name = tensor("op_788_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163055808)))]; tensor linear_36_cast_fp16 = linear(bias = var_788_to_fp16, weight = var_787_to_fp16, x = var_776_cast_fp16)[name = tensor("linear_36_cast_fp16")]; tensor var_791_to_fp16 = const()[name = tensor("op_791_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163058432)))]; tensor linear_37_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_791_to_fp16, x = var_776_cast_fp16)[name = tensor("linear_37_cast_fp16")]; tensor var_795_to_fp16 = const()[name = tensor("op_795_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(166335296)))]; tensor var_796_to_fp16 = const()[name = tensor("op_796_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169612160)))]; tensor linear_38_cast_fp16 = linear(bias = var_796_to_fp16, weight = var_795_to_fp16, x = var_776_cast_fp16)[name = tensor("linear_38_cast_fp16")]; tensor var_804 = const()[name = tensor("op_804"), val = tensor([1, 1500, 20, -1])]; tensor var_805_cast_fp16 = reshape(shape = var_804, x = linear_36_cast_fp16)[name = tensor("op_805_cast_fp16")]; tensor const_236_to_fp16 = const()[name = tensor("const_236_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_27_cast_fp16 = mul(x = var_805_cast_fp16, y = const_236_to_fp16)[name = tensor("q_27_cast_fp16")]; tensor var_811 = const()[name = tensor("op_811"), val = tensor([1, 1500, 20, -1])]; tensor var_812_cast_fp16 = reshape(shape = var_811, x = linear_37_cast_fp16)[name = tensor("op_812_cast_fp16")]; tensor const_237_to_fp16 = const()[name = tensor("const_237_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_27_cast_fp16 = mul(x = var_812_cast_fp16, y = const_237_to_fp16)[name = tensor("k_27_cast_fp16")]; tensor var_818 = const()[name = tensor("op_818"), val = tensor([1, 1500, 20, -1])]; tensor var_819_cast_fp16 = reshape(shape = var_818, x = linear_38_cast_fp16)[name = tensor("op_819_cast_fp16")]; tensor var_820 = const()[name = tensor("op_820"), val = tensor([0, 2, 1, 3])]; tensor qk_13_transpose_x_0 = const()[name = tensor("qk_13_transpose_x_0"), val = tensor(false)]; tensor qk_13_transpose_y_0 = const()[name = tensor("qk_13_transpose_y_0"), val = tensor(false)]; tensor transpose_140_perm_0 = const()[name = tensor("transpose_140_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_141_perm_0 = const()[name = tensor("transpose_141_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_293 = transpose(perm = transpose_141_perm_0, x = k_27_cast_fp16)[name = tensor("transpose_293")]; tensor transpose_294 = transpose(perm = transpose_140_perm_0, x = q_27_cast_fp16)[name = tensor("transpose_294")]; tensor qk_13_cast_fp16 = matmul(transpose_x = qk_13_transpose_x_0, transpose_y = qk_13_transpose_y_0, x = transpose_294, y = transpose_293)[name = tensor("qk_13_cast_fp16")]; tensor var_824_cast_fp16 = softmax(axis = var_760, x = qk_13_cast_fp16)[name = tensor("op_824_cast_fp16")]; tensor var_826_transpose_x_0 = const()[name = tensor("op_826_transpose_x_0"), val = tensor(false)]; tensor var_826_transpose_y_0 = const()[name = tensor("op_826_transpose_y_0"), val = tensor(false)]; tensor transpose_295 = transpose(perm = var_820, x = var_819_cast_fp16)[name = tensor("transpose_295")]; tensor var_826_cast_fp16 = matmul(transpose_x = var_826_transpose_x_0, transpose_y = var_826_transpose_y_0, x = var_824_cast_fp16, y = transpose_295)[name = tensor("op_826_cast_fp16")]; tensor var_827 = const()[name = tensor("op_827"), val = tensor([0, 2, 1, 3])]; tensor concat_6 = const()[name = tensor("concat_6"), val = tensor([1, 1500, 1280])]; tensor transpose_292 = transpose(perm = var_827, x = var_826_cast_fp16)[name = tensor("transpose_292")]; tensor x_83_cast_fp16 = reshape(shape = concat_6, x = transpose_292)[name = tensor("x_83_cast_fp16")]; tensor var_832_to_fp16 = const()[name = tensor("op_832_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169614784)))]; tensor var_833_to_fp16 = const()[name = tensor("op_833_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(172891648)))]; tensor linear_39_cast_fp16 = linear(bias = var_833_to_fp16, weight = var_832_to_fp16, x = x_83_cast_fp16)[name = tensor("linear_39_cast_fp16")]; tensor x_85_cast_fp16 = add(x = x_79_cast_fp16, y = linear_39_cast_fp16)[name = tensor("x_85_cast_fp16")]; tensor var_840_axes_0 = const()[name = tensor("op_840_axes_0"), val = tensor([-1])]; tensor blocks_6_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_6_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(172894272)))]; tensor blocks_6_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_6_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(172896896)))]; tensor var_840_cast_fp16 = layer_norm(axes = var_840_axes_0, beta = blocks_6_mlp_ln_bias_to_fp16, epsilon = var_766_to_fp16, gamma = blocks_6_mlp_ln_weight_to_fp16, x = x_85_cast_fp16)[name = tensor("op_840_cast_fp16")]; tensor var_849_to_fp16 = const()[name = tensor("op_849_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(172899520)))]; tensor var_850_to_fp16 = const()[name = tensor("op_850_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178306304)))]; tensor linear_40_cast_fp16 = linear(bias = var_850_to_fp16, weight = var_849_to_fp16, x = var_840_cast_fp16)[name = tensor("linear_40_cast_fp16")]; tensor x_89_mode_0 = const()[name = tensor("x_89_mode_0"), val = tensor("EXACT")]; tensor x_89_cast_fp16 = gelu(mode = x_89_mode_0, x = linear_40_cast_fp16)[name = tensor("x_89_cast_fp16")]; tensor var_855_to_fp16 = const()[name = tensor("op_855_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178310592)))]; tensor var_856_to_fp16 = const()[name = tensor("op_856_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(183717376)))]; tensor linear_41_cast_fp16 = linear(bias = var_856_to_fp16, weight = var_855_to_fp16, x = x_89_cast_fp16)[name = tensor("linear_41_cast_fp16")]; tensor x_91_cast_fp16 = add(x = x_85_cast_fp16, y = linear_41_cast_fp16)[name = tensor("x_91_cast_fp16")]; tensor var_866 = const()[name = tensor("op_866"), val = tensor(-1)]; tensor var_882_axes_0 = const()[name = tensor("op_882_axes_0"), val = tensor([-1])]; tensor blocks_7_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_7_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(183720000)))]; tensor blocks_7_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_7_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(183722624)))]; tensor var_872_to_fp16 = const()[name = tensor("op_872_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_882_cast_fp16 = layer_norm(axes = var_882_axes_0, beta = blocks_7_attn_ln_bias_to_fp16, epsilon = var_872_to_fp16, gamma = blocks_7_attn_ln_weight_to_fp16, x = x_91_cast_fp16)[name = tensor("op_882_cast_fp16")]; tensor var_893_to_fp16 = const()[name = tensor("op_893_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(183725248)))]; tensor var_894_to_fp16 = const()[name = tensor("op_894_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(187002112)))]; tensor linear_42_cast_fp16 = linear(bias = var_894_to_fp16, weight = var_893_to_fp16, x = var_882_cast_fp16)[name = tensor("linear_42_cast_fp16")]; tensor var_897_to_fp16 = const()[name = tensor("op_897_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(187004736)))]; tensor linear_43_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_897_to_fp16, x = var_882_cast_fp16)[name = tensor("linear_43_cast_fp16")]; tensor var_901_to_fp16 = const()[name = tensor("op_901_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(190281600)))]; tensor var_902_to_fp16 = const()[name = tensor("op_902_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(193558464)))]; tensor linear_44_cast_fp16 = linear(bias = var_902_to_fp16, weight = var_901_to_fp16, x = var_882_cast_fp16)[name = tensor("linear_44_cast_fp16")]; tensor var_910 = const()[name = tensor("op_910"), val = tensor([1, 1500, 20, -1])]; tensor var_911_cast_fp16 = reshape(shape = var_910, x = linear_42_cast_fp16)[name = tensor("op_911_cast_fp16")]; tensor const_238_to_fp16 = const()[name = tensor("const_238_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_31_cast_fp16 = mul(x = var_911_cast_fp16, y = const_238_to_fp16)[name = tensor("q_31_cast_fp16")]; tensor var_917 = const()[name = tensor("op_917"), val = tensor([1, 1500, 20, -1])]; tensor var_918_cast_fp16 = reshape(shape = var_917, x = linear_43_cast_fp16)[name = tensor("op_918_cast_fp16")]; tensor const_239_to_fp16 = const()[name = tensor("const_239_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_31_cast_fp16 = mul(x = var_918_cast_fp16, y = const_239_to_fp16)[name = tensor("k_31_cast_fp16")]; tensor var_924 = const()[name = tensor("op_924"), val = tensor([1, 1500, 20, -1])]; tensor var_925_cast_fp16 = reshape(shape = var_924, x = linear_44_cast_fp16)[name = tensor("op_925_cast_fp16")]; tensor var_926 = const()[name = tensor("op_926"), val = tensor([0, 2, 1, 3])]; tensor qk_15_transpose_x_0 = const()[name = tensor("qk_15_transpose_x_0"), val = tensor(false)]; tensor qk_15_transpose_y_0 = const()[name = tensor("qk_15_transpose_y_0"), val = tensor(false)]; tensor transpose_142_perm_0 = const()[name = tensor("transpose_142_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_143_perm_0 = const()[name = tensor("transpose_143_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_289 = transpose(perm = transpose_143_perm_0, x = k_31_cast_fp16)[name = tensor("transpose_289")]; tensor transpose_290 = transpose(perm = transpose_142_perm_0, x = q_31_cast_fp16)[name = tensor("transpose_290")]; tensor qk_15_cast_fp16 = matmul(transpose_x = qk_15_transpose_x_0, transpose_y = qk_15_transpose_y_0, x = transpose_290, y = transpose_289)[name = tensor("qk_15_cast_fp16")]; tensor var_930_cast_fp16 = softmax(axis = var_866, x = qk_15_cast_fp16)[name = tensor("op_930_cast_fp16")]; tensor var_932_transpose_x_0 = const()[name = tensor("op_932_transpose_x_0"), val = tensor(false)]; tensor var_932_transpose_y_0 = const()[name = tensor("op_932_transpose_y_0"), val = tensor(false)]; tensor transpose_291 = transpose(perm = var_926, x = var_925_cast_fp16)[name = tensor("transpose_291")]; tensor var_932_cast_fp16 = matmul(transpose_x = var_932_transpose_x_0, transpose_y = var_932_transpose_y_0, x = var_930_cast_fp16, y = transpose_291)[name = tensor("op_932_cast_fp16")]; tensor var_933 = const()[name = tensor("op_933"), val = tensor([0, 2, 1, 3])]; tensor concat_7 = const()[name = tensor("concat_7"), val = tensor([1, 1500, 1280])]; tensor transpose_288 = transpose(perm = var_933, x = var_932_cast_fp16)[name = tensor("transpose_288")]; tensor x_95_cast_fp16 = reshape(shape = concat_7, x = transpose_288)[name = tensor("x_95_cast_fp16")]; tensor var_938_to_fp16 = const()[name = tensor("op_938_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(193561088)))]; tensor var_939_to_fp16 = const()[name = tensor("op_939_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(196837952)))]; tensor linear_45_cast_fp16 = linear(bias = var_939_to_fp16, weight = var_938_to_fp16, x = x_95_cast_fp16)[name = tensor("linear_45_cast_fp16")]; tensor x_97_cast_fp16 = add(x = x_91_cast_fp16, y = linear_45_cast_fp16)[name = tensor("x_97_cast_fp16")]; tensor var_946_axes_0 = const()[name = tensor("op_946_axes_0"), val = tensor([-1])]; tensor blocks_7_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_7_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(196840576)))]; tensor blocks_7_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_7_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(196843200)))]; tensor var_946_cast_fp16 = layer_norm(axes = var_946_axes_0, beta = blocks_7_mlp_ln_bias_to_fp16, epsilon = var_872_to_fp16, gamma = blocks_7_mlp_ln_weight_to_fp16, x = x_97_cast_fp16)[name = tensor("op_946_cast_fp16")]; tensor var_955_to_fp16 = const()[name = tensor("op_955_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(196845824)))]; tensor var_956_to_fp16 = const()[name = tensor("op_956_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(202252608)))]; tensor linear_46_cast_fp16 = linear(bias = var_956_to_fp16, weight = var_955_to_fp16, x = var_946_cast_fp16)[name = tensor("linear_46_cast_fp16")]; tensor x_101_mode_0 = const()[name = tensor("x_101_mode_0"), val = tensor("EXACT")]; tensor x_101_cast_fp16 = gelu(mode = x_101_mode_0, x = linear_46_cast_fp16)[name = tensor("x_101_cast_fp16")]; tensor var_961_to_fp16 = const()[name = tensor("op_961_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(202256896)))]; tensor var_962_to_fp16 = const()[name = tensor("op_962_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(207663680)))]; tensor linear_47_cast_fp16 = linear(bias = var_962_to_fp16, weight = var_961_to_fp16, x = x_101_cast_fp16)[name = tensor("linear_47_cast_fp16")]; tensor x_103_cast_fp16 = add(x = x_97_cast_fp16, y = linear_47_cast_fp16)[name = tensor("x_103_cast_fp16")]; tensor var_972 = const()[name = tensor("op_972"), val = tensor(-1)]; tensor var_988_axes_0 = const()[name = tensor("op_988_axes_0"), val = tensor([-1])]; tensor blocks_8_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_8_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(207666304)))]; tensor blocks_8_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_8_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(207668928)))]; tensor var_978_to_fp16 = const()[name = tensor("op_978_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_988_cast_fp16 = layer_norm(axes = var_988_axes_0, beta = blocks_8_attn_ln_bias_to_fp16, epsilon = var_978_to_fp16, gamma = blocks_8_attn_ln_weight_to_fp16, x = x_103_cast_fp16)[name = tensor("op_988_cast_fp16")]; tensor var_999_to_fp16 = const()[name = tensor("op_999_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(207671552)))]; tensor var_1000_to_fp16 = const()[name = tensor("op_1000_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(210948416)))]; tensor linear_48_cast_fp16 = linear(bias = var_1000_to_fp16, weight = var_999_to_fp16, x = var_988_cast_fp16)[name = tensor("linear_48_cast_fp16")]; tensor var_1003_to_fp16 = const()[name = tensor("op_1003_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(210951040)))]; tensor linear_49_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_1003_to_fp16, x = var_988_cast_fp16)[name = tensor("linear_49_cast_fp16")]; tensor var_1007_to_fp16 = const()[name = tensor("op_1007_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(214227904)))]; tensor var_1008_to_fp16 = const()[name = tensor("op_1008_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217504768)))]; tensor linear_50_cast_fp16 = linear(bias = var_1008_to_fp16, weight = var_1007_to_fp16, x = var_988_cast_fp16)[name = tensor("linear_50_cast_fp16")]; tensor var_1016 = const()[name = tensor("op_1016"), val = tensor([1, 1500, 20, -1])]; tensor var_1017_cast_fp16 = reshape(shape = var_1016, x = linear_48_cast_fp16)[name = tensor("op_1017_cast_fp16")]; tensor const_240_to_fp16 = const()[name = tensor("const_240_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_35_cast_fp16 = mul(x = var_1017_cast_fp16, y = const_240_to_fp16)[name = tensor("q_35_cast_fp16")]; tensor var_1023 = const()[name = tensor("op_1023"), val = tensor([1, 1500, 20, -1])]; tensor var_1024_cast_fp16 = reshape(shape = var_1023, x = linear_49_cast_fp16)[name = tensor("op_1024_cast_fp16")]; tensor const_241_to_fp16 = const()[name = tensor("const_241_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_35_cast_fp16 = mul(x = var_1024_cast_fp16, y = const_241_to_fp16)[name = tensor("k_35_cast_fp16")]; tensor var_1030 = const()[name = tensor("op_1030"), val = tensor([1, 1500, 20, -1])]; tensor var_1031_cast_fp16 = reshape(shape = var_1030, x = linear_50_cast_fp16)[name = tensor("op_1031_cast_fp16")]; tensor var_1032 = const()[name = tensor("op_1032"), val = tensor([0, 2, 1, 3])]; tensor qk_17_transpose_x_0 = const()[name = tensor("qk_17_transpose_x_0"), val = tensor(false)]; tensor qk_17_transpose_y_0 = const()[name = tensor("qk_17_transpose_y_0"), val = tensor(false)]; tensor transpose_144_perm_0 = const()[name = tensor("transpose_144_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_145_perm_0 = const()[name = tensor("transpose_145_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_285 = transpose(perm = transpose_145_perm_0, x = k_35_cast_fp16)[name = tensor("transpose_285")]; tensor transpose_286 = transpose(perm = transpose_144_perm_0, x = q_35_cast_fp16)[name = tensor("transpose_286")]; tensor qk_17_cast_fp16 = matmul(transpose_x = qk_17_transpose_x_0, transpose_y = qk_17_transpose_y_0, x = transpose_286, y = transpose_285)[name = tensor("qk_17_cast_fp16")]; tensor var_1036_cast_fp16 = softmax(axis = var_972, x = qk_17_cast_fp16)[name = tensor("op_1036_cast_fp16")]; tensor var_1038_transpose_x_0 = const()[name = tensor("op_1038_transpose_x_0"), val = tensor(false)]; tensor var_1038_transpose_y_0 = const()[name = tensor("op_1038_transpose_y_0"), val = tensor(false)]; tensor transpose_287 = transpose(perm = var_1032, x = var_1031_cast_fp16)[name = tensor("transpose_287")]; tensor var_1038_cast_fp16 = matmul(transpose_x = var_1038_transpose_x_0, transpose_y = var_1038_transpose_y_0, x = var_1036_cast_fp16, y = transpose_287)[name = tensor("op_1038_cast_fp16")]; tensor var_1039 = const()[name = tensor("op_1039"), val = tensor([0, 2, 1, 3])]; tensor concat_8 = const()[name = tensor("concat_8"), val = tensor([1, 1500, 1280])]; tensor transpose_284 = transpose(perm = var_1039, x = var_1038_cast_fp16)[name = tensor("transpose_284")]; tensor x_107_cast_fp16 = reshape(shape = concat_8, x = transpose_284)[name = tensor("x_107_cast_fp16")]; tensor var_1044_to_fp16 = const()[name = tensor("op_1044_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217507392)))]; tensor var_1045_to_fp16 = const()[name = tensor("op_1045_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220784256)))]; tensor linear_51_cast_fp16 = linear(bias = var_1045_to_fp16, weight = var_1044_to_fp16, x = x_107_cast_fp16)[name = tensor("linear_51_cast_fp16")]; tensor x_109_cast_fp16 = add(x = x_103_cast_fp16, y = linear_51_cast_fp16)[name = tensor("x_109_cast_fp16")]; tensor var_1052_axes_0 = const()[name = tensor("op_1052_axes_0"), val = tensor([-1])]; tensor blocks_8_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_8_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220786880)))]; tensor blocks_8_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_8_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220789504)))]; tensor var_1052_cast_fp16 = layer_norm(axes = var_1052_axes_0, beta = blocks_8_mlp_ln_bias_to_fp16, epsilon = var_978_to_fp16, gamma = blocks_8_mlp_ln_weight_to_fp16, x = x_109_cast_fp16)[name = tensor("op_1052_cast_fp16")]; tensor var_1061_to_fp16 = const()[name = tensor("op_1061_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220792128)))]; tensor var_1062_to_fp16 = const()[name = tensor("op_1062_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(226690432)))]; tensor linear_52_cast_fp16 = linear(bias = var_1062_to_fp16, weight = var_1061_to_fp16, x = var_1052_cast_fp16)[name = tensor("linear_52_cast_fp16")]; tensor x_113_mode_0 = const()[name = tensor("x_113_mode_0"), val = tensor("EXACT")]; tensor x_113_cast_fp16 = gelu(mode = x_113_mode_0, x = linear_52_cast_fp16)[name = tensor("x_113_cast_fp16")]; tensor var_1067_to_fp16 = const()[name = tensor("op_1067_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(226695104)))]; tensor var_1068_to_fp16 = const()[name = tensor("op_1068_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(232593408)))]; tensor linear_53_cast_fp16 = linear(bias = var_1068_to_fp16, weight = var_1067_to_fp16, x = x_113_cast_fp16)[name = tensor("linear_53_cast_fp16")]; tensor x_115_cast_fp16 = add(x = x_109_cast_fp16, y = linear_53_cast_fp16)[name = tensor("x_115_cast_fp16")]; tensor var_1078 = const()[name = tensor("op_1078"), val = tensor(-1)]; tensor var_1094_axes_0 = const()[name = tensor("op_1094_axes_0"), val = tensor([-1])]; tensor blocks_9_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_9_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(232596032)))]; tensor blocks_9_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_9_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(232598656)))]; tensor var_1084_to_fp16 = const()[name = tensor("op_1084_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1094_cast_fp16 = layer_norm(axes = var_1094_axes_0, beta = blocks_9_attn_ln_bias_to_fp16, epsilon = var_1084_to_fp16, gamma = blocks_9_attn_ln_weight_to_fp16, x = x_115_cast_fp16)[name = tensor("op_1094_cast_fp16")]; tensor var_1105_to_fp16 = const()[name = tensor("op_1105_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(232601280)))]; tensor var_1106_to_fp16 = const()[name = tensor("op_1106_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(235878144)))]; tensor linear_54_cast_fp16 = linear(bias = var_1106_to_fp16, weight = var_1105_to_fp16, x = var_1094_cast_fp16)[name = tensor("linear_54_cast_fp16")]; tensor var_1109_to_fp16 = const()[name = tensor("op_1109_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(235880768)))]; tensor linear_55_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_1109_to_fp16, x = var_1094_cast_fp16)[name = tensor("linear_55_cast_fp16")]; tensor var_1113_to_fp16 = const()[name = tensor("op_1113_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(239157632)))]; tensor var_1114_to_fp16 = const()[name = tensor("op_1114_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(242434496)))]; tensor linear_56_cast_fp16 = linear(bias = var_1114_to_fp16, weight = var_1113_to_fp16, x = var_1094_cast_fp16)[name = tensor("linear_56_cast_fp16")]; tensor var_1122 = const()[name = tensor("op_1122"), val = tensor([1, 1500, 20, -1])]; tensor var_1123_cast_fp16 = reshape(shape = var_1122, x = linear_54_cast_fp16)[name = tensor("op_1123_cast_fp16")]; tensor const_242_to_fp16 = const()[name = tensor("const_242_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_39_cast_fp16 = mul(x = var_1123_cast_fp16, y = const_242_to_fp16)[name = tensor("q_39_cast_fp16")]; tensor var_1129 = const()[name = tensor("op_1129"), val = tensor([1, 1500, 20, -1])]; tensor var_1130_cast_fp16 = reshape(shape = var_1129, x = linear_55_cast_fp16)[name = tensor("op_1130_cast_fp16")]; tensor const_243_to_fp16 = const()[name = tensor("const_243_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_39_cast_fp16 = mul(x = var_1130_cast_fp16, y = const_243_to_fp16)[name = tensor("k_39_cast_fp16")]; tensor var_1136 = const()[name = tensor("op_1136"), val = tensor([1, 1500, 20, -1])]; tensor var_1137_cast_fp16 = reshape(shape = var_1136, x = linear_56_cast_fp16)[name = tensor("op_1137_cast_fp16")]; tensor var_1138 = const()[name = tensor("op_1138"), val = tensor([0, 2, 1, 3])]; tensor qk_19_transpose_x_0 = const()[name = tensor("qk_19_transpose_x_0"), val = tensor(false)]; tensor qk_19_transpose_y_0 = const()[name = tensor("qk_19_transpose_y_0"), val = tensor(false)]; tensor transpose_146_perm_0 = const()[name = tensor("transpose_146_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_147_perm_0 = const()[name = tensor("transpose_147_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_281 = transpose(perm = transpose_147_perm_0, x = k_39_cast_fp16)[name = tensor("transpose_281")]; tensor transpose_282 = transpose(perm = transpose_146_perm_0, x = q_39_cast_fp16)[name = tensor("transpose_282")]; tensor qk_19_cast_fp16 = matmul(transpose_x = qk_19_transpose_x_0, transpose_y = qk_19_transpose_y_0, x = transpose_282, y = transpose_281)[name = tensor("qk_19_cast_fp16")]; tensor var_1142_cast_fp16 = softmax(axis = var_1078, x = qk_19_cast_fp16)[name = tensor("op_1142_cast_fp16")]; tensor var_1144_transpose_x_0 = const()[name = tensor("op_1144_transpose_x_0"), val = tensor(false)]; tensor var_1144_transpose_y_0 = const()[name = tensor("op_1144_transpose_y_0"), val = tensor(false)]; tensor transpose_283 = transpose(perm = var_1138, x = var_1137_cast_fp16)[name = tensor("transpose_283")]; tensor var_1144_cast_fp16 = matmul(transpose_x = var_1144_transpose_x_0, transpose_y = var_1144_transpose_y_0, x = var_1142_cast_fp16, y = transpose_283)[name = tensor("op_1144_cast_fp16")]; tensor var_1145 = const()[name = tensor("op_1145"), val = tensor([0, 2, 1, 3])]; tensor concat_9 = const()[name = tensor("concat_9"), val = tensor([1, 1500, 1280])]; tensor transpose_280 = transpose(perm = var_1145, x = var_1144_cast_fp16)[name = tensor("transpose_280")]; tensor x_119_cast_fp16 = reshape(shape = concat_9, x = transpose_280)[name = tensor("x_119_cast_fp16")]; tensor var_1150_to_fp16 = const()[name = tensor("op_1150_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(242437120)))]; tensor var_1151_to_fp16 = const()[name = tensor("op_1151_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245713984)))]; tensor linear_57_cast_fp16 = linear(bias = var_1151_to_fp16, weight = var_1150_to_fp16, x = x_119_cast_fp16)[name = tensor("linear_57_cast_fp16")]; tensor x_121_cast_fp16 = add(x = x_115_cast_fp16, y = linear_57_cast_fp16)[name = tensor("x_121_cast_fp16")]; tensor var_1158_axes_0 = const()[name = tensor("op_1158_axes_0"), val = tensor([-1])]; tensor blocks_9_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_9_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245716608)))]; tensor blocks_9_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_9_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245719232)))]; tensor var_1158_cast_fp16 = layer_norm(axes = var_1158_axes_0, beta = blocks_9_mlp_ln_bias_to_fp16, epsilon = var_1084_to_fp16, gamma = blocks_9_mlp_ln_weight_to_fp16, x = x_121_cast_fp16)[name = tensor("op_1158_cast_fp16")]; tensor var_1167_to_fp16 = const()[name = tensor("op_1167_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245721856)))]; tensor var_1168_to_fp16 = const()[name = tensor("op_1168_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(252439360)))]; tensor linear_58_cast_fp16 = linear(bias = var_1168_to_fp16, weight = var_1167_to_fp16, x = var_1158_cast_fp16)[name = tensor("linear_58_cast_fp16")]; tensor x_125_mode_0 = const()[name = tensor("x_125_mode_0"), val = tensor("EXACT")]; tensor x_125_cast_fp16 = gelu(mode = x_125_mode_0, x = linear_58_cast_fp16)[name = tensor("x_125_cast_fp16")]; tensor var_1173_to_fp16 = const()[name = tensor("op_1173_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(252444672)))]; tensor var_1174_to_fp16 = const()[name = tensor("op_1174_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(259162176)))]; tensor linear_59_cast_fp16 = linear(bias = var_1174_to_fp16, weight = var_1173_to_fp16, x = x_125_cast_fp16)[name = tensor("linear_59_cast_fp16")]; tensor x_127_cast_fp16 = add(x = x_121_cast_fp16, y = linear_59_cast_fp16)[name = tensor("x_127_cast_fp16")]; tensor var_1184 = const()[name = tensor("op_1184"), val = tensor(-1)]; tensor var_1200_axes_0 = const()[name = tensor("op_1200_axes_0"), val = tensor([-1])]; tensor blocks_10_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_10_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(259164800)))]; tensor blocks_10_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_10_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(259167424)))]; tensor var_1190_to_fp16 = const()[name = tensor("op_1190_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1200_cast_fp16 = layer_norm(axes = var_1200_axes_0, beta = blocks_10_attn_ln_bias_to_fp16, epsilon = var_1190_to_fp16, gamma = blocks_10_attn_ln_weight_to_fp16, x = x_127_cast_fp16)[name = tensor("op_1200_cast_fp16")]; tensor var_1211_to_fp16 = const()[name = tensor("op_1211_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(259170048)))]; tensor var_1212_to_fp16 = const()[name = tensor("op_1212_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(262446912)))]; tensor linear_60_cast_fp16 = linear(bias = var_1212_to_fp16, weight = var_1211_to_fp16, x = var_1200_cast_fp16)[name = tensor("linear_60_cast_fp16")]; tensor var_1215_to_fp16 = const()[name = tensor("op_1215_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(262449536)))]; tensor linear_61_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_1215_to_fp16, x = var_1200_cast_fp16)[name = tensor("linear_61_cast_fp16")]; tensor var_1219_to_fp16 = const()[name = tensor("op_1219_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(265726400)))]; tensor var_1220_to_fp16 = const()[name = tensor("op_1220_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(269003264)))]; tensor linear_62_cast_fp16 = linear(bias = var_1220_to_fp16, weight = var_1219_to_fp16, x = var_1200_cast_fp16)[name = tensor("linear_62_cast_fp16")]; tensor var_1228 = const()[name = tensor("op_1228"), val = tensor([1, 1500, 20, -1])]; tensor var_1229_cast_fp16 = reshape(shape = var_1228, x = linear_60_cast_fp16)[name = tensor("op_1229_cast_fp16")]; tensor const_244_to_fp16 = const()[name = tensor("const_244_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_43_cast_fp16 = mul(x = var_1229_cast_fp16, y = const_244_to_fp16)[name = tensor("q_43_cast_fp16")]; tensor var_1235 = const()[name = tensor("op_1235"), val = tensor([1, 1500, 20, -1])]; tensor var_1236_cast_fp16 = reshape(shape = var_1235, x = linear_61_cast_fp16)[name = tensor("op_1236_cast_fp16")]; tensor const_245_to_fp16 = const()[name = tensor("const_245_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_43_cast_fp16 = mul(x = var_1236_cast_fp16, y = const_245_to_fp16)[name = tensor("k_43_cast_fp16")]; tensor var_1242 = const()[name = tensor("op_1242"), val = tensor([1, 1500, 20, -1])]; tensor var_1243_cast_fp16 = reshape(shape = var_1242, x = linear_62_cast_fp16)[name = tensor("op_1243_cast_fp16")]; tensor var_1244 = const()[name = tensor("op_1244"), val = tensor([0, 2, 1, 3])]; tensor qk_21_transpose_x_0 = const()[name = tensor("qk_21_transpose_x_0"), val = tensor(false)]; tensor qk_21_transpose_y_0 = const()[name = tensor("qk_21_transpose_y_0"), val = tensor(false)]; tensor transpose_148_perm_0 = const()[name = tensor("transpose_148_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_149_perm_0 = const()[name = tensor("transpose_149_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_277 = transpose(perm = transpose_149_perm_0, x = k_43_cast_fp16)[name = tensor("transpose_277")]; tensor transpose_278 = transpose(perm = transpose_148_perm_0, x = q_43_cast_fp16)[name = tensor("transpose_278")]; tensor qk_21_cast_fp16 = matmul(transpose_x = qk_21_transpose_x_0, transpose_y = qk_21_transpose_y_0, x = transpose_278, y = transpose_277)[name = tensor("qk_21_cast_fp16")]; tensor var_1248_cast_fp16 = softmax(axis = var_1184, x = qk_21_cast_fp16)[name = tensor("op_1248_cast_fp16")]; tensor var_1250_transpose_x_0 = const()[name = tensor("op_1250_transpose_x_0"), val = tensor(false)]; tensor var_1250_transpose_y_0 = const()[name = tensor("op_1250_transpose_y_0"), val = tensor(false)]; tensor transpose_279 = transpose(perm = var_1244, x = var_1243_cast_fp16)[name = tensor("transpose_279")]; tensor var_1250_cast_fp16 = matmul(transpose_x = var_1250_transpose_x_0, transpose_y = var_1250_transpose_y_0, x = var_1248_cast_fp16, y = transpose_279)[name = tensor("op_1250_cast_fp16")]; tensor var_1251 = const()[name = tensor("op_1251"), val = tensor([0, 2, 1, 3])]; tensor concat_10 = const()[name = tensor("concat_10"), val = tensor([1, 1500, 1280])]; tensor transpose_276 = transpose(perm = var_1251, x = var_1250_cast_fp16)[name = tensor("transpose_276")]; tensor x_131_cast_fp16 = reshape(shape = concat_10, x = transpose_276)[name = tensor("x_131_cast_fp16")]; tensor var_1256_to_fp16 = const()[name = tensor("op_1256_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(269005888)))]; tensor var_1257_to_fp16 = const()[name = tensor("op_1257_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(272282752)))]; tensor linear_63_cast_fp16 = linear(bias = var_1257_to_fp16, weight = var_1256_to_fp16, x = x_131_cast_fp16)[name = tensor("linear_63_cast_fp16")]; tensor x_133_cast_fp16 = add(x = x_127_cast_fp16, y = linear_63_cast_fp16)[name = tensor("x_133_cast_fp16")]; tensor var_1264_axes_0 = const()[name = tensor("op_1264_axes_0"), val = tensor([-1])]; tensor blocks_10_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_10_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(272285376)))]; tensor blocks_10_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_10_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(272288000)))]; tensor var_1264_cast_fp16 = layer_norm(axes = var_1264_axes_0, beta = blocks_10_mlp_ln_bias_to_fp16, epsilon = var_1190_to_fp16, gamma = blocks_10_mlp_ln_weight_to_fp16, x = x_133_cast_fp16)[name = tensor("op_1264_cast_fp16")]; tensor var_1273_to_fp16 = const()[name = tensor("op_1273_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(272290624)))]; tensor var_1274_to_fp16 = const()[name = tensor("op_1274_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(280155008)))]; tensor linear_64_cast_fp16 = linear(bias = var_1274_to_fp16, weight = var_1273_to_fp16, x = var_1264_cast_fp16)[name = tensor("linear_64_cast_fp16")]; tensor x_137_mode_0 = const()[name = tensor("x_137_mode_0"), val = tensor("EXACT")]; tensor x_137_cast_fp16 = gelu(mode = x_137_mode_0, x = linear_64_cast_fp16)[name = tensor("x_137_cast_fp16")]; tensor var_1279_to_fp16 = const()[name = tensor("op_1279_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(280161216)))]; tensor var_1280_to_fp16 = const()[name = tensor("op_1280_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(288025600)))]; tensor linear_65_cast_fp16 = linear(bias = var_1280_to_fp16, weight = var_1279_to_fp16, x = x_137_cast_fp16)[name = tensor("linear_65_cast_fp16")]; tensor x_139_cast_fp16 = add(x = x_133_cast_fp16, y = linear_65_cast_fp16)[name = tensor("x_139_cast_fp16")]; tensor var_1290 = const()[name = tensor("op_1290"), val = tensor(-1)]; tensor var_1306_axes_0 = const()[name = tensor("op_1306_axes_0"), val = tensor([-1])]; tensor blocks_11_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_11_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(288028224)))]; tensor blocks_11_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_11_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(288030848)))]; tensor var_1296_to_fp16 = const()[name = tensor("op_1296_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1306_cast_fp16 = layer_norm(axes = var_1306_axes_0, beta = blocks_11_attn_ln_bias_to_fp16, epsilon = var_1296_to_fp16, gamma = blocks_11_attn_ln_weight_to_fp16, x = x_139_cast_fp16)[name = tensor("op_1306_cast_fp16")]; tensor var_1317_to_fp16 = const()[name = tensor("op_1317_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(288033472)))]; tensor var_1318_to_fp16 = const()[name = tensor("op_1318_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291310336)))]; tensor linear_66_cast_fp16 = linear(bias = var_1318_to_fp16, weight = var_1317_to_fp16, x = var_1306_cast_fp16)[name = tensor("linear_66_cast_fp16")]; tensor var_1321_to_fp16 = const()[name = tensor("op_1321_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291312960)))]; tensor linear_67_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_1321_to_fp16, x = var_1306_cast_fp16)[name = tensor("linear_67_cast_fp16")]; tensor var_1325_to_fp16 = const()[name = tensor("op_1325_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(294589824)))]; tensor var_1326_to_fp16 = const()[name = tensor("op_1326_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(297866688)))]; tensor linear_68_cast_fp16 = linear(bias = var_1326_to_fp16, weight = var_1325_to_fp16, x = var_1306_cast_fp16)[name = tensor("linear_68_cast_fp16")]; tensor var_1334 = const()[name = tensor("op_1334"), val = tensor([1, 1500, 20, -1])]; tensor var_1335_cast_fp16 = reshape(shape = var_1334, x = linear_66_cast_fp16)[name = tensor("op_1335_cast_fp16")]; tensor const_246_to_fp16 = const()[name = tensor("const_246_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_47_cast_fp16 = mul(x = var_1335_cast_fp16, y = const_246_to_fp16)[name = tensor("q_47_cast_fp16")]; tensor var_1341 = const()[name = tensor("op_1341"), val = tensor([1, 1500, 20, -1])]; tensor var_1342_cast_fp16 = reshape(shape = var_1341, x = linear_67_cast_fp16)[name = tensor("op_1342_cast_fp16")]; tensor const_247_to_fp16 = const()[name = tensor("const_247_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_47_cast_fp16 = mul(x = var_1342_cast_fp16, y = const_247_to_fp16)[name = tensor("k_47_cast_fp16")]; tensor var_1348 = const()[name = tensor("op_1348"), val = tensor([1, 1500, 20, -1])]; tensor var_1349_cast_fp16 = reshape(shape = var_1348, x = linear_68_cast_fp16)[name = tensor("op_1349_cast_fp16")]; tensor var_1350 = const()[name = tensor("op_1350"), val = tensor([0, 2, 1, 3])]; tensor qk_23_transpose_x_0 = const()[name = tensor("qk_23_transpose_x_0"), val = tensor(false)]; tensor qk_23_transpose_y_0 = const()[name = tensor("qk_23_transpose_y_0"), val = tensor(false)]; tensor transpose_150_perm_0 = const()[name = tensor("transpose_150_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_151_perm_0 = const()[name = tensor("transpose_151_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_273 = transpose(perm = transpose_151_perm_0, x = k_47_cast_fp16)[name = tensor("transpose_273")]; tensor transpose_274 = transpose(perm = transpose_150_perm_0, x = q_47_cast_fp16)[name = tensor("transpose_274")]; tensor qk_23_cast_fp16 = matmul(transpose_x = qk_23_transpose_x_0, transpose_y = qk_23_transpose_y_0, x = transpose_274, y = transpose_273)[name = tensor("qk_23_cast_fp16")]; tensor var_1354_cast_fp16 = softmax(axis = var_1290, x = qk_23_cast_fp16)[name = tensor("op_1354_cast_fp16")]; tensor var_1356_transpose_x_0 = const()[name = tensor("op_1356_transpose_x_0"), val = tensor(false)]; tensor var_1356_transpose_y_0 = const()[name = tensor("op_1356_transpose_y_0"), val = tensor(false)]; tensor transpose_275 = transpose(perm = var_1350, x = var_1349_cast_fp16)[name = tensor("transpose_275")]; tensor var_1356_cast_fp16 = matmul(transpose_x = var_1356_transpose_x_0, transpose_y = var_1356_transpose_y_0, x = var_1354_cast_fp16, y = transpose_275)[name = tensor("op_1356_cast_fp16")]; tensor var_1357 = const()[name = tensor("op_1357"), val = tensor([0, 2, 1, 3])]; tensor concat_11 = const()[name = tensor("concat_11"), val = tensor([1, 1500, 1280])]; tensor transpose_272 = transpose(perm = var_1357, x = var_1356_cast_fp16)[name = tensor("transpose_272")]; tensor x_143_cast_fp16 = reshape(shape = concat_11, x = transpose_272)[name = tensor("x_143_cast_fp16")]; tensor var_1362_to_fp16 = const()[name = tensor("op_1362_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(297869312)))]; tensor var_1363_to_fp16 = const()[name = tensor("op_1363_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(301146176)))]; tensor linear_69_cast_fp16 = linear(bias = var_1363_to_fp16, weight = var_1362_to_fp16, x = x_143_cast_fp16)[name = tensor("linear_69_cast_fp16")]; tensor x_145_cast_fp16 = add(x = x_139_cast_fp16, y = linear_69_cast_fp16)[name = tensor("x_145_cast_fp16")]; tensor var_1370_axes_0 = const()[name = tensor("op_1370_axes_0"), val = tensor([-1])]; tensor blocks_11_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_11_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(301148800)))]; tensor blocks_11_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_11_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(301151424)))]; tensor var_1370_cast_fp16 = layer_norm(axes = var_1370_axes_0, beta = blocks_11_mlp_ln_bias_to_fp16, epsilon = var_1296_to_fp16, gamma = blocks_11_mlp_ln_weight_to_fp16, x = x_145_cast_fp16)[name = tensor("op_1370_cast_fp16")]; tensor var_1379_to_fp16 = const()[name = tensor("op_1379_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(301154048)))]; tensor var_1380_to_fp16 = const()[name = tensor("op_1380_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(308772672)))]; tensor linear_70_cast_fp16 = linear(bias = var_1380_to_fp16, weight = var_1379_to_fp16, x = var_1370_cast_fp16)[name = tensor("linear_70_cast_fp16")]; tensor x_149_mode_0 = const()[name = tensor("x_149_mode_0"), val = tensor("EXACT")]; tensor x_149_cast_fp16 = gelu(mode = x_149_mode_0, x = linear_70_cast_fp16)[name = tensor("x_149_cast_fp16")]; tensor var_1385_to_fp16 = const()[name = tensor("op_1385_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(308778688)))]; tensor var_1386_to_fp16 = const()[name = tensor("op_1386_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316397312)))]; tensor linear_71_cast_fp16 = linear(bias = var_1386_to_fp16, weight = var_1385_to_fp16, x = x_149_cast_fp16)[name = tensor("linear_71_cast_fp16")]; tensor x_151_cast_fp16 = add(x = x_145_cast_fp16, y = linear_71_cast_fp16)[name = tensor("x_151_cast_fp16")]; tensor var_1396 = const()[name = tensor("op_1396"), val = tensor(-1)]; tensor var_1412_axes_0 = const()[name = tensor("op_1412_axes_0"), val = tensor([-1])]; tensor blocks_12_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_12_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316399936)))]; tensor blocks_12_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_12_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316402560)))]; tensor var_1402_to_fp16 = const()[name = tensor("op_1402_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1412_cast_fp16 = layer_norm(axes = var_1412_axes_0, beta = blocks_12_attn_ln_bias_to_fp16, epsilon = var_1402_to_fp16, gamma = blocks_12_attn_ln_weight_to_fp16, x = x_151_cast_fp16)[name = tensor("op_1412_cast_fp16")]; tensor var_1423_to_fp16 = const()[name = tensor("op_1423_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316405184)))]; tensor var_1424_to_fp16 = const()[name = tensor("op_1424_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(319682048)))]; tensor linear_72_cast_fp16 = linear(bias = var_1424_to_fp16, weight = var_1423_to_fp16, x = var_1412_cast_fp16)[name = tensor("linear_72_cast_fp16")]; tensor var_1427_to_fp16 = const()[name = tensor("op_1427_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(319684672)))]; tensor linear_73_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_1427_to_fp16, x = var_1412_cast_fp16)[name = tensor("linear_73_cast_fp16")]; tensor var_1431_to_fp16 = const()[name = tensor("op_1431_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(322961536)))]; tensor var_1432_to_fp16 = const()[name = tensor("op_1432_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(326238400)))]; tensor linear_74_cast_fp16 = linear(bias = var_1432_to_fp16, weight = var_1431_to_fp16, x = var_1412_cast_fp16)[name = tensor("linear_74_cast_fp16")]; tensor var_1440 = const()[name = tensor("op_1440"), val = tensor([1, 1500, 20, -1])]; tensor var_1441_cast_fp16 = reshape(shape = var_1440, x = linear_72_cast_fp16)[name = tensor("op_1441_cast_fp16")]; tensor const_248_to_fp16 = const()[name = tensor("const_248_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_51_cast_fp16 = mul(x = var_1441_cast_fp16, y = const_248_to_fp16)[name = tensor("q_51_cast_fp16")]; tensor var_1447 = const()[name = tensor("op_1447"), val = tensor([1, 1500, 20, -1])]; tensor var_1448_cast_fp16 = reshape(shape = var_1447, x = linear_73_cast_fp16)[name = tensor("op_1448_cast_fp16")]; tensor const_249_to_fp16 = const()[name = tensor("const_249_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_51_cast_fp16 = mul(x = var_1448_cast_fp16, y = const_249_to_fp16)[name = tensor("k_51_cast_fp16")]; tensor var_1454 = const()[name = tensor("op_1454"), val = tensor([1, 1500, 20, -1])]; tensor var_1455_cast_fp16 = reshape(shape = var_1454, x = linear_74_cast_fp16)[name = tensor("op_1455_cast_fp16")]; tensor var_1456 = const()[name = tensor("op_1456"), val = tensor([0, 2, 1, 3])]; tensor qk_25_transpose_x_0 = const()[name = tensor("qk_25_transpose_x_0"), val = tensor(false)]; tensor qk_25_transpose_y_0 = const()[name = tensor("qk_25_transpose_y_0"), val = tensor(false)]; tensor transpose_152_perm_0 = const()[name = tensor("transpose_152_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_153_perm_0 = const()[name = tensor("transpose_153_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_269 = transpose(perm = transpose_153_perm_0, x = k_51_cast_fp16)[name = tensor("transpose_269")]; tensor transpose_270 = transpose(perm = transpose_152_perm_0, x = q_51_cast_fp16)[name = tensor("transpose_270")]; tensor qk_25_cast_fp16 = matmul(transpose_x = qk_25_transpose_x_0, transpose_y = qk_25_transpose_y_0, x = transpose_270, y = transpose_269)[name = tensor("qk_25_cast_fp16")]; tensor var_1460_cast_fp16 = softmax(axis = var_1396, x = qk_25_cast_fp16)[name = tensor("op_1460_cast_fp16")]; tensor var_1462_transpose_x_0 = const()[name = tensor("op_1462_transpose_x_0"), val = tensor(false)]; tensor var_1462_transpose_y_0 = const()[name = tensor("op_1462_transpose_y_0"), val = tensor(false)]; tensor transpose_271 = transpose(perm = var_1456, x = var_1455_cast_fp16)[name = tensor("transpose_271")]; tensor var_1462_cast_fp16 = matmul(transpose_x = var_1462_transpose_x_0, transpose_y = var_1462_transpose_y_0, x = var_1460_cast_fp16, y = transpose_271)[name = tensor("op_1462_cast_fp16")]; tensor var_1463 = const()[name = tensor("op_1463"), val = tensor([0, 2, 1, 3])]; tensor concat_12 = const()[name = tensor("concat_12"), val = tensor([1, 1500, 1280])]; tensor transpose_268 = transpose(perm = var_1463, x = var_1462_cast_fp16)[name = tensor("transpose_268")]; tensor x_155_cast_fp16 = reshape(shape = concat_12, x = transpose_268)[name = tensor("x_155_cast_fp16")]; tensor var_1468_to_fp16 = const()[name = tensor("op_1468_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(326241024)))]; tensor var_1469_to_fp16 = const()[name = tensor("op_1469_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329517888)))]; tensor linear_75_cast_fp16 = linear(bias = var_1469_to_fp16, weight = var_1468_to_fp16, x = x_155_cast_fp16)[name = tensor("linear_75_cast_fp16")]; tensor x_157_cast_fp16 = add(x = x_151_cast_fp16, y = linear_75_cast_fp16)[name = tensor("x_157_cast_fp16")]; tensor var_1476_axes_0 = const()[name = tensor("op_1476_axes_0"), val = tensor([-1])]; tensor blocks_12_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_12_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329520512)))]; tensor blocks_12_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_12_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329523136)))]; tensor var_1476_cast_fp16 = layer_norm(axes = var_1476_axes_0, beta = blocks_12_mlp_ln_bias_to_fp16, epsilon = var_1402_to_fp16, gamma = blocks_12_mlp_ln_weight_to_fp16, x = x_157_cast_fp16)[name = tensor("op_1476_cast_fp16")]; tensor var_1485_to_fp16 = const()[name = tensor("op_1485_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329525760)))]; tensor var_1486_to_fp16 = const()[name = tensor("op_1486_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(339028544)))]; tensor linear_76_cast_fp16 = linear(bias = var_1486_to_fp16, weight = var_1485_to_fp16, x = var_1476_cast_fp16)[name = tensor("linear_76_cast_fp16")]; tensor x_161_mode_0 = const()[name = tensor("x_161_mode_0"), val = tensor("EXACT")]; tensor x_161_cast_fp16 = gelu(mode = x_161_mode_0, x = linear_76_cast_fp16)[name = tensor("x_161_cast_fp16")]; tensor var_1491_to_fp16 = const()[name = tensor("op_1491_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(339036032)))]; tensor var_1492_to_fp16 = const()[name = tensor("op_1492_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(348538816)))]; tensor linear_77_cast_fp16 = linear(bias = var_1492_to_fp16, weight = var_1491_to_fp16, x = x_161_cast_fp16)[name = tensor("linear_77_cast_fp16")]; tensor x_163_cast_fp16 = add(x = x_157_cast_fp16, y = linear_77_cast_fp16)[name = tensor("x_163_cast_fp16")]; tensor var_1502 = const()[name = tensor("op_1502"), val = tensor(-1)]; tensor var_1518_axes_0 = const()[name = tensor("op_1518_axes_0"), val = tensor([-1])]; tensor blocks_13_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_13_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(348541440)))]; tensor blocks_13_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_13_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(348544064)))]; tensor var_1508_to_fp16 = const()[name = tensor("op_1508_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1518_cast_fp16 = layer_norm(axes = var_1518_axes_0, beta = blocks_13_attn_ln_bias_to_fp16, epsilon = var_1508_to_fp16, gamma = blocks_13_attn_ln_weight_to_fp16, x = x_163_cast_fp16)[name = tensor("op_1518_cast_fp16")]; tensor var_1529_to_fp16 = const()[name = tensor("op_1529_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(348546688)))]; tensor var_1530_to_fp16 = const()[name = tensor("op_1530_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(351823552)))]; tensor linear_78_cast_fp16 = linear(bias = var_1530_to_fp16, weight = var_1529_to_fp16, x = var_1518_cast_fp16)[name = tensor("linear_78_cast_fp16")]; tensor var_1533_to_fp16 = const()[name = tensor("op_1533_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(351826176)))]; tensor linear_79_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_1533_to_fp16, x = var_1518_cast_fp16)[name = tensor("linear_79_cast_fp16")]; tensor var_1537_to_fp16 = const()[name = tensor("op_1537_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(355103040)))]; tensor var_1538_to_fp16 = const()[name = tensor("op_1538_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(358379904)))]; tensor linear_80_cast_fp16 = linear(bias = var_1538_to_fp16, weight = var_1537_to_fp16, x = var_1518_cast_fp16)[name = tensor("linear_80_cast_fp16")]; tensor var_1546 = const()[name = tensor("op_1546"), val = tensor([1, 1500, 20, -1])]; tensor var_1547_cast_fp16 = reshape(shape = var_1546, x = linear_78_cast_fp16)[name = tensor("op_1547_cast_fp16")]; tensor const_250_to_fp16 = const()[name = tensor("const_250_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_55_cast_fp16 = mul(x = var_1547_cast_fp16, y = const_250_to_fp16)[name = tensor("q_55_cast_fp16")]; tensor var_1553 = const()[name = tensor("op_1553"), val = tensor([1, 1500, 20, -1])]; tensor var_1554_cast_fp16 = reshape(shape = var_1553, x = linear_79_cast_fp16)[name = tensor("op_1554_cast_fp16")]; tensor const_251_to_fp16 = const()[name = tensor("const_251_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_55_cast_fp16 = mul(x = var_1554_cast_fp16, y = const_251_to_fp16)[name = tensor("k_55_cast_fp16")]; tensor var_1560 = const()[name = tensor("op_1560"), val = tensor([1, 1500, 20, -1])]; tensor var_1561_cast_fp16 = reshape(shape = var_1560, x = linear_80_cast_fp16)[name = tensor("op_1561_cast_fp16")]; tensor var_1562 = const()[name = tensor("op_1562"), val = tensor([0, 2, 1, 3])]; tensor qk_27_transpose_x_0 = const()[name = tensor("qk_27_transpose_x_0"), val = tensor(false)]; tensor qk_27_transpose_y_0 = const()[name = tensor("qk_27_transpose_y_0"), val = tensor(false)]; tensor transpose_154_perm_0 = const()[name = tensor("transpose_154_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_155_perm_0 = const()[name = tensor("transpose_155_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_265 = transpose(perm = transpose_155_perm_0, x = k_55_cast_fp16)[name = tensor("transpose_265")]; tensor transpose_266 = transpose(perm = transpose_154_perm_0, x = q_55_cast_fp16)[name = tensor("transpose_266")]; tensor qk_27_cast_fp16 = matmul(transpose_x = qk_27_transpose_x_0, transpose_y = qk_27_transpose_y_0, x = transpose_266, y = transpose_265)[name = tensor("qk_27_cast_fp16")]; tensor var_1566_cast_fp16 = softmax(axis = var_1502, x = qk_27_cast_fp16)[name = tensor("op_1566_cast_fp16")]; tensor var_1568_transpose_x_0 = const()[name = tensor("op_1568_transpose_x_0"), val = tensor(false)]; tensor var_1568_transpose_y_0 = const()[name = tensor("op_1568_transpose_y_0"), val = tensor(false)]; tensor transpose_267 = transpose(perm = var_1562, x = var_1561_cast_fp16)[name = tensor("transpose_267")]; tensor var_1568_cast_fp16 = matmul(transpose_x = var_1568_transpose_x_0, transpose_y = var_1568_transpose_y_0, x = var_1566_cast_fp16, y = transpose_267)[name = tensor("op_1568_cast_fp16")]; tensor var_1569 = const()[name = tensor("op_1569"), val = tensor([0, 2, 1, 3])]; tensor concat_13 = const()[name = tensor("concat_13"), val = tensor([1, 1500, 1280])]; tensor transpose_264 = transpose(perm = var_1569, x = var_1568_cast_fp16)[name = tensor("transpose_264")]; tensor x_167_cast_fp16 = reshape(shape = concat_13, x = transpose_264)[name = tensor("x_167_cast_fp16")]; tensor var_1574_to_fp16 = const()[name = tensor("op_1574_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(358382528)))]; tensor var_1575_to_fp16 = const()[name = tensor("op_1575_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(361659392)))]; tensor linear_81_cast_fp16 = linear(bias = var_1575_to_fp16, weight = var_1574_to_fp16, x = x_167_cast_fp16)[name = tensor("linear_81_cast_fp16")]; tensor x_169_cast_fp16 = add(x = x_163_cast_fp16, y = linear_81_cast_fp16)[name = tensor("x_169_cast_fp16")]; tensor var_1582_axes_0 = const()[name = tensor("op_1582_axes_0"), val = tensor([-1])]; tensor blocks_13_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_13_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(361662016)))]; tensor blocks_13_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_13_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(361664640)))]; tensor var_1582_cast_fp16 = layer_norm(axes = var_1582_axes_0, beta = blocks_13_mlp_ln_bias_to_fp16, epsilon = var_1508_to_fp16, gamma = blocks_13_mlp_ln_weight_to_fp16, x = x_169_cast_fp16)[name = tensor("op_1582_cast_fp16")]; tensor var_1591_to_fp16 = const()[name = tensor("op_1591_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(361667264)))]; tensor var_1592_to_fp16 = const()[name = tensor("op_1592_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(371579648)))]; tensor linear_82_cast_fp16 = linear(bias = var_1592_to_fp16, weight = var_1591_to_fp16, x = var_1582_cast_fp16)[name = tensor("linear_82_cast_fp16")]; tensor x_173_mode_0 = const()[name = tensor("x_173_mode_0"), val = tensor("EXACT")]; tensor x_173_cast_fp16 = gelu(mode = x_173_mode_0, x = linear_82_cast_fp16)[name = tensor("x_173_cast_fp16")]; tensor var_1597_to_fp16 = const()[name = tensor("op_1597_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(371587456)))]; tensor var_1598_to_fp16 = const()[name = tensor("op_1598_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(381499840)))]; tensor linear_83_cast_fp16 = linear(bias = var_1598_to_fp16, weight = var_1597_to_fp16, x = x_173_cast_fp16)[name = tensor("linear_83_cast_fp16")]; tensor x_175_cast_fp16 = add(x = x_169_cast_fp16, y = linear_83_cast_fp16)[name = tensor("x_175_cast_fp16")]; tensor var_1608 = const()[name = tensor("op_1608"), val = tensor(-1)]; tensor var_1624_axes_0 = const()[name = tensor("op_1624_axes_0"), val = tensor([-1])]; tensor blocks_14_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_14_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(381502464)))]; tensor blocks_14_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_14_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(381505088)))]; tensor var_1614_to_fp16 = const()[name = tensor("op_1614_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1624_cast_fp16 = layer_norm(axes = var_1624_axes_0, beta = blocks_14_attn_ln_bias_to_fp16, epsilon = var_1614_to_fp16, gamma = blocks_14_attn_ln_weight_to_fp16, x = x_175_cast_fp16)[name = tensor("op_1624_cast_fp16")]; tensor var_1635_to_fp16 = const()[name = tensor("op_1635_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(381507712)))]; tensor var_1636_to_fp16 = const()[name = tensor("op_1636_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(384784576)))]; tensor linear_84_cast_fp16 = linear(bias = var_1636_to_fp16, weight = var_1635_to_fp16, x = var_1624_cast_fp16)[name = tensor("linear_84_cast_fp16")]; tensor var_1639_to_fp16 = const()[name = tensor("op_1639_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(384787200)))]; tensor linear_85_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_1639_to_fp16, x = var_1624_cast_fp16)[name = tensor("linear_85_cast_fp16")]; tensor var_1643_to_fp16 = const()[name = tensor("op_1643_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(388064064)))]; tensor var_1644_to_fp16 = const()[name = tensor("op_1644_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(391340928)))]; tensor linear_86_cast_fp16 = linear(bias = var_1644_to_fp16, weight = var_1643_to_fp16, x = var_1624_cast_fp16)[name = tensor("linear_86_cast_fp16")]; tensor var_1652 = const()[name = tensor("op_1652"), val = tensor([1, 1500, 20, -1])]; tensor var_1653_cast_fp16 = reshape(shape = var_1652, x = linear_84_cast_fp16)[name = tensor("op_1653_cast_fp16")]; tensor const_252_to_fp16 = const()[name = tensor("const_252_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_59_cast_fp16 = mul(x = var_1653_cast_fp16, y = const_252_to_fp16)[name = tensor("q_59_cast_fp16")]; tensor var_1659 = const()[name = tensor("op_1659"), val = tensor([1, 1500, 20, -1])]; tensor var_1660_cast_fp16 = reshape(shape = var_1659, x = linear_85_cast_fp16)[name = tensor("op_1660_cast_fp16")]; tensor const_253_to_fp16 = const()[name = tensor("const_253_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_59_cast_fp16 = mul(x = var_1660_cast_fp16, y = const_253_to_fp16)[name = tensor("k_59_cast_fp16")]; tensor var_1666 = const()[name = tensor("op_1666"), val = tensor([1, 1500, 20, -1])]; tensor var_1667_cast_fp16 = reshape(shape = var_1666, x = linear_86_cast_fp16)[name = tensor("op_1667_cast_fp16")]; tensor var_1668 = const()[name = tensor("op_1668"), val = tensor([0, 2, 1, 3])]; tensor qk_29_transpose_x_0 = const()[name = tensor("qk_29_transpose_x_0"), val = tensor(false)]; tensor qk_29_transpose_y_0 = const()[name = tensor("qk_29_transpose_y_0"), val = tensor(false)]; tensor transpose_156_perm_0 = const()[name = tensor("transpose_156_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_157_perm_0 = const()[name = tensor("transpose_157_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_261 = transpose(perm = transpose_157_perm_0, x = k_59_cast_fp16)[name = tensor("transpose_261")]; tensor transpose_262 = transpose(perm = transpose_156_perm_0, x = q_59_cast_fp16)[name = tensor("transpose_262")]; tensor qk_29_cast_fp16 = matmul(transpose_x = qk_29_transpose_x_0, transpose_y = qk_29_transpose_y_0, x = transpose_262, y = transpose_261)[name = tensor("qk_29_cast_fp16")]; tensor var_1672_cast_fp16 = softmax(axis = var_1608, x = qk_29_cast_fp16)[name = tensor("op_1672_cast_fp16")]; tensor var_1674_transpose_x_0 = const()[name = tensor("op_1674_transpose_x_0"), val = tensor(false)]; tensor var_1674_transpose_y_0 = const()[name = tensor("op_1674_transpose_y_0"), val = tensor(false)]; tensor transpose_263 = transpose(perm = var_1668, x = var_1667_cast_fp16)[name = tensor("transpose_263")]; tensor var_1674_cast_fp16 = matmul(transpose_x = var_1674_transpose_x_0, transpose_y = var_1674_transpose_y_0, x = var_1672_cast_fp16, y = transpose_263)[name = tensor("op_1674_cast_fp16")]; tensor var_1675 = const()[name = tensor("op_1675"), val = tensor([0, 2, 1, 3])]; tensor concat_14 = const()[name = tensor("concat_14"), val = tensor([1, 1500, 1280])]; tensor transpose_260 = transpose(perm = var_1675, x = var_1674_cast_fp16)[name = tensor("transpose_260")]; tensor x_179_cast_fp16 = reshape(shape = concat_14, x = transpose_260)[name = tensor("x_179_cast_fp16")]; tensor var_1680_to_fp16 = const()[name = tensor("op_1680_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(391343552)))]; tensor var_1681_to_fp16 = const()[name = tensor("op_1681_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(394620416)))]; tensor linear_87_cast_fp16 = linear(bias = var_1681_to_fp16, weight = var_1680_to_fp16, x = x_179_cast_fp16)[name = tensor("linear_87_cast_fp16")]; tensor x_181_cast_fp16 = add(x = x_175_cast_fp16, y = linear_87_cast_fp16)[name = tensor("x_181_cast_fp16")]; tensor var_1688_axes_0 = const()[name = tensor("op_1688_axes_0"), val = tensor([-1])]; tensor blocks_14_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_14_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(394623040)))]; tensor blocks_14_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_14_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(394625664)))]; tensor var_1688_cast_fp16 = layer_norm(axes = var_1688_axes_0, beta = blocks_14_mlp_ln_bias_to_fp16, epsilon = var_1614_to_fp16, gamma = blocks_14_mlp_ln_weight_to_fp16, x = x_181_cast_fp16)[name = tensor("op_1688_cast_fp16")]; tensor var_1697_to_fp16 = const()[name = tensor("op_1697_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(394628288)))]; tensor var_1698_to_fp16 = const()[name = tensor("op_1698_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(405196032)))]; tensor linear_88_cast_fp16 = linear(bias = var_1698_to_fp16, weight = var_1697_to_fp16, x = var_1688_cast_fp16)[name = tensor("linear_88_cast_fp16")]; tensor x_185_mode_0 = const()[name = tensor("x_185_mode_0"), val = tensor("EXACT")]; tensor x_185_cast_fp16 = gelu(mode = x_185_mode_0, x = linear_88_cast_fp16)[name = tensor("x_185_cast_fp16")]; tensor var_1703_to_fp16 = const()[name = tensor("op_1703_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(405204352)))]; tensor var_1704_to_fp16 = const()[name = tensor("op_1704_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(415772096)))]; tensor linear_89_cast_fp16 = linear(bias = var_1704_to_fp16, weight = var_1703_to_fp16, x = x_185_cast_fp16)[name = tensor("linear_89_cast_fp16")]; tensor x_187_cast_fp16 = add(x = x_181_cast_fp16, y = linear_89_cast_fp16)[name = tensor("x_187_cast_fp16")]; tensor var_1714 = const()[name = tensor("op_1714"), val = tensor(-1)]; tensor var_1730_axes_0 = const()[name = tensor("op_1730_axes_0"), val = tensor([-1])]; tensor blocks_15_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_15_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(415774720)))]; tensor blocks_15_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_15_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(415777344)))]; tensor var_1720_to_fp16 = const()[name = tensor("op_1720_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1730_cast_fp16 = layer_norm(axes = var_1730_axes_0, beta = blocks_15_attn_ln_bias_to_fp16, epsilon = var_1720_to_fp16, gamma = blocks_15_attn_ln_weight_to_fp16, x = x_187_cast_fp16)[name = tensor("op_1730_cast_fp16")]; tensor var_1741_to_fp16 = const()[name = tensor("op_1741_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(415779968)))]; tensor var_1742_to_fp16 = const()[name = tensor("op_1742_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(419056832)))]; tensor linear_90_cast_fp16 = linear(bias = var_1742_to_fp16, weight = var_1741_to_fp16, x = var_1730_cast_fp16)[name = tensor("linear_90_cast_fp16")]; tensor var_1745_to_fp16 = const()[name = tensor("op_1745_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(419059456)))]; tensor linear_91_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_1745_to_fp16, x = var_1730_cast_fp16)[name = tensor("linear_91_cast_fp16")]; tensor var_1749_to_fp16 = const()[name = tensor("op_1749_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(422336320)))]; tensor var_1750_to_fp16 = const()[name = tensor("op_1750_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(425613184)))]; tensor linear_92_cast_fp16 = linear(bias = var_1750_to_fp16, weight = var_1749_to_fp16, x = var_1730_cast_fp16)[name = tensor("linear_92_cast_fp16")]; tensor var_1758 = const()[name = tensor("op_1758"), val = tensor([1, 1500, 20, -1])]; tensor var_1759_cast_fp16 = reshape(shape = var_1758, x = linear_90_cast_fp16)[name = tensor("op_1759_cast_fp16")]; tensor const_254_to_fp16 = const()[name = tensor("const_254_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_63_cast_fp16 = mul(x = var_1759_cast_fp16, y = const_254_to_fp16)[name = tensor("q_63_cast_fp16")]; tensor var_1765 = const()[name = tensor("op_1765"), val = tensor([1, 1500, 20, -1])]; tensor var_1766_cast_fp16 = reshape(shape = var_1765, x = linear_91_cast_fp16)[name = tensor("op_1766_cast_fp16")]; tensor const_255_to_fp16 = const()[name = tensor("const_255_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_63_cast_fp16 = mul(x = var_1766_cast_fp16, y = const_255_to_fp16)[name = tensor("k_63_cast_fp16")]; tensor var_1772 = const()[name = tensor("op_1772"), val = tensor([1, 1500, 20, -1])]; tensor var_1773_cast_fp16 = reshape(shape = var_1772, x = linear_92_cast_fp16)[name = tensor("op_1773_cast_fp16")]; tensor var_1774 = const()[name = tensor("op_1774"), val = tensor([0, 2, 1, 3])]; tensor qk_31_transpose_x_0 = const()[name = tensor("qk_31_transpose_x_0"), val = tensor(false)]; tensor qk_31_transpose_y_0 = const()[name = tensor("qk_31_transpose_y_0"), val = tensor(false)]; tensor transpose_158_perm_0 = const()[name = tensor("transpose_158_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_159_perm_0 = const()[name = tensor("transpose_159_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_257 = transpose(perm = transpose_159_perm_0, x = k_63_cast_fp16)[name = tensor("transpose_257")]; tensor transpose_258 = transpose(perm = transpose_158_perm_0, x = q_63_cast_fp16)[name = tensor("transpose_258")]; tensor qk_31_cast_fp16 = matmul(transpose_x = qk_31_transpose_x_0, transpose_y = qk_31_transpose_y_0, x = transpose_258, y = transpose_257)[name = tensor("qk_31_cast_fp16")]; tensor var_1778_cast_fp16 = softmax(axis = var_1714, x = qk_31_cast_fp16)[name = tensor("op_1778_cast_fp16")]; tensor var_1780_transpose_x_0 = const()[name = tensor("op_1780_transpose_x_0"), val = tensor(false)]; tensor var_1780_transpose_y_0 = const()[name = tensor("op_1780_transpose_y_0"), val = tensor(false)]; tensor transpose_259 = transpose(perm = var_1774, x = var_1773_cast_fp16)[name = tensor("transpose_259")]; tensor var_1780_cast_fp16 = matmul(transpose_x = var_1780_transpose_x_0, transpose_y = var_1780_transpose_y_0, x = var_1778_cast_fp16, y = transpose_259)[name = tensor("op_1780_cast_fp16")]; tensor var_1781 = const()[name = tensor("op_1781"), val = tensor([0, 2, 1, 3])]; tensor concat_15 = const()[name = tensor("concat_15"), val = tensor([1, 1500, 1280])]; tensor transpose_256 = transpose(perm = var_1781, x = var_1780_cast_fp16)[name = tensor("transpose_256")]; tensor x_191_cast_fp16 = reshape(shape = concat_15, x = transpose_256)[name = tensor("x_191_cast_fp16")]; tensor var_1786_to_fp16 = const()[name = tensor("op_1786_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(425615808)))]; tensor var_1787_to_fp16 = const()[name = tensor("op_1787_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(428892672)))]; tensor linear_93_cast_fp16 = linear(bias = var_1787_to_fp16, weight = var_1786_to_fp16, x = x_191_cast_fp16)[name = tensor("linear_93_cast_fp16")]; tensor x_193_cast_fp16 = add(x = x_187_cast_fp16, y = linear_93_cast_fp16)[name = tensor("x_193_cast_fp16")]; tensor var_1794_axes_0 = const()[name = tensor("op_1794_axes_0"), val = tensor([-1])]; tensor blocks_15_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_15_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(428895296)))]; tensor blocks_15_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_15_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(428897920)))]; tensor var_1794_cast_fp16 = layer_norm(axes = var_1794_axes_0, beta = blocks_15_mlp_ln_bias_to_fp16, epsilon = var_1720_to_fp16, gamma = blocks_15_mlp_ln_weight_to_fp16, x = x_193_cast_fp16)[name = tensor("op_1794_cast_fp16")]; tensor var_1803_to_fp16 = const()[name = tensor("op_1803_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(428900544)))]; tensor var_1804_to_fp16 = const()[name = tensor("op_1804_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(440123648)))]; tensor linear_94_cast_fp16 = linear(bias = var_1804_to_fp16, weight = var_1803_to_fp16, x = var_1794_cast_fp16)[name = tensor("linear_94_cast_fp16")]; tensor x_197_mode_0 = const()[name = tensor("x_197_mode_0"), val = tensor("EXACT")]; tensor x_197_cast_fp16 = gelu(mode = x_197_mode_0, x = linear_94_cast_fp16)[name = tensor("x_197_cast_fp16")]; tensor var_1809_to_fp16 = const()[name = tensor("op_1809_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(440132480)))]; tensor var_1810_to_fp16 = const()[name = tensor("op_1810_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(451355584)))]; tensor linear_95_cast_fp16 = linear(bias = var_1810_to_fp16, weight = var_1809_to_fp16, x = x_197_cast_fp16)[name = tensor("linear_95_cast_fp16")]; tensor x_199_cast_fp16 = add(x = x_193_cast_fp16, y = linear_95_cast_fp16)[name = tensor("x_199_cast_fp16")]; tensor var_1820 = const()[name = tensor("op_1820"), val = tensor(-1)]; tensor var_1836_axes_0 = const()[name = tensor("op_1836_axes_0"), val = tensor([-1])]; tensor blocks_16_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_16_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(451358208)))]; tensor blocks_16_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_16_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(451360832)))]; tensor var_1826_to_fp16 = const()[name = tensor("op_1826_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1836_cast_fp16 = layer_norm(axes = var_1836_axes_0, beta = blocks_16_attn_ln_bias_to_fp16, epsilon = var_1826_to_fp16, gamma = blocks_16_attn_ln_weight_to_fp16, x = x_199_cast_fp16)[name = tensor("op_1836_cast_fp16")]; tensor var_1847_to_fp16 = const()[name = tensor("op_1847_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(451363456)))]; tensor var_1848_to_fp16 = const()[name = tensor("op_1848_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(454640320)))]; tensor linear_96_cast_fp16 = linear(bias = var_1848_to_fp16, weight = var_1847_to_fp16, x = var_1836_cast_fp16)[name = tensor("linear_96_cast_fp16")]; tensor var_1851_to_fp16 = const()[name = tensor("op_1851_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(454642944)))]; tensor linear_97_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_1851_to_fp16, x = var_1836_cast_fp16)[name = tensor("linear_97_cast_fp16")]; tensor var_1855_to_fp16 = const()[name = tensor("op_1855_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(457919808)))]; tensor var_1856_to_fp16 = const()[name = tensor("op_1856_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(461196672)))]; tensor linear_98_cast_fp16 = linear(bias = var_1856_to_fp16, weight = var_1855_to_fp16, x = var_1836_cast_fp16)[name = tensor("linear_98_cast_fp16")]; tensor var_1864 = const()[name = tensor("op_1864"), val = tensor([1, 1500, 20, -1])]; tensor var_1865_cast_fp16 = reshape(shape = var_1864, x = linear_96_cast_fp16)[name = tensor("op_1865_cast_fp16")]; tensor const_256_to_fp16 = const()[name = tensor("const_256_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_67_cast_fp16 = mul(x = var_1865_cast_fp16, y = const_256_to_fp16)[name = tensor("q_67_cast_fp16")]; tensor var_1871 = const()[name = tensor("op_1871"), val = tensor([1, 1500, 20, -1])]; tensor var_1872_cast_fp16 = reshape(shape = var_1871, x = linear_97_cast_fp16)[name = tensor("op_1872_cast_fp16")]; tensor const_257_to_fp16 = const()[name = tensor("const_257_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_67_cast_fp16 = mul(x = var_1872_cast_fp16, y = const_257_to_fp16)[name = tensor("k_67_cast_fp16")]; tensor var_1878 = const()[name = tensor("op_1878"), val = tensor([1, 1500, 20, -1])]; tensor var_1879_cast_fp16 = reshape(shape = var_1878, x = linear_98_cast_fp16)[name = tensor("op_1879_cast_fp16")]; tensor var_1880 = const()[name = tensor("op_1880"), val = tensor([0, 2, 1, 3])]; tensor qk_33_transpose_x_0 = const()[name = tensor("qk_33_transpose_x_0"), val = tensor(false)]; tensor qk_33_transpose_y_0 = const()[name = tensor("qk_33_transpose_y_0"), val = tensor(false)]; tensor transpose_160_perm_0 = const()[name = tensor("transpose_160_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_161_perm_0 = const()[name = tensor("transpose_161_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_253 = transpose(perm = transpose_161_perm_0, x = k_67_cast_fp16)[name = tensor("transpose_253")]; tensor transpose_254 = transpose(perm = transpose_160_perm_0, x = q_67_cast_fp16)[name = tensor("transpose_254")]; tensor qk_33_cast_fp16 = matmul(transpose_x = qk_33_transpose_x_0, transpose_y = qk_33_transpose_y_0, x = transpose_254, y = transpose_253)[name = tensor("qk_33_cast_fp16")]; tensor var_1884_cast_fp16 = softmax(axis = var_1820, x = qk_33_cast_fp16)[name = tensor("op_1884_cast_fp16")]; tensor var_1886_transpose_x_0 = const()[name = tensor("op_1886_transpose_x_0"), val = tensor(false)]; tensor var_1886_transpose_y_0 = const()[name = tensor("op_1886_transpose_y_0"), val = tensor(false)]; tensor transpose_255 = transpose(perm = var_1880, x = var_1879_cast_fp16)[name = tensor("transpose_255")]; tensor var_1886_cast_fp16 = matmul(transpose_x = var_1886_transpose_x_0, transpose_y = var_1886_transpose_y_0, x = var_1884_cast_fp16, y = transpose_255)[name = tensor("op_1886_cast_fp16")]; tensor var_1887 = const()[name = tensor("op_1887"), val = tensor([0, 2, 1, 3])]; tensor concat_16 = const()[name = tensor("concat_16"), val = tensor([1, 1500, 1280])]; tensor transpose_252 = transpose(perm = var_1887, x = var_1886_cast_fp16)[name = tensor("transpose_252")]; tensor x_203_cast_fp16 = reshape(shape = concat_16, x = transpose_252)[name = tensor("x_203_cast_fp16")]; tensor var_1892_to_fp16 = const()[name = tensor("op_1892_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(461199296)))]; tensor var_1893_to_fp16 = const()[name = tensor("op_1893_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(464476160)))]; tensor linear_99_cast_fp16 = linear(bias = var_1893_to_fp16, weight = var_1892_to_fp16, x = x_203_cast_fp16)[name = tensor("linear_99_cast_fp16")]; tensor x_205_cast_fp16 = add(x = x_199_cast_fp16, y = linear_99_cast_fp16)[name = tensor("x_205_cast_fp16")]; tensor var_1900_axes_0 = const()[name = tensor("op_1900_axes_0"), val = tensor([-1])]; tensor blocks_16_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_16_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(464478784)))]; tensor blocks_16_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_16_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(464481408)))]; tensor var_1900_cast_fp16 = layer_norm(axes = var_1900_axes_0, beta = blocks_16_mlp_ln_bias_to_fp16, epsilon = var_1826_to_fp16, gamma = blocks_16_mlp_ln_weight_to_fp16, x = x_205_cast_fp16)[name = tensor("op_1900_cast_fp16")]; tensor var_1909_to_fp16 = const()[name = tensor("op_1909_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(464484032)))]; tensor var_1910_to_fp16 = const()[name = tensor("op_1910_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(476198656)))]; tensor linear_100_cast_fp16 = linear(bias = var_1910_to_fp16, weight = var_1909_to_fp16, x = var_1900_cast_fp16)[name = tensor("linear_100_cast_fp16")]; tensor x_209_mode_0 = const()[name = tensor("x_209_mode_0"), val = tensor("EXACT")]; tensor x_209_cast_fp16 = gelu(mode = x_209_mode_0, x = linear_100_cast_fp16)[name = tensor("x_209_cast_fp16")]; tensor var_1915_to_fp16 = const()[name = tensor("op_1915_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(476207872)))]; tensor var_1916_to_fp16 = const()[name = tensor("op_1916_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(487922496)))]; tensor linear_101_cast_fp16 = linear(bias = var_1916_to_fp16, weight = var_1915_to_fp16, x = x_209_cast_fp16)[name = tensor("linear_101_cast_fp16")]; tensor x_211_cast_fp16 = add(x = x_205_cast_fp16, y = linear_101_cast_fp16)[name = tensor("x_211_cast_fp16")]; tensor var_1926 = const()[name = tensor("op_1926"), val = tensor(-1)]; tensor var_1942_axes_0 = const()[name = tensor("op_1942_axes_0"), val = tensor([-1])]; tensor blocks_17_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_17_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(487925120)))]; tensor blocks_17_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_17_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(487927744)))]; tensor var_1932_to_fp16 = const()[name = tensor("op_1932_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1942_cast_fp16 = layer_norm(axes = var_1942_axes_0, beta = blocks_17_attn_ln_bias_to_fp16, epsilon = var_1932_to_fp16, gamma = blocks_17_attn_ln_weight_to_fp16, x = x_211_cast_fp16)[name = tensor("op_1942_cast_fp16")]; tensor var_1953_to_fp16 = const()[name = tensor("op_1953_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(487930368)))]; tensor var_1954_to_fp16 = const()[name = tensor("op_1954_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(491207232)))]; tensor linear_102_cast_fp16 = linear(bias = var_1954_to_fp16, weight = var_1953_to_fp16, x = var_1942_cast_fp16)[name = tensor("linear_102_cast_fp16")]; tensor var_1957_to_fp16 = const()[name = tensor("op_1957_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(491209856)))]; tensor linear_103_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_1957_to_fp16, x = var_1942_cast_fp16)[name = tensor("linear_103_cast_fp16")]; tensor var_1961_to_fp16 = const()[name = tensor("op_1961_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(494486720)))]; tensor var_1962_to_fp16 = const()[name = tensor("op_1962_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(497763584)))]; tensor linear_104_cast_fp16 = linear(bias = var_1962_to_fp16, weight = var_1961_to_fp16, x = var_1942_cast_fp16)[name = tensor("linear_104_cast_fp16")]; tensor var_1970 = const()[name = tensor("op_1970"), val = tensor([1, 1500, 20, -1])]; tensor var_1971_cast_fp16 = reshape(shape = var_1970, x = linear_102_cast_fp16)[name = tensor("op_1971_cast_fp16")]; tensor const_258_to_fp16 = const()[name = tensor("const_258_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_71_cast_fp16 = mul(x = var_1971_cast_fp16, y = const_258_to_fp16)[name = tensor("q_71_cast_fp16")]; tensor var_1977 = const()[name = tensor("op_1977"), val = tensor([1, 1500, 20, -1])]; tensor var_1978_cast_fp16 = reshape(shape = var_1977, x = linear_103_cast_fp16)[name = tensor("op_1978_cast_fp16")]; tensor const_259_to_fp16 = const()[name = tensor("const_259_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_71_cast_fp16 = mul(x = var_1978_cast_fp16, y = const_259_to_fp16)[name = tensor("k_71_cast_fp16")]; tensor var_1984 = const()[name = tensor("op_1984"), val = tensor([1, 1500, 20, -1])]; tensor var_1985_cast_fp16 = reshape(shape = var_1984, x = linear_104_cast_fp16)[name = tensor("op_1985_cast_fp16")]; tensor var_1986 = const()[name = tensor("op_1986"), val = tensor([0, 2, 1, 3])]; tensor qk_35_transpose_x_0 = const()[name = tensor("qk_35_transpose_x_0"), val = tensor(false)]; tensor qk_35_transpose_y_0 = const()[name = tensor("qk_35_transpose_y_0"), val = tensor(false)]; tensor transpose_162_perm_0 = const()[name = tensor("transpose_162_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_163_perm_0 = const()[name = tensor("transpose_163_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_249 = transpose(perm = transpose_163_perm_0, x = k_71_cast_fp16)[name = tensor("transpose_249")]; tensor transpose_250 = transpose(perm = transpose_162_perm_0, x = q_71_cast_fp16)[name = tensor("transpose_250")]; tensor qk_35_cast_fp16 = matmul(transpose_x = qk_35_transpose_x_0, transpose_y = qk_35_transpose_y_0, x = transpose_250, y = transpose_249)[name = tensor("qk_35_cast_fp16")]; tensor var_1990_cast_fp16 = softmax(axis = var_1926, x = qk_35_cast_fp16)[name = tensor("op_1990_cast_fp16")]; tensor var_1992_transpose_x_0 = const()[name = tensor("op_1992_transpose_x_0"), val = tensor(false)]; tensor var_1992_transpose_y_0 = const()[name = tensor("op_1992_transpose_y_0"), val = tensor(false)]; tensor transpose_251 = transpose(perm = var_1986, x = var_1985_cast_fp16)[name = tensor("transpose_251")]; tensor var_1992_cast_fp16 = matmul(transpose_x = var_1992_transpose_x_0, transpose_y = var_1992_transpose_y_0, x = var_1990_cast_fp16, y = transpose_251)[name = tensor("op_1992_cast_fp16")]; tensor var_1993 = const()[name = tensor("op_1993"), val = tensor([0, 2, 1, 3])]; tensor concat_17 = const()[name = tensor("concat_17"), val = tensor([1, 1500, 1280])]; tensor transpose_248 = transpose(perm = var_1993, x = var_1992_cast_fp16)[name = tensor("transpose_248")]; tensor x_215_cast_fp16 = reshape(shape = concat_17, x = transpose_248)[name = tensor("x_215_cast_fp16")]; tensor var_1998_to_fp16 = const()[name = tensor("op_1998_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(497766208)))]; tensor var_1999_to_fp16 = const()[name = tensor("op_1999_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(501043072)))]; tensor linear_105_cast_fp16 = linear(bias = var_1999_to_fp16, weight = var_1998_to_fp16, x = x_215_cast_fp16)[name = tensor("linear_105_cast_fp16")]; tensor x_217_cast_fp16 = add(x = x_211_cast_fp16, y = linear_105_cast_fp16)[name = tensor("x_217_cast_fp16")]; tensor var_2006_axes_0 = const()[name = tensor("op_2006_axes_0"), val = tensor([-1])]; tensor blocks_17_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_17_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(501045696)))]; tensor blocks_17_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_17_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(501048320)))]; tensor var_2006_cast_fp16 = layer_norm(axes = var_2006_axes_0, beta = blocks_17_mlp_ln_bias_to_fp16, epsilon = var_1932_to_fp16, gamma = blocks_17_mlp_ln_weight_to_fp16, x = x_217_cast_fp16)[name = tensor("op_2006_cast_fp16")]; tensor var_2015_to_fp16 = const()[name = tensor("op_2015_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(501050944)))]; tensor var_2016_to_fp16 = const()[name = tensor("op_2016_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(513175168)))]; tensor linear_106_cast_fp16 = linear(bias = var_2016_to_fp16, weight = var_2015_to_fp16, x = var_2006_cast_fp16)[name = tensor("linear_106_cast_fp16")]; tensor x_221_mode_0 = const()[name = tensor("x_221_mode_0"), val = tensor("EXACT")]; tensor x_221_cast_fp16 = gelu(mode = x_221_mode_0, x = linear_106_cast_fp16)[name = tensor("x_221_cast_fp16")]; tensor var_2021_to_fp16 = const()[name = tensor("op_2021_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(513184704)))]; tensor var_2022_to_fp16 = const()[name = tensor("op_2022_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(525308928)))]; tensor linear_107_cast_fp16 = linear(bias = var_2022_to_fp16, weight = var_2021_to_fp16, x = x_221_cast_fp16)[name = tensor("linear_107_cast_fp16")]; tensor x_223_cast_fp16 = add(x = x_217_cast_fp16, y = linear_107_cast_fp16)[name = tensor("x_223_cast_fp16")]; tensor var_2032 = const()[name = tensor("op_2032"), val = tensor(-1)]; tensor var_2048_axes_0 = const()[name = tensor("op_2048_axes_0"), val = tensor([-1])]; tensor blocks_18_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_18_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(525311552)))]; tensor blocks_18_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_18_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(525314176)))]; tensor var_2038_to_fp16 = const()[name = tensor("op_2038_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2048_cast_fp16 = layer_norm(axes = var_2048_axes_0, beta = blocks_18_attn_ln_bias_to_fp16, epsilon = var_2038_to_fp16, gamma = blocks_18_attn_ln_weight_to_fp16, x = x_223_cast_fp16)[name = tensor("op_2048_cast_fp16")]; tensor var_2059_to_fp16 = const()[name = tensor("op_2059_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(525316800)))]; tensor var_2060_to_fp16 = const()[name = tensor("op_2060_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(528593664)))]; tensor linear_108_cast_fp16 = linear(bias = var_2060_to_fp16, weight = var_2059_to_fp16, x = var_2048_cast_fp16)[name = tensor("linear_108_cast_fp16")]; tensor var_2063_to_fp16 = const()[name = tensor("op_2063_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(528596288)))]; tensor linear_109_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_2063_to_fp16, x = var_2048_cast_fp16)[name = tensor("linear_109_cast_fp16")]; tensor var_2067_to_fp16 = const()[name = tensor("op_2067_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(531873152)))]; tensor var_2068_to_fp16 = const()[name = tensor("op_2068_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(535150016)))]; tensor linear_110_cast_fp16 = linear(bias = var_2068_to_fp16, weight = var_2067_to_fp16, x = var_2048_cast_fp16)[name = tensor("linear_110_cast_fp16")]; tensor var_2076 = const()[name = tensor("op_2076"), val = tensor([1, 1500, 20, -1])]; tensor var_2077_cast_fp16 = reshape(shape = var_2076, x = linear_108_cast_fp16)[name = tensor("op_2077_cast_fp16")]; tensor const_260_to_fp16 = const()[name = tensor("const_260_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_75_cast_fp16 = mul(x = var_2077_cast_fp16, y = const_260_to_fp16)[name = tensor("q_75_cast_fp16")]; tensor var_2083 = const()[name = tensor("op_2083"), val = tensor([1, 1500, 20, -1])]; tensor var_2084_cast_fp16 = reshape(shape = var_2083, x = linear_109_cast_fp16)[name = tensor("op_2084_cast_fp16")]; tensor const_261_to_fp16 = const()[name = tensor("const_261_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_75_cast_fp16 = mul(x = var_2084_cast_fp16, y = const_261_to_fp16)[name = tensor("k_75_cast_fp16")]; tensor var_2090 = const()[name = tensor("op_2090"), val = tensor([1, 1500, 20, -1])]; tensor var_2091_cast_fp16 = reshape(shape = var_2090, x = linear_110_cast_fp16)[name = tensor("op_2091_cast_fp16")]; tensor var_2092 = const()[name = tensor("op_2092"), val = tensor([0, 2, 1, 3])]; tensor qk_37_transpose_x_0 = const()[name = tensor("qk_37_transpose_x_0"), val = tensor(false)]; tensor qk_37_transpose_y_0 = const()[name = tensor("qk_37_transpose_y_0"), val = tensor(false)]; tensor transpose_164_perm_0 = const()[name = tensor("transpose_164_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_165_perm_0 = const()[name = tensor("transpose_165_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_245 = transpose(perm = transpose_165_perm_0, x = k_75_cast_fp16)[name = tensor("transpose_245")]; tensor transpose_246 = transpose(perm = transpose_164_perm_0, x = q_75_cast_fp16)[name = tensor("transpose_246")]; tensor qk_37_cast_fp16 = matmul(transpose_x = qk_37_transpose_x_0, transpose_y = qk_37_transpose_y_0, x = transpose_246, y = transpose_245)[name = tensor("qk_37_cast_fp16")]; tensor var_2096_cast_fp16 = softmax(axis = var_2032, x = qk_37_cast_fp16)[name = tensor("op_2096_cast_fp16")]; tensor var_2098_transpose_x_0 = const()[name = tensor("op_2098_transpose_x_0"), val = tensor(false)]; tensor var_2098_transpose_y_0 = const()[name = tensor("op_2098_transpose_y_0"), val = tensor(false)]; tensor transpose_247 = transpose(perm = var_2092, x = var_2091_cast_fp16)[name = tensor("transpose_247")]; tensor var_2098_cast_fp16 = matmul(transpose_x = var_2098_transpose_x_0, transpose_y = var_2098_transpose_y_0, x = var_2096_cast_fp16, y = transpose_247)[name = tensor("op_2098_cast_fp16")]; tensor var_2099 = const()[name = tensor("op_2099"), val = tensor([0, 2, 1, 3])]; tensor concat_18 = const()[name = tensor("concat_18"), val = tensor([1, 1500, 1280])]; tensor transpose_244 = transpose(perm = var_2099, x = var_2098_cast_fp16)[name = tensor("transpose_244")]; tensor x_227_cast_fp16 = reshape(shape = concat_18, x = transpose_244)[name = tensor("x_227_cast_fp16")]; tensor var_2104_to_fp16 = const()[name = tensor("op_2104_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(535152640)))]; tensor var_2105_to_fp16 = const()[name = tensor("op_2105_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(538429504)))]; tensor linear_111_cast_fp16 = linear(bias = var_2105_to_fp16, weight = var_2104_to_fp16, x = x_227_cast_fp16)[name = tensor("linear_111_cast_fp16")]; tensor x_229_cast_fp16 = add(x = x_223_cast_fp16, y = linear_111_cast_fp16)[name = tensor("x_229_cast_fp16")]; tensor var_2112_axes_0 = const()[name = tensor("op_2112_axes_0"), val = tensor([-1])]; tensor blocks_18_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_18_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(538432128)))]; tensor blocks_18_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_18_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(538434752)))]; tensor var_2112_cast_fp16 = layer_norm(axes = var_2112_axes_0, beta = blocks_18_mlp_ln_bias_to_fp16, epsilon = var_2038_to_fp16, gamma = blocks_18_mlp_ln_weight_to_fp16, x = x_229_cast_fp16)[name = tensor("op_2112_cast_fp16")]; tensor var_2121_to_fp16 = const()[name = tensor("op_2121_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(538437376)))]; tensor var_2122_to_fp16 = const()[name = tensor("op_2122_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(550397760)))]; tensor linear_112_cast_fp16 = linear(bias = var_2122_to_fp16, weight = var_2121_to_fp16, x = var_2112_cast_fp16)[name = tensor("linear_112_cast_fp16")]; tensor x_233_mode_0 = const()[name = tensor("x_233_mode_0"), val = tensor("EXACT")]; tensor x_233_cast_fp16 = gelu(mode = x_233_mode_0, x = linear_112_cast_fp16)[name = tensor("x_233_cast_fp16")]; tensor var_2127_to_fp16 = const()[name = tensor("op_2127_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(550407168)))]; tensor var_2128_to_fp16 = const()[name = tensor("op_2128_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(562367552)))]; tensor linear_113_cast_fp16 = linear(bias = var_2128_to_fp16, weight = var_2127_to_fp16, x = x_233_cast_fp16)[name = tensor("linear_113_cast_fp16")]; tensor x_235_cast_fp16 = add(x = x_229_cast_fp16, y = linear_113_cast_fp16)[name = tensor("x_235_cast_fp16")]; tensor var_2138 = const()[name = tensor("op_2138"), val = tensor(-1)]; tensor var_2154_axes_0 = const()[name = tensor("op_2154_axes_0"), val = tensor([-1])]; tensor blocks_19_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_19_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(562370176)))]; tensor blocks_19_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_19_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(562372800)))]; tensor var_2144_to_fp16 = const()[name = tensor("op_2144_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2154_cast_fp16 = layer_norm(axes = var_2154_axes_0, beta = blocks_19_attn_ln_bias_to_fp16, epsilon = var_2144_to_fp16, gamma = blocks_19_attn_ln_weight_to_fp16, x = x_235_cast_fp16)[name = tensor("op_2154_cast_fp16")]; tensor var_2165_to_fp16 = const()[name = tensor("op_2165_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(562375424)))]; tensor var_2166_to_fp16 = const()[name = tensor("op_2166_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(565652288)))]; tensor linear_114_cast_fp16 = linear(bias = var_2166_to_fp16, weight = var_2165_to_fp16, x = var_2154_cast_fp16)[name = tensor("linear_114_cast_fp16")]; tensor var_2169_to_fp16 = const()[name = tensor("op_2169_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(565654912)))]; tensor linear_115_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_2169_to_fp16, x = var_2154_cast_fp16)[name = tensor("linear_115_cast_fp16")]; tensor var_2173_to_fp16 = const()[name = tensor("op_2173_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(568931776)))]; tensor var_2174_to_fp16 = const()[name = tensor("op_2174_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(572208640)))]; tensor linear_116_cast_fp16 = linear(bias = var_2174_to_fp16, weight = var_2173_to_fp16, x = var_2154_cast_fp16)[name = tensor("linear_116_cast_fp16")]; tensor var_2182 = const()[name = tensor("op_2182"), val = tensor([1, 1500, 20, -1])]; tensor var_2183_cast_fp16 = reshape(shape = var_2182, x = linear_114_cast_fp16)[name = tensor("op_2183_cast_fp16")]; tensor const_262_to_fp16 = const()[name = tensor("const_262_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_79_cast_fp16 = mul(x = var_2183_cast_fp16, y = const_262_to_fp16)[name = tensor("q_79_cast_fp16")]; tensor var_2189 = const()[name = tensor("op_2189"), val = tensor([1, 1500, 20, -1])]; tensor var_2190_cast_fp16 = reshape(shape = var_2189, x = linear_115_cast_fp16)[name = tensor("op_2190_cast_fp16")]; tensor const_263_to_fp16 = const()[name = tensor("const_263_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_79_cast_fp16 = mul(x = var_2190_cast_fp16, y = const_263_to_fp16)[name = tensor("k_79_cast_fp16")]; tensor var_2196 = const()[name = tensor("op_2196"), val = tensor([1, 1500, 20, -1])]; tensor var_2197_cast_fp16 = reshape(shape = var_2196, x = linear_116_cast_fp16)[name = tensor("op_2197_cast_fp16")]; tensor var_2198 = const()[name = tensor("op_2198"), val = tensor([0, 2, 1, 3])]; tensor qk_39_transpose_x_0 = const()[name = tensor("qk_39_transpose_x_0"), val = tensor(false)]; tensor qk_39_transpose_y_0 = const()[name = tensor("qk_39_transpose_y_0"), val = tensor(false)]; tensor transpose_166_perm_0 = const()[name = tensor("transpose_166_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_167_perm_0 = const()[name = tensor("transpose_167_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_241 = transpose(perm = transpose_167_perm_0, x = k_79_cast_fp16)[name = tensor("transpose_241")]; tensor transpose_242 = transpose(perm = transpose_166_perm_0, x = q_79_cast_fp16)[name = tensor("transpose_242")]; tensor qk_39_cast_fp16 = matmul(transpose_x = qk_39_transpose_x_0, transpose_y = qk_39_transpose_y_0, x = transpose_242, y = transpose_241)[name = tensor("qk_39_cast_fp16")]; tensor var_2202_cast_fp16 = softmax(axis = var_2138, x = qk_39_cast_fp16)[name = tensor("op_2202_cast_fp16")]; tensor var_2204_transpose_x_0 = const()[name = tensor("op_2204_transpose_x_0"), val = tensor(false)]; tensor var_2204_transpose_y_0 = const()[name = tensor("op_2204_transpose_y_0"), val = tensor(false)]; tensor transpose_243 = transpose(perm = var_2198, x = var_2197_cast_fp16)[name = tensor("transpose_243")]; tensor var_2204_cast_fp16 = matmul(transpose_x = var_2204_transpose_x_0, transpose_y = var_2204_transpose_y_0, x = var_2202_cast_fp16, y = transpose_243)[name = tensor("op_2204_cast_fp16")]; tensor var_2205 = const()[name = tensor("op_2205"), val = tensor([0, 2, 1, 3])]; tensor concat_19 = const()[name = tensor("concat_19"), val = tensor([1, 1500, 1280])]; tensor transpose_240 = transpose(perm = var_2205, x = var_2204_cast_fp16)[name = tensor("transpose_240")]; tensor x_239_cast_fp16 = reshape(shape = concat_19, x = transpose_240)[name = tensor("x_239_cast_fp16")]; tensor var_2210_to_fp16 = const()[name = tensor("op_2210_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(572211264)))]; tensor var_2211_to_fp16 = const()[name = tensor("op_2211_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(575488128)))]; tensor linear_117_cast_fp16 = linear(bias = var_2211_to_fp16, weight = var_2210_to_fp16, x = x_239_cast_fp16)[name = tensor("linear_117_cast_fp16")]; tensor x_241_cast_fp16 = add(x = x_235_cast_fp16, y = linear_117_cast_fp16)[name = tensor("x_241_cast_fp16")]; tensor var_2218_axes_0 = const()[name = tensor("op_2218_axes_0"), val = tensor([-1])]; tensor blocks_19_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_19_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(575490752)))]; tensor blocks_19_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_19_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(575493376)))]; tensor var_2218_cast_fp16 = layer_norm(axes = var_2218_axes_0, beta = blocks_19_mlp_ln_bias_to_fp16, epsilon = var_2144_to_fp16, gamma = blocks_19_mlp_ln_weight_to_fp16, x = x_241_cast_fp16)[name = tensor("op_2218_cast_fp16")]; tensor var_2227_to_fp16 = const()[name = tensor("op_2227_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(575496000)))]; tensor var_2228_to_fp16 = const()[name = tensor("op_2228_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(587784064)))]; tensor linear_118_cast_fp16 = linear(bias = var_2228_to_fp16, weight = var_2227_to_fp16, x = var_2218_cast_fp16)[name = tensor("linear_118_cast_fp16")]; tensor x_245_mode_0 = const()[name = tensor("x_245_mode_0"), val = tensor("EXACT")]; tensor x_245_cast_fp16 = gelu(mode = x_245_mode_0, x = linear_118_cast_fp16)[name = tensor("x_245_cast_fp16")]; tensor var_2233_to_fp16 = const()[name = tensor("op_2233_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(587793728)))]; tensor var_2234_to_fp16 = const()[name = tensor("op_2234_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(600081792)))]; tensor linear_119_cast_fp16 = linear(bias = var_2234_to_fp16, weight = var_2233_to_fp16, x = x_245_cast_fp16)[name = tensor("linear_119_cast_fp16")]; tensor x_247_cast_fp16 = add(x = x_241_cast_fp16, y = linear_119_cast_fp16)[name = tensor("x_247_cast_fp16")]; tensor var_2244 = const()[name = tensor("op_2244"), val = tensor(-1)]; tensor var_2260_axes_0 = const()[name = tensor("op_2260_axes_0"), val = tensor([-1])]; tensor blocks_20_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_20_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(600084416)))]; tensor blocks_20_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_20_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(600087040)))]; tensor var_2250_to_fp16 = const()[name = tensor("op_2250_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2260_cast_fp16 = layer_norm(axes = var_2260_axes_0, beta = blocks_20_attn_ln_bias_to_fp16, epsilon = var_2250_to_fp16, gamma = blocks_20_attn_ln_weight_to_fp16, x = x_247_cast_fp16)[name = tensor("op_2260_cast_fp16")]; tensor var_2271_to_fp16 = const()[name = tensor("op_2271_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(600089664)))]; tensor var_2272_to_fp16 = const()[name = tensor("op_2272_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(603366528)))]; tensor linear_120_cast_fp16 = linear(bias = var_2272_to_fp16, weight = var_2271_to_fp16, x = var_2260_cast_fp16)[name = tensor("linear_120_cast_fp16")]; tensor var_2275_to_fp16 = const()[name = tensor("op_2275_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(603369152)))]; tensor linear_121_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_2275_to_fp16, x = var_2260_cast_fp16)[name = tensor("linear_121_cast_fp16")]; tensor var_2279_to_fp16 = const()[name = tensor("op_2279_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(606646016)))]; tensor var_2280_to_fp16 = const()[name = tensor("op_2280_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(609922880)))]; tensor linear_122_cast_fp16 = linear(bias = var_2280_to_fp16, weight = var_2279_to_fp16, x = var_2260_cast_fp16)[name = tensor("linear_122_cast_fp16")]; tensor var_2288 = const()[name = tensor("op_2288"), val = tensor([1, 1500, 20, -1])]; tensor var_2289_cast_fp16 = reshape(shape = var_2288, x = linear_120_cast_fp16)[name = tensor("op_2289_cast_fp16")]; tensor const_264_to_fp16 = const()[name = tensor("const_264_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_83_cast_fp16 = mul(x = var_2289_cast_fp16, y = const_264_to_fp16)[name = tensor("q_83_cast_fp16")]; tensor var_2295 = const()[name = tensor("op_2295"), val = tensor([1, 1500, 20, -1])]; tensor var_2296_cast_fp16 = reshape(shape = var_2295, x = linear_121_cast_fp16)[name = tensor("op_2296_cast_fp16")]; tensor const_265_to_fp16 = const()[name = tensor("const_265_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_83_cast_fp16 = mul(x = var_2296_cast_fp16, y = const_265_to_fp16)[name = tensor("k_83_cast_fp16")]; tensor var_2302 = const()[name = tensor("op_2302"), val = tensor([1, 1500, 20, -1])]; tensor var_2303_cast_fp16 = reshape(shape = var_2302, x = linear_122_cast_fp16)[name = tensor("op_2303_cast_fp16")]; tensor var_2304 = const()[name = tensor("op_2304"), val = tensor([0, 2, 1, 3])]; tensor qk_41_transpose_x_0 = const()[name = tensor("qk_41_transpose_x_0"), val = tensor(false)]; tensor qk_41_transpose_y_0 = const()[name = tensor("qk_41_transpose_y_0"), val = tensor(false)]; tensor transpose_168_perm_0 = const()[name = tensor("transpose_168_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_169_perm_0 = const()[name = tensor("transpose_169_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_237 = transpose(perm = transpose_169_perm_0, x = k_83_cast_fp16)[name = tensor("transpose_237")]; tensor transpose_238 = transpose(perm = transpose_168_perm_0, x = q_83_cast_fp16)[name = tensor("transpose_238")]; tensor qk_41_cast_fp16 = matmul(transpose_x = qk_41_transpose_x_0, transpose_y = qk_41_transpose_y_0, x = transpose_238, y = transpose_237)[name = tensor("qk_41_cast_fp16")]; tensor var_2308_cast_fp16 = softmax(axis = var_2244, x = qk_41_cast_fp16)[name = tensor("op_2308_cast_fp16")]; tensor var_2310_transpose_x_0 = const()[name = tensor("op_2310_transpose_x_0"), val = tensor(false)]; tensor var_2310_transpose_y_0 = const()[name = tensor("op_2310_transpose_y_0"), val = tensor(false)]; tensor transpose_239 = transpose(perm = var_2304, x = var_2303_cast_fp16)[name = tensor("transpose_239")]; tensor var_2310_cast_fp16 = matmul(transpose_x = var_2310_transpose_x_0, transpose_y = var_2310_transpose_y_0, x = var_2308_cast_fp16, y = transpose_239)[name = tensor("op_2310_cast_fp16")]; tensor var_2311 = const()[name = tensor("op_2311"), val = tensor([0, 2, 1, 3])]; tensor concat_20 = const()[name = tensor("concat_20"), val = tensor([1, 1500, 1280])]; tensor transpose_236 = transpose(perm = var_2311, x = var_2310_cast_fp16)[name = tensor("transpose_236")]; tensor x_251_cast_fp16 = reshape(shape = concat_20, x = transpose_236)[name = tensor("x_251_cast_fp16")]; tensor var_2316_to_fp16 = const()[name = tensor("op_2316_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(609925504)))]; tensor var_2317_to_fp16 = const()[name = tensor("op_2317_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(613202368)))]; tensor linear_123_cast_fp16 = linear(bias = var_2317_to_fp16, weight = var_2316_to_fp16, x = x_251_cast_fp16)[name = tensor("linear_123_cast_fp16")]; tensor x_253_cast_fp16 = add(x = x_247_cast_fp16, y = linear_123_cast_fp16)[name = tensor("x_253_cast_fp16")]; tensor var_2324_axes_0 = const()[name = tensor("op_2324_axes_0"), val = tensor([-1])]; tensor blocks_20_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_20_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(613204992)))]; tensor blocks_20_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_20_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(613207616)))]; tensor var_2324_cast_fp16 = layer_norm(axes = var_2324_axes_0, beta = blocks_20_mlp_ln_bias_to_fp16, epsilon = var_2250_to_fp16, gamma = blocks_20_mlp_ln_weight_to_fp16, x = x_253_cast_fp16)[name = tensor("op_2324_cast_fp16")]; tensor var_2333_to_fp16 = const()[name = tensor("op_2333_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(613210240)))]; tensor var_2334_to_fp16 = const()[name = tensor("op_2334_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(625662144)))]; tensor linear_124_cast_fp16 = linear(bias = var_2334_to_fp16, weight = var_2333_to_fp16, x = var_2324_cast_fp16)[name = tensor("linear_124_cast_fp16")]; tensor x_257_mode_0 = const()[name = tensor("x_257_mode_0"), val = tensor("EXACT")]; tensor x_257_cast_fp16 = gelu(mode = x_257_mode_0, x = linear_124_cast_fp16)[name = tensor("x_257_cast_fp16")]; tensor var_2339_to_fp16 = const()[name = tensor("op_2339_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(625671936)))]; tensor var_2340_to_fp16 = const()[name = tensor("op_2340_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(638123840)))]; tensor linear_125_cast_fp16 = linear(bias = var_2340_to_fp16, weight = var_2339_to_fp16, x = x_257_cast_fp16)[name = tensor("linear_125_cast_fp16")]; tensor x_259_cast_fp16 = add(x = x_253_cast_fp16, y = linear_125_cast_fp16)[name = tensor("x_259_cast_fp16")]; tensor var_2350 = const()[name = tensor("op_2350"), val = tensor(-1)]; tensor var_2366_axes_0 = const()[name = tensor("op_2366_axes_0"), val = tensor([-1])]; tensor blocks_21_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_21_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(638126464)))]; tensor blocks_21_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_21_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(638129088)))]; tensor var_2356_to_fp16 = const()[name = tensor("op_2356_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2366_cast_fp16 = layer_norm(axes = var_2366_axes_0, beta = blocks_21_attn_ln_bias_to_fp16, epsilon = var_2356_to_fp16, gamma = blocks_21_attn_ln_weight_to_fp16, x = x_259_cast_fp16)[name = tensor("op_2366_cast_fp16")]; tensor var_2377_to_fp16 = const()[name = tensor("op_2377_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(638131712)))]; tensor var_2378_to_fp16 = const()[name = tensor("op_2378_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(641408576)))]; tensor linear_126_cast_fp16 = linear(bias = var_2378_to_fp16, weight = var_2377_to_fp16, x = var_2366_cast_fp16)[name = tensor("linear_126_cast_fp16")]; tensor var_2381_to_fp16 = const()[name = tensor("op_2381_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(641411200)))]; tensor linear_127_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_2381_to_fp16, x = var_2366_cast_fp16)[name = tensor("linear_127_cast_fp16")]; tensor var_2385_to_fp16 = const()[name = tensor("op_2385_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(644688064)))]; tensor var_2386_to_fp16 = const()[name = tensor("op_2386_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(647964928)))]; tensor linear_128_cast_fp16 = linear(bias = var_2386_to_fp16, weight = var_2385_to_fp16, x = var_2366_cast_fp16)[name = tensor("linear_128_cast_fp16")]; tensor var_2394 = const()[name = tensor("op_2394"), val = tensor([1, 1500, 20, -1])]; tensor var_2395_cast_fp16 = reshape(shape = var_2394, x = linear_126_cast_fp16)[name = tensor("op_2395_cast_fp16")]; tensor const_266_to_fp16 = const()[name = tensor("const_266_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_87_cast_fp16 = mul(x = var_2395_cast_fp16, y = const_266_to_fp16)[name = tensor("q_87_cast_fp16")]; tensor var_2401 = const()[name = tensor("op_2401"), val = tensor([1, 1500, 20, -1])]; tensor var_2402_cast_fp16 = reshape(shape = var_2401, x = linear_127_cast_fp16)[name = tensor("op_2402_cast_fp16")]; tensor const_267_to_fp16 = const()[name = tensor("const_267_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_87_cast_fp16 = mul(x = var_2402_cast_fp16, y = const_267_to_fp16)[name = tensor("k_87_cast_fp16")]; tensor var_2408 = const()[name = tensor("op_2408"), val = tensor([1, 1500, 20, -1])]; tensor var_2409_cast_fp16 = reshape(shape = var_2408, x = linear_128_cast_fp16)[name = tensor("op_2409_cast_fp16")]; tensor var_2410 = const()[name = tensor("op_2410"), val = tensor([0, 2, 1, 3])]; tensor qk_43_transpose_x_0 = const()[name = tensor("qk_43_transpose_x_0"), val = tensor(false)]; tensor qk_43_transpose_y_0 = const()[name = tensor("qk_43_transpose_y_0"), val = tensor(false)]; tensor transpose_170_perm_0 = const()[name = tensor("transpose_170_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_171_perm_0 = const()[name = tensor("transpose_171_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_233 = transpose(perm = transpose_171_perm_0, x = k_87_cast_fp16)[name = tensor("transpose_233")]; tensor transpose_234 = transpose(perm = transpose_170_perm_0, x = q_87_cast_fp16)[name = tensor("transpose_234")]; tensor qk_43_cast_fp16 = matmul(transpose_x = qk_43_transpose_x_0, transpose_y = qk_43_transpose_y_0, x = transpose_234, y = transpose_233)[name = tensor("qk_43_cast_fp16")]; tensor var_2414_cast_fp16 = softmax(axis = var_2350, x = qk_43_cast_fp16)[name = tensor("op_2414_cast_fp16")]; tensor var_2416_transpose_x_0 = const()[name = tensor("op_2416_transpose_x_0"), val = tensor(false)]; tensor var_2416_transpose_y_0 = const()[name = tensor("op_2416_transpose_y_0"), val = tensor(false)]; tensor transpose_235 = transpose(perm = var_2410, x = var_2409_cast_fp16)[name = tensor("transpose_235")]; tensor var_2416_cast_fp16 = matmul(transpose_x = var_2416_transpose_x_0, transpose_y = var_2416_transpose_y_0, x = var_2414_cast_fp16, y = transpose_235)[name = tensor("op_2416_cast_fp16")]; tensor var_2417 = const()[name = tensor("op_2417"), val = tensor([0, 2, 1, 3])]; tensor concat_21 = const()[name = tensor("concat_21"), val = tensor([1, 1500, 1280])]; tensor transpose_232 = transpose(perm = var_2417, x = var_2416_cast_fp16)[name = tensor("transpose_232")]; tensor x_263_cast_fp16 = reshape(shape = concat_21, x = transpose_232)[name = tensor("x_263_cast_fp16")]; tensor var_2422_to_fp16 = const()[name = tensor("op_2422_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(647967552)))]; tensor var_2423_to_fp16 = const()[name = tensor("op_2423_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(651244416)))]; tensor linear_129_cast_fp16 = linear(bias = var_2423_to_fp16, weight = var_2422_to_fp16, x = x_263_cast_fp16)[name = tensor("linear_129_cast_fp16")]; tensor x_265_cast_fp16 = add(x = x_259_cast_fp16, y = linear_129_cast_fp16)[name = tensor("x_265_cast_fp16")]; tensor var_2430_axes_0 = const()[name = tensor("op_2430_axes_0"), val = tensor([-1])]; tensor blocks_21_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_21_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(651247040)))]; tensor blocks_21_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_21_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(651249664)))]; tensor var_2430_cast_fp16 = layer_norm(axes = var_2430_axes_0, beta = blocks_21_mlp_ln_bias_to_fp16, epsilon = var_2356_to_fp16, gamma = blocks_21_mlp_ln_weight_to_fp16, x = x_265_cast_fp16)[name = tensor("op_2430_cast_fp16")]; tensor var_2439_to_fp16 = const()[name = tensor("op_2439_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(651252288)))]; tensor var_2440_to_fp16 = const()[name = tensor("op_2440_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(663868032)))]; tensor linear_130_cast_fp16 = linear(bias = var_2440_to_fp16, weight = var_2439_to_fp16, x = var_2430_cast_fp16)[name = tensor("linear_130_cast_fp16")]; tensor x_269_mode_0 = const()[name = tensor("x_269_mode_0"), val = tensor("EXACT")]; tensor x_269_cast_fp16 = gelu(mode = x_269_mode_0, x = linear_130_cast_fp16)[name = tensor("x_269_cast_fp16")]; tensor var_2445_to_fp16 = const()[name = tensor("op_2445_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(663877952)))]; tensor var_2446_to_fp16 = const()[name = tensor("op_2446_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(676493696)))]; tensor linear_131_cast_fp16 = linear(bias = var_2446_to_fp16, weight = var_2445_to_fp16, x = x_269_cast_fp16)[name = tensor("linear_131_cast_fp16")]; tensor x_271_cast_fp16 = add(x = x_265_cast_fp16, y = linear_131_cast_fp16)[name = tensor("x_271_cast_fp16")]; tensor var_2456 = const()[name = tensor("op_2456"), val = tensor(-1)]; tensor var_2472_axes_0 = const()[name = tensor("op_2472_axes_0"), val = tensor([-1])]; tensor blocks_22_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_22_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(676496320)))]; tensor blocks_22_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_22_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(676498944)))]; tensor var_2462_to_fp16 = const()[name = tensor("op_2462_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2472_cast_fp16 = layer_norm(axes = var_2472_axes_0, beta = blocks_22_attn_ln_bias_to_fp16, epsilon = var_2462_to_fp16, gamma = blocks_22_attn_ln_weight_to_fp16, x = x_271_cast_fp16)[name = tensor("op_2472_cast_fp16")]; tensor var_2483_to_fp16 = const()[name = tensor("op_2483_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(676501568)))]; tensor var_2484_to_fp16 = const()[name = tensor("op_2484_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(679778432)))]; tensor linear_132_cast_fp16 = linear(bias = var_2484_to_fp16, weight = var_2483_to_fp16, x = var_2472_cast_fp16)[name = tensor("linear_132_cast_fp16")]; tensor var_2487_to_fp16 = const()[name = tensor("op_2487_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(679781056)))]; tensor linear_133_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_2487_to_fp16, x = var_2472_cast_fp16)[name = tensor("linear_133_cast_fp16")]; tensor var_2491_to_fp16 = const()[name = tensor("op_2491_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(683057920)))]; tensor var_2492_to_fp16 = const()[name = tensor("op_2492_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(686334784)))]; tensor linear_134_cast_fp16 = linear(bias = var_2492_to_fp16, weight = var_2491_to_fp16, x = var_2472_cast_fp16)[name = tensor("linear_134_cast_fp16")]; tensor var_2500 = const()[name = tensor("op_2500"), val = tensor([1, 1500, 20, -1])]; tensor var_2501_cast_fp16 = reshape(shape = var_2500, x = linear_132_cast_fp16)[name = tensor("op_2501_cast_fp16")]; tensor const_268_to_fp16 = const()[name = tensor("const_268_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_91_cast_fp16 = mul(x = var_2501_cast_fp16, y = const_268_to_fp16)[name = tensor("q_91_cast_fp16")]; tensor var_2507 = const()[name = tensor("op_2507"), val = tensor([1, 1500, 20, -1])]; tensor var_2508_cast_fp16 = reshape(shape = var_2507, x = linear_133_cast_fp16)[name = tensor("op_2508_cast_fp16")]; tensor const_269_to_fp16 = const()[name = tensor("const_269_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_91_cast_fp16 = mul(x = var_2508_cast_fp16, y = const_269_to_fp16)[name = tensor("k_91_cast_fp16")]; tensor var_2514 = const()[name = tensor("op_2514"), val = tensor([1, 1500, 20, -1])]; tensor var_2515_cast_fp16 = reshape(shape = var_2514, x = linear_134_cast_fp16)[name = tensor("op_2515_cast_fp16")]; tensor var_2516 = const()[name = tensor("op_2516"), val = tensor([0, 2, 1, 3])]; tensor qk_45_transpose_x_0 = const()[name = tensor("qk_45_transpose_x_0"), val = tensor(false)]; tensor qk_45_transpose_y_0 = const()[name = tensor("qk_45_transpose_y_0"), val = tensor(false)]; tensor transpose_172_perm_0 = const()[name = tensor("transpose_172_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_173_perm_0 = const()[name = tensor("transpose_173_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_229 = transpose(perm = transpose_173_perm_0, x = k_91_cast_fp16)[name = tensor("transpose_229")]; tensor transpose_230 = transpose(perm = transpose_172_perm_0, x = q_91_cast_fp16)[name = tensor("transpose_230")]; tensor qk_45_cast_fp16 = matmul(transpose_x = qk_45_transpose_x_0, transpose_y = qk_45_transpose_y_0, x = transpose_230, y = transpose_229)[name = tensor("qk_45_cast_fp16")]; tensor var_2520_cast_fp16 = softmax(axis = var_2456, x = qk_45_cast_fp16)[name = tensor("op_2520_cast_fp16")]; tensor var_2522_transpose_x_0 = const()[name = tensor("op_2522_transpose_x_0"), val = tensor(false)]; tensor var_2522_transpose_y_0 = const()[name = tensor("op_2522_transpose_y_0"), val = tensor(false)]; tensor transpose_231 = transpose(perm = var_2516, x = var_2515_cast_fp16)[name = tensor("transpose_231")]; tensor var_2522_cast_fp16 = matmul(transpose_x = var_2522_transpose_x_0, transpose_y = var_2522_transpose_y_0, x = var_2520_cast_fp16, y = transpose_231)[name = tensor("op_2522_cast_fp16")]; tensor var_2523 = const()[name = tensor("op_2523"), val = tensor([0, 2, 1, 3])]; tensor concat_22 = const()[name = tensor("concat_22"), val = tensor([1, 1500, 1280])]; tensor transpose_228 = transpose(perm = var_2523, x = var_2522_cast_fp16)[name = tensor("transpose_228")]; tensor x_275_cast_fp16 = reshape(shape = concat_22, x = transpose_228)[name = tensor("x_275_cast_fp16")]; tensor var_2528_to_fp16 = const()[name = tensor("op_2528_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(686337408)))]; tensor var_2529_to_fp16 = const()[name = tensor("op_2529_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(689614272)))]; tensor linear_135_cast_fp16 = linear(bias = var_2529_to_fp16, weight = var_2528_to_fp16, x = x_275_cast_fp16)[name = tensor("linear_135_cast_fp16")]; tensor x_277_cast_fp16 = add(x = x_271_cast_fp16, y = linear_135_cast_fp16)[name = tensor("x_277_cast_fp16")]; tensor var_2536_axes_0 = const()[name = tensor("op_2536_axes_0"), val = tensor([-1])]; tensor blocks_22_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_22_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(689616896)))]; tensor blocks_22_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_22_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(689619520)))]; tensor var_2536_cast_fp16 = layer_norm(axes = var_2536_axes_0, beta = blocks_22_mlp_ln_bias_to_fp16, epsilon = var_2462_to_fp16, gamma = blocks_22_mlp_ln_weight_to_fp16, x = x_277_cast_fp16)[name = tensor("op_2536_cast_fp16")]; tensor var_2545_to_fp16 = const()[name = tensor("op_2545_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(689622144)))]; tensor var_2546_to_fp16 = const()[name = tensor("op_2546_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(702401728)))]; tensor linear_136_cast_fp16 = linear(bias = var_2546_to_fp16, weight = var_2545_to_fp16, x = var_2536_cast_fp16)[name = tensor("linear_136_cast_fp16")]; tensor x_281_mode_0 = const()[name = tensor("x_281_mode_0"), val = tensor("EXACT")]; tensor x_281_cast_fp16 = gelu(mode = x_281_mode_0, x = linear_136_cast_fp16)[name = tensor("x_281_cast_fp16")]; tensor var_2551_to_fp16 = const()[name = tensor("op_2551_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(702411776)))]; tensor var_2552_to_fp16 = const()[name = tensor("op_2552_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(715191360)))]; tensor linear_137_cast_fp16 = linear(bias = var_2552_to_fp16, weight = var_2551_to_fp16, x = x_281_cast_fp16)[name = tensor("linear_137_cast_fp16")]; tensor x_283_cast_fp16 = add(x = x_277_cast_fp16, y = linear_137_cast_fp16)[name = tensor("x_283_cast_fp16")]; tensor var_2562 = const()[name = tensor("op_2562"), val = tensor(-1)]; tensor var_2578_axes_0 = const()[name = tensor("op_2578_axes_0"), val = tensor([-1])]; tensor blocks_23_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_23_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(715193984)))]; tensor blocks_23_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_23_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(715196608)))]; tensor var_2568_to_fp16 = const()[name = tensor("op_2568_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2578_cast_fp16 = layer_norm(axes = var_2578_axes_0, beta = blocks_23_attn_ln_bias_to_fp16, epsilon = var_2568_to_fp16, gamma = blocks_23_attn_ln_weight_to_fp16, x = x_283_cast_fp16)[name = tensor("op_2578_cast_fp16")]; tensor var_2589_to_fp16 = const()[name = tensor("op_2589_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(715199232)))]; tensor var_2590_to_fp16 = const()[name = tensor("op_2590_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(718476096)))]; tensor linear_138_cast_fp16 = linear(bias = var_2590_to_fp16, weight = var_2589_to_fp16, x = var_2578_cast_fp16)[name = tensor("linear_138_cast_fp16")]; tensor var_2593_to_fp16 = const()[name = tensor("op_2593_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(718478720)))]; tensor linear_139_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_2593_to_fp16, x = var_2578_cast_fp16)[name = tensor("linear_139_cast_fp16")]; tensor var_2597_to_fp16 = const()[name = tensor("op_2597_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(721755584)))]; tensor var_2598_to_fp16 = const()[name = tensor("op_2598_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(725032448)))]; tensor linear_140_cast_fp16 = linear(bias = var_2598_to_fp16, weight = var_2597_to_fp16, x = var_2578_cast_fp16)[name = tensor("linear_140_cast_fp16")]; tensor var_2606 = const()[name = tensor("op_2606"), val = tensor([1, 1500, 20, -1])]; tensor var_2607_cast_fp16 = reshape(shape = var_2606, x = linear_138_cast_fp16)[name = tensor("op_2607_cast_fp16")]; tensor const_270_to_fp16 = const()[name = tensor("const_270_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_95_cast_fp16 = mul(x = var_2607_cast_fp16, y = const_270_to_fp16)[name = tensor("q_95_cast_fp16")]; tensor var_2613 = const()[name = tensor("op_2613"), val = tensor([1, 1500, 20, -1])]; tensor var_2614_cast_fp16 = reshape(shape = var_2613, x = linear_139_cast_fp16)[name = tensor("op_2614_cast_fp16")]; tensor const_271_to_fp16 = const()[name = tensor("const_271_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_95_cast_fp16 = mul(x = var_2614_cast_fp16, y = const_271_to_fp16)[name = tensor("k_95_cast_fp16")]; tensor var_2620 = const()[name = tensor("op_2620"), val = tensor([1, 1500, 20, -1])]; tensor var_2621_cast_fp16 = reshape(shape = var_2620, x = linear_140_cast_fp16)[name = tensor("op_2621_cast_fp16")]; tensor var_2622 = const()[name = tensor("op_2622"), val = tensor([0, 2, 1, 3])]; tensor qk_47_transpose_x_0 = const()[name = tensor("qk_47_transpose_x_0"), val = tensor(false)]; tensor qk_47_transpose_y_0 = const()[name = tensor("qk_47_transpose_y_0"), val = tensor(false)]; tensor transpose_174_perm_0 = const()[name = tensor("transpose_174_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_175_perm_0 = const()[name = tensor("transpose_175_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_225 = transpose(perm = transpose_175_perm_0, x = k_95_cast_fp16)[name = tensor("transpose_225")]; tensor transpose_226 = transpose(perm = transpose_174_perm_0, x = q_95_cast_fp16)[name = tensor("transpose_226")]; tensor qk_47_cast_fp16 = matmul(transpose_x = qk_47_transpose_x_0, transpose_y = qk_47_transpose_y_0, x = transpose_226, y = transpose_225)[name = tensor("qk_47_cast_fp16")]; tensor var_2626_cast_fp16 = softmax(axis = var_2562, x = qk_47_cast_fp16)[name = tensor("op_2626_cast_fp16")]; tensor var_2628_transpose_x_0 = const()[name = tensor("op_2628_transpose_x_0"), val = tensor(false)]; tensor var_2628_transpose_y_0 = const()[name = tensor("op_2628_transpose_y_0"), val = tensor(false)]; tensor transpose_227 = transpose(perm = var_2622, x = var_2621_cast_fp16)[name = tensor("transpose_227")]; tensor var_2628_cast_fp16 = matmul(transpose_x = var_2628_transpose_x_0, transpose_y = var_2628_transpose_y_0, x = var_2626_cast_fp16, y = transpose_227)[name = tensor("op_2628_cast_fp16")]; tensor var_2629 = const()[name = tensor("op_2629"), val = tensor([0, 2, 1, 3])]; tensor concat_23 = const()[name = tensor("concat_23"), val = tensor([1, 1500, 1280])]; tensor transpose_224 = transpose(perm = var_2629, x = var_2628_cast_fp16)[name = tensor("transpose_224")]; tensor x_287_cast_fp16 = reshape(shape = concat_23, x = transpose_224)[name = tensor("x_287_cast_fp16")]; tensor var_2634_to_fp16 = const()[name = tensor("op_2634_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(725035072)))]; tensor var_2635_to_fp16 = const()[name = tensor("op_2635_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(728311936)))]; tensor linear_141_cast_fp16 = linear(bias = var_2635_to_fp16, weight = var_2634_to_fp16, x = x_287_cast_fp16)[name = tensor("linear_141_cast_fp16")]; tensor x_289_cast_fp16 = add(x = x_283_cast_fp16, y = linear_141_cast_fp16)[name = tensor("x_289_cast_fp16")]; tensor var_2642_axes_0 = const()[name = tensor("op_2642_axes_0"), val = tensor([-1])]; tensor blocks_23_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_23_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(728314560)))]; tensor blocks_23_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_23_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(728317184)))]; tensor var_2642_cast_fp16 = layer_norm(axes = var_2642_axes_0, beta = blocks_23_mlp_ln_bias_to_fp16, epsilon = var_2568_to_fp16, gamma = blocks_23_mlp_ln_weight_to_fp16, x = x_289_cast_fp16)[name = tensor("op_2642_cast_fp16")]; tensor var_2651_to_fp16 = const()[name = tensor("op_2651_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(728319808)))]; tensor var_2652_to_fp16 = const()[name = tensor("op_2652_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(741181312)))]; tensor linear_142_cast_fp16 = linear(bias = var_2652_to_fp16, weight = var_2651_to_fp16, x = var_2642_cast_fp16)[name = tensor("linear_142_cast_fp16")]; tensor x_293_mode_0 = const()[name = tensor("x_293_mode_0"), val = tensor("EXACT")]; tensor x_293_cast_fp16 = gelu(mode = x_293_mode_0, x = linear_142_cast_fp16)[name = tensor("x_293_cast_fp16")]; tensor var_2657_to_fp16 = const()[name = tensor("op_2657_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(741191424)))]; tensor var_2658_to_fp16 = const()[name = tensor("op_2658_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(754052928)))]; tensor linear_143_cast_fp16 = linear(bias = var_2658_to_fp16, weight = var_2657_to_fp16, x = x_293_cast_fp16)[name = tensor("linear_143_cast_fp16")]; tensor x_295_cast_fp16 = add(x = x_289_cast_fp16, y = linear_143_cast_fp16)[name = tensor("x_295_cast_fp16")]; tensor var_2668 = const()[name = tensor("op_2668"), val = tensor(-1)]; tensor var_2684_axes_0 = const()[name = tensor("op_2684_axes_0"), val = tensor([-1])]; tensor blocks_24_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_24_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(754055552)))]; tensor blocks_24_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_24_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(754058176)))]; tensor var_2674_to_fp16 = const()[name = tensor("op_2674_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2684_cast_fp16 = layer_norm(axes = var_2684_axes_0, beta = blocks_24_attn_ln_bias_to_fp16, epsilon = var_2674_to_fp16, gamma = blocks_24_attn_ln_weight_to_fp16, x = x_295_cast_fp16)[name = tensor("op_2684_cast_fp16")]; tensor var_2695_to_fp16 = const()[name = tensor("op_2695_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(754060800)))]; tensor var_2696_to_fp16 = const()[name = tensor("op_2696_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(757337664)))]; tensor linear_144_cast_fp16 = linear(bias = var_2696_to_fp16, weight = var_2695_to_fp16, x = var_2684_cast_fp16)[name = tensor("linear_144_cast_fp16")]; tensor var_2699_to_fp16 = const()[name = tensor("op_2699_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(757340288)))]; tensor linear_145_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_2699_to_fp16, x = var_2684_cast_fp16)[name = tensor("linear_145_cast_fp16")]; tensor var_2703_to_fp16 = const()[name = tensor("op_2703_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(760617152)))]; tensor var_2704_to_fp16 = const()[name = tensor("op_2704_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(763894016)))]; tensor linear_146_cast_fp16 = linear(bias = var_2704_to_fp16, weight = var_2703_to_fp16, x = var_2684_cast_fp16)[name = tensor("linear_146_cast_fp16")]; tensor var_2712 = const()[name = tensor("op_2712"), val = tensor([1, 1500, 20, -1])]; tensor var_2713_cast_fp16 = reshape(shape = var_2712, x = linear_144_cast_fp16)[name = tensor("op_2713_cast_fp16")]; tensor const_272_to_fp16 = const()[name = tensor("const_272_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_99_cast_fp16 = mul(x = var_2713_cast_fp16, y = const_272_to_fp16)[name = tensor("q_99_cast_fp16")]; tensor var_2719 = const()[name = tensor("op_2719"), val = tensor([1, 1500, 20, -1])]; tensor var_2720_cast_fp16 = reshape(shape = var_2719, x = linear_145_cast_fp16)[name = tensor("op_2720_cast_fp16")]; tensor const_273_to_fp16 = const()[name = tensor("const_273_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_99_cast_fp16 = mul(x = var_2720_cast_fp16, y = const_273_to_fp16)[name = tensor("k_99_cast_fp16")]; tensor var_2726 = const()[name = tensor("op_2726"), val = tensor([1, 1500, 20, -1])]; tensor var_2727_cast_fp16 = reshape(shape = var_2726, x = linear_146_cast_fp16)[name = tensor("op_2727_cast_fp16")]; tensor var_2728 = const()[name = tensor("op_2728"), val = tensor([0, 2, 1, 3])]; tensor qk_49_transpose_x_0 = const()[name = tensor("qk_49_transpose_x_0"), val = tensor(false)]; tensor qk_49_transpose_y_0 = const()[name = tensor("qk_49_transpose_y_0"), val = tensor(false)]; tensor transpose_176_perm_0 = const()[name = tensor("transpose_176_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_177_perm_0 = const()[name = tensor("transpose_177_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_221 = transpose(perm = transpose_177_perm_0, x = k_99_cast_fp16)[name = tensor("transpose_221")]; tensor transpose_222 = transpose(perm = transpose_176_perm_0, x = q_99_cast_fp16)[name = tensor("transpose_222")]; tensor qk_49_cast_fp16 = matmul(transpose_x = qk_49_transpose_x_0, transpose_y = qk_49_transpose_y_0, x = transpose_222, y = transpose_221)[name = tensor("qk_49_cast_fp16")]; tensor var_2732_cast_fp16 = softmax(axis = var_2668, x = qk_49_cast_fp16)[name = tensor("op_2732_cast_fp16")]; tensor var_2734_transpose_x_0 = const()[name = tensor("op_2734_transpose_x_0"), val = tensor(false)]; tensor var_2734_transpose_y_0 = const()[name = tensor("op_2734_transpose_y_0"), val = tensor(false)]; tensor transpose_223 = transpose(perm = var_2728, x = var_2727_cast_fp16)[name = tensor("transpose_223")]; tensor var_2734_cast_fp16 = matmul(transpose_x = var_2734_transpose_x_0, transpose_y = var_2734_transpose_y_0, x = var_2732_cast_fp16, y = transpose_223)[name = tensor("op_2734_cast_fp16")]; tensor var_2735 = const()[name = tensor("op_2735"), val = tensor([0, 2, 1, 3])]; tensor concat_24 = const()[name = tensor("concat_24"), val = tensor([1, 1500, 1280])]; tensor transpose_220 = transpose(perm = var_2735, x = var_2734_cast_fp16)[name = tensor("transpose_220")]; tensor x_299_cast_fp16 = reshape(shape = concat_24, x = transpose_220)[name = tensor("x_299_cast_fp16")]; tensor var_2740_to_fp16 = const()[name = tensor("op_2740_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(763896640)))]; tensor var_2741_to_fp16 = const()[name = tensor("op_2741_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(767173504)))]; tensor linear_147_cast_fp16 = linear(bias = var_2741_to_fp16, weight = var_2740_to_fp16, x = x_299_cast_fp16)[name = tensor("linear_147_cast_fp16")]; tensor x_301_cast_fp16 = add(x = x_295_cast_fp16, y = linear_147_cast_fp16)[name = tensor("x_301_cast_fp16")]; tensor var_2748_axes_0 = const()[name = tensor("op_2748_axes_0"), val = tensor([-1])]; tensor blocks_24_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_24_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(767176128)))]; tensor blocks_24_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_24_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(767178752)))]; tensor var_2748_cast_fp16 = layer_norm(axes = var_2748_axes_0, beta = blocks_24_mlp_ln_bias_to_fp16, epsilon = var_2674_to_fp16, gamma = blocks_24_mlp_ln_weight_to_fp16, x = x_301_cast_fp16)[name = tensor("op_2748_cast_fp16")]; tensor var_2757_to_fp16 = const()[name = tensor("op_2757_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(767181376)))]; tensor var_2758_to_fp16 = const()[name = tensor("op_2758_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(780042880)))]; tensor linear_148_cast_fp16 = linear(bias = var_2758_to_fp16, weight = var_2757_to_fp16, x = var_2748_cast_fp16)[name = tensor("linear_148_cast_fp16")]; tensor x_305_mode_0 = const()[name = tensor("x_305_mode_0"), val = tensor("EXACT")]; tensor x_305_cast_fp16 = gelu(mode = x_305_mode_0, x = linear_148_cast_fp16)[name = tensor("x_305_cast_fp16")]; tensor var_2763_to_fp16 = const()[name = tensor("op_2763_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(780052992)))]; tensor var_2764_to_fp16 = const()[name = tensor("op_2764_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(792914496)))]; tensor linear_149_cast_fp16 = linear(bias = var_2764_to_fp16, weight = var_2763_to_fp16, x = x_305_cast_fp16)[name = tensor("linear_149_cast_fp16")]; tensor x_307_cast_fp16 = add(x = x_301_cast_fp16, y = linear_149_cast_fp16)[name = tensor("x_307_cast_fp16")]; tensor var_2774 = const()[name = tensor("op_2774"), val = tensor(-1)]; tensor var_2790_axes_0 = const()[name = tensor("op_2790_axes_0"), val = tensor([-1])]; tensor blocks_25_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_25_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(792917120)))]; tensor blocks_25_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_25_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(792919744)))]; tensor var_2780_to_fp16 = const()[name = tensor("op_2780_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2790_cast_fp16 = layer_norm(axes = var_2790_axes_0, beta = blocks_25_attn_ln_bias_to_fp16, epsilon = var_2780_to_fp16, gamma = blocks_25_attn_ln_weight_to_fp16, x = x_307_cast_fp16)[name = tensor("op_2790_cast_fp16")]; tensor var_2801_to_fp16 = const()[name = tensor("op_2801_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(792922368)))]; tensor var_2802_to_fp16 = const()[name = tensor("op_2802_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(796199232)))]; tensor linear_150_cast_fp16 = linear(bias = var_2802_to_fp16, weight = var_2801_to_fp16, x = var_2790_cast_fp16)[name = tensor("linear_150_cast_fp16")]; tensor var_2805_to_fp16 = const()[name = tensor("op_2805_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(796201856)))]; tensor linear_151_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_2805_to_fp16, x = var_2790_cast_fp16)[name = tensor("linear_151_cast_fp16")]; tensor var_2809_to_fp16 = const()[name = tensor("op_2809_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(799478720)))]; tensor var_2810_to_fp16 = const()[name = tensor("op_2810_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(802755584)))]; tensor linear_152_cast_fp16 = linear(bias = var_2810_to_fp16, weight = var_2809_to_fp16, x = var_2790_cast_fp16)[name = tensor("linear_152_cast_fp16")]; tensor var_2818 = const()[name = tensor("op_2818"), val = tensor([1, 1500, 20, -1])]; tensor var_2819_cast_fp16 = reshape(shape = var_2818, x = linear_150_cast_fp16)[name = tensor("op_2819_cast_fp16")]; tensor const_274_to_fp16 = const()[name = tensor("const_274_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_103_cast_fp16 = mul(x = var_2819_cast_fp16, y = const_274_to_fp16)[name = tensor("q_103_cast_fp16")]; tensor var_2825 = const()[name = tensor("op_2825"), val = tensor([1, 1500, 20, -1])]; tensor var_2826_cast_fp16 = reshape(shape = var_2825, x = linear_151_cast_fp16)[name = tensor("op_2826_cast_fp16")]; tensor const_275_to_fp16 = const()[name = tensor("const_275_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_103_cast_fp16 = mul(x = var_2826_cast_fp16, y = const_275_to_fp16)[name = tensor("k_103_cast_fp16")]; tensor var_2832 = const()[name = tensor("op_2832"), val = tensor([1, 1500, 20, -1])]; tensor var_2833_cast_fp16 = reshape(shape = var_2832, x = linear_152_cast_fp16)[name = tensor("op_2833_cast_fp16")]; tensor var_2834 = const()[name = tensor("op_2834"), val = tensor([0, 2, 1, 3])]; tensor qk_51_transpose_x_0 = const()[name = tensor("qk_51_transpose_x_0"), val = tensor(false)]; tensor qk_51_transpose_y_0 = const()[name = tensor("qk_51_transpose_y_0"), val = tensor(false)]; tensor transpose_178_perm_0 = const()[name = tensor("transpose_178_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_179_perm_0 = const()[name = tensor("transpose_179_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_217 = transpose(perm = transpose_179_perm_0, x = k_103_cast_fp16)[name = tensor("transpose_217")]; tensor transpose_218 = transpose(perm = transpose_178_perm_0, x = q_103_cast_fp16)[name = tensor("transpose_218")]; tensor qk_51_cast_fp16 = matmul(transpose_x = qk_51_transpose_x_0, transpose_y = qk_51_transpose_y_0, x = transpose_218, y = transpose_217)[name = tensor("qk_51_cast_fp16")]; tensor var_2838_cast_fp16 = softmax(axis = var_2774, x = qk_51_cast_fp16)[name = tensor("op_2838_cast_fp16")]; tensor var_2840_transpose_x_0 = const()[name = tensor("op_2840_transpose_x_0"), val = tensor(false)]; tensor var_2840_transpose_y_0 = const()[name = tensor("op_2840_transpose_y_0"), val = tensor(false)]; tensor transpose_219 = transpose(perm = var_2834, x = var_2833_cast_fp16)[name = tensor("transpose_219")]; tensor var_2840_cast_fp16 = matmul(transpose_x = var_2840_transpose_x_0, transpose_y = var_2840_transpose_y_0, x = var_2838_cast_fp16, y = transpose_219)[name = tensor("op_2840_cast_fp16")]; tensor var_2841 = const()[name = tensor("op_2841"), val = tensor([0, 2, 1, 3])]; tensor concat_25 = const()[name = tensor("concat_25"), val = tensor([1, 1500, 1280])]; tensor transpose_216 = transpose(perm = var_2841, x = var_2840_cast_fp16)[name = tensor("transpose_216")]; tensor x_311_cast_fp16 = reshape(shape = concat_25, x = transpose_216)[name = tensor("x_311_cast_fp16")]; tensor var_2846_to_fp16 = const()[name = tensor("op_2846_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(802758208)))]; tensor var_2847_to_fp16 = const()[name = tensor("op_2847_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(806035072)))]; tensor linear_153_cast_fp16 = linear(bias = var_2847_to_fp16, weight = var_2846_to_fp16, x = x_311_cast_fp16)[name = tensor("linear_153_cast_fp16")]; tensor x_313_cast_fp16 = add(x = x_307_cast_fp16, y = linear_153_cast_fp16)[name = tensor("x_313_cast_fp16")]; tensor var_2854_axes_0 = const()[name = tensor("op_2854_axes_0"), val = tensor([-1])]; tensor blocks_25_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_25_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(806037696)))]; tensor blocks_25_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_25_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(806040320)))]; tensor var_2854_cast_fp16 = layer_norm(axes = var_2854_axes_0, beta = blocks_25_mlp_ln_bias_to_fp16, epsilon = var_2780_to_fp16, gamma = blocks_25_mlp_ln_weight_to_fp16, x = x_313_cast_fp16)[name = tensor("op_2854_cast_fp16")]; tensor var_2863_to_fp16 = const()[name = tensor("op_2863_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(806042944)))]; tensor var_2864_to_fp16 = const()[name = tensor("op_2864_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(818822528)))]; tensor linear_154_cast_fp16 = linear(bias = var_2864_to_fp16, weight = var_2863_to_fp16, x = var_2854_cast_fp16)[name = tensor("linear_154_cast_fp16")]; tensor x_317_mode_0 = const()[name = tensor("x_317_mode_0"), val = tensor("EXACT")]; tensor x_317_cast_fp16 = gelu(mode = x_317_mode_0, x = linear_154_cast_fp16)[name = tensor("x_317_cast_fp16")]; tensor var_2869_to_fp16 = const()[name = tensor("op_2869_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(818832576)))]; tensor var_2870_to_fp16 = const()[name = tensor("op_2870_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(831612160)))]; tensor linear_155_cast_fp16 = linear(bias = var_2870_to_fp16, weight = var_2869_to_fp16, x = x_317_cast_fp16)[name = tensor("linear_155_cast_fp16")]; tensor x_319_cast_fp16 = add(x = x_313_cast_fp16, y = linear_155_cast_fp16)[name = tensor("x_319_cast_fp16")]; tensor var_2880 = const()[name = tensor("op_2880"), val = tensor(-1)]; tensor var_2896_axes_0 = const()[name = tensor("op_2896_axes_0"), val = tensor([-1])]; tensor blocks_26_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_26_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(831614784)))]; tensor blocks_26_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_26_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(831617408)))]; tensor var_2886_to_fp16 = const()[name = tensor("op_2886_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2896_cast_fp16 = layer_norm(axes = var_2896_axes_0, beta = blocks_26_attn_ln_bias_to_fp16, epsilon = var_2886_to_fp16, gamma = blocks_26_attn_ln_weight_to_fp16, x = x_319_cast_fp16)[name = tensor("op_2896_cast_fp16")]; tensor var_2907_to_fp16 = const()[name = tensor("op_2907_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(831620032)))]; tensor var_2908_to_fp16 = const()[name = tensor("op_2908_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(834896896)))]; tensor linear_156_cast_fp16 = linear(bias = var_2908_to_fp16, weight = var_2907_to_fp16, x = var_2896_cast_fp16)[name = tensor("linear_156_cast_fp16")]; tensor var_2911_to_fp16 = const()[name = tensor("op_2911_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(834899520)))]; tensor linear_157_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_2911_to_fp16, x = var_2896_cast_fp16)[name = tensor("linear_157_cast_fp16")]; tensor var_2915_to_fp16 = const()[name = tensor("op_2915_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(838176384)))]; tensor var_2916_to_fp16 = const()[name = tensor("op_2916_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(841453248)))]; tensor linear_158_cast_fp16 = linear(bias = var_2916_to_fp16, weight = var_2915_to_fp16, x = var_2896_cast_fp16)[name = tensor("linear_158_cast_fp16")]; tensor var_2924 = const()[name = tensor("op_2924"), val = tensor([1, 1500, 20, -1])]; tensor var_2925_cast_fp16 = reshape(shape = var_2924, x = linear_156_cast_fp16)[name = tensor("op_2925_cast_fp16")]; tensor const_276_to_fp16 = const()[name = tensor("const_276_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_107_cast_fp16 = mul(x = var_2925_cast_fp16, y = const_276_to_fp16)[name = tensor("q_107_cast_fp16")]; tensor var_2931 = const()[name = tensor("op_2931"), val = tensor([1, 1500, 20, -1])]; tensor var_2932_cast_fp16 = reshape(shape = var_2931, x = linear_157_cast_fp16)[name = tensor("op_2932_cast_fp16")]; tensor const_277_to_fp16 = const()[name = tensor("const_277_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_107_cast_fp16 = mul(x = var_2932_cast_fp16, y = const_277_to_fp16)[name = tensor("k_107_cast_fp16")]; tensor var_2938 = const()[name = tensor("op_2938"), val = tensor([1, 1500, 20, -1])]; tensor var_2939_cast_fp16 = reshape(shape = var_2938, x = linear_158_cast_fp16)[name = tensor("op_2939_cast_fp16")]; tensor var_2940 = const()[name = tensor("op_2940"), val = tensor([0, 2, 1, 3])]; tensor qk_53_transpose_x_0 = const()[name = tensor("qk_53_transpose_x_0"), val = tensor(false)]; tensor qk_53_transpose_y_0 = const()[name = tensor("qk_53_transpose_y_0"), val = tensor(false)]; tensor transpose_180_perm_0 = const()[name = tensor("transpose_180_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_181_perm_0 = const()[name = tensor("transpose_181_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_213 = transpose(perm = transpose_181_perm_0, x = k_107_cast_fp16)[name = tensor("transpose_213")]; tensor transpose_214 = transpose(perm = transpose_180_perm_0, x = q_107_cast_fp16)[name = tensor("transpose_214")]; tensor qk_53_cast_fp16 = matmul(transpose_x = qk_53_transpose_x_0, transpose_y = qk_53_transpose_y_0, x = transpose_214, y = transpose_213)[name = tensor("qk_53_cast_fp16")]; tensor var_2944_cast_fp16 = softmax(axis = var_2880, x = qk_53_cast_fp16)[name = tensor("op_2944_cast_fp16")]; tensor var_2946_transpose_x_0 = const()[name = tensor("op_2946_transpose_x_0"), val = tensor(false)]; tensor var_2946_transpose_y_0 = const()[name = tensor("op_2946_transpose_y_0"), val = tensor(false)]; tensor transpose_215 = transpose(perm = var_2940, x = var_2939_cast_fp16)[name = tensor("transpose_215")]; tensor var_2946_cast_fp16 = matmul(transpose_x = var_2946_transpose_x_0, transpose_y = var_2946_transpose_y_0, x = var_2944_cast_fp16, y = transpose_215)[name = tensor("op_2946_cast_fp16")]; tensor var_2947 = const()[name = tensor("op_2947"), val = tensor([0, 2, 1, 3])]; tensor concat_26 = const()[name = tensor("concat_26"), val = tensor([1, 1500, 1280])]; tensor transpose_212 = transpose(perm = var_2947, x = var_2946_cast_fp16)[name = tensor("transpose_212")]; tensor x_323_cast_fp16 = reshape(shape = concat_26, x = transpose_212)[name = tensor("x_323_cast_fp16")]; tensor var_2952_to_fp16 = const()[name = tensor("op_2952_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(841455872)))]; tensor var_2953_to_fp16 = const()[name = tensor("op_2953_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(844732736)))]; tensor linear_159_cast_fp16 = linear(bias = var_2953_to_fp16, weight = var_2952_to_fp16, x = x_323_cast_fp16)[name = tensor("linear_159_cast_fp16")]; tensor x_325_cast_fp16 = add(x = x_319_cast_fp16, y = linear_159_cast_fp16)[name = tensor("x_325_cast_fp16")]; tensor var_2960_axes_0 = const()[name = tensor("op_2960_axes_0"), val = tensor([-1])]; tensor blocks_26_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_26_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(844735360)))]; tensor blocks_26_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_26_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(844737984)))]; tensor var_2960_cast_fp16 = layer_norm(axes = var_2960_axes_0, beta = blocks_26_mlp_ln_bias_to_fp16, epsilon = var_2886_to_fp16, gamma = blocks_26_mlp_ln_weight_to_fp16, x = x_325_cast_fp16)[name = tensor("op_2960_cast_fp16")]; tensor var_2969_to_fp16 = const()[name = tensor("op_2969_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(844740608)))]; tensor var_2970_to_fp16 = const()[name = tensor("op_2970_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(857520192)))]; tensor linear_160_cast_fp16 = linear(bias = var_2970_to_fp16, weight = var_2969_to_fp16, x = var_2960_cast_fp16)[name = tensor("linear_160_cast_fp16")]; tensor x_329_mode_0 = const()[name = tensor("x_329_mode_0"), val = tensor("EXACT")]; tensor x_329_cast_fp16 = gelu(mode = x_329_mode_0, x = linear_160_cast_fp16)[name = tensor("x_329_cast_fp16")]; tensor var_2975_to_fp16 = const()[name = tensor("op_2975_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(857530240)))]; tensor var_2976_to_fp16 = const()[name = tensor("op_2976_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(870309824)))]; tensor linear_161_cast_fp16 = linear(bias = var_2976_to_fp16, weight = var_2975_to_fp16, x = x_329_cast_fp16)[name = tensor("linear_161_cast_fp16")]; tensor x_331_cast_fp16 = add(x = x_325_cast_fp16, y = linear_161_cast_fp16)[name = tensor("x_331_cast_fp16")]; tensor var_2986 = const()[name = tensor("op_2986"), val = tensor(-1)]; tensor var_3002_axes_0 = const()[name = tensor("op_3002_axes_0"), val = tensor([-1])]; tensor blocks_27_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_27_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(870312448)))]; tensor blocks_27_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_27_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(870315072)))]; tensor var_2992_to_fp16 = const()[name = tensor("op_2992_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3002_cast_fp16 = layer_norm(axes = var_3002_axes_0, beta = blocks_27_attn_ln_bias_to_fp16, epsilon = var_2992_to_fp16, gamma = blocks_27_attn_ln_weight_to_fp16, x = x_331_cast_fp16)[name = tensor("op_3002_cast_fp16")]; tensor var_3013_to_fp16 = const()[name = tensor("op_3013_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(870317696)))]; tensor var_3014_to_fp16 = const()[name = tensor("op_3014_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(873594560)))]; tensor linear_162_cast_fp16 = linear(bias = var_3014_to_fp16, weight = var_3013_to_fp16, x = var_3002_cast_fp16)[name = tensor("linear_162_cast_fp16")]; tensor var_3017_to_fp16 = const()[name = tensor("op_3017_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(873597184)))]; tensor linear_163_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_3017_to_fp16, x = var_3002_cast_fp16)[name = tensor("linear_163_cast_fp16")]; tensor var_3021_to_fp16 = const()[name = tensor("op_3021_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(876874048)))]; tensor var_3022_to_fp16 = const()[name = tensor("op_3022_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(880150912)))]; tensor linear_164_cast_fp16 = linear(bias = var_3022_to_fp16, weight = var_3021_to_fp16, x = var_3002_cast_fp16)[name = tensor("linear_164_cast_fp16")]; tensor var_3030 = const()[name = tensor("op_3030"), val = tensor([1, 1500, 20, -1])]; tensor var_3031_cast_fp16 = reshape(shape = var_3030, x = linear_162_cast_fp16)[name = tensor("op_3031_cast_fp16")]; tensor const_278_to_fp16 = const()[name = tensor("const_278_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_111_cast_fp16 = mul(x = var_3031_cast_fp16, y = const_278_to_fp16)[name = tensor("q_111_cast_fp16")]; tensor var_3037 = const()[name = tensor("op_3037"), val = tensor([1, 1500, 20, -1])]; tensor var_3038_cast_fp16 = reshape(shape = var_3037, x = linear_163_cast_fp16)[name = tensor("op_3038_cast_fp16")]; tensor const_279_to_fp16 = const()[name = tensor("const_279_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_111_cast_fp16 = mul(x = var_3038_cast_fp16, y = const_279_to_fp16)[name = tensor("k_111_cast_fp16")]; tensor var_3044 = const()[name = tensor("op_3044"), val = tensor([1, 1500, 20, -1])]; tensor var_3045_cast_fp16 = reshape(shape = var_3044, x = linear_164_cast_fp16)[name = tensor("op_3045_cast_fp16")]; tensor var_3046 = const()[name = tensor("op_3046"), val = tensor([0, 2, 1, 3])]; tensor qk_55_transpose_x_0 = const()[name = tensor("qk_55_transpose_x_0"), val = tensor(false)]; tensor qk_55_transpose_y_0 = const()[name = tensor("qk_55_transpose_y_0"), val = tensor(false)]; tensor transpose_182_perm_0 = const()[name = tensor("transpose_182_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_183_perm_0 = const()[name = tensor("transpose_183_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_209 = transpose(perm = transpose_183_perm_0, x = k_111_cast_fp16)[name = tensor("transpose_209")]; tensor transpose_210 = transpose(perm = transpose_182_perm_0, x = q_111_cast_fp16)[name = tensor("transpose_210")]; tensor qk_55_cast_fp16 = matmul(transpose_x = qk_55_transpose_x_0, transpose_y = qk_55_transpose_y_0, x = transpose_210, y = transpose_209)[name = tensor("qk_55_cast_fp16")]; tensor var_3050_cast_fp16 = softmax(axis = var_2986, x = qk_55_cast_fp16)[name = tensor("op_3050_cast_fp16")]; tensor var_3052_transpose_x_0 = const()[name = tensor("op_3052_transpose_x_0"), val = tensor(false)]; tensor var_3052_transpose_y_0 = const()[name = tensor("op_3052_transpose_y_0"), val = tensor(false)]; tensor transpose_211 = transpose(perm = var_3046, x = var_3045_cast_fp16)[name = tensor("transpose_211")]; tensor var_3052_cast_fp16 = matmul(transpose_x = var_3052_transpose_x_0, transpose_y = var_3052_transpose_y_0, x = var_3050_cast_fp16, y = transpose_211)[name = tensor("op_3052_cast_fp16")]; tensor var_3053 = const()[name = tensor("op_3053"), val = tensor([0, 2, 1, 3])]; tensor concat_27 = const()[name = tensor("concat_27"), val = tensor([1, 1500, 1280])]; tensor transpose_208 = transpose(perm = var_3053, x = var_3052_cast_fp16)[name = tensor("transpose_208")]; tensor x_335_cast_fp16 = reshape(shape = concat_27, x = transpose_208)[name = tensor("x_335_cast_fp16")]; tensor var_3058_to_fp16 = const()[name = tensor("op_3058_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(880153536)))]; tensor var_3059_to_fp16 = const()[name = tensor("op_3059_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(883430400)))]; tensor linear_165_cast_fp16 = linear(bias = var_3059_to_fp16, weight = var_3058_to_fp16, x = x_335_cast_fp16)[name = tensor("linear_165_cast_fp16")]; tensor x_337_cast_fp16 = add(x = x_331_cast_fp16, y = linear_165_cast_fp16)[name = tensor("x_337_cast_fp16")]; tensor var_3066_axes_0 = const()[name = tensor("op_3066_axes_0"), val = tensor([-1])]; tensor blocks_27_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_27_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(883433024)))]; tensor blocks_27_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_27_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(883435648)))]; tensor var_3066_cast_fp16 = layer_norm(axes = var_3066_axes_0, beta = blocks_27_mlp_ln_bias_to_fp16, epsilon = var_2992_to_fp16, gamma = blocks_27_mlp_ln_weight_to_fp16, x = x_337_cast_fp16)[name = tensor("op_3066_cast_fp16")]; tensor var_3075_to_fp16 = const()[name = tensor("op_3075_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(883438272)))]; tensor var_3076_to_fp16 = const()[name = tensor("op_3076_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(896299776)))]; tensor linear_166_cast_fp16 = linear(bias = var_3076_to_fp16, weight = var_3075_to_fp16, x = var_3066_cast_fp16)[name = tensor("linear_166_cast_fp16")]; tensor x_341_mode_0 = const()[name = tensor("x_341_mode_0"), val = tensor("EXACT")]; tensor x_341_cast_fp16 = gelu(mode = x_341_mode_0, x = linear_166_cast_fp16)[name = tensor("x_341_cast_fp16")]; tensor var_3081_to_fp16 = const()[name = tensor("op_3081_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(896309888)))]; tensor var_3082_to_fp16 = const()[name = tensor("op_3082_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(909171392)))]; tensor linear_167_cast_fp16 = linear(bias = var_3082_to_fp16, weight = var_3081_to_fp16, x = x_341_cast_fp16)[name = tensor("linear_167_cast_fp16")]; tensor x_343_cast_fp16 = add(x = x_337_cast_fp16, y = linear_167_cast_fp16)[name = tensor("x_343_cast_fp16")]; tensor var_3092 = const()[name = tensor("op_3092"), val = tensor(-1)]; tensor var_3108_axes_0 = const()[name = tensor("op_3108_axes_0"), val = tensor([-1])]; tensor blocks_28_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_28_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(909174016)))]; tensor blocks_28_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_28_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(909176640)))]; tensor var_3098_to_fp16 = const()[name = tensor("op_3098_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3108_cast_fp16 = layer_norm(axes = var_3108_axes_0, beta = blocks_28_attn_ln_bias_to_fp16, epsilon = var_3098_to_fp16, gamma = blocks_28_attn_ln_weight_to_fp16, x = x_343_cast_fp16)[name = tensor("op_3108_cast_fp16")]; tensor var_3119_to_fp16 = const()[name = tensor("op_3119_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(909179264)))]; tensor var_3120_to_fp16 = const()[name = tensor("op_3120_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(912456128)))]; tensor linear_168_cast_fp16 = linear(bias = var_3120_to_fp16, weight = var_3119_to_fp16, x = var_3108_cast_fp16)[name = tensor("linear_168_cast_fp16")]; tensor var_3123_to_fp16 = const()[name = tensor("op_3123_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(912458752)))]; tensor linear_169_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_3123_to_fp16, x = var_3108_cast_fp16)[name = tensor("linear_169_cast_fp16")]; tensor var_3127_to_fp16 = const()[name = tensor("op_3127_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(915735616)))]; tensor var_3128_to_fp16 = const()[name = tensor("op_3128_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(919012480)))]; tensor linear_170_cast_fp16 = linear(bias = var_3128_to_fp16, weight = var_3127_to_fp16, x = var_3108_cast_fp16)[name = tensor("linear_170_cast_fp16")]; tensor var_3136 = const()[name = tensor("op_3136"), val = tensor([1, 1500, 20, -1])]; tensor var_3137_cast_fp16 = reshape(shape = var_3136, x = linear_168_cast_fp16)[name = tensor("op_3137_cast_fp16")]; tensor const_280_to_fp16 = const()[name = tensor("const_280_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_115_cast_fp16 = mul(x = var_3137_cast_fp16, y = const_280_to_fp16)[name = tensor("q_115_cast_fp16")]; tensor var_3143 = const()[name = tensor("op_3143"), val = tensor([1, 1500, 20, -1])]; tensor var_3144_cast_fp16 = reshape(shape = var_3143, x = linear_169_cast_fp16)[name = tensor("op_3144_cast_fp16")]; tensor const_281_to_fp16 = const()[name = tensor("const_281_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_115_cast_fp16 = mul(x = var_3144_cast_fp16, y = const_281_to_fp16)[name = tensor("k_115_cast_fp16")]; tensor var_3150 = const()[name = tensor("op_3150"), val = tensor([1, 1500, 20, -1])]; tensor var_3151_cast_fp16 = reshape(shape = var_3150, x = linear_170_cast_fp16)[name = tensor("op_3151_cast_fp16")]; tensor var_3152 = const()[name = tensor("op_3152"), val = tensor([0, 2, 1, 3])]; tensor qk_57_transpose_x_0 = const()[name = tensor("qk_57_transpose_x_0"), val = tensor(false)]; tensor qk_57_transpose_y_0 = const()[name = tensor("qk_57_transpose_y_0"), val = tensor(false)]; tensor transpose_184_perm_0 = const()[name = tensor("transpose_184_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_185_perm_0 = const()[name = tensor("transpose_185_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_205 = transpose(perm = transpose_185_perm_0, x = k_115_cast_fp16)[name = tensor("transpose_205")]; tensor transpose_206 = transpose(perm = transpose_184_perm_0, x = q_115_cast_fp16)[name = tensor("transpose_206")]; tensor qk_57_cast_fp16 = matmul(transpose_x = qk_57_transpose_x_0, transpose_y = qk_57_transpose_y_0, x = transpose_206, y = transpose_205)[name = tensor("qk_57_cast_fp16")]; tensor var_3156_cast_fp16 = softmax(axis = var_3092, x = qk_57_cast_fp16)[name = tensor("op_3156_cast_fp16")]; tensor var_3158_transpose_x_0 = const()[name = tensor("op_3158_transpose_x_0"), val = tensor(false)]; tensor var_3158_transpose_y_0 = const()[name = tensor("op_3158_transpose_y_0"), val = tensor(false)]; tensor transpose_207 = transpose(perm = var_3152, x = var_3151_cast_fp16)[name = tensor("transpose_207")]; tensor var_3158_cast_fp16 = matmul(transpose_x = var_3158_transpose_x_0, transpose_y = var_3158_transpose_y_0, x = var_3156_cast_fp16, y = transpose_207)[name = tensor("op_3158_cast_fp16")]; tensor var_3159 = const()[name = tensor("op_3159"), val = tensor([0, 2, 1, 3])]; tensor concat_28 = const()[name = tensor("concat_28"), val = tensor([1, 1500, 1280])]; tensor transpose_204 = transpose(perm = var_3159, x = var_3158_cast_fp16)[name = tensor("transpose_204")]; tensor x_347_cast_fp16 = reshape(shape = concat_28, x = transpose_204)[name = tensor("x_347_cast_fp16")]; tensor var_3164_to_fp16 = const()[name = tensor("op_3164_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(919015104)))]; tensor var_3165_to_fp16 = const()[name = tensor("op_3165_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(922291968)))]; tensor linear_171_cast_fp16 = linear(bias = var_3165_to_fp16, weight = var_3164_to_fp16, x = x_347_cast_fp16)[name = tensor("linear_171_cast_fp16")]; tensor x_349_cast_fp16 = add(x = x_343_cast_fp16, y = linear_171_cast_fp16)[name = tensor("x_349_cast_fp16")]; tensor var_3172_axes_0 = const()[name = tensor("op_3172_axes_0"), val = tensor([-1])]; tensor blocks_28_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_28_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(922294592)))]; tensor blocks_28_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_28_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(922297216)))]; tensor var_3172_cast_fp16 = layer_norm(axes = var_3172_axes_0, beta = blocks_28_mlp_ln_bias_to_fp16, epsilon = var_3098_to_fp16, gamma = blocks_28_mlp_ln_weight_to_fp16, x = x_349_cast_fp16)[name = tensor("op_3172_cast_fp16")]; tensor var_3181_to_fp16 = const()[name = tensor("op_3181_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(922299840)))]; tensor var_3182_to_fp16 = const()[name = tensor("op_3182_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(935243264)))]; tensor linear_172_cast_fp16 = linear(bias = var_3182_to_fp16, weight = var_3181_to_fp16, x = var_3172_cast_fp16)[name = tensor("linear_172_cast_fp16")]; tensor x_353_mode_0 = const()[name = tensor("x_353_mode_0"), val = tensor("EXACT")]; tensor x_353_cast_fp16 = gelu(mode = x_353_mode_0, x = linear_172_cast_fp16)[name = tensor("x_353_cast_fp16")]; tensor var_3187_to_fp16 = const()[name = tensor("op_3187_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(935253440)))]; tensor var_3188_to_fp16 = const()[name = tensor("op_3188_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(948196864)))]; tensor linear_173_cast_fp16 = linear(bias = var_3188_to_fp16, weight = var_3187_to_fp16, x = x_353_cast_fp16)[name = tensor("linear_173_cast_fp16")]; tensor x_355_cast_fp16 = add(x = x_349_cast_fp16, y = linear_173_cast_fp16)[name = tensor("x_355_cast_fp16")]; tensor var_3198 = const()[name = tensor("op_3198"), val = tensor(-1)]; tensor var_3214_axes_0 = const()[name = tensor("op_3214_axes_0"), val = tensor([-1])]; tensor blocks_29_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_29_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(948199488)))]; tensor blocks_29_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_29_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(948202112)))]; tensor var_3204_to_fp16 = const()[name = tensor("op_3204_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3214_cast_fp16 = layer_norm(axes = var_3214_axes_0, beta = blocks_29_attn_ln_bias_to_fp16, epsilon = var_3204_to_fp16, gamma = blocks_29_attn_ln_weight_to_fp16, x = x_355_cast_fp16)[name = tensor("op_3214_cast_fp16")]; tensor var_3225_to_fp16 = const()[name = tensor("op_3225_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(948204736)))]; tensor var_3226_to_fp16 = const()[name = tensor("op_3226_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(951481600)))]; tensor linear_174_cast_fp16 = linear(bias = var_3226_to_fp16, weight = var_3225_to_fp16, x = var_3214_cast_fp16)[name = tensor("linear_174_cast_fp16")]; tensor var_3229_to_fp16 = const()[name = tensor("op_3229_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(951484224)))]; tensor linear_175_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_3229_to_fp16, x = var_3214_cast_fp16)[name = tensor("linear_175_cast_fp16")]; tensor var_3233_to_fp16 = const()[name = tensor("op_3233_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(954761088)))]; tensor var_3234_to_fp16 = const()[name = tensor("op_3234_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(958037952)))]; tensor linear_176_cast_fp16 = linear(bias = var_3234_to_fp16, weight = var_3233_to_fp16, x = var_3214_cast_fp16)[name = tensor("linear_176_cast_fp16")]; tensor var_3242 = const()[name = tensor("op_3242"), val = tensor([1, 1500, 20, -1])]; tensor var_3243_cast_fp16 = reshape(shape = var_3242, x = linear_174_cast_fp16)[name = tensor("op_3243_cast_fp16")]; tensor const_282_to_fp16 = const()[name = tensor("const_282_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_119_cast_fp16 = mul(x = var_3243_cast_fp16, y = const_282_to_fp16)[name = tensor("q_119_cast_fp16")]; tensor var_3249 = const()[name = tensor("op_3249"), val = tensor([1, 1500, 20, -1])]; tensor var_3250_cast_fp16 = reshape(shape = var_3249, x = linear_175_cast_fp16)[name = tensor("op_3250_cast_fp16")]; tensor const_283_to_fp16 = const()[name = tensor("const_283_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_119_cast_fp16 = mul(x = var_3250_cast_fp16, y = const_283_to_fp16)[name = tensor("k_119_cast_fp16")]; tensor var_3256 = const()[name = tensor("op_3256"), val = tensor([1, 1500, 20, -1])]; tensor var_3257_cast_fp16 = reshape(shape = var_3256, x = linear_176_cast_fp16)[name = tensor("op_3257_cast_fp16")]; tensor var_3258 = const()[name = tensor("op_3258"), val = tensor([0, 2, 1, 3])]; tensor qk_59_transpose_x_0 = const()[name = tensor("qk_59_transpose_x_0"), val = tensor(false)]; tensor qk_59_transpose_y_0 = const()[name = tensor("qk_59_transpose_y_0"), val = tensor(false)]; tensor transpose_186_perm_0 = const()[name = tensor("transpose_186_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_187_perm_0 = const()[name = tensor("transpose_187_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_201 = transpose(perm = transpose_187_perm_0, x = k_119_cast_fp16)[name = tensor("transpose_201")]; tensor transpose_202 = transpose(perm = transpose_186_perm_0, x = q_119_cast_fp16)[name = tensor("transpose_202")]; tensor qk_59_cast_fp16 = matmul(transpose_x = qk_59_transpose_x_0, transpose_y = qk_59_transpose_y_0, x = transpose_202, y = transpose_201)[name = tensor("qk_59_cast_fp16")]; tensor var_3262_cast_fp16 = softmax(axis = var_3198, x = qk_59_cast_fp16)[name = tensor("op_3262_cast_fp16")]; tensor var_3264_transpose_x_0 = const()[name = tensor("op_3264_transpose_x_0"), val = tensor(false)]; tensor var_3264_transpose_y_0 = const()[name = tensor("op_3264_transpose_y_0"), val = tensor(false)]; tensor transpose_203 = transpose(perm = var_3258, x = var_3257_cast_fp16)[name = tensor("transpose_203")]; tensor var_3264_cast_fp16 = matmul(transpose_x = var_3264_transpose_x_0, transpose_y = var_3264_transpose_y_0, x = var_3262_cast_fp16, y = transpose_203)[name = tensor("op_3264_cast_fp16")]; tensor var_3265 = const()[name = tensor("op_3265"), val = tensor([0, 2, 1, 3])]; tensor concat_29 = const()[name = tensor("concat_29"), val = tensor([1, 1500, 1280])]; tensor transpose_200 = transpose(perm = var_3265, x = var_3264_cast_fp16)[name = tensor("transpose_200")]; tensor x_359_cast_fp16 = reshape(shape = concat_29, x = transpose_200)[name = tensor("x_359_cast_fp16")]; tensor var_3270_to_fp16 = const()[name = tensor("op_3270_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(958040576)))]; tensor var_3271_to_fp16 = const()[name = tensor("op_3271_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(961317440)))]; tensor linear_177_cast_fp16 = linear(bias = var_3271_to_fp16, weight = var_3270_to_fp16, x = x_359_cast_fp16)[name = tensor("linear_177_cast_fp16")]; tensor x_361_cast_fp16 = add(x = x_355_cast_fp16, y = linear_177_cast_fp16)[name = tensor("x_361_cast_fp16")]; tensor var_3278_axes_0 = const()[name = tensor("op_3278_axes_0"), val = tensor([-1])]; tensor blocks_29_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_29_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(961320064)))]; tensor blocks_29_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_29_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(961322688)))]; tensor var_3278_cast_fp16 = layer_norm(axes = var_3278_axes_0, beta = blocks_29_mlp_ln_bias_to_fp16, epsilon = var_3204_to_fp16, gamma = blocks_29_mlp_ln_weight_to_fp16, x = x_361_cast_fp16)[name = tensor("op_3278_cast_fp16")]; tensor var_3287_to_fp16 = const()[name = tensor("op_3287_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(961325312)))]; tensor var_3288_to_fp16 = const()[name = tensor("op_3288_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(974186816)))]; tensor linear_178_cast_fp16 = linear(bias = var_3288_to_fp16, weight = var_3287_to_fp16, x = var_3278_cast_fp16)[name = tensor("linear_178_cast_fp16")]; tensor x_365_mode_0 = const()[name = tensor("x_365_mode_0"), val = tensor("EXACT")]; tensor x_365_cast_fp16 = gelu(mode = x_365_mode_0, x = linear_178_cast_fp16)[name = tensor("x_365_cast_fp16")]; tensor var_3293_to_fp16 = const()[name = tensor("op_3293_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(974196928)))]; tensor var_3294_to_fp16 = const()[name = tensor("op_3294_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(987058432)))]; tensor linear_179_cast_fp16 = linear(bias = var_3294_to_fp16, weight = var_3293_to_fp16, x = x_365_cast_fp16)[name = tensor("linear_179_cast_fp16")]; tensor x_367_cast_fp16 = add(x = x_361_cast_fp16, y = linear_179_cast_fp16)[name = tensor("x_367_cast_fp16")]; tensor var_3304 = const()[name = tensor("op_3304"), val = tensor(-1)]; tensor var_3320_axes_0 = const()[name = tensor("op_3320_axes_0"), val = tensor([-1])]; tensor blocks_30_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_30_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(987061056)))]; tensor blocks_30_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_30_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(987063680)))]; tensor var_3310_to_fp16 = const()[name = tensor("op_3310_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3320_cast_fp16 = layer_norm(axes = var_3320_axes_0, beta = blocks_30_attn_ln_bias_to_fp16, epsilon = var_3310_to_fp16, gamma = blocks_30_attn_ln_weight_to_fp16, x = x_367_cast_fp16)[name = tensor("op_3320_cast_fp16")]; tensor var_3331_to_fp16 = const()[name = tensor("op_3331_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(987066304)))]; tensor var_3332_to_fp16 = const()[name = tensor("op_3332_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(990343168)))]; tensor linear_180_cast_fp16 = linear(bias = var_3332_to_fp16, weight = var_3331_to_fp16, x = var_3320_cast_fp16)[name = tensor("linear_180_cast_fp16")]; tensor var_3335_to_fp16 = const()[name = tensor("op_3335_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(990345792)))]; tensor linear_181_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_3335_to_fp16, x = var_3320_cast_fp16)[name = tensor("linear_181_cast_fp16")]; tensor var_3339_to_fp16 = const()[name = tensor("op_3339_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(993622656)))]; tensor var_3340_to_fp16 = const()[name = tensor("op_3340_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(996899520)))]; tensor linear_182_cast_fp16 = linear(bias = var_3340_to_fp16, weight = var_3339_to_fp16, x = var_3320_cast_fp16)[name = tensor("linear_182_cast_fp16")]; tensor var_3348 = const()[name = tensor("op_3348"), val = tensor([1, 1500, 20, -1])]; tensor var_3349_cast_fp16 = reshape(shape = var_3348, x = linear_180_cast_fp16)[name = tensor("op_3349_cast_fp16")]; tensor const_284_to_fp16 = const()[name = tensor("const_284_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_123_cast_fp16 = mul(x = var_3349_cast_fp16, y = const_284_to_fp16)[name = tensor("q_123_cast_fp16")]; tensor var_3355 = const()[name = tensor("op_3355"), val = tensor([1, 1500, 20, -1])]; tensor var_3356_cast_fp16 = reshape(shape = var_3355, x = linear_181_cast_fp16)[name = tensor("op_3356_cast_fp16")]; tensor const_285_to_fp16 = const()[name = tensor("const_285_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_123_cast_fp16 = mul(x = var_3356_cast_fp16, y = const_285_to_fp16)[name = tensor("k_123_cast_fp16")]; tensor var_3362 = const()[name = tensor("op_3362"), val = tensor([1, 1500, 20, -1])]; tensor var_3363_cast_fp16 = reshape(shape = var_3362, x = linear_182_cast_fp16)[name = tensor("op_3363_cast_fp16")]; tensor var_3364 = const()[name = tensor("op_3364"), val = tensor([0, 2, 1, 3])]; tensor qk_61_transpose_x_0 = const()[name = tensor("qk_61_transpose_x_0"), val = tensor(false)]; tensor qk_61_transpose_y_0 = const()[name = tensor("qk_61_transpose_y_0"), val = tensor(false)]; tensor transpose_188_perm_0 = const()[name = tensor("transpose_188_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_189_perm_0 = const()[name = tensor("transpose_189_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_197 = transpose(perm = transpose_189_perm_0, x = k_123_cast_fp16)[name = tensor("transpose_197")]; tensor transpose_198 = transpose(perm = transpose_188_perm_0, x = q_123_cast_fp16)[name = tensor("transpose_198")]; tensor qk_61_cast_fp16 = matmul(transpose_x = qk_61_transpose_x_0, transpose_y = qk_61_transpose_y_0, x = transpose_198, y = transpose_197)[name = tensor("qk_61_cast_fp16")]; tensor var_3368_cast_fp16 = softmax(axis = var_3304, x = qk_61_cast_fp16)[name = tensor("op_3368_cast_fp16")]; tensor var_3370_transpose_x_0 = const()[name = tensor("op_3370_transpose_x_0"), val = tensor(false)]; tensor var_3370_transpose_y_0 = const()[name = tensor("op_3370_transpose_y_0"), val = tensor(false)]; tensor transpose_199 = transpose(perm = var_3364, x = var_3363_cast_fp16)[name = tensor("transpose_199")]; tensor var_3370_cast_fp16 = matmul(transpose_x = var_3370_transpose_x_0, transpose_y = var_3370_transpose_y_0, x = var_3368_cast_fp16, y = transpose_199)[name = tensor("op_3370_cast_fp16")]; tensor var_3371 = const()[name = tensor("op_3371"), val = tensor([0, 2, 1, 3])]; tensor concat_30 = const()[name = tensor("concat_30"), val = tensor([1, 1500, 1280])]; tensor transpose_196 = transpose(perm = var_3371, x = var_3370_cast_fp16)[name = tensor("transpose_196")]; tensor x_371_cast_fp16 = reshape(shape = concat_30, x = transpose_196)[name = tensor("x_371_cast_fp16")]; tensor var_3376_to_fp16 = const()[name = tensor("op_3376_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(996902144)))]; tensor var_3377_to_fp16 = const()[name = tensor("op_3377_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1000179008)))]; tensor linear_183_cast_fp16 = linear(bias = var_3377_to_fp16, weight = var_3376_to_fp16, x = x_371_cast_fp16)[name = tensor("linear_183_cast_fp16")]; tensor x_373_cast_fp16 = add(x = x_367_cast_fp16, y = linear_183_cast_fp16)[name = tensor("x_373_cast_fp16")]; tensor var_3384_axes_0 = const()[name = tensor("op_3384_axes_0"), val = tensor([-1])]; tensor blocks_30_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_30_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1000181632)))]; tensor blocks_30_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_30_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1000184256)))]; tensor var_3384_cast_fp16 = layer_norm(axes = var_3384_axes_0, beta = blocks_30_mlp_ln_bias_to_fp16, epsilon = var_3310_to_fp16, gamma = blocks_30_mlp_ln_weight_to_fp16, x = x_373_cast_fp16)[name = tensor("op_3384_cast_fp16")]; tensor var_3393_to_fp16 = const()[name = tensor("op_3393_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1000186880)))]; tensor var_3394_to_fp16 = const()[name = tensor("op_3394_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1012966464)))]; tensor linear_184_cast_fp16 = linear(bias = var_3394_to_fp16, weight = var_3393_to_fp16, x = var_3384_cast_fp16)[name = tensor("linear_184_cast_fp16")]; tensor x_377_mode_0 = const()[name = tensor("x_377_mode_0"), val = tensor("EXACT")]; tensor x_377_cast_fp16 = gelu(mode = x_377_mode_0, x = linear_184_cast_fp16)[name = tensor("x_377_cast_fp16")]; tensor var_3399_to_fp16 = const()[name = tensor("op_3399_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1012976512)))]; tensor var_3400_to_fp16 = const()[name = tensor("op_3400_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1025756096)))]; tensor linear_185_cast_fp16 = linear(bias = var_3400_to_fp16, weight = var_3399_to_fp16, x = x_377_cast_fp16)[name = tensor("linear_185_cast_fp16")]; tensor x_379_cast_fp16 = add(x = x_373_cast_fp16, y = linear_185_cast_fp16)[name = tensor("x_379_cast_fp16")]; tensor var_3410 = const()[name = tensor("op_3410"), val = tensor(-1)]; tensor var_3426_axes_0 = const()[name = tensor("op_3426_axes_0"), val = tensor([-1])]; tensor blocks_31_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_31_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1025758720)))]; tensor blocks_31_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_31_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1025761344)))]; tensor var_3416_to_fp16 = const()[name = tensor("op_3416_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3426_cast_fp16 = layer_norm(axes = var_3426_axes_0, beta = blocks_31_attn_ln_bias_to_fp16, epsilon = var_3416_to_fp16, gamma = blocks_31_attn_ln_weight_to_fp16, x = x_379_cast_fp16)[name = tensor("op_3426_cast_fp16")]; tensor var_3437_to_fp16 = const()[name = tensor("op_3437_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1025763968)))]; tensor var_3438_to_fp16 = const()[name = tensor("op_3438_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1029040832)))]; tensor linear_186_cast_fp16 = linear(bias = var_3438_to_fp16, weight = var_3437_to_fp16, x = var_3426_cast_fp16)[name = tensor("linear_186_cast_fp16")]; tensor var_3441_to_fp16 = const()[name = tensor("op_3441_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1029043456)))]; tensor linear_187_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_3441_to_fp16, x = var_3426_cast_fp16)[name = tensor("linear_187_cast_fp16")]; tensor var_3445_to_fp16 = const()[name = tensor("op_3445_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1032320320)))]; tensor var_3446_to_fp16 = const()[name = tensor("op_3446_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1035597184)))]; tensor linear_188_cast_fp16 = linear(bias = var_3446_to_fp16, weight = var_3445_to_fp16, x = var_3426_cast_fp16)[name = tensor("linear_188_cast_fp16")]; tensor var_3454 = const()[name = tensor("op_3454"), val = tensor([1, 1500, 20, -1])]; tensor var_3455_cast_fp16 = reshape(shape = var_3454, x = linear_186_cast_fp16)[name = tensor("op_3455_cast_fp16")]; tensor const_286_to_fp16 = const()[name = tensor("const_286_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_cast_fp16 = mul(x = var_3455_cast_fp16, y = const_286_to_fp16)[name = tensor("q_cast_fp16")]; tensor var_3461 = const()[name = tensor("op_3461"), val = tensor([1, 1500, 20, -1])]; tensor var_3462_cast_fp16 = reshape(shape = var_3461, x = linear_187_cast_fp16)[name = tensor("op_3462_cast_fp16")]; tensor const_287_to_fp16 = const()[name = tensor("const_287_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_cast_fp16 = mul(x = var_3462_cast_fp16, y = const_287_to_fp16)[name = tensor("k_cast_fp16")]; tensor var_3468 = const()[name = tensor("op_3468"), val = tensor([1, 1500, 20, -1])]; tensor var_3469_cast_fp16 = reshape(shape = var_3468, x = linear_188_cast_fp16)[name = tensor("op_3469_cast_fp16")]; tensor var_3470 = const()[name = tensor("op_3470"), val = tensor([0, 2, 1, 3])]; tensor qk_transpose_x_0 = const()[name = tensor("qk_transpose_x_0"), val = tensor(false)]; tensor qk_transpose_y_0 = const()[name = tensor("qk_transpose_y_0"), val = tensor(false)]; tensor transpose_190_perm_0 = const()[name = tensor("transpose_190_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_191_perm_0 = const()[name = tensor("transpose_191_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_193 = transpose(perm = transpose_191_perm_0, x = k_cast_fp16)[name = tensor("transpose_193")]; tensor transpose_194 = transpose(perm = transpose_190_perm_0, x = q_cast_fp16)[name = tensor("transpose_194")]; tensor qk_cast_fp16 = matmul(transpose_x = qk_transpose_x_0, transpose_y = qk_transpose_y_0, x = transpose_194, y = transpose_193)[name = tensor("qk_cast_fp16")]; tensor var_3474_cast_fp16 = softmax(axis = var_3410, x = qk_cast_fp16)[name = tensor("op_3474_cast_fp16")]; tensor var_3476_transpose_x_0 = const()[name = tensor("op_3476_transpose_x_0"), val = tensor(false)]; tensor var_3476_transpose_y_0 = const()[name = tensor("op_3476_transpose_y_0"), val = tensor(false)]; tensor transpose_195 = transpose(perm = var_3470, x = var_3469_cast_fp16)[name = tensor("transpose_195")]; tensor var_3476_cast_fp16 = matmul(transpose_x = var_3476_transpose_x_0, transpose_y = var_3476_transpose_y_0, x = var_3474_cast_fp16, y = transpose_195)[name = tensor("op_3476_cast_fp16")]; tensor var_3477 = const()[name = tensor("op_3477"), val = tensor([0, 2, 1, 3])]; tensor concat_31 = const()[name = tensor("concat_31"), val = tensor([1, 1500, 1280])]; tensor transpose_192 = transpose(perm = var_3477, x = var_3476_cast_fp16)[name = tensor("transpose_192")]; tensor x_383_cast_fp16 = reshape(shape = concat_31, x = transpose_192)[name = tensor("x_383_cast_fp16")]; tensor var_3482_to_fp16 = const()[name = tensor("op_3482_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1035599808)))]; tensor var_3483_to_fp16 = const()[name = tensor("op_3483_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1038876672)))]; tensor linear_189_cast_fp16 = linear(bias = var_3483_to_fp16, weight = var_3482_to_fp16, x = x_383_cast_fp16)[name = tensor("linear_189_cast_fp16")]; tensor x_385_cast_fp16 = add(x = x_379_cast_fp16, y = linear_189_cast_fp16)[name = tensor("x_385_cast_fp16")]; tensor var_3490_axes_0 = const()[name = tensor("op_3490_axes_0"), val = tensor([-1])]; tensor blocks_31_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_31_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1038879296)))]; tensor blocks_31_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_31_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1038881920)))]; tensor var_3490_cast_fp16 = layer_norm(axes = var_3490_axes_0, beta = blocks_31_mlp_ln_bias_to_fp16, epsilon = var_3416_to_fp16, gamma = blocks_31_mlp_ln_weight_to_fp16, x = x_385_cast_fp16)[name = tensor("op_3490_cast_fp16")]; tensor var_3499_to_fp16 = const()[name = tensor("op_3499_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1038884544)))]; tensor var_3500_to_fp16 = const()[name = tensor("op_3500_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1051336448)))]; tensor linear_190_cast_fp16 = linear(bias = var_3500_to_fp16, weight = var_3499_to_fp16, x = var_3490_cast_fp16)[name = tensor("linear_190_cast_fp16")]; tensor x_389_mode_0 = const()[name = tensor("x_389_mode_0"), val = tensor("EXACT")]; tensor x_389_cast_fp16 = gelu(mode = x_389_mode_0, x = linear_190_cast_fp16)[name = tensor("x_389_cast_fp16")]; tensor var_3505_to_fp16 = const()[name = tensor("op_3505_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1051346240)))]; tensor var_3506_to_fp16 = const()[name = tensor("op_3506_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1063798144)))]; tensor linear_191_cast_fp16 = linear(bias = var_3506_to_fp16, weight = var_3505_to_fp16, x = x_389_cast_fp16)[name = tensor("linear_191_cast_fp16")]; tensor x_cast_fp16 = add(x = x_385_cast_fp16, y = linear_191_cast_fp16)[name = tensor("x_cast_fp16")]; tensor var_3519_axes_0 = const()[name = tensor("op_3519_axes_0"), val = tensor([-1])]; tensor ln_post_weight_to_fp16 = const()[name = tensor("ln_post_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1063800768)))]; tensor ln_post_bias_to_fp16 = const()[name = tensor("ln_post_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1063803392)))]; tensor var_3510_to_fp16 = const()[name = tensor("op_3510_to_fp16"), val = tensor(0x1.5p-17)]; tensor output = layer_norm(axes = var_3519_axes_0, beta = ln_post_bias_to_fp16, epsilon = var_3510_to_fp16, gamma = ln_post_weight_to_fp16, x = x_cast_fp16)[name = tensor("op_3519_cast_fp16")]; } -> (output); }