program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "3304.5.2"}, {"coremlc-version", "3304.6.2"}, {"coremltools-component-torch", "2.2.2"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "7.2"}})] { func main(tensor logmel_data) { tensor var_20 = const()[name = tensor("op_20"), val = tensor(1)]; tensor var_28 = const()[name = tensor("op_28"), val = tensor([1])]; tensor var_30 = const()[name = tensor("op_30"), val = tensor([1])]; tensor var_32_pad_type_0 = const()[name = tensor("op_32_pad_type_0"), val = tensor("custom")]; tensor var_32_pad_0 = const()[name = tensor("op_32_pad_0"), val = tensor([1, 1])]; tensor weight_3_to_fp16 = const()[name = tensor("weight_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor bias_3_to_fp16 = const()[name = tensor("bias_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245888)))]; tensor var_32_cast_fp16 = conv(bias = bias_3_to_fp16, dilations = var_30, groups = var_20, pad = var_32_pad_0, pad_type = var_32_pad_type_0, strides = var_28, weight = weight_3_to_fp16, x = logmel_data)[name = tensor("op_32_cast_fp16")]; tensor input_1_mode_0 = const()[name = tensor("input_1_mode_0"), val = tensor("EXACT")]; tensor input_1_cast_fp16 = gelu(mode = input_1_mode_0, x = var_32_cast_fp16)[name = tensor("input_1_cast_fp16")]; tensor var_37 = const()[name = tensor("op_37"), val = tensor(1)]; tensor var_46 = const()[name = tensor("op_46"), val = tensor([2])]; tensor var_48 = const()[name = tensor("op_48"), val = tensor([1])]; tensor var_50_pad_type_0 = const()[name = tensor("op_50_pad_type_0"), val = tensor("custom")]; tensor var_50_pad_0 = const()[name = tensor("op_50_pad_0"), val = tensor([1, 1])]; tensor weight_7_to_fp16 = const()[name = tensor("weight_7_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(246976)))]; tensor bias_7_to_fp16 = const()[name = tensor("bias_7_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1819904)))]; tensor var_50_cast_fp16 = conv(bias = bias_7_to_fp16, dilations = var_48, groups = var_37, pad = var_50_pad_0, pad_type = var_50_pad_type_0, strides = var_46, weight = weight_7_to_fp16, x = input_1_cast_fp16)[name = tensor("op_50_cast_fp16")]; tensor x_3_mode_0 = const()[name = tensor("x_3_mode_0"), val = tensor("EXACT")]; tensor x_3_cast_fp16 = gelu(mode = x_3_mode_0, x = var_50_cast_fp16)[name = tensor("x_3_cast_fp16")]; tensor var_56 = const()[name = tensor("op_56"), val = tensor([0, 2, 1])]; tensor positional_embedding_to_fp16 = const()[name = tensor("positional_embedding_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1820992)))]; tensor transpose_60 = transpose(perm = var_56, x = x_3_cast_fp16)[name = tensor("transpose_60")]; tensor var_59_cast_fp16 = add(x = transpose_60, y = positional_embedding_to_fp16)[name = tensor("op_59_cast_fp16")]; tensor var_72 = const()[name = tensor("op_72"), val = tensor(-1)]; tensor var_88_axes_0 = const()[name = tensor("op_88_axes_0"), val = tensor([-1])]; tensor blocks_0_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_0_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3357056)))]; tensor blocks_0_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_0_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3358144)))]; tensor var_78_to_fp16 = const()[name = tensor("op_78_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_88_cast_fp16 = layer_norm(axes = var_88_axes_0, beta = blocks_0_attn_ln_bias_to_fp16, epsilon = var_78_to_fp16, gamma = blocks_0_attn_ln_weight_to_fp16, x = var_59_cast_fp16)[name = tensor("op_88_cast_fp16")]; tensor var_99_to_fp16 = const()[name = tensor("op_99_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3359232)))]; tensor var_100_to_fp16 = const()[name = tensor("op_100_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3883584)))]; tensor linear_0_cast_fp16 = linear(bias = var_100_to_fp16, weight = var_99_to_fp16, x = var_88_cast_fp16)[name = tensor("linear_0_cast_fp16")]; tensor var_103_to_fp16 = const()[name = tensor("op_103_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3884672)))]; tensor linear_1_bias_0_to_fp16 = const()[name = tensor("linear_1_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4409024)))]; tensor linear_1_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_103_to_fp16, x = var_88_cast_fp16)[name = tensor("linear_1_cast_fp16")]; tensor var_107_to_fp16 = const()[name = tensor("op_107_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4410112)))]; tensor var_108_to_fp16 = const()[name = tensor("op_108_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4934464)))]; tensor linear_2_cast_fp16 = linear(bias = var_108_to_fp16, weight = var_107_to_fp16, x = var_88_cast_fp16)[name = tensor("linear_2_cast_fp16")]; tensor var_116 = const()[name = tensor("op_116"), val = tensor([1, 1500, 8, -1])]; tensor var_117_cast_fp16 = reshape(shape = var_116, x = linear_0_cast_fp16)[name = tensor("op_117_cast_fp16")]; tensor const_42_to_fp16 = const()[name = tensor("const_42_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_3_cast_fp16 = mul(x = var_117_cast_fp16, y = const_42_to_fp16)[name = tensor("q_3_cast_fp16")]; tensor var_123 = const()[name = tensor("op_123"), val = tensor([1, 1500, 8, -1])]; tensor var_124_cast_fp16 = reshape(shape = var_123, x = linear_1_cast_fp16)[name = tensor("op_124_cast_fp16")]; tensor const_43_to_fp16 = const()[name = tensor("const_43_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_3_cast_fp16 = mul(x = var_124_cast_fp16, y = const_43_to_fp16)[name = tensor("k_3_cast_fp16")]; tensor var_130 = const()[name = tensor("op_130"), val = tensor([1, 1500, 8, -1])]; tensor var_131_cast_fp16 = reshape(shape = var_130, x = linear_2_cast_fp16)[name = tensor("op_131_cast_fp16")]; tensor var_132 = const()[name = tensor("op_132"), val = tensor([0, 2, 1, 3])]; tensor qk_1_transpose_x_0 = const()[name = tensor("qk_1_transpose_x_0"), val = tensor(false)]; tensor qk_1_transpose_y_0 = const()[name = tensor("qk_1_transpose_y_0"), val = tensor(false)]; tensor transpose_24_perm_0 = const()[name = tensor("transpose_24_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_25_perm_0 = const()[name = tensor("transpose_25_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_57 = transpose(perm = transpose_25_perm_0, x = k_3_cast_fp16)[name = tensor("transpose_57")]; tensor transpose_58 = transpose(perm = transpose_24_perm_0, x = q_3_cast_fp16)[name = tensor("transpose_58")]; tensor qk_1_cast_fp16 = matmul(transpose_x = qk_1_transpose_x_0, transpose_y = qk_1_transpose_y_0, x = transpose_58, y = transpose_57)[name = tensor("qk_1_cast_fp16")]; tensor var_136_cast_fp16 = softmax(axis = var_72, x = qk_1_cast_fp16)[name = tensor("op_136_cast_fp16")]; tensor var_138_transpose_x_0 = const()[name = tensor("op_138_transpose_x_0"), val = tensor(false)]; tensor var_138_transpose_y_0 = const()[name = tensor("op_138_transpose_y_0"), val = tensor(false)]; tensor transpose_59 = transpose(perm = var_132, x = var_131_cast_fp16)[name = tensor("transpose_59")]; tensor var_138_cast_fp16 = matmul(transpose_x = var_138_transpose_x_0, transpose_y = var_138_transpose_y_0, x = var_136_cast_fp16, y = transpose_59)[name = tensor("op_138_cast_fp16")]; tensor var_139 = const()[name = tensor("op_139"), val = tensor([0, 2, 1, 3])]; tensor concat_0 = const()[name = tensor("concat_0"), val = tensor([1, 1500, 512])]; tensor transpose_56 = transpose(perm = var_139, x = var_138_cast_fp16)[name = tensor("transpose_56")]; tensor x_11_cast_fp16 = reshape(shape = concat_0, x = transpose_56)[name = tensor("x_11_cast_fp16")]; tensor var_144_to_fp16 = const()[name = tensor("op_144_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4935552)))]; tensor var_145_to_fp16 = const()[name = tensor("op_145_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5459904)))]; tensor linear_3_cast_fp16 = linear(bias = var_145_to_fp16, weight = var_144_to_fp16, x = x_11_cast_fp16)[name = tensor("linear_3_cast_fp16")]; tensor x_13_cast_fp16 = add(x = var_59_cast_fp16, y = linear_3_cast_fp16)[name = tensor("x_13_cast_fp16")]; tensor var_152_axes_0 = const()[name = tensor("op_152_axes_0"), val = tensor([-1])]; tensor blocks_0_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_0_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5460992)))]; tensor blocks_0_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_0_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5462080)))]; tensor var_152_cast_fp16 = layer_norm(axes = var_152_axes_0, beta = blocks_0_mlp_ln_bias_to_fp16, epsilon = var_78_to_fp16, gamma = blocks_0_mlp_ln_weight_to_fp16, x = x_13_cast_fp16)[name = tensor("op_152_cast_fp16")]; tensor var_161_to_fp16 = const()[name = tensor("op_161_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5463168)))]; tensor var_162_to_fp16 = const()[name = tensor("op_162_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7560384)))]; tensor linear_4_cast_fp16 = linear(bias = var_162_to_fp16, weight = var_161_to_fp16, x = var_152_cast_fp16)[name = tensor("linear_4_cast_fp16")]; tensor x_17_mode_0 = const()[name = tensor("x_17_mode_0"), val = tensor("EXACT")]; tensor x_17_cast_fp16 = gelu(mode = x_17_mode_0, x = linear_4_cast_fp16)[name = tensor("x_17_cast_fp16")]; tensor var_167_to_fp16 = const()[name = tensor("op_167_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7564544)))]; tensor var_168_to_fp16 = const()[name = tensor("op_168_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9661760)))]; tensor linear_5_cast_fp16 = linear(bias = var_168_to_fp16, weight = var_167_to_fp16, x = x_17_cast_fp16)[name = tensor("linear_5_cast_fp16")]; tensor x_19_cast_fp16 = add(x = x_13_cast_fp16, y = linear_5_cast_fp16)[name = tensor("x_19_cast_fp16")]; tensor var_178 = const()[name = tensor("op_178"), val = tensor(-1)]; tensor var_194_axes_0 = const()[name = tensor("op_194_axes_0"), val = tensor([-1])]; tensor blocks_1_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_1_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9662848)))]; tensor blocks_1_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_1_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9663936)))]; tensor var_184_to_fp16 = const()[name = tensor("op_184_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_194_cast_fp16 = layer_norm(axes = var_194_axes_0, beta = blocks_1_attn_ln_bias_to_fp16, epsilon = var_184_to_fp16, gamma = blocks_1_attn_ln_weight_to_fp16, x = x_19_cast_fp16)[name = tensor("op_194_cast_fp16")]; tensor var_205_to_fp16 = const()[name = tensor("op_205_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9665024)))]; tensor var_206_to_fp16 = const()[name = tensor("op_206_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10189376)))]; tensor linear_6_cast_fp16 = linear(bias = var_206_to_fp16, weight = var_205_to_fp16, x = var_194_cast_fp16)[name = tensor("linear_6_cast_fp16")]; tensor var_209_to_fp16 = const()[name = tensor("op_209_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10190464)))]; tensor linear_7_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_209_to_fp16, x = var_194_cast_fp16)[name = tensor("linear_7_cast_fp16")]; tensor var_213_to_fp16 = const()[name = tensor("op_213_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10714816)))]; tensor var_214_to_fp16 = const()[name = tensor("op_214_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11239168)))]; tensor linear_8_cast_fp16 = linear(bias = var_214_to_fp16, weight = var_213_to_fp16, x = var_194_cast_fp16)[name = tensor("linear_8_cast_fp16")]; tensor var_222 = const()[name = tensor("op_222"), val = tensor([1, 1500, 8, -1])]; tensor var_223_cast_fp16 = reshape(shape = var_222, x = linear_6_cast_fp16)[name = tensor("op_223_cast_fp16")]; tensor const_44_to_fp16 = const()[name = tensor("const_44_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_7_cast_fp16 = mul(x = var_223_cast_fp16, y = const_44_to_fp16)[name = tensor("q_7_cast_fp16")]; tensor var_229 = const()[name = tensor("op_229"), val = tensor([1, 1500, 8, -1])]; tensor var_230_cast_fp16 = reshape(shape = var_229, x = linear_7_cast_fp16)[name = tensor("op_230_cast_fp16")]; tensor const_45_to_fp16 = const()[name = tensor("const_45_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_7_cast_fp16 = mul(x = var_230_cast_fp16, y = const_45_to_fp16)[name = tensor("k_7_cast_fp16")]; tensor var_236 = const()[name = tensor("op_236"), val = tensor([1, 1500, 8, -1])]; tensor var_237_cast_fp16 = reshape(shape = var_236, x = linear_8_cast_fp16)[name = tensor("op_237_cast_fp16")]; tensor var_238 = const()[name = tensor("op_238"), val = tensor([0, 2, 1, 3])]; tensor qk_3_transpose_x_0 = const()[name = tensor("qk_3_transpose_x_0"), val = tensor(false)]; tensor qk_3_transpose_y_0 = const()[name = tensor("qk_3_transpose_y_0"), val = tensor(false)]; tensor transpose_26_perm_0 = const()[name = tensor("transpose_26_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_27_perm_0 = const()[name = tensor("transpose_27_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_53 = transpose(perm = transpose_27_perm_0, x = k_7_cast_fp16)[name = tensor("transpose_53")]; tensor transpose_54 = transpose(perm = transpose_26_perm_0, x = q_7_cast_fp16)[name = tensor("transpose_54")]; tensor qk_3_cast_fp16 = matmul(transpose_x = qk_3_transpose_x_0, transpose_y = qk_3_transpose_y_0, x = transpose_54, y = transpose_53)[name = tensor("qk_3_cast_fp16")]; tensor var_242_cast_fp16 = softmax(axis = var_178, x = qk_3_cast_fp16)[name = tensor("op_242_cast_fp16")]; tensor var_244_transpose_x_0 = const()[name = tensor("op_244_transpose_x_0"), val = tensor(false)]; tensor var_244_transpose_y_0 = const()[name = tensor("op_244_transpose_y_0"), val = tensor(false)]; tensor transpose_55 = transpose(perm = var_238, x = var_237_cast_fp16)[name = tensor("transpose_55")]; tensor var_244_cast_fp16 = matmul(transpose_x = var_244_transpose_x_0, transpose_y = var_244_transpose_y_0, x = var_242_cast_fp16, y = transpose_55)[name = tensor("op_244_cast_fp16")]; tensor var_245 = const()[name = tensor("op_245"), val = tensor([0, 2, 1, 3])]; tensor concat_1 = const()[name = tensor("concat_1"), val = tensor([1, 1500, 512])]; tensor transpose_52 = transpose(perm = var_245, x = var_244_cast_fp16)[name = tensor("transpose_52")]; tensor x_23_cast_fp16 = reshape(shape = concat_1, x = transpose_52)[name = tensor("x_23_cast_fp16")]; tensor var_250_to_fp16 = const()[name = tensor("op_250_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11240256)))]; tensor var_251_to_fp16 = const()[name = tensor("op_251_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11764608)))]; tensor linear_9_cast_fp16 = linear(bias = var_251_to_fp16, weight = var_250_to_fp16, x = x_23_cast_fp16)[name = tensor("linear_9_cast_fp16")]; tensor x_25_cast_fp16 = add(x = x_19_cast_fp16, y = linear_9_cast_fp16)[name = tensor("x_25_cast_fp16")]; tensor var_258_axes_0 = const()[name = tensor("op_258_axes_0"), val = tensor([-1])]; tensor blocks_1_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_1_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11765696)))]; tensor blocks_1_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_1_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11766784)))]; tensor var_258_cast_fp16 = layer_norm(axes = var_258_axes_0, beta = blocks_1_mlp_ln_bias_to_fp16, epsilon = var_184_to_fp16, gamma = blocks_1_mlp_ln_weight_to_fp16, x = x_25_cast_fp16)[name = tensor("op_258_cast_fp16")]; tensor var_267_to_fp16 = const()[name = tensor("op_267_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11767872)))]; tensor var_268_to_fp16 = const()[name = tensor("op_268_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13865088)))]; tensor linear_10_cast_fp16 = linear(bias = var_268_to_fp16, weight = var_267_to_fp16, x = var_258_cast_fp16)[name = tensor("linear_10_cast_fp16")]; tensor x_29_mode_0 = const()[name = tensor("x_29_mode_0"), val = tensor("EXACT")]; tensor x_29_cast_fp16 = gelu(mode = x_29_mode_0, x = linear_10_cast_fp16)[name = tensor("x_29_cast_fp16")]; tensor var_273_to_fp16 = const()[name = tensor("op_273_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13869248)))]; tensor var_274_to_fp16 = const()[name = tensor("op_274_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15966464)))]; tensor linear_11_cast_fp16 = linear(bias = var_274_to_fp16, weight = var_273_to_fp16, x = x_29_cast_fp16)[name = tensor("linear_11_cast_fp16")]; tensor x_31_cast_fp16 = add(x = x_25_cast_fp16, y = linear_11_cast_fp16)[name = tensor("x_31_cast_fp16")]; tensor var_284 = const()[name = tensor("op_284"), val = tensor(-1)]; tensor var_300_axes_0 = const()[name = tensor("op_300_axes_0"), val = tensor([-1])]; tensor blocks_2_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_2_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15967552)))]; tensor blocks_2_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_2_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15968640)))]; tensor var_290_to_fp16 = const()[name = tensor("op_290_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_300_cast_fp16 = layer_norm(axes = var_300_axes_0, beta = blocks_2_attn_ln_bias_to_fp16, epsilon = var_290_to_fp16, gamma = blocks_2_attn_ln_weight_to_fp16, x = x_31_cast_fp16)[name = tensor("op_300_cast_fp16")]; tensor var_311_to_fp16 = const()[name = tensor("op_311_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15969728)))]; tensor var_312_to_fp16 = const()[name = tensor("op_312_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16494080)))]; tensor linear_12_cast_fp16 = linear(bias = var_312_to_fp16, weight = var_311_to_fp16, x = var_300_cast_fp16)[name = tensor("linear_12_cast_fp16")]; tensor var_315_to_fp16 = const()[name = tensor("op_315_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16495168)))]; tensor linear_13_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_315_to_fp16, x = var_300_cast_fp16)[name = tensor("linear_13_cast_fp16")]; tensor var_319_to_fp16 = const()[name = tensor("op_319_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17019520)))]; tensor var_320_to_fp16 = const()[name = tensor("op_320_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17543872)))]; tensor linear_14_cast_fp16 = linear(bias = var_320_to_fp16, weight = var_319_to_fp16, x = var_300_cast_fp16)[name = tensor("linear_14_cast_fp16")]; tensor var_328 = const()[name = tensor("op_328"), val = tensor([1, 1500, 8, -1])]; tensor var_329_cast_fp16 = reshape(shape = var_328, x = linear_12_cast_fp16)[name = tensor("op_329_cast_fp16")]; tensor const_46_to_fp16 = const()[name = tensor("const_46_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_11_cast_fp16 = mul(x = var_329_cast_fp16, y = const_46_to_fp16)[name = tensor("q_11_cast_fp16")]; tensor var_335 = const()[name = tensor("op_335"), val = tensor([1, 1500, 8, -1])]; tensor var_336_cast_fp16 = reshape(shape = var_335, x = linear_13_cast_fp16)[name = tensor("op_336_cast_fp16")]; tensor const_47_to_fp16 = const()[name = tensor("const_47_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_11_cast_fp16 = mul(x = var_336_cast_fp16, y = const_47_to_fp16)[name = tensor("k_11_cast_fp16")]; tensor var_342 = const()[name = tensor("op_342"), val = tensor([1, 1500, 8, -1])]; tensor var_343_cast_fp16 = reshape(shape = var_342, x = linear_14_cast_fp16)[name = tensor("op_343_cast_fp16")]; tensor var_344 = const()[name = tensor("op_344"), val = tensor([0, 2, 1, 3])]; tensor qk_5_transpose_x_0 = const()[name = tensor("qk_5_transpose_x_0"), val = tensor(false)]; tensor qk_5_transpose_y_0 = const()[name = tensor("qk_5_transpose_y_0"), val = tensor(false)]; tensor transpose_28_perm_0 = const()[name = tensor("transpose_28_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_29_perm_0 = const()[name = tensor("transpose_29_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_49 = transpose(perm = transpose_29_perm_0, x = k_11_cast_fp16)[name = tensor("transpose_49")]; tensor transpose_50 = transpose(perm = transpose_28_perm_0, x = q_11_cast_fp16)[name = tensor("transpose_50")]; tensor qk_5_cast_fp16 = matmul(transpose_x = qk_5_transpose_x_0, transpose_y = qk_5_transpose_y_0, x = transpose_50, y = transpose_49)[name = tensor("qk_5_cast_fp16")]; tensor var_348_cast_fp16 = softmax(axis = var_284, x = qk_5_cast_fp16)[name = tensor("op_348_cast_fp16")]; tensor var_350_transpose_x_0 = const()[name = tensor("op_350_transpose_x_0"), val = tensor(false)]; tensor var_350_transpose_y_0 = const()[name = tensor("op_350_transpose_y_0"), val = tensor(false)]; tensor transpose_51 = transpose(perm = var_344, x = var_343_cast_fp16)[name = tensor("transpose_51")]; tensor var_350_cast_fp16 = matmul(transpose_x = var_350_transpose_x_0, transpose_y = var_350_transpose_y_0, x = var_348_cast_fp16, y = transpose_51)[name = tensor("op_350_cast_fp16")]; tensor var_351 = const()[name = tensor("op_351"), val = tensor([0, 2, 1, 3])]; tensor concat_2 = const()[name = tensor("concat_2"), val = tensor([1, 1500, 512])]; tensor transpose_48 = transpose(perm = var_351, x = var_350_cast_fp16)[name = tensor("transpose_48")]; tensor x_35_cast_fp16 = reshape(shape = concat_2, x = transpose_48)[name = tensor("x_35_cast_fp16")]; tensor var_356_to_fp16 = const()[name = tensor("op_356_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17544960)))]; tensor var_357_to_fp16 = const()[name = tensor("op_357_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18069312)))]; tensor linear_15_cast_fp16 = linear(bias = var_357_to_fp16, weight = var_356_to_fp16, x = x_35_cast_fp16)[name = tensor("linear_15_cast_fp16")]; tensor x_37_cast_fp16 = add(x = x_31_cast_fp16, y = linear_15_cast_fp16)[name = tensor("x_37_cast_fp16")]; tensor var_364_axes_0 = const()[name = tensor("op_364_axes_0"), val = tensor([-1])]; tensor blocks_2_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_2_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18070400)))]; tensor blocks_2_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_2_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18071488)))]; tensor var_364_cast_fp16 = layer_norm(axes = var_364_axes_0, beta = blocks_2_mlp_ln_bias_to_fp16, epsilon = var_290_to_fp16, gamma = blocks_2_mlp_ln_weight_to_fp16, x = x_37_cast_fp16)[name = tensor("op_364_cast_fp16")]; tensor var_373_to_fp16 = const()[name = tensor("op_373_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18072576)))]; tensor var_374_to_fp16 = const()[name = tensor("op_374_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20169792)))]; tensor linear_16_cast_fp16 = linear(bias = var_374_to_fp16, weight = var_373_to_fp16, x = var_364_cast_fp16)[name = tensor("linear_16_cast_fp16")]; tensor x_41_mode_0 = const()[name = tensor("x_41_mode_0"), val = tensor("EXACT")]; tensor x_41_cast_fp16 = gelu(mode = x_41_mode_0, x = linear_16_cast_fp16)[name = tensor("x_41_cast_fp16")]; tensor var_379_to_fp16 = const()[name = tensor("op_379_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20173952)))]; tensor var_380_to_fp16 = const()[name = tensor("op_380_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22271168)))]; tensor linear_17_cast_fp16 = linear(bias = var_380_to_fp16, weight = var_379_to_fp16, x = x_41_cast_fp16)[name = tensor("linear_17_cast_fp16")]; tensor x_43_cast_fp16 = add(x = x_37_cast_fp16, y = linear_17_cast_fp16)[name = tensor("x_43_cast_fp16")]; tensor var_390 = const()[name = tensor("op_390"), val = tensor(-1)]; tensor var_406_axes_0 = const()[name = tensor("op_406_axes_0"), val = tensor([-1])]; tensor blocks_3_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_3_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22272256)))]; tensor blocks_3_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_3_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22273344)))]; tensor var_396_to_fp16 = const()[name = tensor("op_396_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_406_cast_fp16 = layer_norm(axes = var_406_axes_0, beta = blocks_3_attn_ln_bias_to_fp16, epsilon = var_396_to_fp16, gamma = blocks_3_attn_ln_weight_to_fp16, x = x_43_cast_fp16)[name = tensor("op_406_cast_fp16")]; tensor var_417_to_fp16 = const()[name = tensor("op_417_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22274432)))]; tensor var_418_to_fp16 = const()[name = tensor("op_418_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22798784)))]; tensor linear_18_cast_fp16 = linear(bias = var_418_to_fp16, weight = var_417_to_fp16, x = var_406_cast_fp16)[name = tensor("linear_18_cast_fp16")]; tensor var_421_to_fp16 = const()[name = tensor("op_421_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22799872)))]; tensor linear_19_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_421_to_fp16, x = var_406_cast_fp16)[name = tensor("linear_19_cast_fp16")]; tensor var_425_to_fp16 = const()[name = tensor("op_425_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23324224)))]; tensor var_426_to_fp16 = const()[name = tensor("op_426_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23848576)))]; tensor linear_20_cast_fp16 = linear(bias = var_426_to_fp16, weight = var_425_to_fp16, x = var_406_cast_fp16)[name = tensor("linear_20_cast_fp16")]; tensor var_434 = const()[name = tensor("op_434"), val = tensor([1, 1500, 8, -1])]; tensor var_435_cast_fp16 = reshape(shape = var_434, x = linear_18_cast_fp16)[name = tensor("op_435_cast_fp16")]; tensor const_48_to_fp16 = const()[name = tensor("const_48_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_15_cast_fp16 = mul(x = var_435_cast_fp16, y = const_48_to_fp16)[name = tensor("q_15_cast_fp16")]; tensor var_441 = const()[name = tensor("op_441"), val = tensor([1, 1500, 8, -1])]; tensor var_442_cast_fp16 = reshape(shape = var_441, x = linear_19_cast_fp16)[name = tensor("op_442_cast_fp16")]; tensor const_49_to_fp16 = const()[name = tensor("const_49_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_15_cast_fp16 = mul(x = var_442_cast_fp16, y = const_49_to_fp16)[name = tensor("k_15_cast_fp16")]; tensor var_448 = const()[name = tensor("op_448"), val = tensor([1, 1500, 8, -1])]; tensor var_449_cast_fp16 = reshape(shape = var_448, x = linear_20_cast_fp16)[name = tensor("op_449_cast_fp16")]; tensor var_450 = const()[name = tensor("op_450"), val = tensor([0, 2, 1, 3])]; tensor qk_7_transpose_x_0 = const()[name = tensor("qk_7_transpose_x_0"), val = tensor(false)]; tensor qk_7_transpose_y_0 = const()[name = tensor("qk_7_transpose_y_0"), val = tensor(false)]; tensor transpose_30_perm_0 = const()[name = tensor("transpose_30_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_31_perm_0 = const()[name = tensor("transpose_31_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_45 = transpose(perm = transpose_31_perm_0, x = k_15_cast_fp16)[name = tensor("transpose_45")]; tensor transpose_46 = transpose(perm = transpose_30_perm_0, x = q_15_cast_fp16)[name = tensor("transpose_46")]; tensor qk_7_cast_fp16 = matmul(transpose_x = qk_7_transpose_x_0, transpose_y = qk_7_transpose_y_0, x = transpose_46, y = transpose_45)[name = tensor("qk_7_cast_fp16")]; tensor var_454_cast_fp16 = softmax(axis = var_390, x = qk_7_cast_fp16)[name = tensor("op_454_cast_fp16")]; tensor var_456_transpose_x_0 = const()[name = tensor("op_456_transpose_x_0"), val = tensor(false)]; tensor var_456_transpose_y_0 = const()[name = tensor("op_456_transpose_y_0"), val = tensor(false)]; tensor transpose_47 = transpose(perm = var_450, x = var_449_cast_fp16)[name = tensor("transpose_47")]; tensor var_456_cast_fp16 = matmul(transpose_x = var_456_transpose_x_0, transpose_y = var_456_transpose_y_0, x = var_454_cast_fp16, y = transpose_47)[name = tensor("op_456_cast_fp16")]; tensor var_457 = const()[name = tensor("op_457"), val = tensor([0, 2, 1, 3])]; tensor concat_3 = const()[name = tensor("concat_3"), val = tensor([1, 1500, 512])]; tensor transpose_44 = transpose(perm = var_457, x = var_456_cast_fp16)[name = tensor("transpose_44")]; tensor x_47_cast_fp16 = reshape(shape = concat_3, x = transpose_44)[name = tensor("x_47_cast_fp16")]; tensor var_462_to_fp16 = const()[name = tensor("op_462_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23849664)))]; tensor var_463_to_fp16 = const()[name = tensor("op_463_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24374016)))]; tensor linear_21_cast_fp16 = linear(bias = var_463_to_fp16, weight = var_462_to_fp16, x = x_47_cast_fp16)[name = tensor("linear_21_cast_fp16")]; tensor x_49_cast_fp16 = add(x = x_43_cast_fp16, y = linear_21_cast_fp16)[name = tensor("x_49_cast_fp16")]; tensor var_470_axes_0 = const()[name = tensor("op_470_axes_0"), val = tensor([-1])]; tensor blocks_3_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_3_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24375104)))]; tensor blocks_3_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_3_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24376192)))]; tensor var_470_cast_fp16 = layer_norm(axes = var_470_axes_0, beta = blocks_3_mlp_ln_bias_to_fp16, epsilon = var_396_to_fp16, gamma = blocks_3_mlp_ln_weight_to_fp16, x = x_49_cast_fp16)[name = tensor("op_470_cast_fp16")]; tensor var_479_to_fp16 = const()[name = tensor("op_479_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24377280)))]; tensor var_480_to_fp16 = const()[name = tensor("op_480_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26474496)))]; tensor linear_22_cast_fp16 = linear(bias = var_480_to_fp16, weight = var_479_to_fp16, x = var_470_cast_fp16)[name = tensor("linear_22_cast_fp16")]; tensor x_53_mode_0 = const()[name = tensor("x_53_mode_0"), val = tensor("EXACT")]; tensor x_53_cast_fp16 = gelu(mode = x_53_mode_0, x = linear_22_cast_fp16)[name = tensor("x_53_cast_fp16")]; tensor var_485_to_fp16 = const()[name = tensor("op_485_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26478656)))]; tensor var_486_to_fp16 = const()[name = tensor("op_486_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28575872)))]; tensor linear_23_cast_fp16 = linear(bias = var_486_to_fp16, weight = var_485_to_fp16, x = x_53_cast_fp16)[name = tensor("linear_23_cast_fp16")]; tensor x_55_cast_fp16 = add(x = x_49_cast_fp16, y = linear_23_cast_fp16)[name = tensor("x_55_cast_fp16")]; tensor var_496 = const()[name = tensor("op_496"), val = tensor(-1)]; tensor var_512_axes_0 = const()[name = tensor("op_512_axes_0"), val = tensor([-1])]; tensor blocks_4_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_4_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28576960)))]; tensor blocks_4_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_4_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28578048)))]; tensor var_502_to_fp16 = const()[name = tensor("op_502_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_512_cast_fp16 = layer_norm(axes = var_512_axes_0, beta = blocks_4_attn_ln_bias_to_fp16, epsilon = var_502_to_fp16, gamma = blocks_4_attn_ln_weight_to_fp16, x = x_55_cast_fp16)[name = tensor("op_512_cast_fp16")]; tensor var_523_to_fp16 = const()[name = tensor("op_523_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28579136)))]; tensor var_524_to_fp16 = const()[name = tensor("op_524_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29103488)))]; tensor linear_24_cast_fp16 = linear(bias = var_524_to_fp16, weight = var_523_to_fp16, x = var_512_cast_fp16)[name = tensor("linear_24_cast_fp16")]; tensor var_527_to_fp16 = const()[name = tensor("op_527_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29104576)))]; tensor linear_25_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_527_to_fp16, x = var_512_cast_fp16)[name = tensor("linear_25_cast_fp16")]; tensor var_531_to_fp16 = const()[name = tensor("op_531_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29628928)))]; tensor var_532_to_fp16 = const()[name = tensor("op_532_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30153280)))]; tensor linear_26_cast_fp16 = linear(bias = var_532_to_fp16, weight = var_531_to_fp16, x = var_512_cast_fp16)[name = tensor("linear_26_cast_fp16")]; tensor var_540 = const()[name = tensor("op_540"), val = tensor([1, 1500, 8, -1])]; tensor var_541_cast_fp16 = reshape(shape = var_540, x = linear_24_cast_fp16)[name = tensor("op_541_cast_fp16")]; tensor const_50_to_fp16 = const()[name = tensor("const_50_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_19_cast_fp16 = mul(x = var_541_cast_fp16, y = const_50_to_fp16)[name = tensor("q_19_cast_fp16")]; tensor var_547 = const()[name = tensor("op_547"), val = tensor([1, 1500, 8, -1])]; tensor var_548_cast_fp16 = reshape(shape = var_547, x = linear_25_cast_fp16)[name = tensor("op_548_cast_fp16")]; tensor const_51_to_fp16 = const()[name = tensor("const_51_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_19_cast_fp16 = mul(x = var_548_cast_fp16, y = const_51_to_fp16)[name = tensor("k_19_cast_fp16")]; tensor var_554 = const()[name = tensor("op_554"), val = tensor([1, 1500, 8, -1])]; tensor var_555_cast_fp16 = reshape(shape = var_554, x = linear_26_cast_fp16)[name = tensor("op_555_cast_fp16")]; tensor var_556 = const()[name = tensor("op_556"), val = tensor([0, 2, 1, 3])]; tensor qk_9_transpose_x_0 = const()[name = tensor("qk_9_transpose_x_0"), val = tensor(false)]; tensor qk_9_transpose_y_0 = const()[name = tensor("qk_9_transpose_y_0"), val = tensor(false)]; tensor transpose_32_perm_0 = const()[name = tensor("transpose_32_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_33_perm_0 = const()[name = tensor("transpose_33_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_41 = transpose(perm = transpose_33_perm_0, x = k_19_cast_fp16)[name = tensor("transpose_41")]; tensor transpose_42 = transpose(perm = transpose_32_perm_0, x = q_19_cast_fp16)[name = tensor("transpose_42")]; tensor qk_9_cast_fp16 = matmul(transpose_x = qk_9_transpose_x_0, transpose_y = qk_9_transpose_y_0, x = transpose_42, y = transpose_41)[name = tensor("qk_9_cast_fp16")]; tensor var_560_cast_fp16 = softmax(axis = var_496, x = qk_9_cast_fp16)[name = tensor("op_560_cast_fp16")]; tensor var_562_transpose_x_0 = const()[name = tensor("op_562_transpose_x_0"), val = tensor(false)]; tensor var_562_transpose_y_0 = const()[name = tensor("op_562_transpose_y_0"), val = tensor(false)]; tensor transpose_43 = transpose(perm = var_556, x = var_555_cast_fp16)[name = tensor("transpose_43")]; tensor var_562_cast_fp16 = matmul(transpose_x = var_562_transpose_x_0, transpose_y = var_562_transpose_y_0, x = var_560_cast_fp16, y = transpose_43)[name = tensor("op_562_cast_fp16")]; tensor var_563 = const()[name = tensor("op_563"), val = tensor([0, 2, 1, 3])]; tensor concat_4 = const()[name = tensor("concat_4"), val = tensor([1, 1500, 512])]; tensor transpose_40 = transpose(perm = var_563, x = var_562_cast_fp16)[name = tensor("transpose_40")]; tensor x_59_cast_fp16 = reshape(shape = concat_4, x = transpose_40)[name = tensor("x_59_cast_fp16")]; tensor var_568_to_fp16 = const()[name = tensor("op_568_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30154368)))]; tensor var_569_to_fp16 = const()[name = tensor("op_569_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30678720)))]; tensor linear_27_cast_fp16 = linear(bias = var_569_to_fp16, weight = var_568_to_fp16, x = x_59_cast_fp16)[name = tensor("linear_27_cast_fp16")]; tensor x_61_cast_fp16 = add(x = x_55_cast_fp16, y = linear_27_cast_fp16)[name = tensor("x_61_cast_fp16")]; tensor var_576_axes_0 = const()[name = tensor("op_576_axes_0"), val = tensor([-1])]; tensor blocks_4_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_4_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30679808)))]; tensor blocks_4_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_4_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30680896)))]; tensor var_576_cast_fp16 = layer_norm(axes = var_576_axes_0, beta = blocks_4_mlp_ln_bias_to_fp16, epsilon = var_502_to_fp16, gamma = blocks_4_mlp_ln_weight_to_fp16, x = x_61_cast_fp16)[name = tensor("op_576_cast_fp16")]; tensor var_585_to_fp16 = const()[name = tensor("op_585_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30681984)))]; tensor var_586_to_fp16 = const()[name = tensor("op_586_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(32779200)))]; tensor linear_28_cast_fp16 = linear(bias = var_586_to_fp16, weight = var_585_to_fp16, x = var_576_cast_fp16)[name = tensor("linear_28_cast_fp16")]; tensor x_65_mode_0 = const()[name = tensor("x_65_mode_0"), val = tensor("EXACT")]; tensor x_65_cast_fp16 = gelu(mode = x_65_mode_0, x = linear_28_cast_fp16)[name = tensor("x_65_cast_fp16")]; tensor var_591_to_fp16 = const()[name = tensor("op_591_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(32783360)))]; tensor var_592_to_fp16 = const()[name = tensor("op_592_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34880576)))]; tensor linear_29_cast_fp16 = linear(bias = var_592_to_fp16, weight = var_591_to_fp16, x = x_65_cast_fp16)[name = tensor("linear_29_cast_fp16")]; tensor x_67_cast_fp16 = add(x = x_61_cast_fp16, y = linear_29_cast_fp16)[name = tensor("x_67_cast_fp16")]; tensor var_602 = const()[name = tensor("op_602"), val = tensor(-1)]; tensor var_618_axes_0 = const()[name = tensor("op_618_axes_0"), val = tensor([-1])]; tensor blocks_5_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_5_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34881664)))]; tensor blocks_5_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_5_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34882752)))]; tensor var_608_to_fp16 = const()[name = tensor("op_608_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_618_cast_fp16 = layer_norm(axes = var_618_axes_0, beta = blocks_5_attn_ln_bias_to_fp16, epsilon = var_608_to_fp16, gamma = blocks_5_attn_ln_weight_to_fp16, x = x_67_cast_fp16)[name = tensor("op_618_cast_fp16")]; tensor var_629_to_fp16 = const()[name = tensor("op_629_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34883840)))]; tensor var_630_to_fp16 = const()[name = tensor("op_630_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35408192)))]; tensor linear_30_cast_fp16 = linear(bias = var_630_to_fp16, weight = var_629_to_fp16, x = var_618_cast_fp16)[name = tensor("linear_30_cast_fp16")]; tensor var_633_to_fp16 = const()[name = tensor("op_633_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35409280)))]; tensor linear_31_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_633_to_fp16, x = var_618_cast_fp16)[name = tensor("linear_31_cast_fp16")]; tensor var_637_to_fp16 = const()[name = tensor("op_637_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35933632)))]; tensor var_638_to_fp16 = const()[name = tensor("op_638_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36457984)))]; tensor linear_32_cast_fp16 = linear(bias = var_638_to_fp16, weight = var_637_to_fp16, x = var_618_cast_fp16)[name = tensor("linear_32_cast_fp16")]; tensor var_646 = const()[name = tensor("op_646"), val = tensor([1, 1500, 8, -1])]; tensor var_647_cast_fp16 = reshape(shape = var_646, x = linear_30_cast_fp16)[name = tensor("op_647_cast_fp16")]; tensor const_52_to_fp16 = const()[name = tensor("const_52_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_cast_fp16 = mul(x = var_647_cast_fp16, y = const_52_to_fp16)[name = tensor("q_cast_fp16")]; tensor var_653 = const()[name = tensor("op_653"), val = tensor([1, 1500, 8, -1])]; tensor var_654_cast_fp16 = reshape(shape = var_653, x = linear_31_cast_fp16)[name = tensor("op_654_cast_fp16")]; tensor const_53_to_fp16 = const()[name = tensor("const_53_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_cast_fp16 = mul(x = var_654_cast_fp16, y = const_53_to_fp16)[name = tensor("k_cast_fp16")]; tensor var_660 = const()[name = tensor("op_660"), val = tensor([1, 1500, 8, -1])]; tensor var_661_cast_fp16 = reshape(shape = var_660, x = linear_32_cast_fp16)[name = tensor("op_661_cast_fp16")]; tensor var_662 = const()[name = tensor("op_662"), val = tensor([0, 2, 1, 3])]; tensor qk_transpose_x_0 = const()[name = tensor("qk_transpose_x_0"), val = tensor(false)]; tensor qk_transpose_y_0 = const()[name = tensor("qk_transpose_y_0"), val = tensor(false)]; tensor transpose_34_perm_0 = const()[name = tensor("transpose_34_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_35_perm_0 = const()[name = tensor("transpose_35_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_37 = transpose(perm = transpose_35_perm_0, x = k_cast_fp16)[name = tensor("transpose_37")]; tensor transpose_38 = transpose(perm = transpose_34_perm_0, x = q_cast_fp16)[name = tensor("transpose_38")]; tensor qk_cast_fp16 = matmul(transpose_x = qk_transpose_x_0, transpose_y = qk_transpose_y_0, x = transpose_38, y = transpose_37)[name = tensor("qk_cast_fp16")]; tensor var_666_cast_fp16 = softmax(axis = var_602, x = qk_cast_fp16)[name = tensor("op_666_cast_fp16")]; tensor var_668_transpose_x_0 = const()[name = tensor("op_668_transpose_x_0"), val = tensor(false)]; tensor var_668_transpose_y_0 = const()[name = tensor("op_668_transpose_y_0"), val = tensor(false)]; tensor transpose_39 = transpose(perm = var_662, x = var_661_cast_fp16)[name = tensor("transpose_39")]; tensor var_668_cast_fp16 = matmul(transpose_x = var_668_transpose_x_0, transpose_y = var_668_transpose_y_0, x = var_666_cast_fp16, y = transpose_39)[name = tensor("op_668_cast_fp16")]; tensor var_669 = const()[name = tensor("op_669"), val = tensor([0, 2, 1, 3])]; tensor concat_5 = const()[name = tensor("concat_5"), val = tensor([1, 1500, 512])]; tensor transpose_36 = transpose(perm = var_669, x = var_668_cast_fp16)[name = tensor("transpose_36")]; tensor x_71_cast_fp16 = reshape(shape = concat_5, x = transpose_36)[name = tensor("x_71_cast_fp16")]; tensor var_674_to_fp16 = const()[name = tensor("op_674_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36459072)))]; tensor var_675_to_fp16 = const()[name = tensor("op_675_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36983424)))]; tensor linear_33_cast_fp16 = linear(bias = var_675_to_fp16, weight = var_674_to_fp16, x = x_71_cast_fp16)[name = tensor("linear_33_cast_fp16")]; tensor x_73_cast_fp16 = add(x = x_67_cast_fp16, y = linear_33_cast_fp16)[name = tensor("x_73_cast_fp16")]; tensor var_682_axes_0 = const()[name = tensor("op_682_axes_0"), val = tensor([-1])]; tensor blocks_5_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_5_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36984512)))]; tensor blocks_5_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_5_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36985600)))]; tensor var_682_cast_fp16 = layer_norm(axes = var_682_axes_0, beta = blocks_5_mlp_ln_bias_to_fp16, epsilon = var_608_to_fp16, gamma = blocks_5_mlp_ln_weight_to_fp16, x = x_73_cast_fp16)[name = tensor("op_682_cast_fp16")]; tensor var_691_to_fp16 = const()[name = tensor("op_691_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36986688)))]; tensor var_692_to_fp16 = const()[name = tensor("op_692_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39083904)))]; tensor linear_34_cast_fp16 = linear(bias = var_692_to_fp16, weight = var_691_to_fp16, x = var_682_cast_fp16)[name = tensor("linear_34_cast_fp16")]; tensor x_77_mode_0 = const()[name = tensor("x_77_mode_0"), val = tensor("EXACT")]; tensor x_77_cast_fp16 = gelu(mode = x_77_mode_0, x = linear_34_cast_fp16)[name = tensor("x_77_cast_fp16")]; tensor var_697_to_fp16 = const()[name = tensor("op_697_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39088064)))]; tensor var_698_to_fp16 = const()[name = tensor("op_698_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41185280)))]; tensor linear_35_cast_fp16 = linear(bias = var_698_to_fp16, weight = var_697_to_fp16, x = x_77_cast_fp16)[name = tensor("linear_35_cast_fp16")]; tensor x_cast_fp16 = add(x = x_73_cast_fp16, y = linear_35_cast_fp16)[name = tensor("x_cast_fp16")]; tensor var_711_axes_0 = const()[name = tensor("op_711_axes_0"), val = tensor([-1])]; tensor ln_post_weight_to_fp16 = const()[name = tensor("ln_post_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41186368)))]; tensor ln_post_bias_to_fp16 = const()[name = tensor("ln_post_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41187456)))]; tensor var_702_to_fp16 = const()[name = tensor("op_702_to_fp16"), val = tensor(0x1.5p-17)]; tensor output = layer_norm(axes = var_711_axes_0, beta = ln_post_bias_to_fp16, epsilon = var_702_to_fp16, gamma = ln_post_weight_to_fp16, x = x_cast_fp16)[name = tensor("op_711_cast_fp16")]; } -> (output); }