/model/model/Shape:Shape*input:input_5F_ids(1,0)*output:_2F_model_2F_model_2F_Shape_5F_output_5F_0(2) /model/model/Gather:Gather*input:_2F_model_2F_model_2F_Shape_5F_output_5F_0(2);_2F_model_2F_model_2F_Constant_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_Gather_5F_output_5F_0()*axis:0 /model/model/Shape_1:Shape*input:pkv0(1,8,0,128)*output:_2F_model_2F_model_2F_Shape_5F_1_5F_output_5F_0(4) /model/model/Gather_1:Gather*input:_2F_model_2F_model_2F_Shape_5F_1_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_Gather_5F_1_5F_output_5F_0()*axis:0 /model/model/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_Gather_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_Unsqueeze_5F_output_5F_0(1) /model/model/Concat:Concat*input:_2F_model_2F_model_2F_Constant_5F_2_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Unsqueeze_5F_output_5F_0(1)*output:_2F_model_2F_model_2F_Concat_5F_output_5F_0(2)*axis:0 /model/model/Reshape:Reshape*input:position_5F_ids(1,0);_2F_model_2F_model_2F_Concat_5F_output_5F_0(2)*output:_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*allowzero:0 /model/model/embed_tokens/Gather:Gather*input:model_2E_model_2E_embed_5F_tokens_2E_weight.bin(float16:32000,4096);input_5F_ids(1,0)*output:_2F_model_2F_model_2F_embed_5F_tokens_2F_Gather_5F_output_5F_0(1,0,4096) /model/model/Add:Add*input:_2F_model_2F_model_2F_Gather_5F_output_5F_0();_2F_model_2F_model_2F_Gather_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_Add_5F_output_5F_0() /model/model/Sub:Sub*input:_2F_model_2F_model_2F_Add_5F_output_5F_0();_2F_model_2F_model_2F_Gather_5F_output_5F_0()*output:_2F_model_2F_model_2F_Sub_5F_output_5F_0() /model/model/Concat_1:Concat*input:_2F_model_2F_model_2F_Unsqueeze_5F_output_5F_0(1);_2F_model_2F_model_2F_Unsqueeze_5F_output_5F_0(1)*output:_2F_model_2F_model_2F_Concat_5F_1_5F_output_5F_0(2)*axis:0 /model/model/ConstantOfShape:ConstantOfShape*input:_2F_model_2F_model_2F_Concat_5F_1_5F_output_5F_0(2)*output:_2F_model_2F_model_2F_ConstantOfShape_5F_output_5F_0(0,0)*value:-3.4028234663852886e+38 /model/model/Shape_3:Shape*input:_2F_model_2F_model_2F_ConstantOfShape_5F_output_5F_0(0,0)*output:_2F_model_2F_model_2F_Shape_5F_3_5F_output_5F_0(2) /model/model/Slice:Slice*input:_2F_model_2F_model_2F_Shape_5F_3_5F_output_5F_0(2);_2F_model_2F_model_2F_Constant_5F_2_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_Slice_5F_output_5F_0(1) /model/model/Squeeze:Squeeze*input:_2F_model_2F_model_2F_Slice_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_Squeeze_5F_output_5F_0() /model/model/Range:Range*input:_2F_model_2F_model_2F_Constant_5F_8_5F_output_5F_0.bin(int64:);_2F_model_2F_model_2F_Squeeze_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_Range_5F_output_5F_0(0) /model/model/Add_1:Add*input:_2F_model_2F_model_2F_Range_5F_output_5F_0(0);_2F_model_2F_model_2F_Constant_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_Add_5F_1_5F_output_5F_0(0) /model/model/Reshape_1:Reshape*input:_2F_model_2F_model_2F_Add_5F_1_5F_output_5F_0(0);14831.bin(int64:2)*output:_2F_model_2F_model_2F_Reshape_5F_1_5F_output_5F_0(0,1)*allowzero:0 /model/model/Less:Less*input:_2F_model_2F_model_2F_Range_5F_output_5F_0(0);_2F_model_2F_model_2F_Reshape_5F_1_5F_output_5F_0(0,1)*output:_2F_model_2F_model_2F_Less_5F_output_5F_0(0,0) /model/model/Where:Where*input:_2F_model_2F_model_2F_Less_5F_output_5F_0(0,0);_2F_model_2F_model_2F_Constant_5F_16_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_ConstantOfShape_5F_output_5F_0(0,0)*output:_2F_model_2F_model_2F_Where_5F_output_5F_0(0,0) /model/model/Unsqueeze_5:Unsqueeze*input:_2F_model_2F_model_2F_Sub_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_Unsqueeze_5F_5_5F_output_5F_0(1) /model/model/Concat_3:Concat*input:_2F_model_2F_model_2F_Unsqueeze_5F_output_5F_0(1);_2F_model_2F_model_2F_Unsqueeze_5F_5_5F_output_5F_0(1)*output:_2F_model_2F_model_2F_Concat_5F_3_5F_output_5F_0(2)*axis:0 /model/model/ConstantOfShape_1:ConstantOfShape*input:_2F_model_2F_model_2F_Concat_5F_3_5F_output_5F_0(2)*output:_2F_model_2F_model_2F_ConstantOfShape_5F_1_5F_output_5F_0(0,0)*value:0.0 /model/model/Concat_4:Concat*input:_2F_model_2F_model_2F_ConstantOfShape_5F_1_5F_output_5F_0(0,0);_2F_model_2F_model_2F_Where_5F_output_5F_0(0,0)*output:_2F_model_2F_model_2F_Concat_5F_4_5F_output_5F_0(0,0)*axis:-1 /model/model/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_Concat_5F_4_5F_output_5F_0(0,0);4708.bin(int64:2)*output:_2F_model_2F_model_2F_Unsqueeze_5F_7_5F_output_5F_0(1,1,0,0) /model/model/Add_2:Add*input:_2F_model_2F_model_2F_Gather_5F_output_5F_0();_2F_model_2F_model_2F_Sub_5F_output_5F_0()*output:_2F_model_2F_model_2F_Add_5F_2_5F_output_5F_0() /model/model/Unsqueeze_10:Unsqueeze*input:_2F_model_2F_model_2F_Add_5F_2_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_Unsqueeze_5F_10_5F_output_5F_0(1) /model/model/Concat_5:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Unsqueeze_5F_output_5F_0(1);_2F_model_2F_model_2F_Unsqueeze_5F_10_5F_output_5F_0(1)*output:_2F_model_2F_model_2F_Concat_5F_5_5F_output_5F_0(4)*axis:0 /model/model/Equal:Equal*input:_2F_model_2F_model_2F_Concat_5F_5_5F_output_5F_0(4);_2F_model_2F_model_2F_Mul_5F_output_5F_0.bin(int64:4)*output:_2F_model_2F_model_2F_Equal_5F_output_5F_0(4) /model/model/Where_1:Where*input:_2F_model_2F_model_2F_Equal_5F_output_5F_0(4);_2F_model_2F_model_2F_ConstantOfShape_5F_2_5F_output_5F_0.bin(int64:4);_2F_model_2F_model_2F_Concat_5F_5_5F_output_5F_0(4)*output:_2F_model_2F_model_2F_Where_5F_1_5F_output_5F_0(4) /model/model/Expand:Expand*input:_2F_model_2F_model_2F_Unsqueeze_5F_7_5F_output_5F_0(1,1,0,0);_2F_model_2F_model_2F_Where_5F_1_5F_output_5F_0(4)*output:_2F_model_2F_model_2F_Expand_5F_output_5F_0(0,0,0,0) /model/model/Shape_6:Shape*input:attention_5F_mask(1,0)*output:_2F_model_2F_model_2F_Shape_5F_6_5F_output_5F_0(2) /model/model/Gather_3:Gather*input:_2F_model_2F_model_2F_Shape_5F_6_5F_output_5F_0(2);_2F_model_2F_model_2F_Constant_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/Unsqueeze_12:Unsqueeze*input:attention_5F_mask(1,0);14833.bin(int64:2)*output:_2F_model_2F_model_2F_Unsqueeze_5F_12_5F_output_5F_0(1,1,1,0) /model/model/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_Gather_5F_3_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/Concat_6:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Unsqueeze_5F_output_5F_0(1);_2F_model_2F_model_2F_Unsqueeze_5F_15_5F_output_5F_0(1)*output:_2F_model_2F_model_2F_Concat_5F_6_5F_output_5F_0(4)*axis:0 /model/model/Equal_1:Equal*input:_2F_model_2F_model_2F_Concat_5F_6_5F_output_5F_0(4);_2F_model_2F_model_2F_Mul_5F_output_5F_0.bin(int64:4)*output:_2F_model_2F_model_2F_Equal_5F_1_5F_output_5F_0(4) /model/model/Where_2:Where*input:_2F_model_2F_model_2F_Equal_5F_1_5F_output_5F_0(4);_2F_model_2F_model_2F_ConstantOfShape_5F_2_5F_output_5F_0.bin(int64:4);_2F_model_2F_model_2F_Concat_5F_6_5F_output_5F_0(4)*output:_2F_model_2F_model_2F_Where_5F_2_5F_output_5F_0(4) /model/model/Expand_1:Expand*input:_2F_model_2F_model_2F_Unsqueeze_5F_12_5F_output_5F_0(1,1,1,0);_2F_model_2F_model_2F_Where_5F_2_5F_output_5F_0(4)*output:_2F_model_2F_model_2F_Expand_5F_1_5F_output_5F_0(0,0,0,0) /model/model/Cast_4:Cast*input:_2F_model_2F_model_2F_Expand_5F_1_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_Cast_5F_4_5F_output_5F_0(0,0,0,0)*to:1 /model/model/Sub_1:Sub*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_Cast_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_Sub_5F_1_5F_output_5F_0(0,0,0,0) /model/model/Cast_5:Cast*input:_2F_model_2F_model_2F_Sub_5F_1_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_Cast_5F_5_5F_output_5F_0(0,0,0,0)*to:9 /model/model/Where_3:Where*input:_2F_model_2F_model_2F_Cast_5F_5_5F_output_5F_0(0,0,0,0);_2F_model_2F_model_2F_Constant_5F_35_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_Sub_5F_1_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_Where_5F_3_5F_output_5F_0(0,0,0,0) /model/model/Cast_8:Cast*input:_2F_model_2F_model_2F_Where_5F_3_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_Cast_5F_8_5F_output_5F_0(0,0,0,0)*to:9 /model/model/Where_4:Where*input:_2F_model_2F_model_2F_Cast_5F_8_5F_output_5F_0(0,0,0,0);_2F_model_2F_model_2F_Constant_5F_35_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_Expand_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0) /model/model/layers.0/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_embed_5F_tokens_2F_Gather_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.0/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.0/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.0/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.0/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.0/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_embed_5F_tokens_2F_Gather_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.0/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_0_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.0/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9693.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.0/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9694.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.0/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9695.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.0/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.0/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.0/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.0/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.0/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.0/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.0/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.0/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.0/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Gather_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.0/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.0/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.0/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.0/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.0/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.0/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.0/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.0/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.0/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.0/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.0/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.0/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.0/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.0/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.0/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.0/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.0/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.0/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.0/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.0/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.0/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.0/self_attn/Concat_5:Concat*input:pkv0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv0(1,8,0,128)*axis:-2 /model/model/layers.0/self_attn/Concat_6:Concat*input:pkv1(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv1(1,8,0,128)*axis:-2 /model/model/layers.0/self_attn/Shape_7:Shape*input:opkv0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Shape_5F_7_5F_output_5F_0(4) /model/model/layers.0/self_attn/Gather_9:Gather*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Shape_5F_7_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Gather_5F_9_5F_output_5F_0()*axis:0 /model/model/layers.0/self_attn/Unsqueeze_12:Unsqueeze*input:opkv0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.0/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Gather_5F_9_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.0/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.0/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.0/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.0/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.0/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.0/self_attn/Shape_12:Shape*input:opkv1(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Shape_5F_12_5F_output_5F_0(4) /model/model/layers.0/self_attn/Gather_13:Gather*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Shape_5F_12_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Gather_5F_13_5F_output_5F_0()*axis:0 /model/model/layers.0/self_attn/Unsqueeze_21:Unsqueeze*input:opkv1(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.0/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Gather_5F_13_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.0/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.0/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.0/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.0/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.0/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.0/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.0/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.0/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.0/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.0/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.0/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.0/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.0/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.0/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9723.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.0/Add:Add*input:_2F_model_2F_model_2F_embed_5F_tokens_2F_Gather_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_0_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.0/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_0_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_0_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.0/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_0_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_0_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.0/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_0_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_0_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.0/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_0_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.0/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_0_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.0/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_0_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_0_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.0/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_0_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_0_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_0_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.0/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_0_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9724.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_0_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.0/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_0_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_0_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.0/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_0_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_0_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_0_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.0/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_0_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9725.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_0_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.0/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_0_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_0_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_0_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.0/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_0_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_9726.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_0_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.0/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_0_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_0_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.1/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_0_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_1_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.1/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_1_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_1_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.1/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_1_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_1_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.1/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_1_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.1/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_1_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.1/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_0_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_1_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.1/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_1_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_1_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_1_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.1/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_1_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9727.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.1/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_1_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9728.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.1/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_1_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9729.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.1/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.1/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.1/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.1/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.1/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.1/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.1/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.1/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.1/self_attn/Shape_3:Shape*input:pkv2(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.1/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.1/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.1/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.1/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.1/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.1/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.1/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.1/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.1/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.1/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.1/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.1/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.1/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.1/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.1/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.1/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.1/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.1/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.1/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.1/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.1/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.1/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.1/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.1/self_attn/Concat_5:Concat*input:pkv2(1,8,0,128);_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv2(1,8,0,128)*axis:-2 /model/model/layers.1/self_attn/Concat_6:Concat*input:pkv3(1,8,0,128);_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv3(1,8,0,128)*axis:-2 /model/model/layers.1/self_attn/Shape_8:Shape*input:opkv2(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.1/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.1/self_attn/Unsqueeze_12:Unsqueeze*input:opkv2(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.1/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.1/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.1/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.1/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.1/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.1/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.1/self_attn/Shape_13:Shape*input:opkv3(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.1/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.1/self_attn/Unsqueeze_21:Unsqueeze*input:opkv3(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.1/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.1/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.1/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.1/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.1/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.1/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.1/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.1/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.1/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.1/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.1/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.1/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.1/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.1/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.1/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9757.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.1/Add:Add*input:_2F_model_2F_model_2F_layers_2E_0_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_1_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_1_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.1/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_1_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_1_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.1/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_1_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_1_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.1/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_1_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_1_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.1/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_1_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.1/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_1_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.1/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_1_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_1_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_1_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.1/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_1_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_1_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_1_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.1/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_1_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9758.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_1_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.1/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_1_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_1_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.1/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_1_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_1_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_1_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.1/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_1_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9759.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_1_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.1/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_1_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_1_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_1_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.1/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_1_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_9760.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_1_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.1/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_1_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_1_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_1_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.2/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_1_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_2_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.2/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_2_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_2_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.2/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_2_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_2_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.2/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_2_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.2/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_2_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.2/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_1_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_2_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.2/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_2_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_2_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_2_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.2/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_2_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9761.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.2/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_2_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9762.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.2/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_2_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9763.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.2/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.2/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.2/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.2/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.2/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.2/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.2/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.2/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.2/self_attn/Shape_3:Shape*input:pkv4(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.2/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.2/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.2/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.2/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.2/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.2/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.2/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.2/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.2/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.2/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.2/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.2/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.2/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.2/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.2/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.2/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.2/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.2/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.2/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.2/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.2/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.2/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.2/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.2/self_attn/Concat_5:Concat*input:pkv4(1,8,0,128);_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv4(1,8,0,128)*axis:-2 /model/model/layers.2/self_attn/Concat_6:Concat*input:pkv5(1,8,0,128);_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv5(1,8,0,128)*axis:-2 /model/model/layers.2/self_attn/Shape_8:Shape*input:opkv4(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.2/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.2/self_attn/Unsqueeze_12:Unsqueeze*input:opkv4(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.2/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.2/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.2/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.2/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.2/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.2/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.2/self_attn/Shape_13:Shape*input:opkv5(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.2/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.2/self_attn/Unsqueeze_21:Unsqueeze*input:opkv5(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.2/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.2/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.2/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.2/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.2/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.2/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.2/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.2/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.2/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.2/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.2/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.2/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.2/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.2/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.2/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9791.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.2/Add:Add*input:_2F_model_2F_model_2F_layers_2E_1_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_2_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_2_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.2/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_2_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_2_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.2/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_2_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_2_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.2/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_2_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_2_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.2/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_2_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.2/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_2_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.2/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_2_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_2_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_2_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.2/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_2_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_2_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_2_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.2/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_2_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9792.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_2_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.2/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_2_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_2_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.2/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_2_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_2_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_2_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.2/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_2_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9793.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_2_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.2/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_2_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_2_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_2_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.2/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_2_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_9794.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_2_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.2/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_2_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_2_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_2_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.3/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_2_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_3_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.3/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_3_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_3_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.3/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_3_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_3_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.3/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_3_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.3/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_3_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.3/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_2_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_3_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.3/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_3_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_3_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_3_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.3/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_3_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9795.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.3/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_3_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9796.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.3/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_3_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9797.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.3/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.3/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.3/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.3/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.3/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.3/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.3/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.3/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.3/self_attn/Shape_3:Shape*input:pkv6(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.3/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.3/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.3/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.3/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.3/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.3/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.3/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.3/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.3/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.3/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.3/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.3/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.3/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.3/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.3/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.3/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.3/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.3/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.3/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.3/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.3/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.3/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.3/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.3/self_attn/Concat_5:Concat*input:pkv6(1,8,0,128);_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv6(1,8,0,128)*axis:-2 /model/model/layers.3/self_attn/Concat_6:Concat*input:pkv7(1,8,0,128);_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv7(1,8,0,128)*axis:-2 /model/model/layers.3/self_attn/Shape_8:Shape*input:opkv6(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.3/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.3/self_attn/Unsqueeze_12:Unsqueeze*input:opkv6(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.3/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.3/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.3/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.3/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.3/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.3/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.3/self_attn/Shape_13:Shape*input:opkv7(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.3/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.3/self_attn/Unsqueeze_21:Unsqueeze*input:opkv7(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.3/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.3/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.3/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.3/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.3/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.3/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.3/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.3/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.3/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.3/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.3/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.3/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.3/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.3/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.3/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9825.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.3/Add:Add*input:_2F_model_2F_model_2F_layers_2E_2_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_3_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_3_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.3/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_3_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_3_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.3/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_3_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_3_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.3/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_3_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_3_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.3/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_3_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.3/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_3_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.3/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_3_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_3_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_3_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.3/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_3_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_3_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_3_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.3/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_3_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9826.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_3_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.3/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_3_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_3_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.3/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_3_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_3_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_3_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.3/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_3_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9827.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_3_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.3/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_3_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_3_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_3_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.3/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_3_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_9828.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_3_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.3/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_3_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_3_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_3_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.4/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_3_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_4_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.4/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_4_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_4_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.4/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_4_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_4_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.4/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_4_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.4/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_4_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.4/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_3_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_4_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.4/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_4_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_4_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_4_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.4/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_4_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9829.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.4/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_4_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9830.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.4/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_4_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9831.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.4/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.4/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.4/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.4/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.4/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.4/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.4/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.4/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.4/self_attn/Shape_3:Shape*input:pkv8(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.4/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.4/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.4/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.4/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.4/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.4/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.4/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.4/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.4/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.4/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.4/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.4/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.4/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.4/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.4/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.4/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.4/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.4/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.4/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.4/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.4/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.4/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.4/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.4/self_attn/Concat_5:Concat*input:pkv8(1,8,0,128);_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv8(1,8,0,128)*axis:-2 /model/model/layers.4/self_attn/Concat_6:Concat*input:pkv9(1,8,0,128);_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv9(1,8,0,128)*axis:-2 /model/model/layers.4/self_attn/Shape_8:Shape*input:opkv8(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.4/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.4/self_attn/Unsqueeze_12:Unsqueeze*input:opkv8(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.4/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.4/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.4/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.4/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.4/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.4/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.4/self_attn/Shape_13:Shape*input:opkv9(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.4/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.4/self_attn/Unsqueeze_21:Unsqueeze*input:opkv9(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.4/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.4/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.4/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.4/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.4/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.4/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.4/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.4/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.4/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.4/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.4/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.4/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.4/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.4/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.4/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9859.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.4/Add:Add*input:_2F_model_2F_model_2F_layers_2E_3_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_4_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_4_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.4/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_4_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_4_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.4/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_4_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_4_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.4/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_4_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_4_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.4/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_4_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.4/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_4_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.4/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_4_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_4_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_4_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.4/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_4_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_4_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_4_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.4/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_4_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9860.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_4_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.4/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_4_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_4_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.4/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_4_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_4_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_4_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.4/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_4_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9861.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_4_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.4/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_4_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_4_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_4_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.4/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_4_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_9862.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_4_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.4/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_4_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_4_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_4_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.5/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_4_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_5_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.5/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_5_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_5_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.5/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_5_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_5_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.5/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_5_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.5/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_5_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.5/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_4_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_5_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.5/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_5_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_5_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_5_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.5/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_5_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9863.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.5/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_5_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9864.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.5/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_5_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9865.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.5/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.5/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.5/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.5/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.5/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.5/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.5/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.5/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.5/self_attn/Shape_3:Shape*input:pkv10(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.5/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.5/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.5/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.5/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.5/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.5/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.5/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.5/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.5/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.5/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.5/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.5/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.5/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.5/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.5/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.5/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.5/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.5/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.5/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.5/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.5/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.5/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.5/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.5/self_attn/Concat_5:Concat*input:pkv10(1,8,0,128);_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv10(1,8,0,128)*axis:-2 /model/model/layers.5/self_attn/Concat_6:Concat*input:pkv11(1,8,0,128);_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv11(1,8,0,128)*axis:-2 /model/model/layers.5/self_attn/Shape_8:Shape*input:opkv10(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.5/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.5/self_attn/Unsqueeze_12:Unsqueeze*input:opkv10(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.5/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.5/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.5/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.5/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.5/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.5/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.5/self_attn/Shape_13:Shape*input:opkv11(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.5/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.5/self_attn/Unsqueeze_21:Unsqueeze*input:opkv11(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.5/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.5/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.5/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.5/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.5/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.5/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.5/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.5/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.5/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.5/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.5/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.5/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.5/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.5/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.5/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9893.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.5/Add:Add*input:_2F_model_2F_model_2F_layers_2E_4_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_5_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_5_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.5/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_5_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_5_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.5/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_5_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_5_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.5/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_5_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_5_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.5/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_5_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.5/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_5_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.5/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_5_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_5_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_5_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.5/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_5_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_5_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_5_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.5/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_5_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9894.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_5_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.5/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_5_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_5_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.5/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_5_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_5_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_5_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.5/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_5_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9895.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_5_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.5/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_5_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_5_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_5_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.5/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_5_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_9896.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_5_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.5/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_5_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_5_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_5_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.6/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_5_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_6_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.6/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_6_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_6_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.6/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_6_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_6_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.6/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_6_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.6/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_6_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.6/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_5_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_6_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.6/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_6_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_6_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_6_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.6/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_6_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9897.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.6/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_6_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9898.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.6/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_6_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9899.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.6/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.6/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.6/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.6/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.6/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.6/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.6/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.6/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.6/self_attn/Shape_3:Shape*input:pkv12(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.6/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.6/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.6/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.6/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.6/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.6/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.6/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.6/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.6/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.6/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.6/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.6/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.6/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.6/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.6/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.6/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.6/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.6/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.6/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.6/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.6/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.6/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.6/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.6/self_attn/Concat_5:Concat*input:pkv12(1,8,0,128);_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv12(1,8,0,128)*axis:-2 /model/model/layers.6/self_attn/Concat_6:Concat*input:pkv13(1,8,0,128);_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv13(1,8,0,128)*axis:-2 /model/model/layers.6/self_attn/Shape_8:Shape*input:opkv12(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.6/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.6/self_attn/Unsqueeze_12:Unsqueeze*input:opkv12(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.6/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.6/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.6/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.6/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.6/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.6/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.6/self_attn/Shape_13:Shape*input:opkv13(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.6/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.6/self_attn/Unsqueeze_21:Unsqueeze*input:opkv13(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.6/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.6/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.6/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.6/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.6/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.6/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.6/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.6/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.6/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.6/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.6/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.6/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.6/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.6/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.6/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9927.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.6/Add:Add*input:_2F_model_2F_model_2F_layers_2E_5_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_6_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_6_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.6/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_6_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_6_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.6/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_6_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_6_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.6/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_6_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_6_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.6/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_6_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.6/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_6_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.6/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_6_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_6_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_6_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.6/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_6_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_6_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_6_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.6/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_6_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9928.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_6_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.6/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_6_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_6_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.6/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_6_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_6_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_6_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.6/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_6_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9929.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_6_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.6/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_6_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_6_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_6_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.6/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_6_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_9930.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_6_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.6/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_6_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_6_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_6_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.7/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_6_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_7_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.7/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_7_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_7_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.7/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_7_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_7_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.7/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_7_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.7/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_7_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.7/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_6_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_7_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.7/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_7_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_7_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_7_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.7/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_7_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9931.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.7/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_7_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9932.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.7/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_7_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9933.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.7/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.7/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.7/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.7/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.7/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.7/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.7/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.7/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.7/self_attn/Shape_3:Shape*input:pkv14(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.7/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.7/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.7/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.7/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.7/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.7/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.7/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.7/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.7/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.7/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.7/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.7/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.7/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.7/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.7/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.7/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.7/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.7/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.7/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.7/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.7/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.7/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.7/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.7/self_attn/Concat_5:Concat*input:pkv14(1,8,0,128);_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv14(1,8,0,128)*axis:-2 /model/model/layers.7/self_attn/Concat_6:Concat*input:pkv15(1,8,0,128);_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv15(1,8,0,128)*axis:-2 /model/model/layers.7/self_attn/Shape_8:Shape*input:opkv14(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.7/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.7/self_attn/Unsqueeze_12:Unsqueeze*input:opkv14(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.7/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.7/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.7/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.7/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.7/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.7/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.7/self_attn/Shape_13:Shape*input:opkv15(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.7/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.7/self_attn/Unsqueeze_21:Unsqueeze*input:opkv15(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.7/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.7/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.7/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.7/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.7/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.7/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.7/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.7/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.7/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.7/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.7/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.7/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.7/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.7/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.7/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9961.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.7/Add:Add*input:_2F_model_2F_model_2F_layers_2E_6_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_7_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_7_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.7/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_7_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_7_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.7/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_7_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_7_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.7/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_7_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_7_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.7/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_7_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.7/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_7_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.7/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_7_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_7_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_7_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.7/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_7_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_7_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_7_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.7/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_7_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9962.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_7_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.7/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_7_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_7_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.7/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_7_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_7_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_7_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.7/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_7_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9963.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_7_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.7/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_7_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_7_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_7_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.7/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_7_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_9964.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_7_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.7/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_7_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_7_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_7_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.8/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_7_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_8_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.8/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_8_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_8_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.8/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_8_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_8_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.8/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_8_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.8/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_8_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.8/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_7_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_8_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.8/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_8_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_8_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_8_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.8/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_8_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9965.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.8/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_8_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9966.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.8/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_8_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9967.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.8/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.8/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.8/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.8/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.8/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.8/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.8/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.8/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.8/self_attn/Shape_3:Shape*input:pkv16(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.8/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.8/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.8/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.8/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.8/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.8/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.8/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.8/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.8/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.8/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.8/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.8/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.8/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.8/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.8/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.8/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.8/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.8/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.8/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.8/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.8/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.8/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.8/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.8/self_attn/Concat_5:Concat*input:pkv16(1,8,0,128);_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv16(1,8,0,128)*axis:-2 /model/model/layers.8/self_attn/Concat_6:Concat*input:pkv17(1,8,0,128);_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv17(1,8,0,128)*axis:-2 /model/model/layers.8/self_attn/Shape_8:Shape*input:opkv16(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.8/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.8/self_attn/Unsqueeze_12:Unsqueeze*input:opkv16(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.8/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.8/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.8/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.8/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.8/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.8/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.8/self_attn/Shape_13:Shape*input:opkv17(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.8/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.8/self_attn/Unsqueeze_21:Unsqueeze*input:opkv17(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.8/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.8/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.8/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.8/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.8/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.8/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.8/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.8/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.8/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.8/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.8/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.8/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.8/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.8/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.8/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9995.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.8/Add:Add*input:_2F_model_2F_model_2F_layers_2E_7_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_8_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_8_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.8/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_8_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_8_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.8/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_8_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_8_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.8/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_8_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_8_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.8/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_8_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.8/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_8_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.8/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_8_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_8_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_8_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.8/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_8_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_8_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_8_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.8/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_8_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9996.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_8_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.8/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_8_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_8_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.8/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_8_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_8_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_8_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.8/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_8_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9997.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_8_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.8/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_8_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_8_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_8_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.8/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_8_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_9998.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_8_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.8/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_8_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_8_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_8_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.9/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_8_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_9_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.9/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_9_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_9_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.9/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_9_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_9_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.9/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_9_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.9/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_9_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.9/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_8_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_9_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.9/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_9_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_9_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_9_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.9/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_9_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_9999.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.9/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_9_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10000.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.9/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_9_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10001.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.9/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.9/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.9/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.9/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.9/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.9/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.9/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.9/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.9/self_attn/Shape_3:Shape*input:pkv18(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.9/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.9/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.9/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.9/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.9/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.9/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.9/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.9/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.9/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.9/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.9/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.9/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.9/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.9/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.9/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.9/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.9/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.9/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.9/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.9/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.9/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.9/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.9/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.9/self_attn/Concat_5:Concat*input:pkv18(1,8,0,128);_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv18(1,8,0,128)*axis:-2 /model/model/layers.9/self_attn/Concat_6:Concat*input:pkv19(1,8,0,128);_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv19(1,8,0,128)*axis:-2 /model/model/layers.9/self_attn/Shape_8:Shape*input:opkv18(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.9/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.9/self_attn/Unsqueeze_12:Unsqueeze*input:opkv18(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.9/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.9/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.9/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.9/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.9/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.9/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.9/self_attn/Shape_13:Shape*input:opkv19(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.9/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.9/self_attn/Unsqueeze_21:Unsqueeze*input:opkv19(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.9/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.9/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.9/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.9/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.9/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.9/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.9/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.9/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.9/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.9/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.9/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.9/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.9/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.9/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.9/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10029.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.9/Add:Add*input:_2F_model_2F_model_2F_layers_2E_8_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_9_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_9_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.9/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_9_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_9_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.9/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_9_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_9_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.9/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_9_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_9_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.9/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_9_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.9/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_9_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.9/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_9_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_9_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_9_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.9/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_9_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_9_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_9_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.9/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_9_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10030.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_9_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.9/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_9_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_9_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.9/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_9_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_9_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_9_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.9/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_9_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10031.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_9_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.9/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_9_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_9_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_9_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.9/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_9_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10032.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_9_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.9/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_9_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_9_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_9_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.10/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_9_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_10_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.10/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_10_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_10_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.10/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_10_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_10_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.10/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_10_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.10/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_10_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.10/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_9_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_10_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.10/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_10_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_10_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_10_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.10/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_10_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10033.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.10/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_10_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10034.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.10/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_10_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10035.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.10/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.10/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.10/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.10/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.10/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.10/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.10/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.10/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.10/self_attn/Shape_3:Shape*input:pkv20(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.10/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.10/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.10/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.10/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.10/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.10/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.10/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.10/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.10/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.10/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.10/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.10/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.10/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.10/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.10/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.10/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.10/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.10/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.10/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.10/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.10/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.10/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.10/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.10/self_attn/Concat_5:Concat*input:pkv20(1,8,0,128);_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv20(1,8,0,128)*axis:-2 /model/model/layers.10/self_attn/Concat_6:Concat*input:pkv21(1,8,0,128);_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv21(1,8,0,128)*axis:-2 /model/model/layers.10/self_attn/Shape_8:Shape*input:opkv20(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.10/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.10/self_attn/Unsqueeze_12:Unsqueeze*input:opkv20(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.10/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.10/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.10/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.10/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.10/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.10/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.10/self_attn/Shape_13:Shape*input:opkv21(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.10/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.10/self_attn/Unsqueeze_21:Unsqueeze*input:opkv21(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.10/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.10/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.10/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.10/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.10/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.10/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.10/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.10/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.10/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.10/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.10/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.10/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.10/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.10/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.10/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10063.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.10/Add:Add*input:_2F_model_2F_model_2F_layers_2E_9_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_10_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_10_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.10/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_10_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_10_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.10/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_10_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_10_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.10/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_10_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_10_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.10/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_10_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.10/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_10_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.10/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_10_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_10_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_10_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.10/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_10_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_10_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_10_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.10/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_10_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10064.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_10_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.10/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_10_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_10_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.10/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_10_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_10_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_10_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.10/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_10_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10065.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_10_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.10/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_10_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_10_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_10_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.10/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_10_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10066.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_10_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.10/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_10_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_10_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_10_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.11/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_10_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_11_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.11/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_11_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_11_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.11/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_11_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_11_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.11/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_11_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.11/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_11_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.11/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_10_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_11_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.11/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_11_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_11_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_11_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.11/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_11_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10067.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.11/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_11_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10068.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.11/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_11_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10069.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.11/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.11/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.11/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.11/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.11/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.11/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.11/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.11/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.11/self_attn/Shape_3:Shape*input:pkv22(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.11/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.11/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.11/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.11/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.11/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.11/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.11/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.11/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.11/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.11/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.11/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.11/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.11/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.11/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.11/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.11/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.11/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.11/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.11/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.11/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.11/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.11/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.11/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.11/self_attn/Concat_5:Concat*input:pkv22(1,8,0,128);_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv22(1,8,0,128)*axis:-2 /model/model/layers.11/self_attn/Concat_6:Concat*input:pkv23(1,8,0,128);_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv23(1,8,0,128)*axis:-2 /model/model/layers.11/self_attn/Shape_8:Shape*input:opkv22(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.11/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.11/self_attn/Unsqueeze_12:Unsqueeze*input:opkv22(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.11/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.11/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.11/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.11/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.11/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.11/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.11/self_attn/Shape_13:Shape*input:opkv23(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.11/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.11/self_attn/Unsqueeze_21:Unsqueeze*input:opkv23(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.11/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.11/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.11/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.11/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.11/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.11/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.11/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.11/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.11/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.11/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.11/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.11/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.11/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.11/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.11/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10097.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.11/Add:Add*input:_2F_model_2F_model_2F_layers_2E_10_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_11_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_11_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.11/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_11_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_11_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.11/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_11_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_11_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.11/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_11_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_11_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.11/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_11_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.11/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_11_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.11/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_11_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_11_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_11_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.11/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_11_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_11_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_11_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.11/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_11_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10098.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_11_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.11/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_11_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_11_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.11/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_11_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_11_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_11_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.11/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_11_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10099.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_11_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.11/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_11_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_11_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_11_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.11/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_11_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10100.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_11_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.11/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_11_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_11_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_11_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.12/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_11_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_12_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.12/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_12_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_12_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.12/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_12_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_12_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.12/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_12_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.12/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_12_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.12/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_11_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_12_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.12/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_12_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_12_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_12_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.12/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_12_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10101.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.12/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_12_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10102.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.12/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_12_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10103.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.12/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.12/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.12/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.12/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.12/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.12/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.12/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.12/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.12/self_attn/Shape_3:Shape*input:pkv24(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.12/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.12/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.12/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.12/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.12/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.12/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.12/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.12/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.12/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.12/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.12/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.12/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.12/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.12/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.12/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.12/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.12/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.12/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.12/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.12/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.12/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.12/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.12/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.12/self_attn/Concat_5:Concat*input:pkv24(1,8,0,128);_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv24(1,8,0,128)*axis:-2 /model/model/layers.12/self_attn/Concat_6:Concat*input:pkv25(1,8,0,128);_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv25(1,8,0,128)*axis:-2 /model/model/layers.12/self_attn/Shape_8:Shape*input:opkv24(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.12/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.12/self_attn/Unsqueeze_12:Unsqueeze*input:opkv24(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.12/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.12/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.12/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.12/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.12/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.12/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.12/self_attn/Shape_13:Shape*input:opkv25(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.12/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.12/self_attn/Unsqueeze_21:Unsqueeze*input:opkv25(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.12/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.12/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.12/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.12/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.12/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.12/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.12/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.12/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.12/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.12/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.12/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.12/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.12/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.12/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.12/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10131.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.12/Add:Add*input:_2F_model_2F_model_2F_layers_2E_11_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_12_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_12_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.12/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_12_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_12_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.12/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_12_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_12_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.12/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_12_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_12_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.12/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_12_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.12/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_12_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.12/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_12_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_12_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_12_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.12/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_12_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_12_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_12_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.12/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_12_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10132.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_12_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.12/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_12_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_12_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.12/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_12_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_12_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_12_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.12/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_12_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10133.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_12_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.12/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_12_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_12_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_12_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.12/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_12_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10134.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_12_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.12/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_12_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_12_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_12_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.13/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_12_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_13_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.13/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_13_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_13_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.13/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_13_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_13_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.13/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_13_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.13/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_13_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.13/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_12_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_13_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.13/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_13_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_13_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_13_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.13/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_13_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10135.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.13/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_13_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10136.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.13/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_13_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10137.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.13/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.13/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.13/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.13/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.13/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.13/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.13/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.13/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.13/self_attn/Shape_3:Shape*input:pkv26(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.13/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.13/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.13/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.13/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.13/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.13/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.13/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.13/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.13/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.13/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.13/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.13/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.13/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.13/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.13/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.13/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.13/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.13/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.13/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.13/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.13/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.13/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.13/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.13/self_attn/Concat_5:Concat*input:pkv26(1,8,0,128);_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv26(1,8,0,128)*axis:-2 /model/model/layers.13/self_attn/Concat_6:Concat*input:pkv27(1,8,0,128);_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv27(1,8,0,128)*axis:-2 /model/model/layers.13/self_attn/Shape_8:Shape*input:opkv26(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.13/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.13/self_attn/Unsqueeze_12:Unsqueeze*input:opkv26(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.13/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.13/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.13/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.13/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.13/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.13/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.13/self_attn/Shape_13:Shape*input:opkv27(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.13/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.13/self_attn/Unsqueeze_21:Unsqueeze*input:opkv27(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.13/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.13/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.13/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.13/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.13/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.13/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.13/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.13/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.13/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.13/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.13/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.13/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.13/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.13/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.13/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10165.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.13/Add:Add*input:_2F_model_2F_model_2F_layers_2E_12_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_13_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_13_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.13/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_13_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_13_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.13/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_13_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_13_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.13/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_13_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_13_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.13/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_13_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.13/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_13_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.13/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_13_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_13_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_13_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.13/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_13_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_13_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_13_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.13/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_13_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10166.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_13_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.13/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_13_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_13_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.13/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_13_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_13_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_13_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.13/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_13_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10167.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_13_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.13/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_13_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_13_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_13_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.13/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_13_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10168.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_13_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.13/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_13_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_13_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_13_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.14/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_13_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_14_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.14/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_14_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_14_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.14/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_14_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_14_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.14/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_14_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.14/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_14_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.14/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_13_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_14_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.14/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_14_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_14_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_14_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.14/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_14_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10169.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.14/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_14_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10170.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.14/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_14_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10171.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.14/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.14/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.14/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.14/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.14/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.14/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.14/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.14/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.14/self_attn/Shape_3:Shape*input:pkv28(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.14/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.14/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.14/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.14/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.14/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.14/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.14/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.14/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.14/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.14/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.14/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.14/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.14/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.14/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.14/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.14/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.14/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.14/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.14/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.14/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.14/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.14/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.14/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.14/self_attn/Concat_5:Concat*input:pkv28(1,8,0,128);_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv28(1,8,0,128)*axis:-2 /model/model/layers.14/self_attn/Concat_6:Concat*input:pkv29(1,8,0,128);_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv29(1,8,0,128)*axis:-2 /model/model/layers.14/self_attn/Shape_8:Shape*input:opkv28(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.14/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.14/self_attn/Unsqueeze_12:Unsqueeze*input:opkv28(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.14/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.14/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.14/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.14/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.14/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.14/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.14/self_attn/Shape_13:Shape*input:opkv29(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.14/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.14/self_attn/Unsqueeze_21:Unsqueeze*input:opkv29(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.14/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.14/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.14/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.14/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.14/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.14/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.14/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.14/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.14/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.14/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.14/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.14/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.14/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.14/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.14/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10199.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.14/Add:Add*input:_2F_model_2F_model_2F_layers_2E_13_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_14_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_14_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.14/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_14_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_14_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.14/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_14_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_14_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.14/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_14_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_14_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.14/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_14_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.14/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_14_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.14/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_14_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_14_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_14_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.14/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_14_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_14_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_14_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.14/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_14_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10200.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_14_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.14/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_14_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_14_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.14/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_14_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_14_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_14_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.14/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_14_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10201.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_14_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.14/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_14_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_14_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_14_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.14/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_14_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10202.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_14_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.14/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_14_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_14_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_14_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.15/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_14_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_15_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.15/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_15_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_15_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.15/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_15_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_15_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.15/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_15_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.15/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_15_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.15/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_14_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_15_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.15/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_15_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_15_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_15_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.15/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_15_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10203.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.15/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_15_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10204.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.15/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_15_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10205.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.15/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.15/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.15/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.15/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.15/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.15/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.15/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.15/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.15/self_attn/Shape_3:Shape*input:pkv30(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.15/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.15/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.15/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.15/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.15/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.15/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.15/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.15/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.15/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.15/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.15/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.15/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.15/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.15/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.15/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.15/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.15/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.15/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.15/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.15/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.15/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.15/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.15/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.15/self_attn/Concat_5:Concat*input:pkv30(1,8,0,128);_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv30(1,8,0,128)*axis:-2 /model/model/layers.15/self_attn/Concat_6:Concat*input:pkv31(1,8,0,128);_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv31(1,8,0,128)*axis:-2 /model/model/layers.15/self_attn/Shape_8:Shape*input:opkv30(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.15/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.15/self_attn/Unsqueeze_12:Unsqueeze*input:opkv30(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.15/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.15/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.15/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.15/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.15/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.15/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.15/self_attn/Shape_13:Shape*input:opkv31(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.15/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.15/self_attn/Unsqueeze_21:Unsqueeze*input:opkv31(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.15/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.15/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.15/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.15/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.15/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.15/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.15/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.15/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.15/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.15/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.15/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.15/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.15/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.15/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.15/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10233.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.15/Add:Add*input:_2F_model_2F_model_2F_layers_2E_14_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_15_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_15_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.15/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_15_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_15_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.15/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_15_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_15_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.15/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_15_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_15_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.15/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_15_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.15/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_15_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.15/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_15_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_15_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_15_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.15/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_15_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_15_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_15_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.15/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_15_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10234.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_15_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.15/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_15_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_15_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.15/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_15_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_15_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_15_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.15/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_15_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10235.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_15_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.15/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_15_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_15_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_15_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.15/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_15_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10236.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_15_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.15/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_15_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_15_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_15_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.16/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_15_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_16_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.16/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_16_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_16_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.16/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_16_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_16_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.16/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_16_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.16/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_16_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.16/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_15_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_16_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.16/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_16_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_16_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_16_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.16/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_16_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10237.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.16/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_16_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10238.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.16/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_16_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10239.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.16/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.16/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.16/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.16/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.16/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.16/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.16/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.16/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.16/self_attn/Shape_3:Shape*input:pkv32(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.16/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.16/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.16/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.16/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.16/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.16/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.16/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.16/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.16/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.16/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.16/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.16/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.16/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.16/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.16/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.16/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.16/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.16/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.16/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.16/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.16/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.16/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.16/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.16/self_attn/Concat_5:Concat*input:pkv32(1,8,0,128);_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv32(1,8,0,128)*axis:-2 /model/model/layers.16/self_attn/Concat_6:Concat*input:pkv33(1,8,0,128);_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv33(1,8,0,128)*axis:-2 /model/model/layers.16/self_attn/Shape_8:Shape*input:opkv32(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.16/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.16/self_attn/Unsqueeze_12:Unsqueeze*input:opkv32(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.16/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.16/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.16/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.16/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.16/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.16/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.16/self_attn/Shape_13:Shape*input:opkv33(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.16/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.16/self_attn/Unsqueeze_21:Unsqueeze*input:opkv33(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.16/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.16/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.16/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.16/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.16/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.16/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.16/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.16/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.16/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.16/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.16/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.16/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.16/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.16/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.16/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10267.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.16/Add:Add*input:_2F_model_2F_model_2F_layers_2E_15_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_16_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_16_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.16/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_16_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_16_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.16/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_16_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_16_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.16/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_16_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_16_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.16/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_16_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.16/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_16_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.16/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_16_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_16_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_16_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.16/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_16_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_16_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_16_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.16/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_16_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10268.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_16_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.16/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_16_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_16_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.16/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_16_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_16_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_16_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.16/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_16_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10269.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_16_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.16/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_16_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_16_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_16_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.16/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_16_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10270.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_16_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.16/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_16_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_16_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_16_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.17/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_16_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_17_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.17/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_17_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_17_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.17/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_17_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_17_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.17/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_17_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.17/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_17_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.17/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_16_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_17_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.17/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_17_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_17_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_17_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.17/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_17_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10271.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.17/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_17_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10272.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.17/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_17_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10273.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.17/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.17/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.17/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.17/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.17/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.17/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.17/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.17/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.17/self_attn/Shape_3:Shape*input:pkv34(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.17/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.17/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.17/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.17/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.17/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.17/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.17/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.17/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.17/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.17/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.17/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.17/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.17/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.17/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.17/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.17/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.17/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.17/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.17/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.17/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.17/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.17/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.17/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.17/self_attn/Concat_5:Concat*input:pkv34(1,8,0,128);_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv34(1,8,0,128)*axis:-2 /model/model/layers.17/self_attn/Concat_6:Concat*input:pkv35(1,8,0,128);_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv35(1,8,0,128)*axis:-2 /model/model/layers.17/self_attn/Shape_8:Shape*input:opkv34(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.17/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.17/self_attn/Unsqueeze_12:Unsqueeze*input:opkv34(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.17/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.17/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.17/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.17/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.17/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.17/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.17/self_attn/Shape_13:Shape*input:opkv35(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.17/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.17/self_attn/Unsqueeze_21:Unsqueeze*input:opkv35(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.17/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.17/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.17/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.17/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.17/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.17/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.17/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.17/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.17/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.17/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.17/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.17/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.17/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.17/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.17/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10301.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.17/Add:Add*input:_2F_model_2F_model_2F_layers_2E_16_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_17_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_17_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.17/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_17_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_17_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.17/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_17_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_17_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.17/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_17_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_17_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.17/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_17_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.17/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_17_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.17/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_17_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_17_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_17_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.17/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_17_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_17_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_17_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.17/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_17_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10302.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_17_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.17/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_17_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_17_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.17/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_17_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_17_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_17_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.17/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_17_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10303.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_17_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.17/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_17_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_17_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_17_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.17/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_17_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10304.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_17_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.17/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_17_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_17_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_17_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.18/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_17_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_18_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.18/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_18_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_18_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.18/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_18_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_18_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.18/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_18_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.18/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_18_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.18/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_17_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_18_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.18/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_18_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_18_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_18_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.18/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_18_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10305.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.18/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_18_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10306.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.18/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_18_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10307.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.18/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.18/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.18/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.18/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.18/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.18/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.18/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.18/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.18/self_attn/Shape_3:Shape*input:pkv36(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.18/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.18/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.18/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.18/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.18/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.18/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.18/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.18/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.18/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.18/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.18/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.18/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.18/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.18/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.18/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.18/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.18/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.18/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.18/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.18/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.18/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.18/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.18/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.18/self_attn/Concat_5:Concat*input:pkv36(1,8,0,128);_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv36(1,8,0,128)*axis:-2 /model/model/layers.18/self_attn/Concat_6:Concat*input:pkv37(1,8,0,128);_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv37(1,8,0,128)*axis:-2 /model/model/layers.18/self_attn/Shape_8:Shape*input:opkv36(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.18/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.18/self_attn/Unsqueeze_12:Unsqueeze*input:opkv36(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.18/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.18/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.18/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.18/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.18/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.18/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.18/self_attn/Shape_13:Shape*input:opkv37(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.18/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.18/self_attn/Unsqueeze_21:Unsqueeze*input:opkv37(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.18/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.18/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.18/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.18/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.18/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.18/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.18/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.18/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.18/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.18/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.18/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.18/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.18/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.18/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.18/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10335.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.18/Add:Add*input:_2F_model_2F_model_2F_layers_2E_17_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_18_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_18_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.18/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_18_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_18_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.18/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_18_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_18_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.18/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_18_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_18_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.18/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_18_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.18/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_18_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.18/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_18_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_18_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_18_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.18/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_18_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_18_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_18_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.18/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_18_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10336.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_18_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.18/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_18_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_18_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.18/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_18_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_18_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_18_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.18/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_18_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10337.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_18_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.18/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_18_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_18_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_18_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.18/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_18_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10338.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_18_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.18/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_18_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_18_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_18_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.19/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_18_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_19_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.19/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_19_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_19_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.19/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_19_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_19_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.19/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_19_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.19/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_19_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.19/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_18_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_19_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.19/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_19_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_19_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_19_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.19/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_19_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10339.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.19/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_19_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10340.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.19/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_19_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10341.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.19/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.19/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.19/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.19/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.19/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.19/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.19/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.19/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.19/self_attn/Shape_3:Shape*input:pkv38(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.19/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.19/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.19/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.19/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.19/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.19/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.19/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.19/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.19/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.19/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.19/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.19/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.19/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.19/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.19/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.19/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.19/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.19/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.19/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.19/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.19/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.19/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.19/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.19/self_attn/Concat_5:Concat*input:pkv38(1,8,0,128);_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv38(1,8,0,128)*axis:-2 /model/model/layers.19/self_attn/Concat_6:Concat*input:pkv39(1,8,0,128);_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv39(1,8,0,128)*axis:-2 /model/model/layers.19/self_attn/Shape_8:Shape*input:opkv38(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.19/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.19/self_attn/Unsqueeze_12:Unsqueeze*input:opkv38(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.19/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.19/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.19/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.19/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.19/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.19/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.19/self_attn/Shape_13:Shape*input:opkv39(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.19/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.19/self_attn/Unsqueeze_21:Unsqueeze*input:opkv39(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.19/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.19/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.19/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.19/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.19/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.19/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.19/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.19/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.19/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.19/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.19/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.19/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.19/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.19/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.19/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10369.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.19/Add:Add*input:_2F_model_2F_model_2F_layers_2E_18_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_19_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_19_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.19/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_19_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_19_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.19/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_19_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_19_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.19/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_19_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_19_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.19/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_19_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.19/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_19_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.19/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_19_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_19_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_19_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.19/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_19_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_19_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_19_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.19/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_19_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10370.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_19_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.19/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_19_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_19_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.19/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_19_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_19_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_19_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.19/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_19_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10371.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_19_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.19/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_19_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_19_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_19_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.19/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_19_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10372.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_19_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.19/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_19_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_19_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_19_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.20/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_19_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_20_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.20/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_20_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_20_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.20/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_20_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_20_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.20/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_20_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.20/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_20_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.20/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_19_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_20_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.20/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_20_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_20_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_20_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.20/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_20_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10373.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.20/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_20_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10374.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.20/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_20_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10375.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.20/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.20/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.20/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.20/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.20/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.20/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.20/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.20/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.20/self_attn/Shape_3:Shape*input:pkv40(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.20/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.20/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.20/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.20/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.20/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.20/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.20/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.20/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.20/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.20/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.20/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.20/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.20/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.20/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.20/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.20/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.20/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.20/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.20/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.20/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.20/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.20/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.20/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.20/self_attn/Concat_5:Concat*input:pkv40(1,8,0,128);_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv40(1,8,0,128)*axis:-2 /model/model/layers.20/self_attn/Concat_6:Concat*input:pkv41(1,8,0,128);_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv41(1,8,0,128)*axis:-2 /model/model/layers.20/self_attn/Shape_8:Shape*input:opkv40(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.20/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.20/self_attn/Unsqueeze_12:Unsqueeze*input:opkv40(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.20/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.20/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.20/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.20/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.20/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.20/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.20/self_attn/Shape_13:Shape*input:opkv41(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.20/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.20/self_attn/Unsqueeze_21:Unsqueeze*input:opkv41(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.20/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.20/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.20/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.20/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.20/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.20/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.20/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.20/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.20/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.20/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.20/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.20/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.20/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.20/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.20/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10403.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.20/Add:Add*input:_2F_model_2F_model_2F_layers_2E_19_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_20_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_20_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.20/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_20_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_20_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.20/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_20_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_20_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.20/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_20_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_20_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.20/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_20_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.20/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_20_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.20/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_20_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_20_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_20_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.20/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_20_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_20_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_20_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.20/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_20_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10404.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_20_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.20/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_20_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_20_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.20/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_20_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_20_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_20_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.20/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_20_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10405.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_20_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.20/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_20_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_20_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_20_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.20/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_20_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10406.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_20_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.20/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_20_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_20_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_20_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.21/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_20_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_21_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.21/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_21_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_21_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.21/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_21_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_21_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.21/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_21_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.21/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_21_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.21/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_20_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_21_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.21/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_21_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_21_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_21_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.21/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_21_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10407.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.21/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_21_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10408.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.21/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_21_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10409.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.21/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.21/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.21/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.21/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.21/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.21/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.21/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.21/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.21/self_attn/Shape_3:Shape*input:pkv42(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.21/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.21/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.21/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.21/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.21/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.21/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.21/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.21/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.21/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.21/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.21/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.21/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.21/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.21/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.21/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.21/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.21/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.21/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.21/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.21/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.21/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.21/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.21/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.21/self_attn/Concat_5:Concat*input:pkv42(1,8,0,128);_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv42(1,8,0,128)*axis:-2 /model/model/layers.21/self_attn/Concat_6:Concat*input:pkv43(1,8,0,128);_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv43(1,8,0,128)*axis:-2 /model/model/layers.21/self_attn/Shape_8:Shape*input:opkv42(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.21/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.21/self_attn/Unsqueeze_12:Unsqueeze*input:opkv42(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.21/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.21/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.21/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.21/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.21/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.21/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.21/self_attn/Shape_13:Shape*input:opkv43(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.21/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.21/self_attn/Unsqueeze_21:Unsqueeze*input:opkv43(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.21/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.21/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.21/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.21/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.21/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.21/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.21/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.21/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.21/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.21/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.21/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.21/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.21/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.21/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.21/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10437.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.21/Add:Add*input:_2F_model_2F_model_2F_layers_2E_20_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_21_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_21_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.21/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_21_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_21_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.21/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_21_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_21_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.21/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_21_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_21_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.21/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_21_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.21/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_21_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.21/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_21_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_21_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_21_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.21/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_21_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_21_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_21_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.21/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_21_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10438.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_21_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.21/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_21_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_21_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.21/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_21_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_21_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_21_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.21/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_21_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10439.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_21_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.21/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_21_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_21_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_21_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.21/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_21_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10440.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_21_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.21/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_21_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_21_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_21_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.22/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_21_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_22_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.22/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_22_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_22_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.22/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_22_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_22_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.22/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_22_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.22/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_22_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.22/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_21_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_22_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.22/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_22_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_22_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_22_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.22/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_22_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10441.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.22/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_22_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10442.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.22/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_22_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10443.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.22/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.22/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.22/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.22/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.22/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.22/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.22/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.22/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.22/self_attn/Shape_3:Shape*input:pkv44(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.22/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.22/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.22/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.22/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.22/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.22/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.22/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.22/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.22/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.22/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.22/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.22/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.22/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.22/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.22/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.22/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.22/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.22/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.22/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.22/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.22/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.22/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.22/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.22/self_attn/Concat_5:Concat*input:pkv44(1,8,0,128);_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv44(1,8,0,128)*axis:-2 /model/model/layers.22/self_attn/Concat_6:Concat*input:pkv45(1,8,0,128);_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv45(1,8,0,128)*axis:-2 /model/model/layers.22/self_attn/Shape_8:Shape*input:opkv44(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.22/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.22/self_attn/Unsqueeze_12:Unsqueeze*input:opkv44(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.22/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.22/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.22/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.22/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.22/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.22/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.22/self_attn/Shape_13:Shape*input:opkv45(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.22/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.22/self_attn/Unsqueeze_21:Unsqueeze*input:opkv45(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.22/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.22/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.22/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.22/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.22/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.22/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.22/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.22/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.22/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.22/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.22/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.22/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.22/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.22/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.22/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10471.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.22/Add:Add*input:_2F_model_2F_model_2F_layers_2E_21_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_22_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_22_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.22/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_22_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_22_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.22/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_22_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_22_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.22/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_22_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_22_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.22/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_22_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.22/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_22_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.22/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_22_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_22_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_22_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.22/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_22_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_22_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_22_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.22/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_22_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10472.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_22_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.22/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_22_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_22_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.22/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_22_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_22_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_22_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.22/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_22_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10473.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_22_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.22/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_22_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_22_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_22_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.22/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_22_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10474.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_22_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.22/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_22_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_22_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_22_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.23/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_22_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_23_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.23/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_23_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_23_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.23/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_23_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_23_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.23/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_23_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.23/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_23_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.23/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_22_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_23_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.23/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_23_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_23_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_23_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.23/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_23_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10475.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.23/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_23_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10476.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.23/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_23_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10477.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.23/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.23/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.23/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.23/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.23/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.23/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.23/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.23/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.23/self_attn/Shape_3:Shape*input:pkv46(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.23/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.23/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.23/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.23/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.23/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.23/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.23/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.23/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.23/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.23/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.23/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.23/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.23/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.23/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.23/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.23/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.23/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.23/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.23/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.23/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.23/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.23/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.23/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.23/self_attn/Concat_5:Concat*input:pkv46(1,8,0,128);_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv46(1,8,0,128)*axis:-2 /model/model/layers.23/self_attn/Concat_6:Concat*input:pkv47(1,8,0,128);_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv47(1,8,0,128)*axis:-2 /model/model/layers.23/self_attn/Shape_8:Shape*input:opkv46(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.23/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.23/self_attn/Unsqueeze_12:Unsqueeze*input:opkv46(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.23/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.23/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.23/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.23/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.23/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.23/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.23/self_attn/Shape_13:Shape*input:opkv47(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.23/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.23/self_attn/Unsqueeze_21:Unsqueeze*input:opkv47(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.23/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.23/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.23/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.23/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.23/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.23/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.23/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.23/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.23/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.23/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.23/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.23/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.23/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.23/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.23/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10505.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.23/Add:Add*input:_2F_model_2F_model_2F_layers_2E_22_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_23_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_23_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.23/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_23_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_23_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.23/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_23_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_23_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.23/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_23_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_23_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.23/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_23_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.23/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_23_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.23/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_23_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_23_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_23_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.23/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_23_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_23_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_23_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.23/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_23_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10506.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_23_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.23/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_23_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_23_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.23/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_23_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_23_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_23_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.23/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_23_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10507.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_23_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.23/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_23_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_23_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_23_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.23/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_23_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10508.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_23_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.23/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_23_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_23_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_23_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.24/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_23_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_24_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.24/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_24_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_24_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.24/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_24_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_24_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.24/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_24_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.24/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_24_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.24/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_23_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_24_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.24/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_24_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_24_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_24_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.24/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_24_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10509.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.24/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_24_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10510.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.24/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_24_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10511.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.24/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.24/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.24/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.24/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.24/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.24/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.24/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.24/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.24/self_attn/Shape_3:Shape*input:pkv48(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.24/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.24/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.24/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.24/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.24/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.24/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.24/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.24/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.24/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.24/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.24/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.24/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.24/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.24/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.24/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.24/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.24/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.24/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.24/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.24/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.24/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.24/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.24/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.24/self_attn/Concat_5:Concat*input:pkv48(1,8,0,128);_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv48(1,8,0,128)*axis:-2 /model/model/layers.24/self_attn/Concat_6:Concat*input:pkv49(1,8,0,128);_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv49(1,8,0,128)*axis:-2 /model/model/layers.24/self_attn/Shape_8:Shape*input:opkv48(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.24/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.24/self_attn/Unsqueeze_12:Unsqueeze*input:opkv48(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.24/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.24/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.24/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.24/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.24/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.24/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.24/self_attn/Shape_13:Shape*input:opkv49(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.24/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.24/self_attn/Unsqueeze_21:Unsqueeze*input:opkv49(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.24/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.24/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.24/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.24/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.24/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.24/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.24/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.24/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.24/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.24/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.24/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.24/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.24/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.24/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.24/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10539.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.24/Add:Add*input:_2F_model_2F_model_2F_layers_2E_23_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_24_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_24_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.24/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_24_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_24_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.24/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_24_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_24_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.24/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_24_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_24_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.24/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_24_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.24/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_24_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.24/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_24_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_24_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_24_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.24/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_24_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_24_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_24_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.24/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_24_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10540.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_24_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.24/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_24_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_24_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.24/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_24_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_24_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_24_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.24/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_24_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10541.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_24_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.24/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_24_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_24_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_24_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.24/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_24_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10542.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_24_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.24/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_24_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_24_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_24_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.25/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_24_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_25_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.25/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_25_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_25_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.25/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_25_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_25_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.25/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_25_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.25/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_25_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.25/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_24_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_25_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.25/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_25_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_25_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_25_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.25/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_25_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10543.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.25/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_25_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10544.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.25/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_25_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10545.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.25/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.25/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.25/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.25/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.25/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.25/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.25/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.25/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.25/self_attn/Shape_3:Shape*input:pkv50(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.25/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.25/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.25/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.25/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.25/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.25/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.25/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.25/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.25/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.25/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.25/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.25/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.25/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.25/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.25/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.25/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.25/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.25/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.25/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.25/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.25/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.25/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.25/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.25/self_attn/Concat_5:Concat*input:pkv50(1,8,0,128);_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv50(1,8,0,128)*axis:-2 /model/model/layers.25/self_attn/Concat_6:Concat*input:pkv51(1,8,0,128);_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv51(1,8,0,128)*axis:-2 /model/model/layers.25/self_attn/Shape_8:Shape*input:opkv50(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.25/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.25/self_attn/Unsqueeze_12:Unsqueeze*input:opkv50(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.25/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.25/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.25/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.25/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.25/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.25/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.25/self_attn/Shape_13:Shape*input:opkv51(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.25/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.25/self_attn/Unsqueeze_21:Unsqueeze*input:opkv51(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.25/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.25/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.25/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.25/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.25/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.25/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.25/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.25/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.25/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.25/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.25/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.25/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.25/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.25/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.25/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10573.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.25/Add:Add*input:_2F_model_2F_model_2F_layers_2E_24_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_25_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_25_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.25/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_25_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_25_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.25/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_25_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_25_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.25/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_25_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_25_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.25/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_25_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.25/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_25_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.25/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_25_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_25_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_25_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.25/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_25_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_25_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_25_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.25/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_25_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10574.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_25_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.25/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_25_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_25_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.25/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_25_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_25_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_25_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.25/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_25_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10575.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_25_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.25/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_25_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_25_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_25_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.25/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_25_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10576.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_25_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.25/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_25_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_25_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_25_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.26/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_25_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_26_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.26/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_26_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_26_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.26/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_26_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_26_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.26/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_26_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.26/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_26_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.26/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_25_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_26_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.26/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_26_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_26_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_26_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.26/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_26_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10577.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.26/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_26_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10578.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.26/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_26_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10579.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.26/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.26/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.26/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.26/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.26/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.26/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.26/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.26/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.26/self_attn/Shape_3:Shape*input:pkv52(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.26/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.26/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.26/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.26/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.26/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.26/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.26/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.26/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.26/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.26/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.26/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.26/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.26/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.26/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.26/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.26/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.26/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.26/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.26/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.26/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.26/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.26/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.26/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.26/self_attn/Concat_5:Concat*input:pkv52(1,8,0,128);_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv52(1,8,0,128)*axis:-2 /model/model/layers.26/self_attn/Concat_6:Concat*input:pkv53(1,8,0,128);_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv53(1,8,0,128)*axis:-2 /model/model/layers.26/self_attn/Shape_8:Shape*input:opkv52(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.26/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.26/self_attn/Unsqueeze_12:Unsqueeze*input:opkv52(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.26/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.26/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.26/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.26/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.26/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.26/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.26/self_attn/Shape_13:Shape*input:opkv53(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.26/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.26/self_attn/Unsqueeze_21:Unsqueeze*input:opkv53(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.26/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.26/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.26/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.26/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.26/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.26/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.26/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.26/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.26/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.26/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.26/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.26/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.26/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.26/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.26/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10607.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.26/Add:Add*input:_2F_model_2F_model_2F_layers_2E_25_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_26_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_26_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.26/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_26_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_26_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.26/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_26_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_26_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.26/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_26_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_26_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.26/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_26_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.26/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_26_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.26/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_26_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_26_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_26_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.26/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_26_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_26_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_26_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.26/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_26_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10608.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_26_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.26/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_26_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_26_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.26/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_26_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_26_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_26_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.26/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_26_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10609.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_26_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.26/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_26_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_26_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_26_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.26/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_26_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10610.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_26_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.26/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_26_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_26_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_26_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.27/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_26_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_27_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.27/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_27_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_27_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.27/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_27_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_27_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.27/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_27_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.27/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_27_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.27/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_26_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_27_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.27/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_27_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_27_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_27_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.27/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_27_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10611.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.27/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_27_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10612.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.27/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_27_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10613.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.27/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.27/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.27/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.27/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.27/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.27/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.27/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.27/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.27/self_attn/Shape_3:Shape*input:pkv54(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.27/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.27/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.27/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.27/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.27/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.27/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.27/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.27/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.27/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.27/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.27/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.27/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.27/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.27/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.27/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.27/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.27/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.27/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.27/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.27/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.27/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.27/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.27/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.27/self_attn/Concat_5:Concat*input:pkv54(1,8,0,128);_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv54(1,8,0,128)*axis:-2 /model/model/layers.27/self_attn/Concat_6:Concat*input:pkv55(1,8,0,128);_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv55(1,8,0,128)*axis:-2 /model/model/layers.27/self_attn/Shape_8:Shape*input:opkv54(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.27/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.27/self_attn/Unsqueeze_12:Unsqueeze*input:opkv54(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.27/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.27/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.27/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.27/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.27/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.27/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.27/self_attn/Shape_13:Shape*input:opkv55(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.27/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.27/self_attn/Unsqueeze_21:Unsqueeze*input:opkv55(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.27/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.27/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.27/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.27/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.27/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.27/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.27/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.27/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.27/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.27/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.27/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.27/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.27/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.27/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.27/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10641.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.27/Add:Add*input:_2F_model_2F_model_2F_layers_2E_26_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_27_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_27_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.27/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_27_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_27_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.27/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_27_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_27_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.27/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_27_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_27_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.27/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_27_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.27/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_27_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.27/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_27_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_27_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_27_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.27/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_27_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_27_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_27_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.27/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_27_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10642.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_27_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.27/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_27_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_27_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.27/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_27_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_27_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_27_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.27/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_27_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10643.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_27_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.27/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_27_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_27_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_27_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.27/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_27_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10644.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_27_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.27/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_27_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_27_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_27_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.28/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_27_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_28_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.28/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_28_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_28_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.28/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_28_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_28_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.28/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_28_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.28/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_28_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.28/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_27_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_28_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.28/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_28_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_28_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_28_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.28/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_28_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10645.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.28/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_28_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10646.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.28/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_28_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10647.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.28/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.28/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.28/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.28/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.28/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.28/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.28/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.28/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.28/self_attn/Shape_3:Shape*input:pkv56(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.28/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.28/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.28/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.28/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.28/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.28/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.28/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.28/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.28/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.28/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.28/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.28/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.28/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.28/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.28/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.28/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.28/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.28/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.28/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.28/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.28/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.28/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.28/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.28/self_attn/Concat_5:Concat*input:pkv56(1,8,0,128);_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv56(1,8,0,128)*axis:-2 /model/model/layers.28/self_attn/Concat_6:Concat*input:pkv57(1,8,0,128);_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv57(1,8,0,128)*axis:-2 /model/model/layers.28/self_attn/Shape_8:Shape*input:opkv56(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.28/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.28/self_attn/Unsqueeze_12:Unsqueeze*input:opkv56(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.28/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.28/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.28/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.28/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.28/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.28/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.28/self_attn/Shape_13:Shape*input:opkv57(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.28/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.28/self_attn/Unsqueeze_21:Unsqueeze*input:opkv57(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.28/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.28/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.28/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.28/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.28/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.28/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.28/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.28/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.28/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.28/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.28/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.28/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.28/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.28/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.28/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10675.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.28/Add:Add*input:_2F_model_2F_model_2F_layers_2E_27_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_28_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_28_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.28/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_28_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_28_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.28/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_28_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_28_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.28/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_28_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_28_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.28/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_28_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.28/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_28_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.28/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_28_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_28_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_28_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.28/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_28_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_28_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_28_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.28/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_28_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10676.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_28_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.28/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_28_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_28_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.28/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_28_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_28_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_28_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.28/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_28_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10677.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_28_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.28/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_28_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_28_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_28_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.28/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_28_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10678.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_28_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.28/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_28_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_28_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_28_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.29/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_28_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_29_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.29/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_29_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_29_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.29/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_29_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_29_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.29/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_29_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.29/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_29_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.29/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_28_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_29_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.29/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_29_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_29_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_29_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.29/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_29_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10679.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.29/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_29_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10680.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.29/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_29_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10681.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.29/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.29/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.29/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.29/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.29/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.29/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.29/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.29/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.29/self_attn/Shape_3:Shape*input:pkv58(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.29/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.29/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.29/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.29/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.29/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.29/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.29/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.29/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.29/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.29/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.29/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.29/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.29/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.29/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.29/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.29/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.29/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.29/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.29/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.29/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.29/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.29/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.29/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.29/self_attn/Concat_5:Concat*input:pkv58(1,8,0,128);_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv58(1,8,0,128)*axis:-2 /model/model/layers.29/self_attn/Concat_6:Concat*input:pkv59(1,8,0,128);_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv59(1,8,0,128)*axis:-2 /model/model/layers.29/self_attn/Shape_8:Shape*input:opkv58(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.29/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.29/self_attn/Unsqueeze_12:Unsqueeze*input:opkv58(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.29/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.29/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.29/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.29/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.29/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.29/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.29/self_attn/Shape_13:Shape*input:opkv59(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.29/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.29/self_attn/Unsqueeze_21:Unsqueeze*input:opkv59(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.29/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.29/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.29/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.29/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.29/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.29/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.29/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.29/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.29/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.29/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.29/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.29/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.29/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.29/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.29/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10709.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.29/Add:Add*input:_2F_model_2F_model_2F_layers_2E_28_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_29_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_29_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.29/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_29_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_29_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.29/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_29_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_29_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.29/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_29_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_29_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.29/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_29_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.29/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_29_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.29/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_29_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_29_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_29_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.29/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_29_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_29_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_29_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.29/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_29_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10710.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_29_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.29/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_29_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_29_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.29/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_29_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_29_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_29_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.29/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_29_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10711.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_29_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.29/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_29_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_29_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_29_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.29/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_29_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10712.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_29_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.29/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_29_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_29_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_29_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.30/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_29_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_30_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.30/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_30_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_30_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.30/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_30_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_30_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.30/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_30_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.30/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_30_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.30/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_29_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_30_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.30/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_30_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_30_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_30_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.30/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_30_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10713.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.30/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_30_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10714.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.30/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_30_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10715.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.30/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.30/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.30/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.30/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.30/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.30/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.30/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.30/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.30/self_attn/Shape_3:Shape*input:pkv60(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.30/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.30/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.30/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.30/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.30/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.30/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.30/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.30/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.30/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.30/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.30/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.30/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.30/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.30/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.30/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.30/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.30/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.30/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.30/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.30/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.30/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.30/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.30/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.30/self_attn/Concat_5:Concat*input:pkv60(1,8,0,128);_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv60(1,8,0,128)*axis:-2 /model/model/layers.30/self_attn/Concat_6:Concat*input:pkv61(1,8,0,128);_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv61(1,8,0,128)*axis:-2 /model/model/layers.30/self_attn/Shape_8:Shape*input:opkv60(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.30/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.30/self_attn/Unsqueeze_12:Unsqueeze*input:opkv60(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.30/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.30/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.30/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.30/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.30/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.30/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.30/self_attn/Shape_13:Shape*input:opkv61(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.30/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.30/self_attn/Unsqueeze_21:Unsqueeze*input:opkv61(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.30/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.30/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.30/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.30/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.30/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.30/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.30/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.30/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.30/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.30/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.30/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.30/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.30/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.30/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.30/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10743.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.30/Add:Add*input:_2F_model_2F_model_2F_layers_2E_29_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_30_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_30_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.30/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_30_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_30_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.30/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_30_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_30_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.30/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_30_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_30_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.30/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_30_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.30/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_30_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.30/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_30_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_30_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_30_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.30/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_30_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_30_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_30_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.30/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_30_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10744.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_30_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.30/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_30_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_30_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.30/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_30_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_30_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_30_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.30/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_30_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10745.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_30_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.30/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_30_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_30_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_30_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.30/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_30_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10746.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_30_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.30/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_30_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_30_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_30_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.31/input_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_30_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_31_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.31/input_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_31_2F_input_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_31_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.31/input_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_31_2F_input_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_31_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.31/input_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_31_2F_input_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.31/input_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_31_2F_input_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.31/input_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_30_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_31_2F_input_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.31/input_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_31_2E_input_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_31_2F_input_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_31_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.31/self_attn/q_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_31_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10747.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.31/self_attn/k_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_31_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10748.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.31/self_attn/v_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_31_2F_input_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10749.bin(float16:4096,1024)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024) /model/model/layers.31/self_attn/Reshape:Reshape*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_q_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096);3745.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*allowzero:0 /model/model/layers.31/self_attn/Transpose:Transpose*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_output_5F_0(1,0,32,128)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128)*perm:0,2,1,3 /model/model/layers.31/self_attn/Reshape_1:Reshape*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_k_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.31/self_attn/Transpose_1:Transpose*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_1_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.31/self_attn/Reshape_2:Reshape*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_v_5F_proj_2F_MatMul_5F_output_5F_0(1,0,1024);3747.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*allowzero:0 /model/model/layers.31/self_attn/Transpose_2:Transpose*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_2_5F_output_5F_0(1,0,8,128)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*perm:0,2,1,3 /model/model/layers.31/self_attn/Shape_2:Shape*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4) /model/model/layers.31/self_attn/Gather_2:Gather*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Shape_5F_2_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0()*axis:0 /model/model/layers.31/self_attn/Shape_3:Shape*input:pkv62(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4) /model/model/layers.31/self_attn/Gather_3:Gather*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Shape_5F_3_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*axis:0 /model/model/layers.31/self_attn/Add:Add*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Gather_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Gather_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Add_5F_output_5F_0() /model/model/layers.31/self_attn/rotary_emb/Unsqueeze:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Add_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1) /model/model/layers.31/self_attn/rotary_emb/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0() /model/model/layers.31/self_attn/rotary_emb/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_rotary_5F_emb_2F_Constant_5F_5_5F_output_5F_0.bin(float16:32768,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_rotary_5F_emb_2F_Unsqueeze_5F_output_5F_0(1);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0() /model/model/layers.31/self_attn/Gather_4:Gather*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0()*axis:0 /model/model/layers.31/self_attn/Unsqueeze_6:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Gather_5F_4_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0() /model/model/layers.31/self_attn/Gather_5:Gather*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_rotary_5F_emb_2F_Slice_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_Reshape_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0()*axis:0 /model/model/layers.31/self_attn/Unsqueeze_7:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Gather_5F_5_5F_output_5F_0();_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0() /model/model/layers.31/self_attn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Mul_5F_output_5F_0() /model/model/layers.31/self_attn/Slice:Slice*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64) /model/model/layers.31/self_attn/Slice_1:Slice*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64) /model/model/layers.31/self_attn/Neg:Neg*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Slice_5F_1_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64) /model/model/layers.31/self_attn/Concat_3:Concat*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Neg_5F_output_5F_0(1,32,0,64);_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Slice_5F_output_5F_0(1,32,0,64)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128)*axis:-1 /model/model/layers.31/self_attn/Mul_1:Mul*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Concat_5F_3_5F_output_5F_0(1,32,0,128);_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0() /model/model/layers.31/self_attn/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Mul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Mul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0() /model/model/layers.31/self_attn/Mul_2:Mul*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Unsqueeze_5F_6_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0() /model/model/layers.31/self_attn/Slice_2:Slice*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64) /model/model/layers.31/self_attn/Slice_3:Slice*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_1_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Unsqueeze_5F_8_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_6_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_13_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64) /model/model/layers.31/self_attn/Neg_1:Neg*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Slice_5F_3_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64) /model/model/layers.31/self_attn/Concat_4:Concat*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Neg_5F_1_5F_output_5F_0(1,8,0,64);_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Slice_5F_2_5F_output_5F_0(1,8,0,64)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128)*axis:-1 /model/model/layers.31/self_attn/Mul_3:Mul*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Concat_5F_4_5F_output_5F_0(1,8,0,128);_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Unsqueeze_5F_7_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0() /model/model/layers.31/self_attn/Add_2:Add*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Mul_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Mul_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0() /model/model/layers.31/self_attn/Concat_5:Concat*input:pkv62(1,8,0,128);_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Add_5F_2_5F_output_5F_0()*output:opkv62(1,8,0,128)*axis:-2 /model/model/layers.31/self_attn/Concat_6:Concat*input:pkv63(1,8,0,128);_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_2_5F_output_5F_0(1,8,0,128)*output:opkv63(1,8,0,128)*axis:-2 /model/model/layers.31/self_attn/Shape_8:Shape*input:opkv62(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4) /model/model/layers.31/self_attn/Gather_10:Gather*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Shape_5F_8_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0()*axis:0 /model/model/layers.31/self_attn/Unsqueeze_12:Unsqueeze*input:opkv62(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128) /model/model/layers.31/self_attn/Unsqueeze_15:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Gather_5F_10_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1) /model/model/layers.31/self_attn/Concat_7:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Unsqueeze_5F_15_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*axis:0 /model/model/layers.31/self_attn/Equal:Equal*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5) /model/model/layers.31/self_attn/Where:Where*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Equal_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Concat_5F_7_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Where_5F_output_5F_0(5) /model/model/layers.31/self_attn/Expand:Expand*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Unsqueeze_5F_12_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Where_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128) /model/model/layers.31/self_attn/Reshape_4:Reshape*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Expand_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.31/self_attn/Shape_13:Shape*input:opkv63(1,8,0,128)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4) /model/model/layers.31/self_attn/Gather_14:Gather*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Shape_5F_13_5F_output_5F_0(4);_2F_model_2F_model_2F_Constant_5F_1_5F_output_5F_0.bin(int64:)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0()*axis:0 /model/model/layers.31/self_attn/Unsqueeze_21:Unsqueeze*input:opkv63(1,8,0,128);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_35_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128) /model/model/layers.31/self_attn/Unsqueeze_24:Unsqueeze*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Gather_5F_14_5F_output_5F_0();onnx_3A__3A_Unsqueeze_5F_368.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1) /model/model/layers.31/self_attn/Concat_9:Concat*input:_2F_model_2F_model_2F_Constant_5F_18_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_4_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_38_5F_output_5F_0.bin(int64:1);_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Unsqueeze_5F_24_5F_output_5F_0(1);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_3_5F_output_5F_0.bin(int64:1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*axis:0 /model/model/layers.31/self_attn/Equal_1:Equal*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Mul_5F_4_5F_output_5F_0.bin(int64:5)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5) /model/model/layers.31/self_attn/Where_1:Where*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Equal_5F_1_5F_output_5F_0(5);_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_ConstantOfShape_5F_output_5F_0.bin(int64:5);_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Concat_5F_9_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5) /model/model/layers.31/self_attn/Expand_1:Expand*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Unsqueeze_5F_21_5F_output_5F_0(1,8,1,0,128);_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Where_5F_1_5F_output_5F_0(5)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128) /model/model/layers.31/self_attn/Reshape_6:Reshape*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Expand_5F_1_5F_output_5F_0(0,8,0,0,128);3751.bin(int64:4)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*allowzero:0 /model/model/layers.31/self_attn/Transpose_3:Transpose*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_4_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*perm:0,1,3,2 /model/model/layers.31/self_attn/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Add_5F_1_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_3_5F_output_5F_0(1,32,128,0)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_MatMul_5F_output_5F_0() /model/model/layers.31/self_attn/Div_2:Div*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_MatMul_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_0_2F_self_5F_attn_2F_Constant_5F_57_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0() /model/model/layers.31/self_attn/Add_3:Add*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Div_5F_2_5F_output_5F_0();_2F_model_2F_model_2F_Where_5F_4_5F_output_5F_0(0,0,0,0)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0() /model/model/layers.31/self_attn/Softmax:Softmax*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Add_5F_3_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Softmax_5F_output_5F_0()*axis:-1 /model/model/layers.31/self_attn/MatMul_1:MatMul*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Softmax_5F_output_5F_0();_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_6_5F_output_5F_0(1,32,0,128)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0() /model/model/layers.31/self_attn/Transpose_4:Transpose*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_MatMul_5F_1_5F_output_5F_0()*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0()*perm:0,2,1,3 /model/model/layers.31/self_attn/Reshape_7:Reshape*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Transpose_5F_4_5F_output_5F_0();3755.bin(int64:3)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096)*allowzero:0 /model/model/layers.31/self_attn/o_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_Reshape_5F_7_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10777.bin(float16:4096,4096)*output:_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.31/Add:Add*input:_2F_model_2F_model_2F_layers_2E_30_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_31_2F_self_5F_attn_2F_o_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_31_2F_Add_5F_output_5F_0(1,0,4096) /model/model/layers.31/post_attention_layernorm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_31_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_31_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/layers.31/post_attention_layernorm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_layers_2E_31_2F_post_5F_attention_5F_layernorm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_31_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/layers.31/post_attention_layernorm/Add:Add*input:_2F_model_2F_model_2F_layers_2E_31_2F_post_5F_attention_5F_layernorm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_layers_2E_31_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1) /model/model/layers.31/post_attention_layernorm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_layers_2E_31_2F_post_5F_attention_5F_layernorm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/layers.31/post_attention_layernorm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_layers_2E_31_2F_post_5F_attention_5F_layernorm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1) /model/model/layers.31/post_attention_layernorm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_31_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_31_2F_post_5F_attention_5F_layernorm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_layers_2E_31_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/layers.31/post_attention_layernorm/Mul_1:Mul*input:model_2E_model_2E_layers_2E_31_2E_post_5F_attention_5F_layernorm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_layers_2E_31_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_31_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/model/layers.31/mlp/gate_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_31_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10778.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_31_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.31/mlp/act_fn/Sigmoid:Sigmoid*input:_2F_model_2F_model_2F_layers_2E_31_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_31_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336) /model/model/layers.31/mlp/act_fn/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_31_2F_mlp_2F_gate_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_31_2F_mlp_2F_act_5F_fn_2F_Sigmoid_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_31_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.31/mlp/up_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_31_2F_post_5F_attention_5F_layernorm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10779.bin(float16:4096,14336)*output:_2F_model_2F_model_2F_layers_2E_31_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336) /model/model/layers.31/mlp/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_31_2F_mlp_2F_act_5F_fn_2F_Mul_5F_output_5F_0(1,0,14336);_2F_model_2F_model_2F_layers_2E_31_2F_mlp_2F_up_5F_proj_2F_MatMul_5F_output_5F_0(1,0,14336)*output:_2F_model_2F_model_2F_layers_2E_31_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336) /model/model/layers.31/mlp/down_proj/MatMul:MatMul*input:_2F_model_2F_model_2F_layers_2E_31_2F_mlp_2F_Mul_5F_output_5F_0(1,0,14336);onnx_3A__3A_MatMul_5F_10780.bin(float16:14336,4096)*output:_2F_model_2F_model_2F_layers_2E_31_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096) /model/model/layers.31/Add_1:Add*input:_2F_model_2F_model_2F_layers_2E_31_2F_Add_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_31_2F_mlp_2F_down_5F_proj_2F_MatMul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_layers_2E_31_2F_Add_5F_1_5F_output_5F_0(1,0,4096) /model/model/norm/Pow:Pow*input:_2F_model_2F_model_2F_layers_2E_31_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_norm_2F_Pow_5F_output_5F_0(1,0,4096) /model/model/norm/ReduceMean:ReduceMean*input:_2F_model_2F_model_2F_norm_2F_Pow_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_norm_2F_ReduceMean_5F_output_5F_0(1,0,1)*axes:-1;keepdims:1 /model/model/norm/Add:Add*input:_2F_model_2F_model_2F_norm_2F_ReduceMean_5F_output_5F_0(1,0,1);_2F_model_2F_model_2F_layers_2E_0_2F_input_5F_layernorm_2F_Constant_5F_1_5F_output_5F_0.bin(float16:)*output:_2F_model_2F_model_2F_norm_2F_Add_5F_output_5F_0(1,0,1) /model/model/norm/Sqrt:Sqrt*input:_2F_model_2F_model_2F_norm_2F_Add_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_norm_2F_Sqrt_5F_output_5F_0(1,0,1) /model/model/norm/Div:Div*input:_2F_model_2F_model_2F_Constant_5F_34_5F_output_5F_0.bin(float16:);_2F_model_2F_model_2F_norm_2F_Sqrt_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_norm_2F_Div_5F_output_5F_0(1,0,1) /model/model/norm/Mul:Mul*input:_2F_model_2F_model_2F_layers_2E_31_2F_Add_5F_1_5F_output_5F_0(1,0,4096);_2F_model_2F_model_2F_norm_2F_Div_5F_output_5F_0(1,0,1)*output:_2F_model_2F_model_2F_norm_2F_Mul_5F_output_5F_0(1,0,4096) /model/model/norm/Mul_1:Mul*input:model_2E_model_2E_norm_2E_weight.bin(float16:4096);_2F_model_2F_model_2F_norm_2F_Mul_5F_output_5F_0(1,0,4096)*output:_2F_model_2F_model_2F_norm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096) /model/lm_head/MatMul:MatMul*input:_2F_model_2F_model_2F_norm_2F_Mul_5F_1_5F_output_5F_0(1,0,4096);onnx_3A__3A_MatMul_5F_10781.bin(float16:4096,32000)*output:logits(1,0,32000)