diff --git "a/controlnet/RyzenAI/.cache/down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_meta.json" "b/controlnet/RyzenAI/.cache/down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_meta.json" new file mode 100644--- /dev/null +++ "b/controlnet/RyzenAI/.cache/down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_meta.json" @@ -0,0 +1,59360 @@ +{ + "dd_meta_major_version": 1, + "dd_meta_minor_version": 2, + "state_table_updates": [], + "op_list": [ + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5286" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_0" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5287" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_1" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5349" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_2" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5350" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_3" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5412" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_4" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5413" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_5" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5475" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_6" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5476" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_7" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5538" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_8" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5539" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_9" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5601" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_10" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5602" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_11" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5672" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_12" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5673" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_13" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5752" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_14" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5753" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_15" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5815" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_16" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5816" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_17" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5878" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_18" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5879" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_19" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5942" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_20" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5943" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_21" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6005" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_22" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6006" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_23" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6068" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_24" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6069" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_25" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6132" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_26" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6133" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_27" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6195" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_28" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6196" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_29" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6258" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_30" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6259" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_31" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_0-/conv_in/Conv", + "type": "SDConv", + "in_args": [ + "Transpose_0_out-sample.out0_1_0" + ], + "const_args": [ + "NhwcConv_0_weight_NHWC" + ], + "out_args": [ + "NhwcConv_0_out-/conv_in/Conv_output_0.out0_1_0" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "4" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "4" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_0_out-/conv_in/Conv_output_0.out0_1_0", + "class_labels_13_12_trans.out_12_1_0" + ], + "const_args": [], + "out_args": [ + "/Add_output_0_13_12.out_12_1_0" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_0", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_0_out-/conv_in/Conv_output_0.out0_1_0" + ], + "const_args": [ + "GroupNorm_0_wts_7_1_0" + ], + "out_args": [ + "GroupNorm_0.out8_0.out7_1_0" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_0", + "type": "SDSilu", + "in_args": [ + "GroupNorm_0.out8_0.out7_1_0" + ], + "const_args": [ + "Sigmoid_0.weights10_0" + ], + "out_args": [ + "GroupNorm_0_sigmoid_out.8_0.out10_0" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/resnets.0/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_0_sigmoid_out.8_0.out10_0" + ], + "const_args": [ + "down_blocks.0.resnets.0.conv1.weight" + ], + "out_args": [ + "/down_blocks.0/resnets.0/conv1/Conv_output_0_0_0.out0_1_1" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/time_embedding/linear_1/Gemm", + "type": "SDGemm", + "in_args": [ + "/time_proj/Concat_1_output_0.out2_3_0" + ], + "const_args": [ + "time_embedding.linear_1.weight_7_0" + ], + "out_args": [ + "/time_embedding/linear_1/Gemm_output_0.out2_3_0" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/time_embedding/act/Sigmoid", + "type": "SDSilu", + "in_args": [ + "/time_embedding/linear_1/Gemm_output_0.out2_3_0" + ], + "const_args": [ + "/time_embedding/act/Sigmoid.weights10_1" + ], + "out_args": [ + "/time_embedding/act/Sigmoid_output_0.out10_1" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/time_embedding/linear_2/Gemm", + "type": "SDGemm", + "in_args": [ + "/time_embedding/act/Sigmoid_output_0.out10_1" + ], + "const_args": [ + "time_embedding.linear_2.weight_7_1" + ], + "out_args": [ + "/time_embedding/linear_2/Gemm_output_0.out2_3_1" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/resnets.0/act_1/Sigmoid", + "type": "SDSilu", + "in_args": [ + "/time_embedding/linear_2/Gemm_output_0.out2_3_1" + ], + "const_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid.weights10_2" + ], + "out_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "down_blocks.0.resnets.0.time_emb_proj.weight_7_2" + ], + "out_args": [ + "/down_blocks.0/resnets.0/Unsqueeze_1_output_0_0_0.out2_0_0" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "down_blocks.0.resnets.1.time_emb_proj.weight_7_3" + ], + "out_args": [ + "/down_blocks.0/resnets.1/Unsqueeze_1_output_0_0_1.out2_0_1" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "down_blocks.1.resnets.0.time_emb_proj.weight_7_4" + ], + "out_args": [ + "/down_blocks.1/resnets.0/Unsqueeze_1_output_0_0_2.out2_0_2" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "down_blocks.1.resnets.1.time_emb_proj.weight_7_5" + ], + "out_args": [ + "/down_blocks.1/resnets.1/Unsqueeze_1_output_0_0_3.out2_0_3" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "down_blocks.2.resnets.0.time_emb_proj.weight_7_6" + ], + "out_args": [ + "/down_blocks.2/resnets.0/Unsqueeze_1_output_0_0_4.out2_0_4" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "down_blocks.2.resnets.1.time_emb_proj.weight_7_7" + ], + "out_args": [ + "/down_blocks.2/resnets.1/Unsqueeze_1_output_0_0_5.out2_0_5" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.3/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "down_blocks.3.resnets.0.time_emb_proj.weight_7_8" + ], + "out_args": [ + "/down_blocks.3/resnets.0/Unsqueeze_1_output_0_0_6.out2_0_6" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.3/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "down_blocks.3.resnets.1.time_emb_proj.weight_7_9" + ], + "out_args": [ + "/down_blocks.3/resnets.1/Unsqueeze_1_output_0_0_7.out2_0_7" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "mid_block.resnets.0.time_emb_proj.weight_7_10" + ], + "out_args": [ + "/mid_block/resnets.0/Unsqueeze_1_output_0_0_8.out2_0_8" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "mid_block.resnets.1.time_emb_proj.weight_7_11" + ], + "out_args": [ + "/mid_block/resnets.1/Unsqueeze_1_output_0_0_9.out2_0_9" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "up_blocks.0.resnets.0.time_emb_proj.weight_7_12" + ], + "out_args": [ + "/up_blocks.0/resnets.0/Unsqueeze_1_output_0_0_10.out2_0_10" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "up_blocks.0.resnets.1.time_emb_proj.weight_7_13" + ], + "out_args": [ + "/up_blocks.0/resnets.1/Unsqueeze_1_output_0_0_11.out2_0_11" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.2/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "up_blocks.0.resnets.2.time_emb_proj.weight_7_14" + ], + "out_args": [ + "/up_blocks.0/resnets.2/Unsqueeze_1_output_0_0_12.out2_0_12" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "up_blocks.1.resnets.0.time_emb_proj.weight_7_15" + ], + "out_args": [ + "/up_blocks.1/resnets.0/Unsqueeze_1_output_0_0_13.out2_0_13" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "up_blocks.1.resnets.1.time_emb_proj.weight_7_16" + ], + "out_args": [ + "/up_blocks.1/resnets.1/Unsqueeze_1_output_0_0_14.out2_0_14" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.2/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "up_blocks.1.resnets.2.time_emb_proj.weight_7_17" + ], + "out_args": [ + "/up_blocks.1/resnets.2/Unsqueeze_1_output_0_0_15.out2_0_15" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "up_blocks.2.resnets.0.time_emb_proj.weight_7_18" + ], + "out_args": [ + "/up_blocks.2/resnets.0/Unsqueeze_1_output_0_0_16.out2_0_16" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "up_blocks.2.resnets.1.time_emb_proj.weight_7_19" + ], + "out_args": [ + "/up_blocks.2/resnets.1/Unsqueeze_1_output_0_0_17.out2_0_17" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.2/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "up_blocks.2.resnets.2.time_emb_proj.weight_7_20" + ], + "out_args": [ + "/up_blocks.2/resnets.2/Unsqueeze_1_output_0_0_18.out2_0_18" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "up_blocks.3.resnets.0.time_emb_proj.weight_7_21" + ], + "out_args": [ + "/up_blocks.3/resnets.0/Unsqueeze_1_output_0_0_19.out2_0_19" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "up_blocks.3.resnets.1.time_emb_proj.weight_7_22" + ], + "out_args": [ + "/up_blocks.3/resnets.1/Unsqueeze_1_output_0_0_20.out2_0_20" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.2/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2" + ], + "const_args": [ + "up_blocks.3.resnets.2.time_emb_proj.weight_7_23" + ], + "out_args": [ + "/up_blocks.3/resnets.2/Unsqueeze_1_output_0_0_21.out2_0_21" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/resnets.0/Add", + "type": "SDAdd", + "in_args": [ + "/down_blocks.0/resnets.0/conv1/Conv_output_0_0_0.out0_1_1", + "/down_blocks.0/resnets.0/Unsqueeze_1_output_0_0_0.out2_0_0" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/resnets.0/Add.out_12_1_1" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_1", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.0/resnets.0/Add.out_12_1_1" + ], + "const_args": [ + "GroupNorm_1_wts_7_1_1" + ], + "out_args": [ + "GroupNorm_1.out8_1.out7_1_1" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_1", + "type": "SDSilu", + "in_args": [ + "GroupNorm_1.out8_1.out7_1_1" + ], + "const_args": [ + "Sigmoid_1.weights10_3" + ], + "out_args": [ + "GroupNorm_1_sigmoid_out.8_1.out10_3" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_1-/down_blocks.0/resnets.0/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_1_sigmoid_out.8_1.out10_3" + ], + "const_args": [ + "NhwcConv_1_weight_NHWC" + ], + "out_args": [ + "NhwcConv_1_out-/down_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_2" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/resnets.0/Add_1", + "type": "SDAdd", + "in_args": [ + "NhwcConv_0_out-/conv_in/Conv_output_0.out0_1_0", + "NhwcConv_1_out-/down_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_2" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/resnets.0/Add_1.out_12_1_2" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_2", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.0/resnets.0/Add_1.out_12_1_2" + ], + "const_args": [ + "GroupNorm_2_wts_7_1_2" + ], + "out_args": [ + "/down_blocks.0/attentions.0/norm/Add_output_0_NHWC.out7_1_2" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_2-/down_blocks.0/attentions.0/proj_in/Conv", + "type": "SDConv", + "in_args": [ + "/down_blocks.0/attentions.0/norm/Add_output_0_NHWC.out7_1_2" + ], + "const_args": [ + "NhwcConv_2_weight_NHWC" + ], + "out_args": [ + "/down_blocks.0/attentions.0/Reshape_output_0.out0_0_0" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.0/attentions.0/Reshape_output_0.out0_0_0" + ], + "const_args": [ + "down_blocks.0.attentions.0.transformer_blocks.0.norm1.weight", + "down_blocks.0.attentions.0.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_0" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_0" + ], + "const_args": [ + "onnx::MatMul_5263" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_32" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_0" + ], + "const_args": [ + "onnx::MatMul_5262" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_33" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_0" + ], + "const_args": [ + "onnx::MatMul_5264" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_34" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_0", + "type": "SDMHA", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_33", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_32", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_34" + ], + "const_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_0_mask.8_0" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_0" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320", + "4096" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_0" + ], + "const_args": [ + "onnx::MatMul_5284" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_2" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/Add", + "type": "SDAdd", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_2", + "/down_blocks.0/attentions.0/Reshape_output_0.out0_0_0" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_3" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_3" + ], + "const_args": [ + "down_blocks.0.attentions.0.transformer_blocks.0.norm2.weight", + "down_blocks.0.attentions.0.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_1" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_1" + ], + "const_args": [ + "onnx::MatMul_5285" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_1", + "type": "SDMHA", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_0", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_1" + ], + "const_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_1_mask.8_1" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_1" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_1" + ], + "const_args": [ + "onnx::MatMul_5307" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_3" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1", + "type": "SDAdd", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_3", + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_3" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_4" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_4" + ], + "const_args": [ + "down_blocks.0.attentions.0.transformer_blocks.0.norm3.weight", + "down_blocks.0.attentions.0.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_2" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul_2_0_0", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_2" + ], + "const_args": [ + "onnx::MatMul_5308_2_0_0" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_0" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul_2_0_1", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_2" + ], + "const_args": [ + "onnx::MatMul_5308_2_0_1" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_4" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_4", + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_0" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_1" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.2/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_1" + ], + "const_args": [ + "onnx::MatMul_5309" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_5" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/Add_2", + "type": "SDAdd", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_5", + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_4" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.0/Reshape_1_output_0.out_12_0_0" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_3-/down_blocks.0/attentions.0/proj_out/Conv", + "type": "SDConv", + "in_args": [ + "/down_blocks.0/attentions.0/Reshape_1_output_0.out_12_0_0" + ], + "const_args": [ + "NhwcConv_3_weight_NHWC" + ], + "out_args": [ + "NhwcConv_3_out-/down_blocks.0/attentions.0/proj_out/Conv_output_0.out0_1_3" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_3_out-/down_blocks.0/attentions.0/proj_out/Conv_output_0.out0_1_3", + "/down_blocks.0/resnets.0/Add_1.out_12_1_2" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.0/Add.out_12_1_5" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_3", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.0/attentions.0/Add.out_12_1_5" + ], + "const_args": [ + "GroupNorm_3_wts_7_1_3" + ], + "out_args": [ + "GroupNorm_3.out8_3.out7_1_3" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_2", + "type": "SDSilu", + "in_args": [ + "GroupNorm_3.out8_3.out7_1_3" + ], + "const_args": [ + "Sigmoid_2.weights10_4" + ], + "out_args": [ + "GroupNorm_3_sigmoid_out.8_3.out10_4" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/Add_1", + "type": "SDAdd", + "in_args": [ + "/down_blocks.0/attentions.0/Add.out_12_1_5", + "timestep_cond_13_11_trans.out_12_1_6" + ], + "const_args": [], + "out_args": [ + "/Add_1_output_0_13_11.out_12_1_6" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/resnets.1/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_3_sigmoid_out.8_3.out10_4" + ], + "const_args": [ + "down_blocks.0.resnets.1.conv1.weight" + ], + "out_args": [ + "/down_blocks.0/resnets.1/conv1/Conv_output_0_0_1.out0_1_4" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/resnets.1/Add", + "type": "SDAdd", + "in_args": [ + "/down_blocks.0/resnets.1/conv1/Conv_output_0_0_1.out0_1_4", + "/down_blocks.0/resnets.1/Unsqueeze_1_output_0_0_1.out2_0_1" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/resnets.1/Add.out_12_1_7" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_4", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.0/resnets.1/Add.out_12_1_7" + ], + "const_args": [ + "GroupNorm_4_wts_7_1_4" + ], + "out_args": [ + "GroupNorm_4.out8_4.out7_1_4" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_3", + "type": "SDSilu", + "in_args": [ + "GroupNorm_4.out8_4.out7_1_4" + ], + "const_args": [ + "Sigmoid_3.weights10_5" + ], + "out_args": [ + "GroupNorm_4_sigmoid_out.8_4.out10_5" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_4-/down_blocks.0/resnets.1/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_4_sigmoid_out.8_4.out10_5" + ], + "const_args": [ + "NhwcConv_4_weight_NHWC" + ], + "out_args": [ + "NhwcConv_4_out-/down_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_5" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/resnets.1/Add_1", + "type": "SDAdd", + "in_args": [ + "/down_blocks.0/attentions.0/Add.out_12_1_5", + "NhwcConv_4_out-/down_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_5" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/resnets.1/Add_1.out_12_1_8" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_5", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.0/resnets.1/Add_1.out_12_1_8" + ], + "const_args": [ + "GroupNorm_5_wts_7_1_5" + ], + "out_args": [ + "/down_blocks.0/attentions.1/norm/Add_output_0_NHWC.out7_1_5" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_5-/down_blocks.0/attentions.1/proj_in/Conv", + "type": "SDConv", + "in_args": [ + "/down_blocks.0/attentions.1/norm/Add_output_0_NHWC.out7_1_5" + ], + "const_args": [ + "NhwcConv_5_weight_NHWC" + ], + "out_args": [ + "/down_blocks.0/attentions.1/Reshape_output_0.out0_0_1" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.0/attentions.1/Reshape_output_0.out0_0_1" + ], + "const_args": [ + "down_blocks.0.attentions.1.transformer_blocks.0.norm1.weight", + "down_blocks.0.attentions.1.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_3" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_3" + ], + "const_args": [ + "onnx::MatMul_5326" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_36" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_3" + ], + "const_args": [ + "onnx::MatMul_5325" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_37" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_3" + ], + "const_args": [ + "onnx::MatMul_5327" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_38" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_2", + "type": "SDMHA", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_37", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_36", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_38" + ], + "const_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_2_mask.8_2" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_2" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320", + "4096" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_2" + ], + "const_args": [ + "onnx::MatMul_5347" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_6" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/Add", + "type": "SDAdd", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_6", + "/down_blocks.0/attentions.1/Reshape_output_0.out0_0_1" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_9" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_9" + ], + "const_args": [ + "down_blocks.0.attentions.1.transformer_blocks.0.norm2.weight", + "down_blocks.0.attentions.1.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_4" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_4" + ], + "const_args": [ + "onnx::MatMul_5348" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_3", + "type": "SDMHA", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_2", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_3" + ], + "const_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_3_mask.8_3" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_3" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_3" + ], + "const_args": [ + "onnx::MatMul_5370" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_7" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1", + "type": "SDAdd", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_7", + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_9" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_10" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_10" + ], + "const_args": [ + "down_blocks.0.attentions.1.transformer_blocks.0.norm3.weight", + "down_blocks.0.attentions.1.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_5" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul_2_1_0", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_5" + ], + "const_args": [ + "onnx::MatMul_5371_2_1_0" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_1" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul_2_1_1", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_5" + ], + "const_args": [ + "onnx::MatMul_5371_2_1_1" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_8" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_8", + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_1" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_2" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.2/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_2" + ], + "const_args": [ + "onnx::MatMul_5372" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_9" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/Add_2", + "type": "SDAdd", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_9", + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_10" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.1/Reshape_1_output_0.out_12_0_1" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_6-/down_blocks.0/attentions.1/proj_out/Conv", + "type": "SDConv", + "in_args": [ + "/down_blocks.0/attentions.1/Reshape_1_output_0.out_12_0_1" + ], + "const_args": [ + "NhwcConv_6_weight_NHWC" + ], + "out_args": [ + "NhwcConv_6_out-/down_blocks.0/attentions.1/proj_out/Conv_output_0.out0_1_6" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_6_out-/down_blocks.0/attentions.1/proj_out/Conv_output_0.out0_1_6", + "/down_blocks.0/resnets.1/Add_1.out_12_1_8" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.1/Add.out_12_1_11" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_7-/down_blocks.0/downsamplers.0/conv/Conv", + "type": "SDConv", + "in_args": [ + "/down_blocks.0/attentions.1/Add.out_12_1_11" + ], + "const_args": [ + "NhwcConv_7_weight_NHWC" + ], + "out_args": [ + "NhwcConv_7_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "2", + "2" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_8-/down_blocks.1/resnets.0/conv_shortcut/Conv", + "type": "SDConv", + "in_args": [ + "NhwcConv_7_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7" + ], + "const_args": [ + "NhwcConv_8_weight_NHWC" + ], + "out_args": [ + "NhwcConv_8_out-/down_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_8" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/Add_2", + "type": "SDAdd", + "in_args": [ + "/down_blocks.0/attentions.1/Add.out_12_1_11", + "attention_mask_13_10_trans.out_12_1_12" + ], + "const_args": [], + "out_args": [ + "/Add_2_output_0_13_10.out_12_1_12" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/Add_3", + "type": "SDAdd", + "in_args": [ + "NhwcConv_7_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7", + "cross_attention_kwargs_13_9_trans.out_12_1_13" + ], + "const_args": [], + "out_args": [ + "/Add_3_output_0_13_9.out_12_1_13" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_6", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_7_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7" + ], + "const_args": [ + "GroupNorm_6_wts_7_1_6" + ], + "out_args": [ + "GroupNorm_6.out8_6.out7_1_6" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_4", + "type": "SDSilu", + "in_args": [ + "GroupNorm_6.out8_6.out7_1_6" + ], + "const_args": [ + "Sigmoid_4.weights10_6" + ], + "out_args": [ + "GroupNorm_6_sigmoid_out.8_6.out10_6" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/resnets.0/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_6_sigmoid_out.8_6.out10_6" + ], + "const_args": [ + "down_blocks.1.resnets.0.conv1.weight" + ], + "out_args": [ + "/down_blocks.1/resnets.0/conv1/Conv_output_0_0_2.out0_1_9" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/resnets.0/Add", + "type": "SDAdd", + "in_args": [ + "/down_blocks.1/resnets.0/conv1/Conv_output_0_0_2.out0_1_9", + "/down_blocks.1/resnets.0/Unsqueeze_1_output_0_0_2.out2_0_2" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/resnets.0/Add.out_12_1_14" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_7", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.1/resnets.0/Add.out_12_1_14" + ], + "const_args": [ + "GroupNorm_7_wts_7_1_7" + ], + "out_args": [ + "GroupNorm_7.out8_7.out7_1_7" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_5", + "type": "SDSilu", + "in_args": [ + "GroupNorm_7.out8_7.out7_1_7" + ], + "const_args": [ + "Sigmoid_5.weights10_7" + ], + "out_args": [ + "GroupNorm_7_sigmoid_out.8_7.out10_7" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_9-/down_blocks.1/resnets.0/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_7_sigmoid_out.8_7.out10_7" + ], + "const_args": [ + "NhwcConv_9_weight_NHWC" + ], + "out_args": [ + "NhwcConv_9_out-/down_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_10" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/resnets.0/Add_1", + "type": "SDAdd", + "in_args": [ + "NhwcConv_8_out-/down_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_8", + "NhwcConv_9_out-/down_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_10" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/resnets.0/Add_1.out_12_1_15" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_8", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.1/resnets.0/Add_1.out_12_1_15" + ], + "const_args": [ + "GroupNorm_8_wts_7_1_8" + ], + "out_args": [ + "/down_blocks.1/attentions.0/norm/Add_output_0_NHWC.out7_1_8" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_10-/down_blocks.1/attentions.0/proj_in/Conv", + "type": "SDConv", + "in_args": [ + "/down_blocks.1/attentions.0/norm/Add_output_0_NHWC.out7_1_8" + ], + "const_args": [ + "NhwcConv_10_weight_NHWC" + ], + "out_args": [ + "/down_blocks.1/attentions.0/Reshape_output_0.out0_0_2" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.1/attentions.0/Reshape_output_0.out0_0_2" + ], + "const_args": [ + "down_blocks.1.attentions.0.transformer_blocks.0.norm1.weight", + "down_blocks.1.attentions.0.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_6" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_6" + ], + "const_args": [ + "onnx::MatMul_5389" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_40" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_6" + ], + "const_args": [ + "onnx::MatMul_5388" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_41" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_6" + ], + "const_args": [ + "onnx::MatMul_5390" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_42" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_4", + "type": "SDMHA", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_41", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_40", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_42" + ], + "const_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_4_mask.8_4" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_4" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640", + "1024" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_4" + ], + "const_args": [ + "onnx::MatMul_5410" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_10" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/Add", + "type": "SDAdd", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_10", + "/down_blocks.1/attentions.0/Reshape_output_0.out0_0_2" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_16" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_16" + ], + "const_args": [ + "down_blocks.1.attentions.0.transformer_blocks.0.norm2.weight", + "down_blocks.1.attentions.0.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_7" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_7" + ], + "const_args": [ + "onnx::MatMul_5411" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_5", + "type": "SDMHA", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_4", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_5" + ], + "const_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_5_mask.8_5" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_5" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_5" + ], + "const_args": [ + "onnx::MatMul_5433" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_11" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1", + "type": "SDAdd", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_11", + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_16" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_17" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_17" + ], + "const_args": [ + "down_blocks.1.attentions.0.transformer_blocks.0.norm3.weight", + "down_blocks.1.attentions.0.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_8" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul_2_2_0", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_8" + ], + "const_args": [ + "onnx::MatMul_5434_2_2_0" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_2" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul_2_2_1", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_8" + ], + "const_args": [ + "onnx::MatMul_5434_2_2_1" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_12" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_12", + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_2" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_3" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_3" + ], + "const_args": [ + "onnx::MatMul_5435" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_13" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "2560", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/Add_2", + "type": "SDAdd", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_13", + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_17" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.0/Reshape_1_output_0.out_12_0_2" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_11-/down_blocks.1/attentions.0/proj_out/Conv", + "type": "SDConv", + "in_args": [ + "/down_blocks.1/attentions.0/Reshape_1_output_0.out_12_0_2" + ], + "const_args": [ + "NhwcConv_11_weight_NHWC" + ], + "out_args": [ + "NhwcConv_11_out-/down_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_11" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_11_out-/down_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_11", + "/down_blocks.1/resnets.0/Add_1.out_12_1_15" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.0/Add.out_12_1_18" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_9", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.1/attentions.0/Add.out_12_1_18" + ], + "const_args": [ + "GroupNorm_9_wts_7_1_9" + ], + "out_args": [ + "GroupNorm_9.out8_9.out7_1_9" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_6", + "type": "SDSilu", + "in_args": [ + "GroupNorm_9.out8_9.out7_1_9" + ], + "const_args": [ + "Sigmoid_6.weights10_8" + ], + "out_args": [ + "GroupNorm_9_sigmoid_out.8_9.out10_8" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/Add_4", + "type": "SDAdd", + "in_args": [ + "/down_blocks.1/attentions.0/Add.out_12_1_18", + "added_cond_kwargs_13_8_trans.out_12_1_19" + ], + "const_args": [], + "out_args": [ + "/Add_4_output_0_13_8.out_12_1_19" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/resnets.1/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_9_sigmoid_out.8_9.out10_8" + ], + "const_args": [ + "down_blocks.1.resnets.1.conv1.weight" + ], + "out_args": [ + "/down_blocks.1/resnets.1/conv1/Conv_output_0_0_3.out0_1_12" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/resnets.1/Add", + "type": "SDAdd", + "in_args": [ + "/down_blocks.1/resnets.1/conv1/Conv_output_0_0_3.out0_1_12", + "/down_blocks.1/resnets.1/Unsqueeze_1_output_0_0_3.out2_0_3" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/resnets.1/Add.out_12_1_20" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_10", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.1/resnets.1/Add.out_12_1_20" + ], + "const_args": [ + "GroupNorm_10_wts_7_1_10" + ], + "out_args": [ + "GroupNorm_10.out8_10.out7_1_10" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_7", + "type": "SDSilu", + "in_args": [ + "GroupNorm_10.out8_10.out7_1_10" + ], + "const_args": [ + "Sigmoid_7.weights10_9" + ], + "out_args": [ + "GroupNorm_10_sigmoid_out.8_10.out10_9" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_12-/down_blocks.1/resnets.1/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_10_sigmoid_out.8_10.out10_9" + ], + "const_args": [ + "NhwcConv_12_weight_NHWC" + ], + "out_args": [ + "NhwcConv_12_out-/down_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_13" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/resnets.1/Add_1", + "type": "SDAdd", + "in_args": [ + "/down_blocks.1/attentions.0/Add.out_12_1_18", + "NhwcConv_12_out-/down_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_13" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/resnets.1/Add_1.out_12_1_21" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_11", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.1/resnets.1/Add_1.out_12_1_21" + ], + "const_args": [ + "GroupNorm_11_wts_7_1_11" + ], + "out_args": [ + "/down_blocks.1/attentions.1/norm/Add_output_0_NHWC.out7_1_11" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_13-/down_blocks.1/attentions.1/proj_in/Conv", + "type": "SDConv", + "in_args": [ + "/down_blocks.1/attentions.1/norm/Add_output_0_NHWC.out7_1_11" + ], + "const_args": [ + "NhwcConv_13_weight_NHWC" + ], + "out_args": [ + "/down_blocks.1/attentions.1/Reshape_output_0.out0_0_3" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.1/attentions.1/Reshape_output_0.out0_0_3" + ], + "const_args": [ + "down_blocks.1.attentions.1.transformer_blocks.0.norm1.weight", + "down_blocks.1.attentions.1.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_9" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_9" + ], + "const_args": [ + "onnx::MatMul_5452" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_44" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_9" + ], + "const_args": [ + "onnx::MatMul_5451" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_45" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_9" + ], + "const_args": [ + "onnx::MatMul_5453" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_46" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_6", + "type": "SDMHA", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_45", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_44", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_46" + ], + "const_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_6_mask.8_6" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_6" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640", + "1024" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_6" + ], + "const_args": [ + "onnx::MatMul_5473" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_14" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/Add", + "type": "SDAdd", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_14", + "/down_blocks.1/attentions.1/Reshape_output_0.out0_0_3" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_22" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_22" + ], + "const_args": [ + "down_blocks.1.attentions.1.transformer_blocks.0.norm2.weight", + "down_blocks.1.attentions.1.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_10" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_10" + ], + "const_args": [ + "onnx::MatMul_5474" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_7", + "type": "SDMHA", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_6", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_7" + ], + "const_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_7_mask.8_7" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_7" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_7" + ], + "const_args": [ + "onnx::MatMul_5496" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_15" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1", + "type": "SDAdd", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_15", + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_22" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_23" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_23" + ], + "const_args": [ + "down_blocks.1.attentions.1.transformer_blocks.0.norm3.weight", + "down_blocks.1.attentions.1.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_11" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul_2_3_0", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_11" + ], + "const_args": [ + "onnx::MatMul_5497_2_3_0" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_3" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul_2_3_1", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_11" + ], + "const_args": [ + "onnx::MatMul_5497_2_3_1" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_16" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_16", + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_3" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_4" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_4" + ], + "const_args": [ + "onnx::MatMul_5498" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_17" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "2560", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/Add_2", + "type": "SDAdd", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_17", + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_23" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.1/Reshape_1_output_0.out_12_0_3" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_14-/down_blocks.1/attentions.1/proj_out/Conv", + "type": "SDConv", + "in_args": [ + "/down_blocks.1/attentions.1/Reshape_1_output_0.out_12_0_3" + ], + "const_args": [ + "NhwcConv_14_weight_NHWC" + ], + "out_args": [ + "NhwcConv_14_out-/down_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_14" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_14_out-/down_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_14", + "/down_blocks.1/resnets.1/Add_1.out_12_1_21" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.1/Add.out_12_1_24" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_15-/down_blocks.1/downsamplers.0/conv/Conv", + "type": "SDConv", + "in_args": [ + "/down_blocks.1/attentions.1/Add.out_12_1_24" + ], + "const_args": [ + "NhwcConv_15_weight_NHWC" + ], + "out_args": [ + "NhwcConv_15_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "2", + "2" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_16-/down_blocks.2/resnets.0/conv_shortcut/Conv", + "type": "SDConv", + "in_args": [ + "NhwcConv_15_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15" + ], + "const_args": [ + "NhwcConv_16_weight_NHWC" + ], + "out_args": [ + "NhwcConv_16_out-/down_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_16" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/Add_5", + "type": "SDAdd", + "in_args": [ + "/down_blocks.1/attentions.1/Add.out_12_1_24", + "down_block_additional_residuals_13_7_trans.out_12_1_25" + ], + "const_args": [], + "out_args": [ + "/Add_5_output_0_13_7.out_12_1_25" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/Add_6", + "type": "SDAdd", + "in_args": [ + "NhwcConv_15_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15", + "mid_block_additional_residual_13_6_trans.out_12_1_26" + ], + "const_args": [], + "out_args": [ + "/Add_6_output_0_13_6.out_12_1_26" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_12", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_15_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15" + ], + "const_args": [ + "GroupNorm_12_wts_7_1_12" + ], + "out_args": [ + "GroupNorm_12.out8_12.out7_1_12" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_8", + "type": "SDSilu", + "in_args": [ + "GroupNorm_12.out8_12.out7_1_12" + ], + "const_args": [ + "Sigmoid_8.weights10_10" + ], + "out_args": [ + "GroupNorm_12_sigmoid_out.8_12.out10_10" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/resnets.0/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_12_sigmoid_out.8_12.out10_10" + ], + "const_args": [ + "down_blocks.2.resnets.0.conv1.weight" + ], + "out_args": [ + "/down_blocks.2/resnets.0/conv1/Conv_output_0_0_4.out0_1_17" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/resnets.0/Add", + "type": "SDAdd", + "in_args": [ + "/down_blocks.2/resnets.0/conv1/Conv_output_0_0_4.out0_1_17", + "/down_blocks.2/resnets.0/Unsqueeze_1_output_0_0_4.out2_0_4" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/resnets.0/Add.out_12_1_27" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_13", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.2/resnets.0/Add.out_12_1_27" + ], + "const_args": [ + "GroupNorm_13_wts_7_1_13" + ], + "out_args": [ + "GroupNorm_13.out8_13.out7_1_13" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_9", + "type": "SDSilu", + "in_args": [ + "GroupNorm_13.out8_13.out7_1_13" + ], + "const_args": [ + "Sigmoid_9.weights10_11" + ], + "out_args": [ + "GroupNorm_13_sigmoid_out.8_13.out10_11" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_17-/down_blocks.2/resnets.0/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_13_sigmoid_out.8_13.out10_11" + ], + "const_args": [ + "NhwcConv_17_weight_NHWC" + ], + "out_args": [ + "NhwcConv_17_out-/down_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_18" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/resnets.0/Add_1", + "type": "SDAdd", + "in_args": [ + "NhwcConv_16_out-/down_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_16", + "NhwcConv_17_out-/down_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_18" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/resnets.0/Add_1.out_12_1_28" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_14", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.2/resnets.0/Add_1.out_12_1_28" + ], + "const_args": [ + "GroupNorm_14_wts_7_1_14" + ], + "out_args": [ + "/down_blocks.2/attentions.0/norm/Add_output_0_NHWC.out7_1_14" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_18-/down_blocks.2/attentions.0/proj_in/Conv", + "type": "SDConv", + "in_args": [ + "/down_blocks.2/attentions.0/norm/Add_output_0_NHWC.out7_1_14" + ], + "const_args": [ + "NhwcConv_18_weight_NHWC" + ], + "out_args": [ + "/down_blocks.2/attentions.0/Reshape_output_0.out0_0_4" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.2/attentions.0/Reshape_output_0.out0_0_4" + ], + "const_args": [ + "down_blocks.2.attentions.0.transformer_blocks.0.norm1.weight", + "down_blocks.2.attentions.0.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_12" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_12" + ], + "const_args": [ + "onnx::MatMul_5515" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_48" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_12" + ], + "const_args": [ + "onnx::MatMul_5514" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_49" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_12" + ], + "const_args": [ + "onnx::MatMul_5516" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_50" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_8", + "type": "SDMHA", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_49", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_48", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_50" + ], + "const_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_8_mask.8_8" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_8" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280", + "256" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_8" + ], + "const_args": [ + "onnx::MatMul_5536" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_18" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/Add", + "type": "SDAdd", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_18", + "/down_blocks.2/attentions.0/Reshape_output_0.out0_0_4" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_29" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_29" + ], + "const_args": [ + "down_blocks.2.attentions.0.transformer_blocks.0.norm2.weight", + "down_blocks.2.attentions.0.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_13" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_13" + ], + "const_args": [ + "onnx::MatMul_5537" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_51" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_9", + "type": "SDMHA", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_51", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_8", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_9" + ], + "const_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_9_mask.8_9" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_9" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_9" + ], + "const_args": [ + "onnx::MatMul_5559" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_19" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1", + "type": "SDAdd", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_19", + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_29" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_30" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_30" + ], + "const_args": [ + "down_blocks.2.attentions.0.transformer_blocks.0.norm3.weight", + "down_blocks.2.attentions.0.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_14" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul_2_4_0", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_14" + ], + "const_args": [ + "onnx::MatMul_5560_2_4_0" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_4" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul_2_4_1", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_14" + ], + "const_args": [ + "onnx::MatMul_5560_2_4_1" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_20" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_20", + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_4" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_5" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_5" + ], + "const_args": [ + "onnx::MatMul_5561" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_21" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "5120", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/Add_2", + "type": "SDAdd", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_21", + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_30" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.0/Reshape_1_output_0.out_12_0_4" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_19-/down_blocks.2/attentions.0/proj_out/Conv", + "type": "SDConv", + "in_args": [ + "/down_blocks.2/attentions.0/Reshape_1_output_0.out_12_0_4" + ], + "const_args": [ + "NhwcConv_19_weight_NHWC" + ], + "out_args": [ + "NhwcConv_19_out-/down_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_19" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_19_out-/down_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_19", + "/down_blocks.2/resnets.0/Add_1.out_12_1_28" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.0/Add.out_12_1_31" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_15", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.2/attentions.0/Add.out_12_1_31" + ], + "const_args": [ + "GroupNorm_15_wts_7_1_15" + ], + "out_args": [ + "GroupNorm_15.out8_15.out7_1_15" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_10", + "type": "SDSilu", + "in_args": [ + "GroupNorm_15.out8_15.out7_1_15" + ], + "const_args": [ + "Sigmoid_10.weights10_12" + ], + "out_args": [ + "GroupNorm_15_sigmoid_out.8_15.out10_12" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/Add_7", + "type": "SDAdd", + "in_args": [ + "/down_blocks.2/attentions.0/Add.out_12_1_31", + "onnx::Add_10_13_5_trans.out_12_1_32" + ], + "const_args": [], + "out_args": [ + "/Add_7_output_0_13_5.out_12_1_32" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/resnets.1/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_15_sigmoid_out.8_15.out10_12" + ], + "const_args": [ + "down_blocks.2.resnets.1.conv1.weight" + ], + "out_args": [ + "/down_blocks.2/resnets.1/conv1/Conv_output_0_0_5.out0_1_20" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/resnets.1/Add", + "type": "SDAdd", + "in_args": [ + "/down_blocks.2/resnets.1/conv1/Conv_output_0_0_5.out0_1_20", + "/down_blocks.2/resnets.1/Unsqueeze_1_output_0_0_5.out2_0_5" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/resnets.1/Add.out_12_1_33" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_16", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.2/resnets.1/Add.out_12_1_33" + ], + "const_args": [ + "GroupNorm_16_wts_7_1_16" + ], + "out_args": [ + "GroupNorm_16.out8_16.out7_1_16" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_11", + "type": "SDSilu", + "in_args": [ + "GroupNorm_16.out8_16.out7_1_16" + ], + "const_args": [ + "Sigmoid_11.weights10_13" + ], + "out_args": [ + "GroupNorm_16_sigmoid_out.8_16.out10_13" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_20-/down_blocks.2/resnets.1/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_16_sigmoid_out.8_16.out10_13" + ], + "const_args": [ + "NhwcConv_20_weight_NHWC" + ], + "out_args": [ + "NhwcConv_20_out-/down_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_21" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/resnets.1/Add_1", + "type": "SDAdd", + "in_args": [ + "/down_blocks.2/attentions.0/Add.out_12_1_31", + "NhwcConv_20_out-/down_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_21" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/resnets.1/Add_1.out_12_1_34" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_17", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.2/resnets.1/Add_1.out_12_1_34" + ], + "const_args": [ + "GroupNorm_17_wts_7_1_17" + ], + "out_args": [ + "/down_blocks.2/attentions.1/norm/Add_output_0_NHWC.out7_1_17" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_21-/down_blocks.2/attentions.1/proj_in/Conv", + "type": "SDConv", + "in_args": [ + "/down_blocks.2/attentions.1/norm/Add_output_0_NHWC.out7_1_17" + ], + "const_args": [ + "NhwcConv_21_weight_NHWC" + ], + "out_args": [ + "/down_blocks.2/attentions.1/Reshape_output_0.out0_0_5" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.2/attentions.1/Reshape_output_0.out0_0_5" + ], + "const_args": [ + "down_blocks.2.attentions.1.transformer_blocks.0.norm1.weight", + "down_blocks.2.attentions.1.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_15" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_15" + ], + "const_args": [ + "onnx::MatMul_5578" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_52" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_15" + ], + "const_args": [ + "onnx::MatMul_5577" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_53" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_15" + ], + "const_args": [ + "onnx::MatMul_5579" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_54" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_10", + "type": "SDMHA", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_53", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_52", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_54" + ], + "const_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_10_mask.8_10" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_10" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280", + "256" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_10" + ], + "const_args": [ + "onnx::MatMul_5599" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_22" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/Add", + "type": "SDAdd", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_22", + "/down_blocks.2/attentions.1/Reshape_output_0.out0_0_5" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_35" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_35" + ], + "const_args": [ + "down_blocks.2.attentions.1.transformer_blocks.0.norm2.weight", + "down_blocks.2.attentions.1.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_16" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_16" + ], + "const_args": [ + "onnx::MatMul_5600" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_55" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_11", + "type": "SDMHA", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_55", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_10", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_11" + ], + "const_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_11_mask.8_11" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_11" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_11" + ], + "const_args": [ + "onnx::MatMul_5622" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_23" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1", + "type": "SDAdd", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_23", + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_35" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_36" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_36" + ], + "const_args": [ + "down_blocks.2.attentions.1.transformer_blocks.0.norm3.weight", + "down_blocks.2.attentions.1.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_17" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul_2_5_0", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_17" + ], + "const_args": [ + "onnx::MatMul_5623_2_5_0" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_5" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul_2_5_1", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_17" + ], + "const_args": [ + "onnx::MatMul_5623_2_5_1" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_24" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_24", + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_5" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_6" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/MatMul", + "type": "SDGemm", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_6" + ], + "const_args": [ + "onnx::MatMul_5624" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_25" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "5120", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/Add_2", + "type": "SDAdd", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_25", + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_36" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.1/Reshape_1_output_0.out_12_0_5" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_22-/down_blocks.2/attentions.1/proj_out/Conv", + "type": "SDConv", + "in_args": [ + "/down_blocks.2/attentions.1/Reshape_1_output_0.out_12_0_5" + ], + "const_args": [ + "NhwcConv_22_weight_NHWC" + ], + "out_args": [ + "NhwcConv_22_out-/down_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_22" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_22_out-/down_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_22", + "/down_blocks.2/resnets.1/Add_1.out_12_1_34" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.1/Add.out_12_1_37" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_23-/down_blocks.2/downsamplers.0/conv/Conv", + "type": "SDConv", + "in_args": [ + "/down_blocks.2/attentions.1/Add.out_12_1_37" + ], + "const_args": [ + "NhwcConv_23_weight_NHWC" + ], + "out_args": [ + "NhwcConv_23_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "2", + "2" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/Add_8", + "type": "SDAdd", + "in_args": [ + "/down_blocks.2/attentions.1/Add.out_12_1_37", + "onnx::Add_11_13_4_trans.out_12_1_38" + ], + "const_args": [], + "out_args": [ + "/Add_8_output_0_13_4.out_12_1_38" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/Add_9", + "type": "SDAdd", + "in_args": [ + "NhwcConv_23_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23", + "onnx::Add_12_13_3_trans.out_12_1_39" + ], + "const_args": [], + "out_args": [ + "/Add_9_output_0_13_3.out_12_1_39" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_18", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_23_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23" + ], + "const_args": [ + "GroupNorm_18_wts_7_1_18" + ], + "out_args": [ + "GroupNorm_18.out8_18.out7_1_18" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_12", + "type": "SDSilu", + "in_args": [ + "GroupNorm_18.out8_18.out7_1_18" + ], + "const_args": [ + "Sigmoid_12.weights10_14" + ], + "out_args": [ + "GroupNorm_18_sigmoid_out.8_18.out10_14" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.3/resnets.0/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_18_sigmoid_out.8_18.out10_14" + ], + "const_args": [ + "down_blocks.3.resnets.0.conv1.weight" + ], + "out_args": [ + "/down_blocks.3/resnets.0/conv1/Conv_output_0_0_6.out0_1_24" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.3/resnets.0/Add", + "type": "SDAdd", + "in_args": [ + "/down_blocks.3/resnets.0/conv1/Conv_output_0_0_6.out0_1_24", + "/down_blocks.3/resnets.0/Unsqueeze_1_output_0_0_6.out2_0_6" + ], + "const_args": [], + "out_args": [ + "/down_blocks.3/resnets.0/Add.out_12_1_40" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_19", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.3/resnets.0/Add.out_12_1_40" + ], + "const_args": [ + "GroupNorm_19_wts_7_1_19" + ], + "out_args": [ + "GroupNorm_19.out8_19.out7_1_19" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_13", + "type": "SDSilu", + "in_args": [ + "GroupNorm_19.out8_19.out7_1_19" + ], + "const_args": [ + "Sigmoid_13.weights10_15" + ], + "out_args": [ + "GroupNorm_19_sigmoid_out.8_19.out10_15" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_24-/down_blocks.3/resnets.0/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_19_sigmoid_out.8_19.out10_15" + ], + "const_args": [ + "NhwcConv_24_weight_NHWC" + ], + "out_args": [ + "NhwcConv_24_out-/down_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_25" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.3/resnets.0/Add_1", + "type": "SDAdd", + "in_args": [ + "NhwcConv_23_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23", + "NhwcConv_24_out-/down_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_25" + ], + "const_args": [], + "out_args": [ + "/down_blocks.3/resnets.0/Add_1.out_12_1_41" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_20", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.3/resnets.0/Add_1.out_12_1_41" + ], + "const_args": [ + "GroupNorm_20_wts_7_1_20" + ], + "out_args": [ + "GroupNorm_20.out8_20.out7_1_20" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_14", + "type": "SDSilu", + "in_args": [ + "GroupNorm_20.out8_20.out7_1_20" + ], + "const_args": [ + "Sigmoid_14.weights10_16" + ], + "out_args": [ + "GroupNorm_20_sigmoid_out.8_20.out10_16" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/Add_10", + "type": "SDAdd", + "in_args": [ + "/down_blocks.3/resnets.0/Add_1.out_12_1_41", + "onnx::Add_13_13_2_trans.out_12_1_42" + ], + "const_args": [], + "out_args": [ + "/Add_10_output_0_13_2.out_12_1_42" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.3/resnets.1/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_20_sigmoid_out.8_20.out10_16" + ], + "const_args": [ + "down_blocks.3.resnets.1.conv1.weight" + ], + "out_args": [ + "/down_blocks.3/resnets.1/conv1/Conv_output_0_0_7.out0_1_26" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.3/resnets.1/Add", + "type": "SDAdd", + "in_args": [ + "/down_blocks.3/resnets.1/conv1/Conv_output_0_0_7.out0_1_26", + "/down_blocks.3/resnets.1/Unsqueeze_1_output_0_0_7.out2_0_7" + ], + "const_args": [], + "out_args": [ + "/down_blocks.3/resnets.1/Add.out_12_1_43" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_21", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.3/resnets.1/Add.out_12_1_43" + ], + "const_args": [ + "GroupNorm_21_wts_7_1_21" + ], + "out_args": [ + "GroupNorm_21.out8_21.out7_1_21" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_15", + "type": "SDSilu", + "in_args": [ + "GroupNorm_21.out8_21.out7_1_21" + ], + "const_args": [ + "Sigmoid_15.weights10_17" + ], + "out_args": [ + "GroupNorm_21_sigmoid_out.8_21.out10_17" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_25-/down_blocks.3/resnets.1/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_21_sigmoid_out.8_21.out10_17" + ], + "const_args": [ + "NhwcConv_25_weight_NHWC" + ], + "out_args": [ + "NhwcConv_25_out-/down_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_27" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.3/resnets.1/Add_1", + "type": "SDAdd", + "in_args": [ + "/down_blocks.3/resnets.0/Add_1.out_12_1_41", + "NhwcConv_25_out-/down_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_27" + ], + "const_args": [], + "out_args": [ + "/down_blocks.3/resnets.1/Add_1.out_12_1_44" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_22", + "type": "SDGroupNorm", + "in_args": [ + "/down_blocks.3/resnets.1/Add_1.out_12_1_44" + ], + "const_args": [ + "GroupNorm_22_wts_7_1_22" + ], + "out_args": [ + "GroupNorm_22.out8_22.out7_1_22" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_16", + "type": "SDSilu", + "in_args": [ + "GroupNorm_22.out8_22.out7_1_22" + ], + "const_args": [ + "Sigmoid_16.weights10_18" + ], + "out_args": [ + "GroupNorm_22_sigmoid_out.8_22.out10_18" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/Add_11", + "type": "SDAdd", + "in_args": [ + "/down_blocks.3/resnets.1/Add_1.out_12_1_44", + "onnx::Add_14_13_1_trans.out_12_1_45" + ], + "const_args": [], + "out_args": [ + "/Add_11_output_0_13_1.out_12_1_45" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/resnets.0/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_22_sigmoid_out.8_22.out10_18" + ], + "const_args": [ + "mid_block.resnets.0.conv1.weight" + ], + "out_args": [ + "/mid_block/resnets.0/conv1/Conv_output_0_0_8.out0_1_28" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/resnets.0/Add", + "type": "SDAdd", + "in_args": [ + "/mid_block/resnets.0/conv1/Conv_output_0_0_8.out0_1_28", + "/mid_block/resnets.0/Unsqueeze_1_output_0_0_8.out2_0_8" + ], + "const_args": [], + "out_args": [ + "/mid_block/resnets.0/Add.out_12_1_46" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_23", + "type": "SDGroupNorm", + "in_args": [ + "/mid_block/resnets.0/Add.out_12_1_46" + ], + "const_args": [ + "GroupNorm_23_wts_7_1_23" + ], + "out_args": [ + "GroupNorm_23.out8_23.out7_1_23" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_17", + "type": "SDSilu", + "in_args": [ + "GroupNorm_23.out8_23.out7_1_23" + ], + "const_args": [ + "Sigmoid_17.weights10_19" + ], + "out_args": [ + "GroupNorm_23_sigmoid_out.8_23.out10_19" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_26-/mid_block/resnets.0/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_23_sigmoid_out.8_23.out10_19" + ], + "const_args": [ + "NhwcConv_26_weight_NHWC" + ], + "out_args": [ + "NhwcConv_26_out-/mid_block/resnets.0/conv2/Conv_output_0.out0_1_29" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/resnets.0/Add_1", + "type": "SDAdd", + "in_args": [ + "/down_blocks.3/resnets.1/Add_1.out_12_1_44", + "NhwcConv_26_out-/mid_block/resnets.0/conv2/Conv_output_0.out0_1_29" + ], + "const_args": [], + "out_args": [ + "/mid_block/resnets.0/Add_1.out_12_1_47" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_24", + "type": "SDGroupNorm", + "in_args": [ + "/mid_block/resnets.0/Add_1.out_12_1_47" + ], + "const_args": [ + "GroupNorm_24_wts_7_1_24" + ], + "out_args": [ + "/mid_block/attentions.0/norm/Add_output_0_NHWC.out7_1_24" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_27-/mid_block/attentions.0/proj_in/Conv", + "type": "SDConv", + "in_args": [ + "/mid_block/attentions.0/norm/Add_output_0_NHWC.out7_1_24" + ], + "const_args": [ + "NhwcConv_27_weight_NHWC" + ], + "out_args": [ + "/mid_block/attentions.0/Reshape_output_0.out0_0_6" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/mid_block/attentions.0/Reshape_output_0.out0_0_6" + ], + "const_args": [ + "mid_block.attentions.0.transformer_blocks.0.norm1.weight", + "mid_block.attentions.0.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_18" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn1/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_18" + ], + "const_args": [ + "onnx::MatMul_5649" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_56" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn1/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_18" + ], + "const_args": [ + "onnx::MatMul_5648" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_57" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn1/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_18" + ], + "const_args": [ + "onnx::MatMul_5650" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_58" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_12", + "type": "SDMHA", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_57", + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_56", + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_58" + ], + "const_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_12_mask.8_12" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_12" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280", + "64" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_12" + ], + "const_args": [ + "onnx::MatMul_5670" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_26" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/Add", + "type": "SDAdd", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_26", + "/mid_block/attentions.0/Reshape_output_0.out0_0_6" + ], + "const_args": [], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_48" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_48" + ], + "const_args": [ + "mid_block.attentions.0.transformer_blocks.0.norm2.weight", + "mid_block.attentions.0.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_19" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_19" + ], + "const_args": [ + "onnx::MatMul_5671" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_59" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_13", + "type": "SDMHA", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_59", + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_12", + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_13" + ], + "const_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_13_mask.8_13" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_13" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_13" + ], + "const_args": [ + "onnx::MatMul_5693" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_27" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/Add_1", + "type": "SDAdd", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_27", + "/mid_block/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_48" + ], + "const_args": [], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_49" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_49" + ], + "const_args": [ + "mid_block.attentions.0.transformer_blocks.0.norm3.weight", + "mid_block.attentions.0.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_20" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul_2_6_0", + "type": "SDGemm", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_20" + ], + "const_args": [ + "onnx::MatMul_5694_2_6_0" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_6" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul_2_6_1", + "type": "SDGemm", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_20" + ], + "const_args": [ + "onnx::MatMul_5694_2_6_1" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_28" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_28", + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_6" + ], + "const_args": [], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_7" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "5120" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "5120" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "5120" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/ff/net.2/MatMul", + "type": "SDGemm", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_7" + ], + "const_args": [ + "onnx::MatMul_5695" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_29" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "5120" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "5120", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/Add_2", + "type": "SDAdd", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_29", + "/mid_block/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_49" + ], + "const_args": [], + "out_args": [ + "/mid_block/attentions.0/Reshape_1_output_0.out_12_0_6" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_28-/mid_block/attentions.0/proj_out/Conv", + "type": "SDConv", + "in_args": [ + "/mid_block/attentions.0/Reshape_1_output_0.out_12_0_6" + ], + "const_args": [ + "NhwcConv_28_weight_NHWC" + ], + "out_args": [ + "NhwcConv_28_out-/mid_block/attentions.0/proj_out/Conv_output_0.out0_1_30" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_28_out-/mid_block/attentions.0/proj_out/Conv_output_0.out0_1_30", + "/mid_block/resnets.0/Add_1.out_12_1_47" + ], + "const_args": [], + "out_args": [ + "/mid_block/attentions.0/Add.out_12_1_50" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_25", + "type": "SDGroupNorm", + "in_args": [ + "/mid_block/attentions.0/Add.out_12_1_50" + ], + "const_args": [ + "GroupNorm_25_wts_7_1_25" + ], + "out_args": [ + "GroupNorm_25.out8_25.out7_1_25" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_18", + "type": "SDSilu", + "in_args": [ + "GroupNorm_25.out8_25.out7_1_25" + ], + "const_args": [ + "Sigmoid_18.weights10_20" + ], + "out_args": [ + "GroupNorm_25_sigmoid_out.8_25.out10_20" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/resnets.1/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_25_sigmoid_out.8_25.out10_20" + ], + "const_args": [ + "mid_block.resnets.1.conv1.weight" + ], + "out_args": [ + "/mid_block/resnets.1/conv1/Conv_output_0_0_9.out0_1_31" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/resnets.1/Add", + "type": "SDAdd", + "in_args": [ + "/mid_block/resnets.1/conv1/Conv_output_0_0_9.out0_1_31", + "/mid_block/resnets.1/Unsqueeze_1_output_0_0_9.out2_0_9" + ], + "const_args": [], + "out_args": [ + "/mid_block/resnets.1/Add.out_12_1_51" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_26", + "type": "SDGroupNorm", + "in_args": [ + "/mid_block/resnets.1/Add.out_12_1_51" + ], + "const_args": [ + "GroupNorm_26_wts_7_1_26" + ], + "out_args": [ + "GroupNorm_26.out8_26.out7_1_26" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_19", + "type": "SDSilu", + "in_args": [ + "GroupNorm_26.out8_26.out7_1_26" + ], + "const_args": [ + "Sigmoid_19.weights10_21" + ], + "out_args": [ + "GroupNorm_26_sigmoid_out.8_26.out10_21" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_29-/mid_block/resnets.1/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_26_sigmoid_out.8_26.out10_21" + ], + "const_args": [ + "NhwcConv_29_weight_NHWC" + ], + "out_args": [ + "NhwcConv_29_out-/mid_block/resnets.1/conv2/Conv_output_0.out0_1_32" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/resnets.1/Add_1", + "type": "SDAdd", + "in_args": [ + "/mid_block/attentions.0/Add.out_12_1_50", + "NhwcConv_29_out-/mid_block/resnets.1/conv2/Conv_output_0.out0_1_32" + ], + "const_args": [], + "out_args": [ + "/mid_block/resnets.1/Add_1.out_12_1_52" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/Add_12", + "type": "SDAdd", + "in_args": [ + "/mid_block/resnets.1/Add_1.out_12_1_52", + "onnx::Add_15_13_0_trans.out_12_1_53" + ], + "const_args": [], + "out_args": [ + "/Add_12_output_0_13_0.out_12_1_53" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/Concat", + "type": "SDConcat", + "in_args": [ + "/Add_12_output_0_13_0.out_12_1_53", + "/Add_11_output_0_13_1.out_12_1_45" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/Concat_output_0_NHWC.out13_1" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_27", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.0/Concat_output_0_NHWC.out13_1" + ], + "const_args": [ + "GroupNorm_27_wts_7_1_27" + ], + "out_args": [ + "GroupNorm_27.out8_27.out7_1_27" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "5120" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_30-/up_blocks.0/resnets.0/conv_shortcut/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.0/Concat_output_0_NHWC.out13_1" + ], + "const_args": [ + "NhwcConv_30_weight_NHWC" + ], + "out_args": [ + "NhwcConv_30_out-/up_blocks.0/resnets.0/conv_shortcut/Conv_output_0.out0_1_33" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_20", + "type": "SDSilu", + "in_args": [ + "GroupNorm_27.out8_27.out7_1_27" + ], + "const_args": [ + "Sigmoid_20.weights10_22" + ], + "out_args": [ + "GroupNorm_27_sigmoid_out.8_27.out10_22" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.0/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_27_sigmoid_out.8_27.out10_22" + ], + "const_args": [ + "up_blocks.0.resnets.0.conv1.weight" + ], + "out_args": [ + "/up_blocks.0/resnets.0/conv1/Conv_output_0_0_10.out0_1_34" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.0/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.0/resnets.0/conv1/Conv_output_0_0_10.out0_1_34", + "/up_blocks.0/resnets.0/Unsqueeze_1_output_0_0_10.out2_0_10" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/resnets.0/Add.out_12_1_54" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_28", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.0/resnets.0/Add.out_12_1_54" + ], + "const_args": [ + "GroupNorm_28_wts_7_1_28" + ], + "out_args": [ + "GroupNorm_28.out8_28.out7_1_28" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_21", + "type": "SDSilu", + "in_args": [ + "GroupNorm_28.out8_28.out7_1_28" + ], + "const_args": [ + "Sigmoid_21.weights10_23" + ], + "out_args": [ + "GroupNorm_28_sigmoid_out.8_28.out10_23" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_31-/up_blocks.0/resnets.0/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_28_sigmoid_out.8_28.out10_23" + ], + "const_args": [ + "NhwcConv_31_weight_NHWC" + ], + "out_args": [ + "NhwcConv_31_out-/up_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_35" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.0/Add_1", + "type": "SDAdd", + "in_args": [ + "NhwcConv_30_out-/up_blocks.0/resnets.0/conv_shortcut/Conv_output_0.out0_1_33", + "NhwcConv_31_out-/up_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_35" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/resnets.0/Add_1.out_12_1_55" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/Concat_1", + "type": "SDConcat", + "in_args": [ + "/up_blocks.0/resnets.0/Add_1.out_12_1_55", + "/Add_10_output_0_13_2.out_12_1_42" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/Concat_1_output_0_NHWC.out13_2" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_29", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.0/Concat_1_output_0_NHWC.out13_2" + ], + "const_args": [ + "GroupNorm_29_wts_7_1_29" + ], + "out_args": [ + "GroupNorm_29.out8_29.out7_1_29" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "5120" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_32-/up_blocks.0/resnets.1/conv_shortcut/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.0/Concat_1_output_0_NHWC.out13_2" + ], + "const_args": [ + "NhwcConv_32_weight_NHWC" + ], + "out_args": [ + "NhwcConv_32_out-/up_blocks.0/resnets.1/conv_shortcut/Conv_output_0.out0_1_36" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_22", + "type": "SDSilu", + "in_args": [ + "GroupNorm_29.out8_29.out7_1_29" + ], + "const_args": [ + "Sigmoid_22.weights10_24" + ], + "out_args": [ + "GroupNorm_29_sigmoid_out.8_29.out10_24" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.1/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_29_sigmoid_out.8_29.out10_24" + ], + "const_args": [ + "up_blocks.0.resnets.1.conv1.weight" + ], + "out_args": [ + "/up_blocks.0/resnets.1/conv1/Conv_output_0_0_11.out0_1_37" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.1/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.0/resnets.1/conv1/Conv_output_0_0_11.out0_1_37", + "/up_blocks.0/resnets.1/Unsqueeze_1_output_0_0_11.out2_0_11" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/resnets.1/Add.out_12_1_56" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_30", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.0/resnets.1/Add.out_12_1_56" + ], + "const_args": [ + "GroupNorm_30_wts_7_1_30" + ], + "out_args": [ + "GroupNorm_30.out8_30.out7_1_30" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_23", + "type": "SDSilu", + "in_args": [ + "GroupNorm_30.out8_30.out7_1_30" + ], + "const_args": [ + "Sigmoid_23.weights10_25" + ], + "out_args": [ + "GroupNorm_30_sigmoid_out.8_30.out10_25" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_33-/up_blocks.0/resnets.1/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_30_sigmoid_out.8_30.out10_25" + ], + "const_args": [ + "NhwcConv_33_weight_NHWC" + ], + "out_args": [ + "NhwcConv_33_out-/up_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_38" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.1/Add_1", + "type": "SDAdd", + "in_args": [ + "NhwcConv_32_out-/up_blocks.0/resnets.1/conv_shortcut/Conv_output_0.out0_1_36", + "NhwcConv_33_out-/up_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_38" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/resnets.1/Add_1.out_12_1_57" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/Concat_2", + "type": "SDConcat", + "in_args": [ + "/up_blocks.0/resnets.1/Add_1.out_12_1_57", + "/Add_9_output_0_13_3.out_12_1_39" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/Concat_2_output_0_NHWC.out13_3" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_31", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.0/Concat_2_output_0_NHWC.out13_3" + ], + "const_args": [ + "GroupNorm_31_wts_7_1_31" + ], + "out_args": [ + "GroupNorm_31.out8_31.out7_1_31" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "5120" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_34-/up_blocks.0/resnets.2/conv_shortcut/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.0/Concat_2_output_0_NHWC.out13_3" + ], + "const_args": [ + "NhwcConv_34_weight_NHWC" + ], + "out_args": [ + "NhwcConv_34_out-/up_blocks.0/resnets.2/conv_shortcut/Conv_output_0.out0_1_39" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_24", + "type": "SDSilu", + "in_args": [ + "GroupNorm_31.out8_31.out7_1_31" + ], + "const_args": [ + "Sigmoid_24.weights10_26" + ], + "out_args": [ + "GroupNorm_31_sigmoid_out.8_31.out10_26" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.2/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_31_sigmoid_out.8_31.out10_26" + ], + "const_args": [ + "up_blocks.0.resnets.2.conv1.weight" + ], + "out_args": [ + "/up_blocks.0/resnets.2/conv1/Conv_output_0_0_12.out0_1_40" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.2/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.0/resnets.2/conv1/Conv_output_0_0_12.out0_1_40", + "/up_blocks.0/resnets.2/Unsqueeze_1_output_0_0_12.out2_0_12" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/resnets.2/Add.out_12_1_58" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_32", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.0/resnets.2/Add.out_12_1_58" + ], + "const_args": [ + "GroupNorm_32_wts_7_1_32" + ], + "out_args": [ + "GroupNorm_32.out8_32.out7_1_32" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_25", + "type": "SDSilu", + "in_args": [ + "GroupNorm_32.out8_32.out7_1_32" + ], + "const_args": [ + "Sigmoid_25.weights10_27" + ], + "out_args": [ + "GroupNorm_32_sigmoid_out.8_32.out10_27" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_35-/up_blocks.0/resnets.2/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_32_sigmoid_out.8_32.out10_27" + ], + "const_args": [ + "NhwcConv_35_weight_NHWC" + ], + "out_args": [ + "NhwcConv_35_out-/up_blocks.0/resnets.2/conv2/Conv_output_0.out0_1_41" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.2/Add_1", + "type": "SDAdd", + "in_args": [ + "NhwcConv_34_out-/up_blocks.0/resnets.2/conv_shortcut/Conv_output_0.out0_1_39", + "NhwcConv_35_out-/up_blocks.0/resnets.2/conv2/Conv_output_0.out0_1_41" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/resnets.2/Add_1.out_12_1_59" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/upsamplers.0/Resize", + "type": "SDResize", + "in_args": [ + "/up_blocks.0/resnets.2/Add_1.out_12_1_59" + ], + "const_args": [ + "/up_blocks.0/upsamplers.0/Resize.weights4_0" + ], + "out_args": [ + "/up_blocks.0/upsamplers.0/Resize.out_4_0" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_36-/up_blocks.0/upsamplers.0/conv/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.0/upsamplers.0/Resize.out_4_0" + ], + "const_args": [ + "NhwcConv_36_weight_NHWC" + ], + "out_args": [ + "NhwcConv_36_out-/up_blocks.0/upsamplers.0/conv/Conv_output_0.out0_1_42" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/Concat", + "type": "SDConcat", + "in_args": [ + "NhwcConv_36_out-/up_blocks.0/upsamplers.0/conv/Conv_output_0.out0_1_42", + "/Add_8_output_0_13_4.out_12_1_38" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/Concat_output_0_NHWC.out13_4" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_33", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.1/Concat_output_0_NHWC.out13_4" + ], + "const_args": [ + "GroupNorm_33_wts_7_1_33" + ], + "out_args": [ + "GroupNorm_33.out8_33.out7_1_33" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "5120" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_37-/up_blocks.1/resnets.0/conv_shortcut/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.1/Concat_output_0_NHWC.out13_4" + ], + "const_args": [ + "NhwcConv_37_weight_NHWC" + ], + "out_args": [ + "NhwcConv_37_out-/up_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_43" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_26", + "type": "SDSilu", + "in_args": [ + "GroupNorm_33.out8_33.out7_1_33" + ], + "const_args": [ + "Sigmoid_26.weights10_28" + ], + "out_args": [ + "GroupNorm_33_sigmoid_out.8_33.out10_28" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.0/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_33_sigmoid_out.8_33.out10_28" + ], + "const_args": [ + "up_blocks.1.resnets.0.conv1.weight" + ], + "out_args": [ + "/up_blocks.1/resnets.0/conv1/Conv_output_0_0_13.out0_1_44" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.0/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.1/resnets.0/conv1/Conv_output_0_0_13.out0_1_44", + "/up_blocks.1/resnets.0/Unsqueeze_1_output_0_0_13.out2_0_13" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/resnets.0/Add.out_12_1_60" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_34", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.1/resnets.0/Add.out_12_1_60" + ], + "const_args": [ + "GroupNorm_34_wts_7_1_34" + ], + "out_args": [ + "GroupNorm_34.out8_34.out7_1_34" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_27", + "type": "SDSilu", + "in_args": [ + "GroupNorm_34.out8_34.out7_1_34" + ], + "const_args": [ + "Sigmoid_27.weights10_29" + ], + "out_args": [ + "GroupNorm_34_sigmoid_out.8_34.out10_29" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_38-/up_blocks.1/resnets.0/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_34_sigmoid_out.8_34.out10_29" + ], + "const_args": [ + "NhwcConv_38_weight_NHWC" + ], + "out_args": [ + "NhwcConv_38_out-/up_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_45" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.0/Add_1", + "type": "SDAdd", + "in_args": [ + "NhwcConv_37_out-/up_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_43", + "NhwcConv_38_out-/up_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_45" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/resnets.0/Add_1.out_12_1_61" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_35", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.1/resnets.0/Add_1.out_12_1_61" + ], + "const_args": [ + "GroupNorm_35_wts_7_1_35" + ], + "out_args": [ + "/up_blocks.1/attentions.0/norm/Add_output_0_NHWC.out7_1_35" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_39-/up_blocks.1/attentions.0/proj_in/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.1/attentions.0/norm/Add_output_0_NHWC.out7_1_35" + ], + "const_args": [ + "NhwcConv_39_weight_NHWC" + ], + "out_args": [ + "/up_blocks.1/attentions.0/Reshape_output_0.out0_0_7" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.1/attentions.0/Reshape_output_0.out0_0_7" + ], + "const_args": [ + "up_blocks.1.attentions.0.transformer_blocks.0.norm1.weight", + "up_blocks.1.attentions.0.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_21" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_21" + ], + "const_args": [ + "onnx::MatMul_5729" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_60" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_21" + ], + "const_args": [ + "onnx::MatMul_5728" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_61" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_21" + ], + "const_args": [ + "onnx::MatMul_5730" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_62" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_14", + "type": "SDMHA", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_61", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_60", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_62" + ], + "const_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_14_mask.8_14" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_14" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280", + "256" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_14" + ], + "const_args": [ + "onnx::MatMul_5750" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_30" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_30", + "/up_blocks.1/attentions.0/Reshape_output_0.out0_0_7" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_62" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_62" + ], + "const_args": [ + "up_blocks.1.attentions.0.transformer_blocks.0.norm2.weight", + "up_blocks.1.attentions.0.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_22" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_22" + ], + "const_args": [ + "onnx::MatMul_5751" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_63" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_15", + "type": "SDMHA", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_63", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_14", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_15" + ], + "const_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_15_mask.8_15" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_15" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_15" + ], + "const_args": [ + "onnx::MatMul_5773" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_31" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1", + "type": "SDAdd", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_31", + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_62" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_63" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_63" + ], + "const_args": [ + "up_blocks.1.attentions.0.transformer_blocks.0.norm3.weight", + "up_blocks.1.attentions.0.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_23" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul_2_7_0", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_23" + ], + "const_args": [ + "onnx::MatMul_5774_2_7_0" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_7" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul_2_7_1", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_23" + ], + "const_args": [ + "onnx::MatMul_5774_2_7_1" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_32" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_32", + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_7" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_8" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_8" + ], + "const_args": [ + "onnx::MatMul_5775" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_33" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "5120", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/Add_2", + "type": "SDAdd", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_33", + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_63" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.0/Reshape_1_output_0.out_12_0_7" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_40-/up_blocks.1/attentions.0/proj_out/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.1/attentions.0/Reshape_1_output_0.out_12_0_7" + ], + "const_args": [ + "NhwcConv_40_weight_NHWC" + ], + "out_args": [ + "NhwcConv_40_out-/up_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_46" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_40_out-/up_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_46", + "/up_blocks.1/resnets.0/Add_1.out_12_1_61" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.0/Add.out_12_1_64" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/Concat_1", + "type": "SDConcat", + "in_args": [ + "/up_blocks.1/attentions.0/Add.out_12_1_64", + "/Add_7_output_0_13_5.out_12_1_32" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/Concat_1_output_0_NHWC.out13_5" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_36", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.1/Concat_1_output_0_NHWC.out13_5" + ], + "const_args": [ + "GroupNorm_36_wts_7_1_36" + ], + "out_args": [ + "GroupNorm_36.out8_36.out7_1_36" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "5120" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_41-/up_blocks.1/resnets.1/conv_shortcut/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.1/Concat_1_output_0_NHWC.out13_5" + ], + "const_args": [ + "NhwcConv_41_weight_NHWC" + ], + "out_args": [ + "NhwcConv_41_out-/up_blocks.1/resnets.1/conv_shortcut/Conv_output_0.out0_1_47" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_28", + "type": "SDSilu", + "in_args": [ + "GroupNorm_36.out8_36.out7_1_36" + ], + "const_args": [ + "Sigmoid_28.weights10_30" + ], + "out_args": [ + "GroupNorm_36_sigmoid_out.8_36.out10_30" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.1/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_36_sigmoid_out.8_36.out10_30" + ], + "const_args": [ + "up_blocks.1.resnets.1.conv1.weight" + ], + "out_args": [ + "/up_blocks.1/resnets.1/conv1/Conv_output_0_0_14.out0_1_48" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.1/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.1/resnets.1/conv1/Conv_output_0_0_14.out0_1_48", + "/up_blocks.1/resnets.1/Unsqueeze_1_output_0_0_14.out2_0_14" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/resnets.1/Add.out_12_1_65" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_37", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.1/resnets.1/Add.out_12_1_65" + ], + "const_args": [ + "GroupNorm_37_wts_7_1_37" + ], + "out_args": [ + "GroupNorm_37.out8_37.out7_1_37" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_29", + "type": "SDSilu", + "in_args": [ + "GroupNorm_37.out8_37.out7_1_37" + ], + "const_args": [ + "Sigmoid_29.weights10_31" + ], + "out_args": [ + "GroupNorm_37_sigmoid_out.8_37.out10_31" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_42-/up_blocks.1/resnets.1/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_37_sigmoid_out.8_37.out10_31" + ], + "const_args": [ + "NhwcConv_42_weight_NHWC" + ], + "out_args": [ + "NhwcConv_42_out-/up_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_49" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.1/Add_1", + "type": "SDAdd", + "in_args": [ + "NhwcConv_41_out-/up_blocks.1/resnets.1/conv_shortcut/Conv_output_0.out0_1_47", + "NhwcConv_42_out-/up_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_49" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/resnets.1/Add_1.out_12_1_66" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_38", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.1/resnets.1/Add_1.out_12_1_66" + ], + "const_args": [ + "GroupNorm_38_wts_7_1_38" + ], + "out_args": [ + "/up_blocks.1/attentions.1/norm/Add_output_0_NHWC.out7_1_38" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_43-/up_blocks.1/attentions.1/proj_in/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.1/attentions.1/norm/Add_output_0_NHWC.out7_1_38" + ], + "const_args": [ + "NhwcConv_43_weight_NHWC" + ], + "out_args": [ + "/up_blocks.1/attentions.1/Reshape_output_0.out0_0_8" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.1/attentions.1/Reshape_output_0.out0_0_8" + ], + "const_args": [ + "up_blocks.1.attentions.1.transformer_blocks.0.norm1.weight", + "up_blocks.1.attentions.1.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_24" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_24" + ], + "const_args": [ + "onnx::MatMul_5792" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_64" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_24" + ], + "const_args": [ + "onnx::MatMul_5791" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_65" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_24" + ], + "const_args": [ + "onnx::MatMul_5793" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_66" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_16", + "type": "SDMHA", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_65", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_64", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_66" + ], + "const_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_16_mask.8_16" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_16" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280", + "256" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_16" + ], + "const_args": [ + "onnx::MatMul_5813" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_34" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_34", + "/up_blocks.1/attentions.1/Reshape_output_0.out0_0_8" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_67" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_67" + ], + "const_args": [ + "up_blocks.1.attentions.1.transformer_blocks.0.norm2.weight", + "up_blocks.1.attentions.1.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_25" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_25" + ], + "const_args": [ + "onnx::MatMul_5814" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_67" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_17", + "type": "SDMHA", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_67", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_16", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_17" + ], + "const_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_17_mask.8_17" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_17" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_17" + ], + "const_args": [ + "onnx::MatMul_5836" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_35" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1", + "type": "SDAdd", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_35", + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_67" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_68" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_68" + ], + "const_args": [ + "up_blocks.1.attentions.1.transformer_blocks.0.norm3.weight", + "up_blocks.1.attentions.1.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_26" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul_2_8_0", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_26" + ], + "const_args": [ + "onnx::MatMul_5837_2_8_0" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_8" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul_2_8_1", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_26" + ], + "const_args": [ + "onnx::MatMul_5837_2_8_1" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_36" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_36", + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_8" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_9" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_9" + ], + "const_args": [ + "onnx::MatMul_5838" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_37" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "5120", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/Add_2", + "type": "SDAdd", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_37", + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_68" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.1/Reshape_1_output_0.out_12_0_8" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_44-/up_blocks.1/attentions.1/proj_out/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.1/attentions.1/Reshape_1_output_0.out_12_0_8" + ], + "const_args": [ + "NhwcConv_44_weight_NHWC" + ], + "out_args": [ + "NhwcConv_44_out-/up_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_50" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_44_out-/up_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_50", + "/up_blocks.1/resnets.1/Add_1.out_12_1_66" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.1/Add.out_12_1_69" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/Concat_2", + "type": "SDConcat", + "in_args": [ + "/up_blocks.1/attentions.1/Add.out_12_1_69", + "/Add_6_output_0_13_6.out_12_1_26" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/Concat_2_output_0_NHWC.out13_6" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1920" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_39", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.1/Concat_2_output_0_NHWC.out13_6" + ], + "const_args": [ + "GroupNorm_39_wts_7_1_39" + ], + "out_args": [ + "GroupNorm_39.out8_39.out7_1_39" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1920" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1920" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "3840" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_45-/up_blocks.1/resnets.2/conv_shortcut/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.1/Concat_2_output_0_NHWC.out13_6" + ], + "const_args": [ + "NhwcConv_45_weight_NHWC" + ], + "out_args": [ + "NhwcConv_45_out-/up_blocks.1/resnets.2/conv_shortcut/Conv_output_0.out0_1_51" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1920" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1920" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_30", + "type": "SDSilu", + "in_args": [ + "GroupNorm_39.out8_39.out7_1_39" + ], + "const_args": [ + "Sigmoid_30.weights10_32" + ], + "out_args": [ + "GroupNorm_39_sigmoid_out.8_39.out10_32" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1920" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1920" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.2/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_39_sigmoid_out.8_39.out10_32" + ], + "const_args": [ + "up_blocks.1.resnets.2.conv1.weight" + ], + "out_args": [ + "/up_blocks.1/resnets.2/conv1/Conv_output_0_0_15.out0_1_52" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1920" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1920" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.2/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.1/resnets.2/conv1/Conv_output_0_0_15.out0_1_52", + "/up_blocks.1/resnets.2/Unsqueeze_1_output_0_0_15.out2_0_15" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/resnets.2/Add.out_12_1_70" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_40", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.1/resnets.2/Add.out_12_1_70" + ], + "const_args": [ + "GroupNorm_40_wts_7_1_40" + ], + "out_args": [ + "GroupNorm_40.out8_40.out7_1_40" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_31", + "type": "SDSilu", + "in_args": [ + "GroupNorm_40.out8_40.out7_1_40" + ], + "const_args": [ + "Sigmoid_31.weights10_33" + ], + "out_args": [ + "GroupNorm_40_sigmoid_out.8_40.out10_33" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_46-/up_blocks.1/resnets.2/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_40_sigmoid_out.8_40.out10_33" + ], + "const_args": [ + "NhwcConv_46_weight_NHWC" + ], + "out_args": [ + "NhwcConv_46_out-/up_blocks.1/resnets.2/conv2/Conv_output_0.out0_1_53" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.2/Add_1", + "type": "SDAdd", + "in_args": [ + "NhwcConv_45_out-/up_blocks.1/resnets.2/conv_shortcut/Conv_output_0.out0_1_51", + "NhwcConv_46_out-/up_blocks.1/resnets.2/conv2/Conv_output_0.out0_1_53" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/resnets.2/Add_1.out_12_1_71" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_41", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.1/resnets.2/Add_1.out_12_1_71" + ], + "const_args": [ + "GroupNorm_41_wts_7_1_41" + ], + "out_args": [ + "/up_blocks.1/attentions.2/norm/Add_output_0_NHWC.out7_1_41" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_47-/up_blocks.1/attentions.2/proj_in/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.1/attentions.2/norm/Add_output_0_NHWC.out7_1_41" + ], + "const_args": [ + "NhwcConv_47_weight_NHWC" + ], + "out_args": [ + "/up_blocks.1/attentions.2/Reshape_output_0.out0_0_9" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.1/attentions.2/Reshape_output_0.out0_0_9" + ], + "const_args": [ + "up_blocks.1.attentions.2.transformer_blocks.0.norm1.weight", + "up_blocks.1.attentions.2.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_27" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_27" + ], + "const_args": [ + "onnx::MatMul_5855" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_68" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_27" + ], + "const_args": [ + "onnx::MatMul_5854" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_69" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_27" + ], + "const_args": [ + "onnx::MatMul_5856" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_70" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/MatMulmha_0_18", + "type": "SDMHA", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_69", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_68", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_70" + ], + "const_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/MatMulmha_0_18_mask.8_18" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_18" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280", + "256" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_18" + ], + "const_args": [ + "onnx::MatMul_5876" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_38" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_38", + "/up_blocks.1/attentions.2/Reshape_output_0.out0_0_9" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_output_0.out_12_1_72" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_output_0.out_12_1_72" + ], + "const_args": [ + "up_blocks.1.attentions.2.transformer_blocks.0.norm2.weight", + "up_blocks.1.attentions.2.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_28" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_28" + ], + "const_args": [ + "onnx::MatMul_5877" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_71" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/MatMulmha_0_19", + "type": "SDMHA", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_71", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_18", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_19" + ], + "const_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/MatMulmha_0_19_mask.8_19" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_19" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_19" + ], + "const_args": [ + "onnx::MatMul_5899" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_39" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1", + "type": "SDAdd", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_39", + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_output_0.out_12_1_72" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1_output_0.out_12_1_73" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1_output_0.out_12_1_73" + ], + "const_args": [ + "up_blocks.1.attentions.2.transformer_blocks.0.norm3.weight", + "up_blocks.1.attentions.2.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_29" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul_2_9_0", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_29" + ], + "const_args": [ + "onnx::MatMul_5900_2_9_0" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_9" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul_2_9_1", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_29" + ], + "const_args": [ + "onnx::MatMul_5900_2_9_1" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_40" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_40", + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_9" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_10" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.2/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_10" + ], + "const_args": [ + "onnx::MatMul_5901" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_41" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "5120", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/Add_2", + "type": "SDAdd", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_41", + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1_output_0.out_12_1_73" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.2/Reshape_1_output_0.out_12_0_9" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_48-/up_blocks.1/attentions.2/proj_out/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.1/attentions.2/Reshape_1_output_0.out_12_0_9" + ], + "const_args": [ + "NhwcConv_48_weight_NHWC" + ], + "out_args": [ + "NhwcConv_48_out-/up_blocks.1/attentions.2/proj_out/Conv_output_0.out0_1_54" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_48_out-/up_blocks.1/attentions.2/proj_out/Conv_output_0.out0_1_54", + "/up_blocks.1/resnets.2/Add_1.out_12_1_71" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.2/Add.out_12_1_74" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/upsamplers.0/Resize", + "type": "SDResize", + "in_args": [ + "/up_blocks.1/attentions.2/Add.out_12_1_74" + ], + "const_args": [ + "/up_blocks.1/upsamplers.0/Resize.weights4_1" + ], + "out_args": [ + "/up_blocks.1/upsamplers.0/Resize.out_4_1" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_49-/up_blocks.1/upsamplers.0/conv/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.1/upsamplers.0/Resize.out_4_1" + ], + "const_args": [ + "NhwcConv_49_weight_NHWC" + ], + "out_args": [ + "NhwcConv_49_out-/up_blocks.1/upsamplers.0/conv/Conv_output_0.out0_1_55" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/Concat", + "type": "SDConcat", + "in_args": [ + "NhwcConv_49_out-/up_blocks.1/upsamplers.0/conv/Conv_output_0.out0_1_55", + "/Add_5_output_0_13_7.out_12_1_25" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/Concat_output_0_NHWC.out13_7" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1920" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_42", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.2/Concat_output_0_NHWC.out13_7" + ], + "const_args": [ + "GroupNorm_42_wts_7_1_42" + ], + "out_args": [ + "GroupNorm_42.out8_42.out7_1_42" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1920" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1920" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "3840" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_50-/up_blocks.2/resnets.0/conv_shortcut/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.2/Concat_output_0_NHWC.out13_7" + ], + "const_args": [ + "NhwcConv_50_weight_NHWC" + ], + "out_args": [ + "NhwcConv_50_out-/up_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_56" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1920" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "1920" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_32", + "type": "SDSilu", + "in_args": [ + "GroupNorm_42.out8_42.out7_1_42" + ], + "const_args": [ + "Sigmoid_32.weights10_34" + ], + "out_args": [ + "GroupNorm_42_sigmoid_out.8_42.out10_34" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1920" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1920" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.0/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_42_sigmoid_out.8_42.out10_34" + ], + "const_args": [ + "up_blocks.2.resnets.0.conv1.weight" + ], + "out_args": [ + "/up_blocks.2/resnets.0/conv1/Conv_output_0_0_16.out0_1_57" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1920" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "1920" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.0/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.2/resnets.0/conv1/Conv_output_0_0_16.out0_1_57", + "/up_blocks.2/resnets.0/Unsqueeze_1_output_0_0_16.out2_0_16" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/resnets.0/Add.out_12_1_75" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_43", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.2/resnets.0/Add.out_12_1_75" + ], + "const_args": [ + "GroupNorm_43_wts_7_1_43" + ], + "out_args": [ + "GroupNorm_43.out8_43.out7_1_43" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_33", + "type": "SDSilu", + "in_args": [ + "GroupNorm_43.out8_43.out7_1_43" + ], + "const_args": [ + "Sigmoid_33.weights10_35" + ], + "out_args": [ + "GroupNorm_43_sigmoid_out.8_43.out10_35" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_51-/up_blocks.2/resnets.0/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_43_sigmoid_out.8_43.out10_35" + ], + "const_args": [ + "NhwcConv_51_weight_NHWC" + ], + "out_args": [ + "NhwcConv_51_out-/up_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_58" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.0/Add_1", + "type": "SDAdd", + "in_args": [ + "NhwcConv_50_out-/up_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_56", + "NhwcConv_51_out-/up_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_58" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/resnets.0/Add_1.out_12_1_76" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_44", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.2/resnets.0/Add_1.out_12_1_76" + ], + "const_args": [ + "GroupNorm_44_wts_7_1_44" + ], + "out_args": [ + "/up_blocks.2/attentions.0/norm/Add_output_0_NHWC.out7_1_44" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_52-/up_blocks.2/attentions.0/proj_in/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.2/attentions.0/norm/Add_output_0_NHWC.out7_1_44" + ], + "const_args": [ + "NhwcConv_52_weight_NHWC" + ], + "out_args": [ + "/up_blocks.2/attentions.0/Reshape_output_0.out0_0_10" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.2/attentions.0/Reshape_output_0.out0_0_10" + ], + "const_args": [ + "up_blocks.2.attentions.0.transformer_blocks.0.norm1.weight", + "up_blocks.2.attentions.0.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_30" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_30" + ], + "const_args": [ + "onnx::MatMul_5919" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_72" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_30" + ], + "const_args": [ + "onnx::MatMul_5918" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_73" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_30" + ], + "const_args": [ + "onnx::MatMul_5920" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_74" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_20", + "type": "SDMHA", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_73", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_72", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_74" + ], + "const_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_20_mask.8_20" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_20" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640", + "1024" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_20" + ], + "const_args": [ + "onnx::MatMul_5940" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_42" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_42", + "/up_blocks.2/attentions.0/Reshape_output_0.out0_0_10" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_77" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_77" + ], + "const_args": [ + "up_blocks.2.attentions.0.transformer_blocks.0.norm2.weight", + "up_blocks.2.attentions.0.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_31" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_31" + ], + "const_args": [ + "onnx::MatMul_5941" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_75" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_21", + "type": "SDMHA", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_75", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_20", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_21" + ], + "const_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_21_mask.8_21" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_21" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_21" + ], + "const_args": [ + "onnx::MatMul_5963" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_43" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1", + "type": "SDAdd", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_43", + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_77" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_78" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_78" + ], + "const_args": [ + "up_blocks.2.attentions.0.transformer_blocks.0.norm3.weight", + "up_blocks.2.attentions.0.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_32" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul_2_10_0", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_32" + ], + "const_args": [ + "onnx::MatMul_5964_2_10_0" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_10" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul_2_10_1", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_32" + ], + "const_args": [ + "onnx::MatMul_5964_2_10_1" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_44" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_44", + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_10" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_11" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_11" + ], + "const_args": [ + "onnx::MatMul_5965" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_45" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "2560", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/Add_2", + "type": "SDAdd", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_45", + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_78" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.0/Reshape_1_output_0.out_12_0_10" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_53-/up_blocks.2/attentions.0/proj_out/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.2/attentions.0/Reshape_1_output_0.out_12_0_10" + ], + "const_args": [ + "NhwcConv_53_weight_NHWC" + ], + "out_args": [ + "NhwcConv_53_out-/up_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_59" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_53_out-/up_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_59", + "/up_blocks.2/resnets.0/Add_1.out_12_1_76" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.0/Add.out_12_1_79" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/Concat_1", + "type": "SDConcat", + "in_args": [ + "/up_blocks.2/attentions.0/Add.out_12_1_79", + "/Add_4_output_0_13_8.out_12_1_19" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/Concat_1_output_0_NHWC.out13_8" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_45", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.2/Concat_1_output_0_NHWC.out13_8" + ], + "const_args": [ + "GroupNorm_45_wts_7_1_45" + ], + "out_args": [ + "GroupNorm_45.out8_45.out7_1_45" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_54-/up_blocks.2/resnets.1/conv_shortcut/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.2/Concat_1_output_0_NHWC.out13_8" + ], + "const_args": [ + "NhwcConv_54_weight_NHWC" + ], + "out_args": [ + "NhwcConv_54_out-/up_blocks.2/resnets.1/conv_shortcut/Conv_output_0.out0_1_60" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_34", + "type": "SDSilu", + "in_args": [ + "GroupNorm_45.out8_45.out7_1_45" + ], + "const_args": [ + "Sigmoid_34.weights10_36" + ], + "out_args": [ + "GroupNorm_45_sigmoid_out.8_45.out10_36" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.1/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_45_sigmoid_out.8_45.out10_36" + ], + "const_args": [ + "up_blocks.2.resnets.1.conv1.weight" + ], + "out_args": [ + "/up_blocks.2/resnets.1/conv1/Conv_output_0_0_17.out0_1_61" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.1/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.2/resnets.1/conv1/Conv_output_0_0_17.out0_1_61", + "/up_blocks.2/resnets.1/Unsqueeze_1_output_0_0_17.out2_0_17" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/resnets.1/Add.out_12_1_80" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_46", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.2/resnets.1/Add.out_12_1_80" + ], + "const_args": [ + "GroupNorm_46_wts_7_1_46" + ], + "out_args": [ + "GroupNorm_46.out8_46.out7_1_46" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_35", + "type": "SDSilu", + "in_args": [ + "GroupNorm_46.out8_46.out7_1_46" + ], + "const_args": [ + "Sigmoid_35.weights10_37" + ], + "out_args": [ + "GroupNorm_46_sigmoid_out.8_46.out10_37" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_55-/up_blocks.2/resnets.1/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_46_sigmoid_out.8_46.out10_37" + ], + "const_args": [ + "NhwcConv_55_weight_NHWC" + ], + "out_args": [ + "NhwcConv_55_out-/up_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_62" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.1/Add_1", + "type": "SDAdd", + "in_args": [ + "NhwcConv_54_out-/up_blocks.2/resnets.1/conv_shortcut/Conv_output_0.out0_1_60", + "NhwcConv_55_out-/up_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_62" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/resnets.1/Add_1.out_12_1_81" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_47", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.2/resnets.1/Add_1.out_12_1_81" + ], + "const_args": [ + "GroupNorm_47_wts_7_1_47" + ], + "out_args": [ + "/up_blocks.2/attentions.1/norm/Add_output_0_NHWC.out7_1_47" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_56-/up_blocks.2/attentions.1/proj_in/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.2/attentions.1/norm/Add_output_0_NHWC.out7_1_47" + ], + "const_args": [ + "NhwcConv_56_weight_NHWC" + ], + "out_args": [ + "/up_blocks.2/attentions.1/Reshape_output_0.out0_0_11" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.2/attentions.1/Reshape_output_0.out0_0_11" + ], + "const_args": [ + "up_blocks.2.attentions.1.transformer_blocks.0.norm1.weight", + "up_blocks.2.attentions.1.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_33" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_33" + ], + "const_args": [ + "onnx::MatMul_5982" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_76" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_33" + ], + "const_args": [ + "onnx::MatMul_5981" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_77" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_33" + ], + "const_args": [ + "onnx::MatMul_5983" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_78" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_22", + "type": "SDMHA", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_77", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_76", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_78" + ], + "const_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_22_mask.8_22" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_22" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640", + "1024" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_22" + ], + "const_args": [ + "onnx::MatMul_6003" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_46" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_46", + "/up_blocks.2/attentions.1/Reshape_output_0.out0_0_11" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_82" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_82" + ], + "const_args": [ + "up_blocks.2.attentions.1.transformer_blocks.0.norm2.weight", + "up_blocks.2.attentions.1.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_34" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_34" + ], + "const_args": [ + "onnx::MatMul_6004" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_79" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_23", + "type": "SDMHA", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_79", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_22", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_23" + ], + "const_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_23_mask.8_23" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_23" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_23" + ], + "const_args": [ + "onnx::MatMul_6026" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_47" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1", + "type": "SDAdd", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_47", + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_82" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_83" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_83" + ], + "const_args": [ + "up_blocks.2.attentions.1.transformer_blocks.0.norm3.weight", + "up_blocks.2.attentions.1.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_35" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul_2_11_0", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_35" + ], + "const_args": [ + "onnx::MatMul_6027_2_11_0" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_11" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul_2_11_1", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_35" + ], + "const_args": [ + "onnx::MatMul_6027_2_11_1" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_48" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_48", + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_11" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_12" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_12" + ], + "const_args": [ + "onnx::MatMul_6028" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_49" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "2560", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/Add_2", + "type": "SDAdd", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_49", + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_83" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.1/Reshape_1_output_0.out_12_0_11" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_57-/up_blocks.2/attentions.1/proj_out/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.2/attentions.1/Reshape_1_output_0.out_12_0_11" + ], + "const_args": [ + "NhwcConv_57_weight_NHWC" + ], + "out_args": [ + "NhwcConv_57_out-/up_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_63" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_57_out-/up_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_63", + "/up_blocks.2/resnets.1/Add_1.out_12_1_81" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.1/Add.out_12_1_84" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/Concat_2", + "type": "SDConcat", + "in_args": [ + "/up_blocks.2/attentions.1/Add.out_12_1_84", + "/Add_3_output_0_13_9.out_12_1_13" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/Concat_2_output_0_NHWC.out13_9" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "960" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_48", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.2/Concat_2_output_0_NHWC.out13_9" + ], + "const_args": [ + "GroupNorm_48_wts_7_1_48" + ], + "out_args": [ + "GroupNorm_48.out8_48.out7_1_48" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "960" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "960" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1920" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_58-/up_blocks.2/resnets.2/conv_shortcut/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.2/Concat_2_output_0_NHWC.out13_9" + ], + "const_args": [ + "NhwcConv_58_weight_NHWC" + ], + "out_args": [ + "NhwcConv_58_out-/up_blocks.2/resnets.2/conv_shortcut/Conv_output_0.out0_1_64" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "960" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "960" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_36", + "type": "SDSilu", + "in_args": [ + "GroupNorm_48.out8_48.out7_1_48" + ], + "const_args": [ + "Sigmoid_36.weights10_38" + ], + "out_args": [ + "GroupNorm_48_sigmoid_out.8_48.out10_38" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "960" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "960" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.2/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_48_sigmoid_out.8_48.out10_38" + ], + "const_args": [ + "up_blocks.2.resnets.2.conv1.weight" + ], + "out_args": [ + "/up_blocks.2/resnets.2/conv1/Conv_output_0_0_18.out0_1_65" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "960" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "960" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.2/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.2/resnets.2/conv1/Conv_output_0_0_18.out0_1_65", + "/up_blocks.2/resnets.2/Unsqueeze_1_output_0_0_18.out2_0_18" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/resnets.2/Add.out_12_1_85" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_49", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.2/resnets.2/Add.out_12_1_85" + ], + "const_args": [ + "GroupNorm_49_wts_7_1_49" + ], + "out_args": [ + "GroupNorm_49.out8_49.out7_1_49" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_37", + "type": "SDSilu", + "in_args": [ + "GroupNorm_49.out8_49.out7_1_49" + ], + "const_args": [ + "Sigmoid_37.weights10_39" + ], + "out_args": [ + "GroupNorm_49_sigmoid_out.8_49.out10_39" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_59-/up_blocks.2/resnets.2/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_49_sigmoid_out.8_49.out10_39" + ], + "const_args": [ + "NhwcConv_59_weight_NHWC" + ], + "out_args": [ + "NhwcConv_59_out-/up_blocks.2/resnets.2/conv2/Conv_output_0.out0_1_66" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.2/Add_1", + "type": "SDAdd", + "in_args": [ + "NhwcConv_58_out-/up_blocks.2/resnets.2/conv_shortcut/Conv_output_0.out0_1_64", + "NhwcConv_59_out-/up_blocks.2/resnets.2/conv2/Conv_output_0.out0_1_66" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/resnets.2/Add_1.out_12_1_86" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_50", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.2/resnets.2/Add_1.out_12_1_86" + ], + "const_args": [ + "GroupNorm_50_wts_7_1_50" + ], + "out_args": [ + "/up_blocks.2/attentions.2/norm/Add_output_0_NHWC.out7_1_50" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_60-/up_blocks.2/attentions.2/proj_in/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.2/attentions.2/norm/Add_output_0_NHWC.out7_1_50" + ], + "const_args": [ + "NhwcConv_60_weight_NHWC" + ], + "out_args": [ + "/up_blocks.2/attentions.2/Reshape_output_0.out0_0_12" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.2/attentions.2/Reshape_output_0.out0_0_12" + ], + "const_args": [ + "up_blocks.2.attentions.2.transformer_blocks.0.norm1.weight", + "up_blocks.2.attentions.2.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_36" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_36" + ], + "const_args": [ + "onnx::MatMul_6045" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_80" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_36" + ], + "const_args": [ + "onnx::MatMul_6044" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_81" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_36" + ], + "const_args": [ + "onnx::MatMul_6046" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_82" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/MatMulmha_0_24", + "type": "SDMHA", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_81", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_80", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_82" + ], + "const_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/MatMulmha_0_24_mask.8_24" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_24" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640", + "1024" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_24" + ], + "const_args": [ + "onnx::MatMul_6066" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_50" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_50", + "/up_blocks.2/attentions.2/Reshape_output_0.out0_0_12" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_output_0.out_12_1_87" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_output_0.out_12_1_87" + ], + "const_args": [ + "up_blocks.2.attentions.2.transformer_blocks.0.norm2.weight", + "up_blocks.2.attentions.2.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_37" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_37" + ], + "const_args": [ + "onnx::MatMul_6067" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_83" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/MatMulmha_0_25", + "type": "SDMHA", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_83", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_24", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_25" + ], + "const_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/MatMulmha_0_25_mask.8_25" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_25" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_25" + ], + "const_args": [ + "onnx::MatMul_6089" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_51" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1", + "type": "SDAdd", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_51", + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_output_0.out_12_1_87" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1_output_0.out_12_1_88" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1_output_0.out_12_1_88" + ], + "const_args": [ + "up_blocks.2.attentions.2.transformer_blocks.0.norm3.weight", + "up_blocks.2.attentions.2.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_38" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul_2_12_0", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_38" + ], + "const_args": [ + "onnx::MatMul_6090_2_12_0" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_12" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul_2_12_1", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_38" + ], + "const_args": [ + "onnx::MatMul_6090_2_12_1" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_52" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_52", + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_12" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_13" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.2/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_13" + ], + "const_args": [ + "onnx::MatMul_6091" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_53" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "2560", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/Add_2", + "type": "SDAdd", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_53", + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1_output_0.out_12_1_88" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.2/Reshape_1_output_0.out_12_0_12" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_61-/up_blocks.2/attentions.2/proj_out/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.2/attentions.2/Reshape_1_output_0.out_12_0_12" + ], + "const_args": [ + "NhwcConv_61_weight_NHWC" + ], + "out_args": [ + "NhwcConv_61_out-/up_blocks.2/attentions.2/proj_out/Conv_output_0.out0_1_67" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_61_out-/up_blocks.2/attentions.2/proj_out/Conv_output_0.out0_1_67", + "/up_blocks.2/resnets.2/Add_1.out_12_1_86" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.2/Add.out_12_1_89" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/upsamplers.0/Resize", + "type": "SDResize", + "in_args": [ + "/up_blocks.2/attentions.2/Add.out_12_1_89" + ], + "const_args": [ + "/up_blocks.2/upsamplers.0/Resize.weights4_2" + ], + "out_args": [ + "/up_blocks.2/upsamplers.0/Resize.out_4_2" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_62-/up_blocks.2/upsamplers.0/conv/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.2/upsamplers.0/Resize.out_4_2" + ], + "const_args": [ + "NhwcConv_62_weight_NHWC" + ], + "out_args": [ + "NhwcConv_62_out-/up_blocks.2/upsamplers.0/conv/Conv_output_0.out0_1_68" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/Concat", + "type": "SDConcat", + "in_args": [ + "NhwcConv_62_out-/up_blocks.2/upsamplers.0/conv/Conv_output_0.out0_1_68", + "/Add_2_output_0_13_10.out_12_1_12" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/Concat_output_0_NHWC.out13_10" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "960" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_51", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.3/Concat_output_0_NHWC.out13_10" + ], + "const_args": [ + "GroupNorm_51_wts_7_1_51" + ], + "out_args": [ + "GroupNorm_51.out8_51.out7_1_51" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "960" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "960" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1920" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_63-/up_blocks.3/resnets.0/conv_shortcut/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.3/Concat_output_0_NHWC.out13_10" + ], + "const_args": [ + "NhwcConv_63_weight_NHWC" + ], + "out_args": [ + "NhwcConv_63_out-/up_blocks.3/resnets.0/conv_shortcut/Conv_output_0.out0_1_69" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "960" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "960" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_38", + "type": "SDSilu", + "in_args": [ + "GroupNorm_51.out8_51.out7_1_51" + ], + "const_args": [ + "Sigmoid_38.weights10_40" + ], + "out_args": [ + "GroupNorm_51_sigmoid_out.8_51.out10_40" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "960" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "960" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.0/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_51_sigmoid_out.8_51.out10_40" + ], + "const_args": [ + "up_blocks.3.resnets.0.conv1.weight" + ], + "out_args": [ + "/up_blocks.3/resnets.0/conv1/Conv_output_0_0_19.out0_1_70" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "960" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "960" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.0/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.3/resnets.0/conv1/Conv_output_0_0_19.out0_1_70", + "/up_blocks.3/resnets.0/Unsqueeze_1_output_0_0_19.out2_0_19" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/resnets.0/Add.out_12_1_90" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_52", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.3/resnets.0/Add.out_12_1_90" + ], + "const_args": [ + "GroupNorm_52_wts_7_1_52" + ], + "out_args": [ + "GroupNorm_52.out8_52.out7_1_52" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_39", + "type": "SDSilu", + "in_args": [ + "GroupNorm_52.out8_52.out7_1_52" + ], + "const_args": [ + "Sigmoid_39.weights10_41" + ], + "out_args": [ + "GroupNorm_52_sigmoid_out.8_52.out10_41" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_64-/up_blocks.3/resnets.0/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_52_sigmoid_out.8_52.out10_41" + ], + "const_args": [ + "NhwcConv_64_weight_NHWC" + ], + "out_args": [ + "NhwcConv_64_out-/up_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_71" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.0/Add_1", + "type": "SDAdd", + "in_args": [ + "NhwcConv_63_out-/up_blocks.3/resnets.0/conv_shortcut/Conv_output_0.out0_1_69", + "NhwcConv_64_out-/up_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_71" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/resnets.0/Add_1.out_12_1_91" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_53", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.3/resnets.0/Add_1.out_12_1_91" + ], + "const_args": [ + "GroupNorm_53_wts_7_1_53" + ], + "out_args": [ + "/up_blocks.3/attentions.0/norm/Add_output_0_NHWC.out7_1_53" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_65-/up_blocks.3/attentions.0/proj_in/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.3/attentions.0/norm/Add_output_0_NHWC.out7_1_53" + ], + "const_args": [ + "NhwcConv_65_weight_NHWC" + ], + "out_args": [ + "/up_blocks.3/attentions.0/Reshape_output_0.out0_0_13" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.3/attentions.0/Reshape_output_0.out0_0_13" + ], + "const_args": [ + "up_blocks.3.attentions.0.transformer_blocks.0.norm1.weight", + "up_blocks.3.attentions.0.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_39" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_39" + ], + "const_args": [ + "onnx::MatMul_6109" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_84" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_39" + ], + "const_args": [ + "onnx::MatMul_6108" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_85" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_39" + ], + "const_args": [ + "onnx::MatMul_6110" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_86" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_26", + "type": "SDMHA", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_85", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_84", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_86" + ], + "const_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_26_mask.8_26" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_26" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320", + "4096" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_26" + ], + "const_args": [ + "onnx::MatMul_6130" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_54" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_54", + "/up_blocks.3/attentions.0/Reshape_output_0.out0_0_13" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_92" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_92" + ], + "const_args": [ + "up_blocks.3.attentions.0.transformer_blocks.0.norm2.weight", + "up_blocks.3.attentions.0.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_40" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_40" + ], + "const_args": [ + "onnx::MatMul_6131" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_87" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_27", + "type": "SDMHA", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_87", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_26", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_27" + ], + "const_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_27_mask.8_27" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_27" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_27" + ], + "const_args": [ + "onnx::MatMul_6153" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_55" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1", + "type": "SDAdd", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_55", + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_92" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_93" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_93" + ], + "const_args": [ + "up_blocks.3.attentions.0.transformer_blocks.0.norm3.weight", + "up_blocks.3.attentions.0.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_41" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul_2_13_0", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_41" + ], + "const_args": [ + "onnx::MatMul_6154_2_13_0" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_13" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul_2_13_1", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_41" + ], + "const_args": [ + "onnx::MatMul_6154_2_13_1" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_56" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_56", + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_13" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_14" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.2/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_14" + ], + "const_args": [ + "onnx::MatMul_6155" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_57" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/Add_2", + "type": "SDAdd", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_57", + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_93" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.0/Reshape_1_output_0.out_12_0_13" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_66-/up_blocks.3/attentions.0/proj_out/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.3/attentions.0/Reshape_1_output_0.out_12_0_13" + ], + "const_args": [ + "NhwcConv_66_weight_NHWC" + ], + "out_args": [ + "NhwcConv_66_out-/up_blocks.3/attentions.0/proj_out/Conv_output_0.out0_1_72" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_66_out-/up_blocks.3/attentions.0/proj_out/Conv_output_0.out0_1_72", + "/up_blocks.3/resnets.0/Add_1.out_12_1_91" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.0/Add.out_12_1_94" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/Concat_1", + "type": "SDConcat", + "in_args": [ + "/up_blocks.3/attentions.0/Add.out_12_1_94", + "/Add_1_output_0_13_11.out_12_1_6" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/Concat_1_output_0_NHWC.out13_11" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_54", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.3/Concat_1_output_0_NHWC.out13_11" + ], + "const_args": [ + "GroupNorm_54_wts_7_1_54" + ], + "out_args": [ + "GroupNorm_54.out8_54.out7_1_54" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_67-/up_blocks.3/resnets.1/conv_shortcut/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.3/Concat_1_output_0_NHWC.out13_11" + ], + "const_args": [ + "NhwcConv_67_weight_NHWC" + ], + "out_args": [ + "NhwcConv_67_out-/up_blocks.3/resnets.1/conv_shortcut/Conv_output_0.out0_1_73" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_40", + "type": "SDSilu", + "in_args": [ + "GroupNorm_54.out8_54.out7_1_54" + ], + "const_args": [ + "Sigmoid_40.weights10_42" + ], + "out_args": [ + "GroupNorm_54_sigmoid_out.8_54.out10_42" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.1/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_54_sigmoid_out.8_54.out10_42" + ], + "const_args": [ + "up_blocks.3.resnets.1.conv1.weight" + ], + "out_args": [ + "/up_blocks.3/resnets.1/conv1/Conv_output_0_0_20.out0_1_74" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.1/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.3/resnets.1/conv1/Conv_output_0_0_20.out0_1_74", + "/up_blocks.3/resnets.1/Unsqueeze_1_output_0_0_20.out2_0_20" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/resnets.1/Add.out_12_1_95" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_55", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.3/resnets.1/Add.out_12_1_95" + ], + "const_args": [ + "GroupNorm_55_wts_7_1_55" + ], + "out_args": [ + "GroupNorm_55.out8_55.out7_1_55" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_41", + "type": "SDSilu", + "in_args": [ + "GroupNorm_55.out8_55.out7_1_55" + ], + "const_args": [ + "Sigmoid_41.weights10_43" + ], + "out_args": [ + "GroupNorm_55_sigmoid_out.8_55.out10_43" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_68-/up_blocks.3/resnets.1/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_55_sigmoid_out.8_55.out10_43" + ], + "const_args": [ + "NhwcConv_68_weight_NHWC" + ], + "out_args": [ + "NhwcConv_68_out-/up_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_75" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.1/Add_1", + "type": "SDAdd", + "in_args": [ + "NhwcConv_67_out-/up_blocks.3/resnets.1/conv_shortcut/Conv_output_0.out0_1_73", + "NhwcConv_68_out-/up_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_75" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/resnets.1/Add_1.out_12_1_96" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_56", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.3/resnets.1/Add_1.out_12_1_96" + ], + "const_args": [ + "GroupNorm_56_wts_7_1_56" + ], + "out_args": [ + "/up_blocks.3/attentions.1/norm/Add_output_0_NHWC.out7_1_56" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_69-/up_blocks.3/attentions.1/proj_in/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.3/attentions.1/norm/Add_output_0_NHWC.out7_1_56" + ], + "const_args": [ + "NhwcConv_69_weight_NHWC" + ], + "out_args": [ + "/up_blocks.3/attentions.1/Reshape_output_0.out0_0_14" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.3/attentions.1/Reshape_output_0.out0_0_14" + ], + "const_args": [ + "up_blocks.3.attentions.1.transformer_blocks.0.norm1.weight", + "up_blocks.3.attentions.1.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_42" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_42" + ], + "const_args": [ + "onnx::MatMul_6172" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_88" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_42" + ], + "const_args": [ + "onnx::MatMul_6171" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_89" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_42" + ], + "const_args": [ + "onnx::MatMul_6173" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_90" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_28", + "type": "SDMHA", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_89", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_88", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_90" + ], + "const_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_28_mask.8_28" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_28" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320", + "4096" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_28" + ], + "const_args": [ + "onnx::MatMul_6193" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_58" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_58", + "/up_blocks.3/attentions.1/Reshape_output_0.out0_0_14" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_97" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_97" + ], + "const_args": [ + "up_blocks.3.attentions.1.transformer_blocks.0.norm2.weight", + "up_blocks.3.attentions.1.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_43" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_43" + ], + "const_args": [ + "onnx::MatMul_6194" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_91" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_29", + "type": "SDMHA", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_91", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_28", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_29" + ], + "const_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_29_mask.8_29" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_29" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_29" + ], + "const_args": [ + "onnx::MatMul_6216" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_59" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1", + "type": "SDAdd", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_59", + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_97" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_98" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_98" + ], + "const_args": [ + "up_blocks.3.attentions.1.transformer_blocks.0.norm3.weight", + "up_blocks.3.attentions.1.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_44" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul_2_14_0", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_44" + ], + "const_args": [ + "onnx::MatMul_6217_2_14_0" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_14" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul_2_14_1", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_44" + ], + "const_args": [ + "onnx::MatMul_6217_2_14_1" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_60" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_60", + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_14" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_15" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.2/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_15" + ], + "const_args": [ + "onnx::MatMul_6218" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_61" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/Add_2", + "type": "SDAdd", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_61", + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_98" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.1/Reshape_1_output_0.out_12_0_14" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_70-/up_blocks.3/attentions.1/proj_out/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.3/attentions.1/Reshape_1_output_0.out_12_0_14" + ], + "const_args": [ + "NhwcConv_70_weight_NHWC" + ], + "out_args": [ + "NhwcConv_70_out-/up_blocks.3/attentions.1/proj_out/Conv_output_0.out0_1_76" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_70_out-/up_blocks.3/attentions.1/proj_out/Conv_output_0.out0_1_76", + "/up_blocks.3/resnets.1/Add_1.out_12_1_96" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.1/Add.out_12_1_99" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/Concat_2", + "type": "SDConcat", + "in_args": [ + "/up_blocks.3/attentions.1/Add.out_12_1_99", + "/Add_output_0_13_12.out_12_1_0" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/Concat_2_output_0_NHWC.out13_12" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_57", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.3/Concat_2_output_0_NHWC.out13_12" + ], + "const_args": [ + "GroupNorm_57_wts_7_1_57" + ], + "out_args": [ + "GroupNorm_57.out8_57.out7_1_57" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_71-/up_blocks.3/resnets.2/conv_shortcut/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.3/Concat_2_output_0_NHWC.out13_12" + ], + "const_args": [ + "NhwcConv_71_weight_NHWC" + ], + "out_args": [ + "NhwcConv_71_out-/up_blocks.3/resnets.2/conv_shortcut/Conv_output_0.out0_1_77" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_42", + "type": "SDSilu", + "in_args": [ + "GroupNorm_57.out8_57.out7_1_57" + ], + "const_args": [ + "Sigmoid_42.weights10_44" + ], + "out_args": [ + "GroupNorm_57_sigmoid_out.8_57.out10_44" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.2/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_57_sigmoid_out.8_57.out10_44" + ], + "const_args": [ + "up_blocks.3.resnets.2.conv1.weight" + ], + "out_args": [ + "/up_blocks.3/resnets.2/conv1/Conv_output_0_0_21.out0_1_78" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.2/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.3/resnets.2/conv1/Conv_output_0_0_21.out0_1_78", + "/up_blocks.3/resnets.2/Unsqueeze_1_output_0_0_21.out2_0_21" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/resnets.2/Add.out_12_1_100" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_58", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.3/resnets.2/Add.out_12_1_100" + ], + "const_args": [ + "GroupNorm_58_wts_7_1_58" + ], + "out_args": [ + "GroupNorm_58.out8_58.out7_1_58" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_43", + "type": "SDSilu", + "in_args": [ + "GroupNorm_58.out8_58.out7_1_58" + ], + "const_args": [ + "Sigmoid_43.weights10_45" + ], + "out_args": [ + "GroupNorm_58_sigmoid_out.8_58.out10_45" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_72-/up_blocks.3/resnets.2/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_58_sigmoid_out.8_58.out10_45" + ], + "const_args": [ + "NhwcConv_72_weight_NHWC" + ], + "out_args": [ + "NhwcConv_72_out-/up_blocks.3/resnets.2/conv2/Conv_output_0.out0_1_79" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.2/Add_1", + "type": "SDAdd", + "in_args": [ + "NhwcConv_71_out-/up_blocks.3/resnets.2/conv_shortcut/Conv_output_0.out0_1_77", + "NhwcConv_72_out-/up_blocks.3/resnets.2/conv2/Conv_output_0.out0_1_79" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/resnets.2/Add_1.out_12_1_101" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_59", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.3/resnets.2/Add_1.out_12_1_101" + ], + "const_args": [ + "GroupNorm_59_wts_7_1_59" + ], + "out_args": [ + "/up_blocks.3/attentions.2/norm/Add_output_0_NHWC.out7_1_59" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_73-/up_blocks.3/attentions.2/proj_in/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.3/attentions.2/norm/Add_output_0_NHWC.out7_1_59" + ], + "const_args": [ + "NhwcConv_73_weight_NHWC" + ], + "out_args": [ + "/up_blocks.3/attentions.2/Reshape_output_0.out0_0_15" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.3/attentions.2/Reshape_output_0.out0_0_15" + ], + "const_args": [ + "up_blocks.3.attentions.2.transformer_blocks.0.norm1.weight", + "up_blocks.3.attentions.2.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_45" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_45" + ], + "const_args": [ + "onnx::MatMul_6235" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_92" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_45" + ], + "const_args": [ + "onnx::MatMul_6234" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_93" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_45" + ], + "const_args": [ + "onnx::MatMul_6236" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_94" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/MatMulmha_0_30", + "type": "SDMHA", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_93", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_92", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_94" + ], + "const_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/MatMulmha_0_30_mask.8_30" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_30" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320", + "4096" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_30" + ], + "const_args": [ + "onnx::MatMul_6256" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_62" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/Add", + "type": "SDAdd", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_62", + "/up_blocks.3/attentions.2/Reshape_output_0.out0_0_15" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_output_0.out_12_1_102" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_output_0.out_12_1_102" + ], + "const_args": [ + "up_blocks.3.attentions.2.transformer_blocks.0.norm2.weight", + "up_blocks.3.attentions.2.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_46" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_46" + ], + "const_args": [ + "onnx::MatMul_6257" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_95" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/MatMulmha_0_31", + "type": "SDMHA", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_95", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_30", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_31" + ], + "const_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/MatMulmha_0_31_mask.8_31" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_31" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_31" + ], + "const_args": [ + "onnx::MatMul_6279" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_63" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1", + "type": "SDAdd", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_63", + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_output_0.out_12_1_102" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1_output_0.out_12_1_103" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1_output_0.out_12_1_103" + ], + "const_args": [ + "up_blocks.3.attentions.2.transformer_blocks.0.norm3.weight", + "up_blocks.3.attentions.2.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_47" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul_2_15_0", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_47" + ], + "const_args": [ + "onnx::MatMul_6280_2_15_0" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_15" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul_2_15_1", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_47" + ], + "const_args": [ + "onnx::MatMul_6280_2_15_1" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_64" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_64", + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_15" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_16" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.2/MatMul", + "type": "SDGemm", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_16" + ], + "const_args": [ + "onnx::MatMul_6281" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_65" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/Add_2", + "type": "SDAdd", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_65", + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1_output_0.out_12_1_103" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.2/Reshape_1_output_0.out_12_0_15" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_74-/up_blocks.3/attentions.2/proj_out/Conv", + "type": "SDConv", + "in_args": [ + "/up_blocks.3/attentions.2/Reshape_1_output_0.out_12_0_15" + ], + "const_args": [ + "NhwcConv_74_weight_NHWC" + ], + "out_args": [ + "NhwcConv_74_out-/up_blocks.3/attentions.2/proj_out/Conv_output_0.out0_1_80" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_74_out-/up_blocks.3/attentions.2/proj_out/Conv_output_0.out0_1_80", + "/up_blocks.3/resnets.2/Add_1.out_12_1_101" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.2/Add.out_12_1_104" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_60", + "type": "SDGroupNorm", + "in_args": [ + "/up_blocks.3/attentions.2/Add.out_12_1_104" + ], + "const_args": [ + "GroupNorm_60_wts_7_1_60" + ], + "out_args": [ + "GroupNorm_60.out8_60.out7_1_60" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_44", + "type": "SDSilu", + "in_args": [ + "GroupNorm_60.out8_60.out7_1_60" + ], + "const_args": [ + "Sigmoid_44.weights10_46" + ], + "out_args": [ + "GroupNorm_60_sigmoid_out.8_60.out10_46" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_75-/conv_out/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_60_sigmoid_out.8_60.out10_46" + ], + "const_args": [ + "NhwcConv_75_weight_NHWC" + ], + "out_args": [ + "NhwcConv_75_out-noise_pred.out0_1_81" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "4" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "4", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + } + ], + "fused_tensors": { + "in": { + "buffer_size": 34505984, + "xrt_arg_id": 0, + "packed_tensors": [ + "encoder_hidden_states.out2_6_0", + "Transpose_0_out-sample.out0_1_0", + "class_labels_13_12_trans.out_12_1_0", + "/time_proj/Concat_1_output_0.out2_3_0", + "timestep_cond_13_11_trans.out_12_1_6", + "attention_mask_13_10_trans.out_12_1_12", + "cross_attention_kwargs_13_9_trans.out_12_1_13", + "added_cond_kwargs_13_8_trans.out_12_1_19", + "down_block_additional_residuals_13_7_trans.out_12_1_25", + "mid_block_additional_residual_13_6_trans.out_12_1_26", + "onnx::Add_10_13_5_trans.out_12_1_32", + "onnx::Add_11_13_4_trans.out_12_1_38", + "onnx::Add_12_13_3_trans.out_12_1_39", + "onnx::Add_13_13_2_trans.out_12_1_42", + "onnx::Add_14_13_1_trans.out_12_1_45", + "onnx::Add_15_13_0_trans.out_12_1_53" + ] + }, + "out": { + "buffer_size": 65536, + "xrt_arg_id": 1, + "packed_tensors": [ + "NhwcConv_75_out-noise_pred.out0_1_81" + ] + }, + "scratch": { + "buffer_size": 2064636160, + "xrt_arg_id": 2, + "packed_tensors": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_0", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_1", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_2", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_3", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_4", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_5", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_6", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_7", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_8", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_9", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_10", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_11", + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_12", + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_13", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_14", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_15", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_16", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_17", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_18", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_19", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_20", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_21", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_22", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_23", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_24", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_25", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_26", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_27", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_28", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_29", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_30", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_31", + "NhwcConv_0_out-/conv_in/Conv_output_0.out0_1_0", + "/Add_output_0_13_12.out_12_1_0", + "GroupNorm_0.out8_0.out7_1_0", + "GroupNorm_0_sigmoid_out.8_0.out10_0", + "/down_blocks.0/resnets.0/conv1/Conv_output_0_0_0.out0_1_1", + "/time_embedding/linear_1/Gemm_output_0.out2_3_0", + "/time_embedding/act/Sigmoid_output_0.out10_1", + "/time_embedding/linear_2/Gemm_output_0.out2_3_1", + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2", + "/down_blocks.0/resnets.0/Unsqueeze_1_output_0_0_0.out2_0_0", + "/down_blocks.0/resnets.1/Unsqueeze_1_output_0_0_1.out2_0_1", + "/down_blocks.1/resnets.0/Unsqueeze_1_output_0_0_2.out2_0_2", + "/down_blocks.1/resnets.1/Unsqueeze_1_output_0_0_3.out2_0_3", + "/down_blocks.2/resnets.0/Unsqueeze_1_output_0_0_4.out2_0_4", + "/down_blocks.2/resnets.1/Unsqueeze_1_output_0_0_5.out2_0_5", + "/down_blocks.3/resnets.0/Unsqueeze_1_output_0_0_6.out2_0_6", + "/down_blocks.3/resnets.1/Unsqueeze_1_output_0_0_7.out2_0_7", + "/mid_block/resnets.0/Unsqueeze_1_output_0_0_8.out2_0_8", + "/mid_block/resnets.1/Unsqueeze_1_output_0_0_9.out2_0_9", + "/up_blocks.0/resnets.0/Unsqueeze_1_output_0_0_10.out2_0_10", + "/up_blocks.0/resnets.1/Unsqueeze_1_output_0_0_11.out2_0_11", + "/up_blocks.0/resnets.2/Unsqueeze_1_output_0_0_12.out2_0_12", + "/up_blocks.1/resnets.0/Unsqueeze_1_output_0_0_13.out2_0_13", + "/up_blocks.1/resnets.1/Unsqueeze_1_output_0_0_14.out2_0_14", + "/up_blocks.1/resnets.2/Unsqueeze_1_output_0_0_15.out2_0_15", + "/up_blocks.2/resnets.0/Unsqueeze_1_output_0_0_16.out2_0_16", + "/up_blocks.2/resnets.1/Unsqueeze_1_output_0_0_17.out2_0_17", + "/up_blocks.2/resnets.2/Unsqueeze_1_output_0_0_18.out2_0_18", + "/up_blocks.3/resnets.0/Unsqueeze_1_output_0_0_19.out2_0_19", + "/up_blocks.3/resnets.1/Unsqueeze_1_output_0_0_20.out2_0_20", + "/up_blocks.3/resnets.2/Unsqueeze_1_output_0_0_21.out2_0_21", + "/down_blocks.0/resnets.0/Add.out_12_1_1", + "GroupNorm_1.out8_1.out7_1_1", + "GroupNorm_1_sigmoid_out.8_1.out10_3", + "NhwcConv_1_out-/down_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_2", + "/down_blocks.0/resnets.0/Add_1.out_12_1_2", + "/down_blocks.0/attentions.0/norm/Add_output_0_NHWC.out7_1_2", + "/down_blocks.0/attentions.0/Reshape_output_0.out0_0_0", + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_0", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_32", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_33", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_34", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_0", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_2", + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_3", + "/down_blocks.0/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_1", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_1", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_3", + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_4", + "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_2", + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_0", + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_4", + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_1", + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_5", + "/down_blocks.0/attentions.0/Reshape_1_output_0.out_12_0_0", + "NhwcConv_3_out-/down_blocks.0/attentions.0/proj_out/Conv_output_0.out0_1_3", + "/down_blocks.0/attentions.0/Add.out_12_1_5", + "GroupNorm_3.out8_3.out7_1_3", + "GroupNorm_3_sigmoid_out.8_3.out10_4", + "/Add_1_output_0_13_11.out_12_1_6", + "/down_blocks.0/resnets.1/conv1/Conv_output_0_0_1.out0_1_4", + "/down_blocks.0/resnets.1/Add.out_12_1_7", + "GroupNorm_4.out8_4.out7_1_4", + "GroupNorm_4_sigmoid_out.8_4.out10_5", + "NhwcConv_4_out-/down_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_5", + "/down_blocks.0/resnets.1/Add_1.out_12_1_8", + "/down_blocks.0/attentions.1/norm/Add_output_0_NHWC.out7_1_5", + "/down_blocks.0/attentions.1/Reshape_output_0.out0_0_1", + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_3", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_36", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_37", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_38", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_2", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_6", + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_9", + "/down_blocks.0/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_4", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_3", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_7", + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_10", + "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_5", + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_1", + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_8", + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_2", + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_9", + "/down_blocks.0/attentions.1/Reshape_1_output_0.out_12_0_1", + "NhwcConv_6_out-/down_blocks.0/attentions.1/proj_out/Conv_output_0.out0_1_6", + "/down_blocks.0/attentions.1/Add.out_12_1_11", + "NhwcConv_7_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7", + "NhwcConv_8_out-/down_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_8", + "/Add_2_output_0_13_10.out_12_1_12", + "/Add_3_output_0_13_9.out_12_1_13", + "GroupNorm_6.out8_6.out7_1_6", + "GroupNorm_6_sigmoid_out.8_6.out10_6", + "/down_blocks.1/resnets.0/conv1/Conv_output_0_0_2.out0_1_9", + "/down_blocks.1/resnets.0/Add.out_12_1_14", + "GroupNorm_7.out8_7.out7_1_7", + "GroupNorm_7_sigmoid_out.8_7.out10_7", + "NhwcConv_9_out-/down_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_10", + "/down_blocks.1/resnets.0/Add_1.out_12_1_15", + "/down_blocks.1/attentions.0/norm/Add_output_0_NHWC.out7_1_8", + "/down_blocks.1/attentions.0/Reshape_output_0.out0_0_2", + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_6", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_40", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_41", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_42", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_4", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_10", + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_16", + "/down_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_7", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_5", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_11", + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_17", + "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_8", + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_2", + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_12", + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_3", + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_13", + "/down_blocks.1/attentions.0/Reshape_1_output_0.out_12_0_2", + "NhwcConv_11_out-/down_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_11", + "/down_blocks.1/attentions.0/Add.out_12_1_18", + "GroupNorm_9.out8_9.out7_1_9", + "GroupNorm_9_sigmoid_out.8_9.out10_8", + "/Add_4_output_0_13_8.out_12_1_19", + "/down_blocks.1/resnets.1/conv1/Conv_output_0_0_3.out0_1_12", + "/down_blocks.1/resnets.1/Add.out_12_1_20", + "GroupNorm_10.out8_10.out7_1_10", + "GroupNorm_10_sigmoid_out.8_10.out10_9", + "NhwcConv_12_out-/down_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_13", + "/down_blocks.1/resnets.1/Add_1.out_12_1_21", + "/down_blocks.1/attentions.1/norm/Add_output_0_NHWC.out7_1_11", + "/down_blocks.1/attentions.1/Reshape_output_0.out0_0_3", + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_9", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_44", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_45", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_46", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_6", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_14", + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_22", + "/down_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_10", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_7", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_15", + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_23", + "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_11", + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_3", + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_16", + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_4", + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_17", + "/down_blocks.1/attentions.1/Reshape_1_output_0.out_12_0_3", + "NhwcConv_14_out-/down_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_14", + "/down_blocks.1/attentions.1/Add.out_12_1_24", + "NhwcConv_15_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15", + "NhwcConv_16_out-/down_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_16", + "/Add_5_output_0_13_7.out_12_1_25", + "/Add_6_output_0_13_6.out_12_1_26", + "GroupNorm_12.out8_12.out7_1_12", + "GroupNorm_12_sigmoid_out.8_12.out10_10", + "/down_blocks.2/resnets.0/conv1/Conv_output_0_0_4.out0_1_17", + "/down_blocks.2/resnets.0/Add.out_12_1_27", + "GroupNorm_13.out8_13.out7_1_13", + "GroupNorm_13_sigmoid_out.8_13.out10_11", + "NhwcConv_17_out-/down_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_18", + "/down_blocks.2/resnets.0/Add_1.out_12_1_28", + "/down_blocks.2/attentions.0/norm/Add_output_0_NHWC.out7_1_14", + "/down_blocks.2/attentions.0/Reshape_output_0.out0_0_4", + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_12", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_48", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_49", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_50", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_8", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_18", + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_29", + "/down_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_13", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_51", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_9", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_19", + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_30", + "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_14", + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_4", + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_20", + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_5", + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_21", + "/down_blocks.2/attentions.0/Reshape_1_output_0.out_12_0_4", + "NhwcConv_19_out-/down_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_19", + "/down_blocks.2/attentions.0/Add.out_12_1_31", + "GroupNorm_15.out8_15.out7_1_15", + "GroupNorm_15_sigmoid_out.8_15.out10_12", + "/Add_7_output_0_13_5.out_12_1_32", + "/down_blocks.2/resnets.1/conv1/Conv_output_0_0_5.out0_1_20", + "/down_blocks.2/resnets.1/Add.out_12_1_33", + "GroupNorm_16.out8_16.out7_1_16", + "GroupNorm_16_sigmoid_out.8_16.out10_13", + "NhwcConv_20_out-/down_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_21", + "/down_blocks.2/resnets.1/Add_1.out_12_1_34", + "/down_blocks.2/attentions.1/norm/Add_output_0_NHWC.out7_1_17", + "/down_blocks.2/attentions.1/Reshape_output_0.out0_0_5", + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_15", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_52", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_53", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_54", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_10", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_22", + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_35", + "/down_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_16", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_55", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_11", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_23", + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_36", + "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_17", + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_5", + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_24", + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_6", + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_25", + "/down_blocks.2/attentions.1/Reshape_1_output_0.out_12_0_5", + "NhwcConv_22_out-/down_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_22", + "/down_blocks.2/attentions.1/Add.out_12_1_37", + "NhwcConv_23_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23", + "/Add_8_output_0_13_4.out_12_1_38", + "/Add_9_output_0_13_3.out_12_1_39", + "GroupNorm_18.out8_18.out7_1_18", + "GroupNorm_18_sigmoid_out.8_18.out10_14", + "/down_blocks.3/resnets.0/conv1/Conv_output_0_0_6.out0_1_24", + "/down_blocks.3/resnets.0/Add.out_12_1_40", + "GroupNorm_19.out8_19.out7_1_19", + "GroupNorm_19_sigmoid_out.8_19.out10_15", + "NhwcConv_24_out-/down_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_25", + "/down_blocks.3/resnets.0/Add_1.out_12_1_41", + "GroupNorm_20.out8_20.out7_1_20", + "GroupNorm_20_sigmoid_out.8_20.out10_16", + "/Add_10_output_0_13_2.out_12_1_42", + "/down_blocks.3/resnets.1/conv1/Conv_output_0_0_7.out0_1_26", + "/down_blocks.3/resnets.1/Add.out_12_1_43", + "GroupNorm_21.out8_21.out7_1_21", + "GroupNorm_21_sigmoid_out.8_21.out10_17", + "NhwcConv_25_out-/down_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_27", + "/down_blocks.3/resnets.1/Add_1.out_12_1_44", + "GroupNorm_22.out8_22.out7_1_22", + "GroupNorm_22_sigmoid_out.8_22.out10_18", + "/Add_11_output_0_13_1.out_12_1_45", + "/mid_block/resnets.0/conv1/Conv_output_0_0_8.out0_1_28", + "/mid_block/resnets.0/Add.out_12_1_46", + "GroupNorm_23.out8_23.out7_1_23", + "GroupNorm_23_sigmoid_out.8_23.out10_19", + "NhwcConv_26_out-/mid_block/resnets.0/conv2/Conv_output_0.out0_1_29", + "/mid_block/resnets.0/Add_1.out_12_1_47", + "/mid_block/attentions.0/norm/Add_output_0_NHWC.out7_1_24", + "/mid_block/attentions.0/Reshape_output_0.out0_0_6", + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_18", + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_56", + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_57", + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_58", + "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_12", + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_26", + "/mid_block/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_48", + "/mid_block/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_19", + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_59", + "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_13", + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_27", + "/mid_block/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_49", + "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_20", + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_6", + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_28", + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_7", + "/mid_block/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_29", + "/mid_block/attentions.0/Reshape_1_output_0.out_12_0_6", + "NhwcConv_28_out-/mid_block/attentions.0/proj_out/Conv_output_0.out0_1_30", + "/mid_block/attentions.0/Add.out_12_1_50", + "GroupNorm_25.out8_25.out7_1_25", + "GroupNorm_25_sigmoid_out.8_25.out10_20", + "/mid_block/resnets.1/conv1/Conv_output_0_0_9.out0_1_31", + "/mid_block/resnets.1/Add.out_12_1_51", + "GroupNorm_26.out8_26.out7_1_26", + "GroupNorm_26_sigmoid_out.8_26.out10_21", + "NhwcConv_29_out-/mid_block/resnets.1/conv2/Conv_output_0.out0_1_32", + "/mid_block/resnets.1/Add_1.out_12_1_52", + "/Add_12_output_0_13_0.out_12_1_53", + "/up_blocks.0/Concat_output_0_NHWC.out13_1", + "GroupNorm_27.out8_27.out7_1_27", + "NhwcConv_30_out-/up_blocks.0/resnets.0/conv_shortcut/Conv_output_0.out0_1_33", + "GroupNorm_27_sigmoid_out.8_27.out10_22", + "/up_blocks.0/resnets.0/conv1/Conv_output_0_0_10.out0_1_34", + "/up_blocks.0/resnets.0/Add.out_12_1_54", + "GroupNorm_28.out8_28.out7_1_28", + "GroupNorm_28_sigmoid_out.8_28.out10_23", + "NhwcConv_31_out-/up_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_35", + "/up_blocks.0/resnets.0/Add_1.out_12_1_55", + "/up_blocks.0/Concat_1_output_0_NHWC.out13_2", + "GroupNorm_29.out8_29.out7_1_29", + "NhwcConv_32_out-/up_blocks.0/resnets.1/conv_shortcut/Conv_output_0.out0_1_36", + "GroupNorm_29_sigmoid_out.8_29.out10_24", + "/up_blocks.0/resnets.1/conv1/Conv_output_0_0_11.out0_1_37", + "/up_blocks.0/resnets.1/Add.out_12_1_56", + "GroupNorm_30.out8_30.out7_1_30", + "GroupNorm_30_sigmoid_out.8_30.out10_25", + "NhwcConv_33_out-/up_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_38", + "/up_blocks.0/resnets.1/Add_1.out_12_1_57", + "/up_blocks.0/Concat_2_output_0_NHWC.out13_3", + "GroupNorm_31.out8_31.out7_1_31", + "NhwcConv_34_out-/up_blocks.0/resnets.2/conv_shortcut/Conv_output_0.out0_1_39", + "GroupNorm_31_sigmoid_out.8_31.out10_26", + "/up_blocks.0/resnets.2/conv1/Conv_output_0_0_12.out0_1_40", + "/up_blocks.0/resnets.2/Add.out_12_1_58", + "GroupNorm_32.out8_32.out7_1_32", + "GroupNorm_32_sigmoid_out.8_32.out10_27", + "NhwcConv_35_out-/up_blocks.0/resnets.2/conv2/Conv_output_0.out0_1_41", + "/up_blocks.0/resnets.2/Add_1.out_12_1_59", + "/up_blocks.0/upsamplers.0/Resize.out_4_0", + "NhwcConv_36_out-/up_blocks.0/upsamplers.0/conv/Conv_output_0.out0_1_42", + "/up_blocks.1/Concat_output_0_NHWC.out13_4", + "GroupNorm_33.out8_33.out7_1_33", + "NhwcConv_37_out-/up_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_43", + "GroupNorm_33_sigmoid_out.8_33.out10_28", + "/up_blocks.1/resnets.0/conv1/Conv_output_0_0_13.out0_1_44", + "/up_blocks.1/resnets.0/Add.out_12_1_60", + "GroupNorm_34.out8_34.out7_1_34", + "GroupNorm_34_sigmoid_out.8_34.out10_29", + "NhwcConv_38_out-/up_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_45", + "/up_blocks.1/resnets.0/Add_1.out_12_1_61", + "/up_blocks.1/attentions.0/norm/Add_output_0_NHWC.out7_1_35", + "/up_blocks.1/attentions.0/Reshape_output_0.out0_0_7", + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_21", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_60", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_61", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_62", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_14", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_30", + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_62", + "/up_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_22", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_63", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_15", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_31", + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_63", + "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_23", + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_7", + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_32", + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_8", + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_33", + "/up_blocks.1/attentions.0/Reshape_1_output_0.out_12_0_7", + "NhwcConv_40_out-/up_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_46", + "/up_blocks.1/attentions.0/Add.out_12_1_64", + "/up_blocks.1/Concat_1_output_0_NHWC.out13_5", + "GroupNorm_36.out8_36.out7_1_36", + "NhwcConv_41_out-/up_blocks.1/resnets.1/conv_shortcut/Conv_output_0.out0_1_47", + "GroupNorm_36_sigmoid_out.8_36.out10_30", + "/up_blocks.1/resnets.1/conv1/Conv_output_0_0_14.out0_1_48", + "/up_blocks.1/resnets.1/Add.out_12_1_65", + "GroupNorm_37.out8_37.out7_1_37", + "GroupNorm_37_sigmoid_out.8_37.out10_31", + "NhwcConv_42_out-/up_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_49", + "/up_blocks.1/resnets.1/Add_1.out_12_1_66", + "/up_blocks.1/attentions.1/norm/Add_output_0_NHWC.out7_1_38", + "/up_blocks.1/attentions.1/Reshape_output_0.out0_0_8", + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_24", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_64", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_65", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_66", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_16", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_34", + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_67", + "/up_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_25", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_67", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_17", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_35", + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_68", + "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_26", + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_8", + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_36", + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_9", + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_37", + "/up_blocks.1/attentions.1/Reshape_1_output_0.out_12_0_8", + "NhwcConv_44_out-/up_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_50", + "/up_blocks.1/attentions.1/Add.out_12_1_69", + "/up_blocks.1/Concat_2_output_0_NHWC.out13_6", + "GroupNorm_39.out8_39.out7_1_39", + "NhwcConv_45_out-/up_blocks.1/resnets.2/conv_shortcut/Conv_output_0.out0_1_51", + "GroupNorm_39_sigmoid_out.8_39.out10_32", + "/up_blocks.1/resnets.2/conv1/Conv_output_0_0_15.out0_1_52", + "/up_blocks.1/resnets.2/Add.out_12_1_70", + "GroupNorm_40.out8_40.out7_1_40", + "GroupNorm_40_sigmoid_out.8_40.out10_33", + "NhwcConv_46_out-/up_blocks.1/resnets.2/conv2/Conv_output_0.out0_1_53", + "/up_blocks.1/resnets.2/Add_1.out_12_1_71", + "/up_blocks.1/attentions.2/norm/Add_output_0_NHWC.out7_1_41", + "/up_blocks.1/attentions.2/Reshape_output_0.out0_0_9", + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_27", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_68", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_69", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_70", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_18", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_38", + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_output_0.out_12_1_72", + "/up_blocks.1/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_28", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_71", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_19", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_39", + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1_output_0.out_12_1_73", + "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_29", + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_9", + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_40", + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_10", + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_41", + "/up_blocks.1/attentions.2/Reshape_1_output_0.out_12_0_9", + "NhwcConv_48_out-/up_blocks.1/attentions.2/proj_out/Conv_output_0.out0_1_54", + "/up_blocks.1/attentions.2/Add.out_12_1_74", + "/up_blocks.1/upsamplers.0/Resize.out_4_1", + "NhwcConv_49_out-/up_blocks.1/upsamplers.0/conv/Conv_output_0.out0_1_55", + "/up_blocks.2/Concat_output_0_NHWC.out13_7", + "GroupNorm_42.out8_42.out7_1_42", + "NhwcConv_50_out-/up_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_56", + "GroupNorm_42_sigmoid_out.8_42.out10_34", + "/up_blocks.2/resnets.0/conv1/Conv_output_0_0_16.out0_1_57", + "/up_blocks.2/resnets.0/Add.out_12_1_75", + "GroupNorm_43.out8_43.out7_1_43", + "GroupNorm_43_sigmoid_out.8_43.out10_35", + "NhwcConv_51_out-/up_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_58", + "/up_blocks.2/resnets.0/Add_1.out_12_1_76", + "/up_blocks.2/attentions.0/norm/Add_output_0_NHWC.out7_1_44", + "/up_blocks.2/attentions.0/Reshape_output_0.out0_0_10", + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_30", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_72", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_73", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_74", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_20", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_42", + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_77", + "/up_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_31", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_75", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_21", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_43", + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_78", + "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_32", + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_10", + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_44", + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_11", + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_45", + "/up_blocks.2/attentions.0/Reshape_1_output_0.out_12_0_10", + "NhwcConv_53_out-/up_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_59", + "/up_blocks.2/attentions.0/Add.out_12_1_79", + "/up_blocks.2/Concat_1_output_0_NHWC.out13_8", + "GroupNorm_45.out8_45.out7_1_45", + "NhwcConv_54_out-/up_blocks.2/resnets.1/conv_shortcut/Conv_output_0.out0_1_60", + "GroupNorm_45_sigmoid_out.8_45.out10_36", + "/up_blocks.2/resnets.1/conv1/Conv_output_0_0_17.out0_1_61", + "/up_blocks.2/resnets.1/Add.out_12_1_80", + "GroupNorm_46.out8_46.out7_1_46", + "GroupNorm_46_sigmoid_out.8_46.out10_37", + "NhwcConv_55_out-/up_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_62", + "/up_blocks.2/resnets.1/Add_1.out_12_1_81", + "/up_blocks.2/attentions.1/norm/Add_output_0_NHWC.out7_1_47", + "/up_blocks.2/attentions.1/Reshape_output_0.out0_0_11", + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_33", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_76", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_77", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_78", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_22", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_46", + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_82", + "/up_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_34", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_79", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_23", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_47", + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_83", + "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_35", + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_11", + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_48", + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_12", + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_49", + "/up_blocks.2/attentions.1/Reshape_1_output_0.out_12_0_11", + "NhwcConv_57_out-/up_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_63", + "/up_blocks.2/attentions.1/Add.out_12_1_84", + "/up_blocks.2/Concat_2_output_0_NHWC.out13_9", + "GroupNorm_48.out8_48.out7_1_48", + "NhwcConv_58_out-/up_blocks.2/resnets.2/conv_shortcut/Conv_output_0.out0_1_64", + "GroupNorm_48_sigmoid_out.8_48.out10_38", + "/up_blocks.2/resnets.2/conv1/Conv_output_0_0_18.out0_1_65", + "/up_blocks.2/resnets.2/Add.out_12_1_85", + "GroupNorm_49.out8_49.out7_1_49", + "GroupNorm_49_sigmoid_out.8_49.out10_39", + "NhwcConv_59_out-/up_blocks.2/resnets.2/conv2/Conv_output_0.out0_1_66", + "/up_blocks.2/resnets.2/Add_1.out_12_1_86", + "/up_blocks.2/attentions.2/norm/Add_output_0_NHWC.out7_1_50", + "/up_blocks.2/attentions.2/Reshape_output_0.out0_0_12", + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_36", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_80", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_81", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_82", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_24", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_50", + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_output_0.out_12_1_87", + "/up_blocks.2/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_37", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_83", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_25", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_51", + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1_output_0.out_12_1_88", + "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_38", + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_12", + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_52", + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_13", + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_53", + "/up_blocks.2/attentions.2/Reshape_1_output_0.out_12_0_12", + "NhwcConv_61_out-/up_blocks.2/attentions.2/proj_out/Conv_output_0.out0_1_67", + "/up_blocks.2/attentions.2/Add.out_12_1_89", + "/up_blocks.2/upsamplers.0/Resize.out_4_2", + "NhwcConv_62_out-/up_blocks.2/upsamplers.0/conv/Conv_output_0.out0_1_68", + "/up_blocks.3/Concat_output_0_NHWC.out13_10", + "GroupNorm_51.out8_51.out7_1_51", + "NhwcConv_63_out-/up_blocks.3/resnets.0/conv_shortcut/Conv_output_0.out0_1_69", + "GroupNorm_51_sigmoid_out.8_51.out10_40", + "/up_blocks.3/resnets.0/conv1/Conv_output_0_0_19.out0_1_70", + "/up_blocks.3/resnets.0/Add.out_12_1_90", + "GroupNorm_52.out8_52.out7_1_52", + "GroupNorm_52_sigmoid_out.8_52.out10_41", + "NhwcConv_64_out-/up_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_71", + "/up_blocks.3/resnets.0/Add_1.out_12_1_91", + "/up_blocks.3/attentions.0/norm/Add_output_0_NHWC.out7_1_53", + "/up_blocks.3/attentions.0/Reshape_output_0.out0_0_13", + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_39", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_84", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_85", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_86", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_26", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_54", + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_92", + "/up_blocks.3/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_40", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_87", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_27", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_55", + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_93", + "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_41", + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_13", + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_56", + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_14", + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_57", + "/up_blocks.3/attentions.0/Reshape_1_output_0.out_12_0_13", + "NhwcConv_66_out-/up_blocks.3/attentions.0/proj_out/Conv_output_0.out0_1_72", + "/up_blocks.3/attentions.0/Add.out_12_1_94", + "/up_blocks.3/Concat_1_output_0_NHWC.out13_11", + "GroupNorm_54.out8_54.out7_1_54", + "NhwcConv_67_out-/up_blocks.3/resnets.1/conv_shortcut/Conv_output_0.out0_1_73", + "GroupNorm_54_sigmoid_out.8_54.out10_42", + "/up_blocks.3/resnets.1/conv1/Conv_output_0_0_20.out0_1_74", + "/up_blocks.3/resnets.1/Add.out_12_1_95", + "GroupNorm_55.out8_55.out7_1_55", + "GroupNorm_55_sigmoid_out.8_55.out10_43", + "NhwcConv_68_out-/up_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_75", + "/up_blocks.3/resnets.1/Add_1.out_12_1_96", + "/up_blocks.3/attentions.1/norm/Add_output_0_NHWC.out7_1_56", + "/up_blocks.3/attentions.1/Reshape_output_0.out0_0_14", + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_42", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_88", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_89", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_90", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_28", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_58", + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_97", + "/up_blocks.3/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_43", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_91", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_29", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_59", + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_98", + "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_44", + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_14", + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_60", + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_15", + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_61", + "/up_blocks.3/attentions.1/Reshape_1_output_0.out_12_0_14", + "NhwcConv_70_out-/up_blocks.3/attentions.1/proj_out/Conv_output_0.out0_1_76", + "/up_blocks.3/attentions.1/Add.out_12_1_99", + "/up_blocks.3/Concat_2_output_0_NHWC.out13_12", + "GroupNorm_57.out8_57.out7_1_57", + "NhwcConv_71_out-/up_blocks.3/resnets.2/conv_shortcut/Conv_output_0.out0_1_77", + "GroupNorm_57_sigmoid_out.8_57.out10_44", + "/up_blocks.3/resnets.2/conv1/Conv_output_0_0_21.out0_1_78", + "/up_blocks.3/resnets.2/Add.out_12_1_100", + "GroupNorm_58.out8_58.out7_1_58", + "GroupNorm_58_sigmoid_out.8_58.out10_45", + "NhwcConv_72_out-/up_blocks.3/resnets.2/conv2/Conv_output_0.out0_1_79", + "/up_blocks.3/resnets.2/Add_1.out_12_1_101", + "/up_blocks.3/attentions.2/norm/Add_output_0_NHWC.out7_1_59", + "/up_blocks.3/attentions.2/Reshape_output_0.out0_0_15", + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_45", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_92", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_93", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_94", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_30", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_62", + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_output_0.out_12_1_102", + "/up_blocks.3/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_46", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_95", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_31", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_63", + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1_output_0.out_12_1_103", + "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_47", + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_15", + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_64", + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_16", + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_65", + "/up_blocks.3/attentions.2/Reshape_1_output_0.out_12_0_15", + "NhwcConv_74_out-/up_blocks.3/attentions.2/proj_out/Conv_output_0.out0_1_80", + "/up_blocks.3/attentions.2/Add.out_12_1_104", + "GroupNorm_60.out8_60.out7_1_60", + "GroupNorm_60_sigmoid_out.8_60.out10_46" + ] + }, + "const": { + "buffer_size": 1001425344, + "xrt_arg_id": 3, + "packed_tensors": [ + "onnx::MatMul_5286", + "onnx::MatMul_5287", + "onnx::MatMul_5349", + "onnx::MatMul_5350", + "onnx::MatMul_5412", + "onnx::MatMul_5413", + "onnx::MatMul_5475", + "onnx::MatMul_5476", + "onnx::MatMul_5538", + "onnx::MatMul_5539", + "onnx::MatMul_5601", + "onnx::MatMul_5602", + "onnx::MatMul_5672", + "onnx::MatMul_5673", + "onnx::MatMul_5752", + "onnx::MatMul_5753", + "onnx::MatMul_5815", + "onnx::MatMul_5816", + "onnx::MatMul_5878", + "onnx::MatMul_5879", + "onnx::MatMul_5942", + "onnx::MatMul_5943", + "onnx::MatMul_6005", + "onnx::MatMul_6006", + "onnx::MatMul_6068", + "onnx::MatMul_6069", + "onnx::MatMul_6132", + "onnx::MatMul_6133", + "onnx::MatMul_6195", + "onnx::MatMul_6196", + "onnx::MatMul_6258", + "onnx::MatMul_6259", + "NhwcConv_0_weight_NHWC", + "GroupNorm_0_wts_7_1_0", + "Sigmoid_0.weights10_0", + "down_blocks.0.resnets.0.conv1.weight", + "time_embedding.linear_1.weight_7_0", + "/time_embedding/act/Sigmoid.weights10_1", + "time_embedding.linear_2.weight_7_1", + "/down_blocks.0/resnets.0/act_1/Sigmoid.weights10_2", + "down_blocks.0.resnets.0.time_emb_proj.weight_7_2", + "down_blocks.0.resnets.1.time_emb_proj.weight_7_3", + "down_blocks.1.resnets.0.time_emb_proj.weight_7_4", + "down_blocks.1.resnets.1.time_emb_proj.weight_7_5", + "down_blocks.2.resnets.0.time_emb_proj.weight_7_6", + "down_blocks.2.resnets.1.time_emb_proj.weight_7_7", + "down_blocks.3.resnets.0.time_emb_proj.weight_7_8", + "down_blocks.3.resnets.1.time_emb_proj.weight_7_9", + "mid_block.resnets.0.time_emb_proj.weight_7_10", + "mid_block.resnets.1.time_emb_proj.weight_7_11", + "up_blocks.0.resnets.0.time_emb_proj.weight_7_12", + "up_blocks.0.resnets.1.time_emb_proj.weight_7_13", + "up_blocks.0.resnets.2.time_emb_proj.weight_7_14", + "up_blocks.1.resnets.0.time_emb_proj.weight_7_15", + "up_blocks.1.resnets.1.time_emb_proj.weight_7_16", + "up_blocks.1.resnets.2.time_emb_proj.weight_7_17", + "up_blocks.2.resnets.0.time_emb_proj.weight_7_18", + "up_blocks.2.resnets.1.time_emb_proj.weight_7_19", + "up_blocks.2.resnets.2.time_emb_proj.weight_7_20", + "up_blocks.3.resnets.0.time_emb_proj.weight_7_21", + "up_blocks.3.resnets.1.time_emb_proj.weight_7_22", + "up_blocks.3.resnets.2.time_emb_proj.weight_7_23", + "GroupNorm_1_wts_7_1_1", + "Sigmoid_1.weights10_3", + "NhwcConv_1_weight_NHWC", + "GroupNorm_2_wts_7_1_2", + "NhwcConv_2_weight_NHWC", + "down_blocks.0.attentions.0.transformer_blocks.0.norm1.weight", + "down_blocks.0.attentions.0.transformer_blocks.0.norm1.bias", + "onnx::MatMul_5263", + "onnx::MatMul_5262", + "onnx::MatMul_5264", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_0_mask.8_0", + "onnx::MatMul_5284", + "down_blocks.0.attentions.0.transformer_blocks.0.norm2.weight", + "down_blocks.0.attentions.0.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5285", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_1_mask.8_1", + "onnx::MatMul_5307", + "down_blocks.0.attentions.0.transformer_blocks.0.norm3.weight", + "down_blocks.0.attentions.0.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5308_2_0_0", + "onnx::MatMul_5308_2_0_1", + "onnx::MatMul_5309", + "NhwcConv_3_weight_NHWC", + "GroupNorm_3_wts_7_1_3", + "Sigmoid_2.weights10_4", + "down_blocks.0.resnets.1.conv1.weight", + "GroupNorm_4_wts_7_1_4", + "Sigmoid_3.weights10_5", + "NhwcConv_4_weight_NHWC", + "GroupNorm_5_wts_7_1_5", + "NhwcConv_5_weight_NHWC", + "down_blocks.0.attentions.1.transformer_blocks.0.norm1.weight", + "down_blocks.0.attentions.1.transformer_blocks.0.norm1.bias", + "onnx::MatMul_5326", + "onnx::MatMul_5325", + "onnx::MatMul_5327", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_2_mask.8_2", + "onnx::MatMul_5347", + "down_blocks.0.attentions.1.transformer_blocks.0.norm2.weight", + "down_blocks.0.attentions.1.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5348", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_3_mask.8_3", + "onnx::MatMul_5370", + "down_blocks.0.attentions.1.transformer_blocks.0.norm3.weight", + "down_blocks.0.attentions.1.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5371_2_1_0", + "onnx::MatMul_5371_2_1_1", + "onnx::MatMul_5372", + "NhwcConv_6_weight_NHWC", + "NhwcConv_7_weight_NHWC", + "NhwcConv_8_weight_NHWC", + "GroupNorm_6_wts_7_1_6", + "Sigmoid_4.weights10_6", + "down_blocks.1.resnets.0.conv1.weight", + "GroupNorm_7_wts_7_1_7", + "Sigmoid_5.weights10_7", + "NhwcConv_9_weight_NHWC", + "GroupNorm_8_wts_7_1_8", + "NhwcConv_10_weight_NHWC", + "down_blocks.1.attentions.0.transformer_blocks.0.norm1.weight", + "down_blocks.1.attentions.0.transformer_blocks.0.norm1.bias", + "onnx::MatMul_5389", + "onnx::MatMul_5388", + "onnx::MatMul_5390", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_4_mask.8_4", + "onnx::MatMul_5410", + "down_blocks.1.attentions.0.transformer_blocks.0.norm2.weight", + "down_blocks.1.attentions.0.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5411", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_5_mask.8_5", + "onnx::MatMul_5433", + "down_blocks.1.attentions.0.transformer_blocks.0.norm3.weight", + "down_blocks.1.attentions.0.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5434_2_2_0", + "onnx::MatMul_5434_2_2_1", + "onnx::MatMul_5435", + "NhwcConv_11_weight_NHWC", + "GroupNorm_9_wts_7_1_9", + "Sigmoid_6.weights10_8", + "down_blocks.1.resnets.1.conv1.weight", + "GroupNorm_10_wts_7_1_10", + "Sigmoid_7.weights10_9", + "NhwcConv_12_weight_NHWC", + "GroupNorm_11_wts_7_1_11", + "NhwcConv_13_weight_NHWC", + "down_blocks.1.attentions.1.transformer_blocks.0.norm1.weight", + "down_blocks.1.attentions.1.transformer_blocks.0.norm1.bias", + "onnx::MatMul_5452", + "onnx::MatMul_5451", + "onnx::MatMul_5453", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_6_mask.8_6", + "onnx::MatMul_5473", + "down_blocks.1.attentions.1.transformer_blocks.0.norm2.weight", + "down_blocks.1.attentions.1.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5474", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_7_mask.8_7", + "onnx::MatMul_5496", + "down_blocks.1.attentions.1.transformer_blocks.0.norm3.weight", + "down_blocks.1.attentions.1.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5497_2_3_0", + "onnx::MatMul_5497_2_3_1", + "onnx::MatMul_5498", + "NhwcConv_14_weight_NHWC", + "NhwcConv_15_weight_NHWC", + "NhwcConv_16_weight_NHWC", + "GroupNorm_12_wts_7_1_12", + "Sigmoid_8.weights10_10", + "down_blocks.2.resnets.0.conv1.weight", + "GroupNorm_13_wts_7_1_13", + "Sigmoid_9.weights10_11", + "NhwcConv_17_weight_NHWC", + "GroupNorm_14_wts_7_1_14", + "NhwcConv_18_weight_NHWC", + "down_blocks.2.attentions.0.transformer_blocks.0.norm1.weight", + "down_blocks.2.attentions.0.transformer_blocks.0.norm1.bias", + "onnx::MatMul_5515", + "onnx::MatMul_5514", + "onnx::MatMul_5516", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_8_mask.8_8", + "onnx::MatMul_5536", + "down_blocks.2.attentions.0.transformer_blocks.0.norm2.weight", + "down_blocks.2.attentions.0.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5537", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_9_mask.8_9", + "onnx::MatMul_5559", + "down_blocks.2.attentions.0.transformer_blocks.0.norm3.weight", + "down_blocks.2.attentions.0.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5560_2_4_0", + "onnx::MatMul_5560_2_4_1", + "onnx::MatMul_5561", + "NhwcConv_19_weight_NHWC", + "GroupNorm_15_wts_7_1_15", + "Sigmoid_10.weights10_12", + "down_blocks.2.resnets.1.conv1.weight", + "GroupNorm_16_wts_7_1_16", + "Sigmoid_11.weights10_13", + "NhwcConv_20_weight_NHWC", + "GroupNorm_17_wts_7_1_17", + "NhwcConv_21_weight_NHWC", + "down_blocks.2.attentions.1.transformer_blocks.0.norm1.weight", + "down_blocks.2.attentions.1.transformer_blocks.0.norm1.bias", + "onnx::MatMul_5578", + "onnx::MatMul_5577", + "onnx::MatMul_5579", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_10_mask.8_10", + "onnx::MatMul_5599", + "down_blocks.2.attentions.1.transformer_blocks.0.norm2.weight", + "down_blocks.2.attentions.1.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5600", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_11_mask.8_11", + "onnx::MatMul_5622", + "down_blocks.2.attentions.1.transformer_blocks.0.norm3.weight", + "down_blocks.2.attentions.1.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5623_2_5_0", + "onnx::MatMul_5623_2_5_1", + "onnx::MatMul_5624", + "NhwcConv_22_weight_NHWC", + "NhwcConv_23_weight_NHWC", + "GroupNorm_18_wts_7_1_18", + "Sigmoid_12.weights10_14", + "down_blocks.3.resnets.0.conv1.weight", + "GroupNorm_19_wts_7_1_19", + "Sigmoid_13.weights10_15", + "NhwcConv_24_weight_NHWC", + "GroupNorm_20_wts_7_1_20", + "Sigmoid_14.weights10_16", + "down_blocks.3.resnets.1.conv1.weight", + "GroupNorm_21_wts_7_1_21", + "Sigmoid_15.weights10_17", + "NhwcConv_25_weight_NHWC", + "GroupNorm_22_wts_7_1_22", + "Sigmoid_16.weights10_18", + "mid_block.resnets.0.conv1.weight", + "GroupNorm_23_wts_7_1_23", + "Sigmoid_17.weights10_19", + "NhwcConv_26_weight_NHWC", + "GroupNorm_24_wts_7_1_24", + "NhwcConv_27_weight_NHWC", + "mid_block.attentions.0.transformer_blocks.0.norm1.weight", + "mid_block.attentions.0.transformer_blocks.0.norm1.bias", + "onnx::MatMul_5649", + "onnx::MatMul_5648", + "onnx::MatMul_5650", + "/mid_block/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_12_mask.8_12", + "onnx::MatMul_5670", + "mid_block.attentions.0.transformer_blocks.0.norm2.weight", + "mid_block.attentions.0.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5671", + "/mid_block/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_13_mask.8_13", + "onnx::MatMul_5693", + "mid_block.attentions.0.transformer_blocks.0.norm3.weight", + "mid_block.attentions.0.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5694_2_6_0", + "onnx::MatMul_5694_2_6_1", + "onnx::MatMul_5695", + "NhwcConv_28_weight_NHWC", + "GroupNorm_25_wts_7_1_25", + "Sigmoid_18.weights10_20", + "mid_block.resnets.1.conv1.weight", + "GroupNorm_26_wts_7_1_26", + "Sigmoid_19.weights10_21", + "NhwcConv_29_weight_NHWC", + "GroupNorm_27_wts_7_1_27", + "NhwcConv_30_weight_NHWC", + "Sigmoid_20.weights10_22", + "up_blocks.0.resnets.0.conv1.weight", + "GroupNorm_28_wts_7_1_28", + "Sigmoid_21.weights10_23", + "NhwcConv_31_weight_NHWC", + "GroupNorm_29_wts_7_1_29", + "NhwcConv_32_weight_NHWC", + "Sigmoid_22.weights10_24", + "up_blocks.0.resnets.1.conv1.weight", + "GroupNorm_30_wts_7_1_30", + "Sigmoid_23.weights10_25", + "NhwcConv_33_weight_NHWC", + "GroupNorm_31_wts_7_1_31", + "NhwcConv_34_weight_NHWC", + "Sigmoid_24.weights10_26", + "up_blocks.0.resnets.2.conv1.weight", + "GroupNorm_32_wts_7_1_32", + "Sigmoid_25.weights10_27", + "NhwcConv_35_weight_NHWC", + "/up_blocks.0/upsamplers.0/Resize.weights4_0", + "NhwcConv_36_weight_NHWC", + "GroupNorm_33_wts_7_1_33", + "NhwcConv_37_weight_NHWC", + "Sigmoid_26.weights10_28", + "up_blocks.1.resnets.0.conv1.weight", + "GroupNorm_34_wts_7_1_34", + "Sigmoid_27.weights10_29", + "NhwcConv_38_weight_NHWC", + "GroupNorm_35_wts_7_1_35", + "NhwcConv_39_weight_NHWC", + "up_blocks.1.attentions.0.transformer_blocks.0.norm1.weight", + "up_blocks.1.attentions.0.transformer_blocks.0.norm1.bias", + "onnx::MatMul_5729", + "onnx::MatMul_5728", + "onnx::MatMul_5730", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_14_mask.8_14", + "onnx::MatMul_5750", + "up_blocks.1.attentions.0.transformer_blocks.0.norm2.weight", + "up_blocks.1.attentions.0.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5751", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_15_mask.8_15", + "onnx::MatMul_5773", + "up_blocks.1.attentions.0.transformer_blocks.0.norm3.weight", + "up_blocks.1.attentions.0.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5774_2_7_0", + "onnx::MatMul_5774_2_7_1", + "onnx::MatMul_5775", + "NhwcConv_40_weight_NHWC", + "GroupNorm_36_wts_7_1_36", + "NhwcConv_41_weight_NHWC", + "Sigmoid_28.weights10_30", + "up_blocks.1.resnets.1.conv1.weight", + "GroupNorm_37_wts_7_1_37", + "Sigmoid_29.weights10_31", + "NhwcConv_42_weight_NHWC", + "GroupNorm_38_wts_7_1_38", + "NhwcConv_43_weight_NHWC", + "up_blocks.1.attentions.1.transformer_blocks.0.norm1.weight", + "up_blocks.1.attentions.1.transformer_blocks.0.norm1.bias", + "onnx::MatMul_5792", + "onnx::MatMul_5791", + "onnx::MatMul_5793", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_16_mask.8_16", + "onnx::MatMul_5813", + "up_blocks.1.attentions.1.transformer_blocks.0.norm2.weight", + "up_blocks.1.attentions.1.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5814", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_17_mask.8_17", + "onnx::MatMul_5836", + "up_blocks.1.attentions.1.transformer_blocks.0.norm3.weight", + "up_blocks.1.attentions.1.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5837_2_8_0", + "onnx::MatMul_5837_2_8_1", + "onnx::MatMul_5838", + "NhwcConv_44_weight_NHWC", + "GroupNorm_39_wts_7_1_39", + "NhwcConv_45_weight_NHWC", + "Sigmoid_30.weights10_32", + "up_blocks.1.resnets.2.conv1.weight", + "GroupNorm_40_wts_7_1_40", + "Sigmoid_31.weights10_33", + "NhwcConv_46_weight_NHWC", + "GroupNorm_41_wts_7_1_41", + "NhwcConv_47_weight_NHWC", + "up_blocks.1.attentions.2.transformer_blocks.0.norm1.weight", + "up_blocks.1.attentions.2.transformer_blocks.0.norm1.bias", + "onnx::MatMul_5855", + "onnx::MatMul_5854", + "onnx::MatMul_5856", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/MatMulmha_0_18_mask.8_18", + "onnx::MatMul_5876", + "up_blocks.1.attentions.2.transformer_blocks.0.norm2.weight", + "up_blocks.1.attentions.2.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5877", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/MatMulmha_0_19_mask.8_19", + "onnx::MatMul_5899", + "up_blocks.1.attentions.2.transformer_blocks.0.norm3.weight", + "up_blocks.1.attentions.2.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5900_2_9_0", + "onnx::MatMul_5900_2_9_1", + "onnx::MatMul_5901", + "NhwcConv_48_weight_NHWC", + "/up_blocks.1/upsamplers.0/Resize.weights4_1", + "NhwcConv_49_weight_NHWC", + "GroupNorm_42_wts_7_1_42", + "NhwcConv_50_weight_NHWC", + "Sigmoid_32.weights10_34", + "up_blocks.2.resnets.0.conv1.weight", + "GroupNorm_43_wts_7_1_43", + "Sigmoid_33.weights10_35", + "NhwcConv_51_weight_NHWC", + "GroupNorm_44_wts_7_1_44", + "NhwcConv_52_weight_NHWC", + "up_blocks.2.attentions.0.transformer_blocks.0.norm1.weight", + "up_blocks.2.attentions.0.transformer_blocks.0.norm1.bias", + "onnx::MatMul_5919", + "onnx::MatMul_5918", + "onnx::MatMul_5920", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_20_mask.8_20", + "onnx::MatMul_5940", + "up_blocks.2.attentions.0.transformer_blocks.0.norm2.weight", + "up_blocks.2.attentions.0.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5941", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_21_mask.8_21", + "onnx::MatMul_5963", + "up_blocks.2.attentions.0.transformer_blocks.0.norm3.weight", + "up_blocks.2.attentions.0.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5964_2_10_0", + "onnx::MatMul_5964_2_10_1", + "onnx::MatMul_5965", + "NhwcConv_53_weight_NHWC", + "GroupNorm_45_wts_7_1_45", + "NhwcConv_54_weight_NHWC", + "Sigmoid_34.weights10_36", + "up_blocks.2.resnets.1.conv1.weight", + "GroupNorm_46_wts_7_1_46", + "Sigmoid_35.weights10_37", + "NhwcConv_55_weight_NHWC", + "GroupNorm_47_wts_7_1_47", + "NhwcConv_56_weight_NHWC", + "up_blocks.2.attentions.1.transformer_blocks.0.norm1.weight", + "up_blocks.2.attentions.1.transformer_blocks.0.norm1.bias", + "onnx::MatMul_5982", + "onnx::MatMul_5981", + "onnx::MatMul_5983", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_22_mask.8_22", + "onnx::MatMul_6003", + "up_blocks.2.attentions.1.transformer_blocks.0.norm2.weight", + "up_blocks.2.attentions.1.transformer_blocks.0.norm2.bias", + "onnx::MatMul_6004", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_23_mask.8_23", + "onnx::MatMul_6026", + "up_blocks.2.attentions.1.transformer_blocks.0.norm3.weight", + "up_blocks.2.attentions.1.transformer_blocks.0.norm3.bias", + "onnx::MatMul_6027_2_11_0", + "onnx::MatMul_6027_2_11_1", + "onnx::MatMul_6028", + "NhwcConv_57_weight_NHWC", + "GroupNorm_48_wts_7_1_48", + "NhwcConv_58_weight_NHWC", + "Sigmoid_36.weights10_38", + "up_blocks.2.resnets.2.conv1.weight", + "GroupNorm_49_wts_7_1_49", + "Sigmoid_37.weights10_39", + "NhwcConv_59_weight_NHWC", + "GroupNorm_50_wts_7_1_50", + "NhwcConv_60_weight_NHWC", + "up_blocks.2.attentions.2.transformer_blocks.0.norm1.weight", + "up_blocks.2.attentions.2.transformer_blocks.0.norm1.bias", + "onnx::MatMul_6045", + "onnx::MatMul_6044", + "onnx::MatMul_6046", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/MatMulmha_0_24_mask.8_24", + "onnx::MatMul_6066", + "up_blocks.2.attentions.2.transformer_blocks.0.norm2.weight", + "up_blocks.2.attentions.2.transformer_blocks.0.norm2.bias", + "onnx::MatMul_6067", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/MatMulmha_0_25_mask.8_25", + "onnx::MatMul_6089", + "up_blocks.2.attentions.2.transformer_blocks.0.norm3.weight", + "up_blocks.2.attentions.2.transformer_blocks.0.norm3.bias", + "onnx::MatMul_6090_2_12_0", + "onnx::MatMul_6090_2_12_1", + "onnx::MatMul_6091", + "NhwcConv_61_weight_NHWC", + "/up_blocks.2/upsamplers.0/Resize.weights4_2", + "NhwcConv_62_weight_NHWC", + "GroupNorm_51_wts_7_1_51", + "NhwcConv_63_weight_NHWC", + "Sigmoid_38.weights10_40", + "up_blocks.3.resnets.0.conv1.weight", + "GroupNorm_52_wts_7_1_52", + "Sigmoid_39.weights10_41", + "NhwcConv_64_weight_NHWC", + "GroupNorm_53_wts_7_1_53", + "NhwcConv_65_weight_NHWC", + "up_blocks.3.attentions.0.transformer_blocks.0.norm1.weight", + "up_blocks.3.attentions.0.transformer_blocks.0.norm1.bias", + "onnx::MatMul_6109", + "onnx::MatMul_6108", + "onnx::MatMul_6110", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_26_mask.8_26", + "onnx::MatMul_6130", + "up_blocks.3.attentions.0.transformer_blocks.0.norm2.weight", + "up_blocks.3.attentions.0.transformer_blocks.0.norm2.bias", + "onnx::MatMul_6131", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_27_mask.8_27", + "onnx::MatMul_6153", + "up_blocks.3.attentions.0.transformer_blocks.0.norm3.weight", + "up_blocks.3.attentions.0.transformer_blocks.0.norm3.bias", + "onnx::MatMul_6154_2_13_0", + "onnx::MatMul_6154_2_13_1", + "onnx::MatMul_6155", + "NhwcConv_66_weight_NHWC", + "GroupNorm_54_wts_7_1_54", + "NhwcConv_67_weight_NHWC", + "Sigmoid_40.weights10_42", + "up_blocks.3.resnets.1.conv1.weight", + "GroupNorm_55_wts_7_1_55", + "Sigmoid_41.weights10_43", + "NhwcConv_68_weight_NHWC", + "GroupNorm_56_wts_7_1_56", + "NhwcConv_69_weight_NHWC", + "up_blocks.3.attentions.1.transformer_blocks.0.norm1.weight", + "up_blocks.3.attentions.1.transformer_blocks.0.norm1.bias", + "onnx::MatMul_6172", + "onnx::MatMul_6171", + "onnx::MatMul_6173", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_28_mask.8_28", + "onnx::MatMul_6193", + "up_blocks.3.attentions.1.transformer_blocks.0.norm2.weight", + "up_blocks.3.attentions.1.transformer_blocks.0.norm2.bias", + "onnx::MatMul_6194", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_29_mask.8_29", + "onnx::MatMul_6216", + "up_blocks.3.attentions.1.transformer_blocks.0.norm3.weight", + "up_blocks.3.attentions.1.transformer_blocks.0.norm3.bias", + "onnx::MatMul_6217_2_14_0", + "onnx::MatMul_6217_2_14_1", + "onnx::MatMul_6218", + "NhwcConv_70_weight_NHWC", + "GroupNorm_57_wts_7_1_57", + "NhwcConv_71_weight_NHWC", + "Sigmoid_42.weights10_44", + "up_blocks.3.resnets.2.conv1.weight", + "GroupNorm_58_wts_7_1_58", + "Sigmoid_43.weights10_45", + "NhwcConv_72_weight_NHWC", + "GroupNorm_59_wts_7_1_59", + "NhwcConv_73_weight_NHWC", + "up_blocks.3.attentions.2.transformer_blocks.0.norm1.weight", + "up_blocks.3.attentions.2.transformer_blocks.0.norm1.bias", + "onnx::MatMul_6235", + "onnx::MatMul_6234", + "onnx::MatMul_6236", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/MatMulmha_0_30_mask.8_30", + "onnx::MatMul_6256", + "up_blocks.3.attentions.2.transformer_blocks.0.norm2.weight", + "up_blocks.3.attentions.2.transformer_blocks.0.norm2.bias", + "onnx::MatMul_6257", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/MatMulmha_0_31_mask.8_31", + "onnx::MatMul_6279", + "up_blocks.3.attentions.2.transformer_blocks.0.norm3.weight", + "up_blocks.3.attentions.2.transformer_blocks.0.norm3.bias", + "onnx::MatMul_6280_2_15_0", + "onnx::MatMul_6280_2_15_1", + "onnx::MatMul_6281", + "NhwcConv_74_weight_NHWC", + "GroupNorm_60_wts_7_1_60", + "Sigmoid_44.weights10_46", + "NhwcConv_75_weight_NHWC" + ] + }, + "super_instr": { + "buffer_size": 0, + "xrt_arg_id": 4, + "packed_tensors": [] + } + }, + "tensor_map": { + "encoder_hidden_states.out2_6_0": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 768 + ], + "size_in_bytes": 236544, + "offset": 7332864 + }, + "Transpose_0_out-sample.out0_1_0": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 4 + ], + "size_in_bytes": 65536, + "offset": 7569408 + }, + "class_labels_13_12_trans.out_12_1_0": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 7634944 + }, + "/time_proj/Concat_1_output_0.out2_3_0": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 320 + ], + "size_in_bytes": 1280, + "offset": 12877824 + }, + "timestep_cond_13_11_trans.out_12_1_6": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 12879104 + }, + "attention_mask_13_10_trans.out_12_1_12": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 18121984 + }, + "cross_attention_kwargs_13_9_trans.out_12_1_13": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 320 + ], + "size_in_bytes": 1310720, + "offset": 23364864 + }, + "added_cond_kwargs_13_8_trans.out_12_1_19": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 24675584 + }, + "down_block_additional_residuals_13_7_trans.out_12_1_25": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 27297024 + }, + "mid_block_additional_residual_13_6_trans.out_12_1_26": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 640 + ], + "size_in_bytes": 655360, + "offset": 29918464 + }, + "onnx::Add_10_13_5_trans.out_12_1_32": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 30573824 + }, + "onnx::Add_11_13_4_trans.out_12_1_38": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 31884544 + }, + "onnx::Add_12_13_3_trans.out_12_1_39": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 33195264 + }, + "onnx::Add_13_13_2_trans.out_12_1_42": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 33522944 + }, + "onnx::Add_14_13_1_trans.out_12_1_45": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 33850624 + }, + "onnx::Add_15_13_0_trans.out_12_1_53": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 34178304 + }, + "NhwcConv_75_out-noise_pred.out0_1_81": { + "packed_buffer_label": "out", + "xrt_arg_id": 1, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 4 + ], + "size_in_bytes": 65536, + "offset": 0 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 320 + ], + "size_in_bytes": 98560, + "offset": 0 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 320 + ], + "size_in_bytes": 98560, + "offset": 98560 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 320 + ], + "size_in_bytes": 98560, + "offset": 197120 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 320 + ], + "size_in_bytes": 98560, + "offset": 295680 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 640 + ], + "size_in_bytes": 197120, + "offset": 394240 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 640 + ], + "size_in_bytes": 197120, + "offset": 591360 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 640 + ], + "size_in_bytes": 197120, + "offset": 788480 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 640 + ], + "size_in_bytes": 197120, + "offset": 985600 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 1280 + ], + "size_in_bytes": 394240, + "offset": 1182720 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 1280 + ], + "size_in_bytes": 394240, + "offset": 1576960 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 1280 + ], + "size_in_bytes": 394240, + "offset": 1971200 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 1280 + ], + "size_in_bytes": 394240, + "offset": 2365440 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 1280 + ], + "size_in_bytes": 394240, + "offset": 2759680 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 1280 + ], + "size_in_bytes": 394240, + "offset": 3153920 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 1280 + ], + "size_in_bytes": 394240, + "offset": 3548160 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 1280 + ], + "size_in_bytes": 394240, + "offset": 3942400 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 1280 + ], + "size_in_bytes": 394240, + "offset": 4336640 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 1280 + ], + "size_in_bytes": 394240, + "offset": 4730880 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 1280 + ], + "size_in_bytes": 394240, + "offset": 5125120 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 1280 + ], + "size_in_bytes": 394240, + "offset": 5519360 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 640 + ], + "size_in_bytes": 197120, + "offset": 5913600 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 640 + ], + "size_in_bytes": 197120, + "offset": 6110720 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_22": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 640 + ], + "size_in_bytes": 197120, + "offset": 6307840 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_23": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 640 + ], + "size_in_bytes": 197120, + "offset": 6504960 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_24": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 640 + ], + "size_in_bytes": 197120, + "offset": 6702080 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_25": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 640 + ], + "size_in_bytes": 197120, + "offset": 6899200 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_26": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 320 + ], + "size_in_bytes": 98560, + "offset": 7096320 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 320 + ], + "size_in_bytes": 98560, + "offset": 7194880 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_28": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 320 + ], + "size_in_bytes": 98560, + "offset": 7293440 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_29": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 320 + ], + "size_in_bytes": 98560, + "offset": 7392000 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_30": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 320 + ], + "size_in_bytes": 98560, + "offset": 7490560 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_31": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 320 + ], + "size_in_bytes": 98560, + "offset": 7589120 + }, + "NhwcConv_0_out-/conv_in/Conv_output_0.out0_1_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 7687680 + }, + "/Add_output_0_13_12.out_12_1_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 12930560 + }, + "GroupNorm_0.out8_0.out7_1_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 18173440 + }, + "GroupNorm_0_sigmoid_out.8_0.out10_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 23416320 + }, + "/down_blocks.0/resnets.0/conv1/Conv_output_0_0_0.out0_1_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 28659200 + }, + "/time_embedding/linear_1/Gemm_output_0.out2_3_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1280 + ], + "size_in_bytes": 5120, + "offset": 33902080 + }, + "/time_embedding/act/Sigmoid_output_0.out10_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1280 + ], + "size_in_bytes": 5120, + "offset": 33907200 + }, + "/time_embedding/linear_2/Gemm_output_0.out2_3_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1280 + ], + "size_in_bytes": 5120, + "offset": 33912320 + }, + "/down_blocks.0/resnets.0/act_1/Sigmoid_output_0.out10_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1280 + ], + "size_in_bytes": 5120, + "offset": 33917440 + }, + "/down_blocks.0/resnets.0/Unsqueeze_1_output_0_0_0.out2_0_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 320 + ], + "size_in_bytes": 1280, + "offset": 33922560 + }, + "/down_blocks.0/resnets.1/Unsqueeze_1_output_0_0_1.out2_0_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 320 + ], + "size_in_bytes": 1280, + "offset": 33923840 + }, + "/down_blocks.1/resnets.0/Unsqueeze_1_output_0_0_2.out2_0_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 640 + ], + "size_in_bytes": 2560, + "offset": 33925120 + }, + "/down_blocks.1/resnets.1/Unsqueeze_1_output_0_0_3.out2_0_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 640 + ], + "size_in_bytes": 2560, + "offset": 33927680 + }, + "/down_blocks.2/resnets.0/Unsqueeze_1_output_0_0_4.out2_0_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "offset": 33930240 + }, + "/down_blocks.2/resnets.1/Unsqueeze_1_output_0_0_5.out2_0_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "offset": 33935360 + }, + "/down_blocks.3/resnets.0/Unsqueeze_1_output_0_0_6.out2_0_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "offset": 33940480 + }, + "/down_blocks.3/resnets.1/Unsqueeze_1_output_0_0_7.out2_0_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "offset": 33945600 + }, + "/mid_block/resnets.0/Unsqueeze_1_output_0_0_8.out2_0_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "offset": 33950720 + }, + "/mid_block/resnets.1/Unsqueeze_1_output_0_0_9.out2_0_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "offset": 33955840 + }, + "/up_blocks.0/resnets.0/Unsqueeze_1_output_0_0_10.out2_0_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "offset": 33960960 + }, + "/up_blocks.0/resnets.1/Unsqueeze_1_output_0_0_11.out2_0_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "offset": 33966080 + }, + "/up_blocks.0/resnets.2/Unsqueeze_1_output_0_0_12.out2_0_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "offset": 33971200 + }, + "/up_blocks.1/resnets.0/Unsqueeze_1_output_0_0_13.out2_0_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "offset": 33976320 + }, + "/up_blocks.1/resnets.1/Unsqueeze_1_output_0_0_14.out2_0_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "offset": 33981440 + }, + "/up_blocks.1/resnets.2/Unsqueeze_1_output_0_0_15.out2_0_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "offset": 33986560 + }, + "/up_blocks.2/resnets.0/Unsqueeze_1_output_0_0_16.out2_0_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 640 + ], + "size_in_bytes": 2560, + "offset": 33991680 + }, + "/up_blocks.2/resnets.1/Unsqueeze_1_output_0_0_17.out2_0_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 640 + ], + "size_in_bytes": 2560, + "offset": 33994240 + }, + "/up_blocks.2/resnets.2/Unsqueeze_1_output_0_0_18.out2_0_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 640 + ], + "size_in_bytes": 2560, + "offset": 33996800 + }, + "/up_blocks.3/resnets.0/Unsqueeze_1_output_0_0_19.out2_0_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 320 + ], + "size_in_bytes": 1280, + "offset": 33999360 + }, + "/up_blocks.3/resnets.1/Unsqueeze_1_output_0_0_20.out2_0_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 320 + ], + "size_in_bytes": 1280, + "offset": 34000640 + }, + "/up_blocks.3/resnets.2/Unsqueeze_1_output_0_0_21.out2_0_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 320 + ], + "size_in_bytes": 1280, + "offset": 34001920 + }, + "/down_blocks.0/resnets.0/Add.out_12_1_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 34003200 + }, + "GroupNorm_1.out8_1.out7_1_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 39246080 + }, + "GroupNorm_1_sigmoid_out.8_1.out10_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 44488960 + }, + "NhwcConv_1_out-/down_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 49731840 + }, + "/down_blocks.0/resnets.0/Add_1.out_12_1_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 54974720 + }, + "/down_blocks.0/attentions.0/norm/Add_output_0_NHWC.out7_1_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 60217600 + }, + "/down_blocks.0/attentions.0/Reshape_output_0.out0_0_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 65460480 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 70703360 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_32": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 75946240 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_33": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 81189120 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_34": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 86432000 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 91674880 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 96917760 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 102160640 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 107403520 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 112646400 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 117889280 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 123132160 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 128375040 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 133617920 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 20971520, + "offset": 138860800 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 20971520, + "offset": 159832320 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 20971520, + "offset": 180803840 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 201775360 + }, + "/down_blocks.0/attentions.0/Reshape_1_output_0.out_12_0_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 207018240 + }, + "NhwcConv_3_out-/down_blocks.0/attentions.0/proj_out/Conv_output_0.out0_1_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 212261120 + }, + "/down_blocks.0/attentions.0/Add.out_12_1_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 217504000 + }, + "GroupNorm_3.out8_3.out7_1_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 222746880 + }, + "GroupNorm_3_sigmoid_out.8_3.out10_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 227989760 + }, + "/Add_1_output_0_13_11.out_12_1_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 233232640 + }, + "/down_blocks.0/resnets.1/conv1/Conv_output_0_0_1.out0_1_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 238475520 + }, + "/down_blocks.0/resnets.1/Add.out_12_1_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 243718400 + }, + "GroupNorm_4.out8_4.out7_1_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 248961280 + }, + "GroupNorm_4_sigmoid_out.8_4.out10_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 254204160 + }, + "NhwcConv_4_out-/down_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 259447040 + }, + "/down_blocks.0/resnets.1/Add_1.out_12_1_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 264689920 + }, + "/down_blocks.0/attentions.1/norm/Add_output_0_NHWC.out7_1_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 269932800 + }, + "/down_blocks.0/attentions.1/Reshape_output_0.out0_0_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 275175680 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 280418560 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_36": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 285661440 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_37": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 290904320 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_38": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 296147200 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 301390080 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 306632960 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 311875840 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 317118720 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 322361600 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 327604480 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 332847360 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 338090240 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 343333120 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 20971520, + "offset": 348576000 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 20971520, + "offset": 369547520 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 20971520, + "offset": 390519040 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 411490560 + }, + "/down_blocks.0/attentions.1/Reshape_1_output_0.out_12_0_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 416733440 + }, + "NhwcConv_6_out-/down_blocks.0/attentions.1/proj_out/Conv_output_0.out0_1_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 421976320 + }, + "/down_blocks.0/attentions.1/Add.out_12_1_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 427219200 + }, + "NhwcConv_7_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 320 + ], + "size_in_bytes": 1310720, + "offset": 432462080 + }, + "NhwcConv_8_out-/down_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 433772800 + }, + "/Add_2_output_0_13_10.out_12_1_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 436394240 + }, + "/Add_3_output_0_13_9.out_12_1_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 320 + ], + "size_in_bytes": 1310720, + "offset": 441637120 + }, + "GroupNorm_6.out8_6.out7_1_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 320 + ], + "size_in_bytes": 1310720, + "offset": 442947840 + }, + "GroupNorm_6_sigmoid_out.8_6.out10_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 320 + ], + "size_in_bytes": 1310720, + "offset": 444258560 + }, + "/down_blocks.1/resnets.0/conv1/Conv_output_0_0_2.out0_1_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 445569280 + }, + "/down_blocks.1/resnets.0/Add.out_12_1_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 448190720 + }, + "GroupNorm_7.out8_7.out7_1_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 450812160 + }, + "GroupNorm_7_sigmoid_out.8_7.out10_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 453433600 + }, + "NhwcConv_9_out-/down_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 456055040 + }, + "/down_blocks.1/resnets.0/Add_1.out_12_1_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 458676480 + }, + "/down_blocks.1/attentions.0/norm/Add_output_0_NHWC.out7_1_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 461297920 + }, + "/down_blocks.1/attentions.0/Reshape_output_0.out0_0_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 463919360 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 466540800 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_40": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 469162240 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_41": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 471783680 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_42": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 474405120 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 477026560 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 479648000 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 482269440 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 484890880 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 487512320 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 490133760 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 492755200 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 495376640 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 497998080 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 10485760, + "offset": 500619520 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 10485760, + "offset": 511105280 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 10485760, + "offset": 521591040 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 532076800 + }, + "/down_blocks.1/attentions.0/Reshape_1_output_0.out_12_0_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 534698240 + }, + "NhwcConv_11_out-/down_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 537319680 + }, + "/down_blocks.1/attentions.0/Add.out_12_1_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 539941120 + }, + "GroupNorm_9.out8_9.out7_1_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 542562560 + }, + "GroupNorm_9_sigmoid_out.8_9.out10_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 545184000 + }, + "/Add_4_output_0_13_8.out_12_1_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 547805440 + }, + "/down_blocks.1/resnets.1/conv1/Conv_output_0_0_3.out0_1_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 550426880 + }, + "/down_blocks.1/resnets.1/Add.out_12_1_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 553048320 + }, + "GroupNorm_10.out8_10.out7_1_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 555669760 + }, + "GroupNorm_10_sigmoid_out.8_10.out10_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 558291200 + }, + "NhwcConv_12_out-/down_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 560912640 + }, + "/down_blocks.1/resnets.1/Add_1.out_12_1_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 563534080 + }, + "/down_blocks.1/attentions.1/norm/Add_output_0_NHWC.out7_1_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 566155520 + }, + "/down_blocks.1/attentions.1/Reshape_output_0.out0_0_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 568776960 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 571398400 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_44": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 574019840 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_45": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 576641280 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_46": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 579262720 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 581884160 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 584505600 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_22": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 587127040 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 589748480 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 592369920 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 594991360 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 597612800 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_23": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 600234240 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 602855680 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 10485760, + "offset": 605477120 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 10485760, + "offset": 615962880 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 10485760, + "offset": 626448640 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 636934400 + }, + "/down_blocks.1/attentions.1/Reshape_1_output_0.out_12_0_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 639555840 + }, + "NhwcConv_14_out-/down_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 642177280 + }, + "/down_blocks.1/attentions.1/Add.out_12_1_24": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 644798720 + }, + "NhwcConv_15_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 640 + ], + "size_in_bytes": 655360, + "offset": 647420160 + }, + "NhwcConv_16_out-/down_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 648075520 + }, + "/Add_5_output_0_13_7.out_12_1_25": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 649386240 + }, + "/Add_6_output_0_13_6.out_12_1_26": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 640 + ], + "size_in_bytes": 655360, + "offset": 652007680 + }, + "GroupNorm_12.out8_12.out7_1_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 640 + ], + "size_in_bytes": 655360, + "offset": 652663040 + }, + "GroupNorm_12_sigmoid_out.8_12.out10_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 640 + ], + "size_in_bytes": 655360, + "offset": 653318400 + }, + "/down_blocks.2/resnets.0/conv1/Conv_output_0_0_4.out0_1_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 653973760 + }, + "/down_blocks.2/resnets.0/Add.out_12_1_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 655284480 + }, + "GroupNorm_13.out8_13.out7_1_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 656595200 + }, + "GroupNorm_13_sigmoid_out.8_13.out10_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 657905920 + }, + "NhwcConv_17_out-/down_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 659216640 + }, + "/down_blocks.2/resnets.0/Add_1.out_12_1_28": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 660527360 + }, + "/down_blocks.2/attentions.0/norm/Add_output_0_NHWC.out7_1_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 661838080 + }, + "/down_blocks.2/attentions.0/Reshape_output_0.out0_0_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 663148800 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 664459520 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_48": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 665770240 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_49": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 667080960 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_50": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 668391680 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 669702400 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 671013120 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_29": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 672323840 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 673634560 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_51": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 674945280 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 676256000 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 677566720 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_30": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 678877440 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 680188160 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 5242880, + "offset": 681498880 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 5242880, + "offset": 686741760 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 5242880, + "offset": 691984640 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 697227520 + }, + "/down_blocks.2/attentions.0/Reshape_1_output_0.out_12_0_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 698538240 + }, + "NhwcConv_19_out-/down_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 699848960 + }, + "/down_blocks.2/attentions.0/Add.out_12_1_31": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 701159680 + }, + "GroupNorm_15.out8_15.out7_1_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 702470400 + }, + "GroupNorm_15_sigmoid_out.8_15.out10_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 703781120 + }, + "/Add_7_output_0_13_5.out_12_1_32": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 705091840 + }, + "/down_blocks.2/resnets.1/conv1/Conv_output_0_0_5.out0_1_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 706402560 + }, + "/down_blocks.2/resnets.1/Add.out_12_1_33": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 707713280 + }, + "GroupNorm_16.out8_16.out7_1_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 709024000 + }, + "GroupNorm_16_sigmoid_out.8_16.out10_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 710334720 + }, + "NhwcConv_20_out-/down_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 711645440 + }, + "/down_blocks.2/resnets.1/Add_1.out_12_1_34": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 712956160 + }, + "/down_blocks.2/attentions.1/norm/Add_output_0_NHWC.out7_1_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 714266880 + }, + "/down_blocks.2/attentions.1/Reshape_output_0.out0_0_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 715577600 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 716888320 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_52": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 718199040 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_53": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 719509760 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_54": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 720820480 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 722131200 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_22": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 723441920 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_35": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 724752640 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 726063360 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_55": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 727374080 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 728684800 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_23": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 729995520 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_36": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 731306240 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 732616960 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 5242880, + "offset": 733927680 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_24": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 5242880, + "offset": 739170560 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 5242880, + "offset": 744413440 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_25": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 749656320 + }, + "/down_blocks.2/attentions.1/Reshape_1_output_0.out_12_0_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 750967040 + }, + "NhwcConv_22_out-/down_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_22": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 752277760 + }, + "/down_blocks.2/attentions.1/Add.out_12_1_37": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 753588480 + }, + "NhwcConv_23_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 754899200 + }, + "/Add_8_output_0_13_4.out_12_1_38": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 755226880 + }, + "/Add_9_output_0_13_3.out_12_1_39": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 756537600 + }, + "GroupNorm_18.out8_18.out7_1_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 756865280 + }, + "GroupNorm_18_sigmoid_out.8_18.out10_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 757192960 + }, + "/down_blocks.3/resnets.0/conv1/Conv_output_0_0_6.out0_1_24": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 757520640 + }, + "/down_blocks.3/resnets.0/Add.out_12_1_40": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 757848320 + }, + "GroupNorm_19.out8_19.out7_1_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 758176000 + }, + "GroupNorm_19_sigmoid_out.8_19.out10_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 758503680 + }, + "NhwcConv_24_out-/down_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_25": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 758831360 + }, + "/down_blocks.3/resnets.0/Add_1.out_12_1_41": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 759159040 + }, + "GroupNorm_20.out8_20.out7_1_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 759486720 + }, + "GroupNorm_20_sigmoid_out.8_20.out10_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 759814400 + }, + "/Add_10_output_0_13_2.out_12_1_42": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 760142080 + }, + "/down_blocks.3/resnets.1/conv1/Conv_output_0_0_7.out0_1_26": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 760469760 + }, + "/down_blocks.3/resnets.1/Add.out_12_1_43": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 760797440 + }, + "GroupNorm_21.out8_21.out7_1_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 761125120 + }, + "GroupNorm_21_sigmoid_out.8_21.out10_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 761452800 + }, + "NhwcConv_25_out-/down_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 761780480 + }, + "/down_blocks.3/resnets.1/Add_1.out_12_1_44": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 762108160 + }, + "GroupNorm_22.out8_22.out7_1_22": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 762435840 + }, + "GroupNorm_22_sigmoid_out.8_22.out10_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 762763520 + }, + "/Add_11_output_0_13_1.out_12_1_45": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 763091200 + }, + "/mid_block/resnets.0/conv1/Conv_output_0_0_8.out0_1_28": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 763418880 + }, + "/mid_block/resnets.0/Add.out_12_1_46": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 763746560 + }, + "GroupNorm_23.out8_23.out7_1_23": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 764074240 + }, + "GroupNorm_23_sigmoid_out.8_23.out10_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 764401920 + }, + "NhwcConv_26_out-/mid_block/resnets.0/conv2/Conv_output_0.out0_1_29": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 764729600 + }, + "/mid_block/resnets.0/Add_1.out_12_1_47": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 765057280 + }, + "/mid_block/attentions.0/norm/Add_output_0_NHWC.out7_1_24": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 765384960 + }, + "/mid_block/attentions.0/Reshape_output_0.out0_0_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 327680, + "offset": 765712640 + }, + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 327680, + "offset": 766040320 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_56": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 327680, + "offset": 766368000 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_57": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 327680, + "offset": 766695680 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_58": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 327680, + "offset": 767023360 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 327680, + "offset": 767351040 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_26": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 327680, + "offset": 767678720 + }, + "/mid_block/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_48": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 327680, + "offset": 768006400 + }, + "/mid_block/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 327680, + "offset": 768334080 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_59": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 327680, + "offset": 768661760 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 327680, + "offset": 768989440 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 327680, + "offset": 769317120 + }, + "/mid_block/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_49": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 327680, + "offset": 769644800 + }, + "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 327680, + "offset": 769972480 + }, + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 5120 + ], + "size_in_bytes": 1310720, + "offset": 770300160 + }, + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_28": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 5120 + ], + "size_in_bytes": 1310720, + "offset": 771610880 + }, + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 5120 + ], + "size_in_bytes": 1310720, + "offset": 772921600 + }, + "/mid_block/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_29": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 327680, + "offset": 774232320 + }, + "/mid_block/attentions.0/Reshape_1_output_0.out_12_0_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 774560000 + }, + "NhwcConv_28_out-/mid_block/attentions.0/proj_out/Conv_output_0.out0_1_30": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 774887680 + }, + "/mid_block/attentions.0/Add.out_12_1_50": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 775215360 + }, + "GroupNorm_25.out8_25.out7_1_25": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 775543040 + }, + "GroupNorm_25_sigmoid_out.8_25.out10_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 775870720 + }, + "/mid_block/resnets.1/conv1/Conv_output_0_0_9.out0_1_31": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 776198400 + }, + "/mid_block/resnets.1/Add.out_12_1_51": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 776526080 + }, + "GroupNorm_26.out8_26.out7_1_26": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 776853760 + }, + "GroupNorm_26_sigmoid_out.8_26.out10_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 777181440 + }, + "NhwcConv_29_out-/mid_block/resnets.1/conv2/Conv_output_0.out0_1_32": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 777509120 + }, + "/mid_block/resnets.1/Add_1.out_12_1_52": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 777836800 + }, + "/Add_12_output_0_13_0.out_12_1_53": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 778164480 + }, + "/up_blocks.0/Concat_output_0_NHWC.out13_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 2560 + ], + "size_in_bytes": 655360, + "offset": 778492160 + }, + "GroupNorm_27.out8_27.out7_1_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 2560 + ], + "size_in_bytes": 655360, + "offset": 779147520 + }, + "NhwcConv_30_out-/up_blocks.0/resnets.0/conv_shortcut/Conv_output_0.out0_1_33": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 779802880 + }, + "GroupNorm_27_sigmoid_out.8_27.out10_22": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 2560 + ], + "size_in_bytes": 655360, + "offset": 780130560 + }, + "/up_blocks.0/resnets.0/conv1/Conv_output_0_0_10.out0_1_34": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 780785920 + }, + "/up_blocks.0/resnets.0/Add.out_12_1_54": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 781113600 + }, + "GroupNorm_28.out8_28.out7_1_28": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 781441280 + }, + "GroupNorm_28_sigmoid_out.8_28.out10_23": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 781768960 + }, + "NhwcConv_31_out-/up_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_35": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 782096640 + }, + "/up_blocks.0/resnets.0/Add_1.out_12_1_55": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 782424320 + }, + "/up_blocks.0/Concat_1_output_0_NHWC.out13_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 2560 + ], + "size_in_bytes": 655360, + "offset": 782752000 + }, + "GroupNorm_29.out8_29.out7_1_29": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 2560 + ], + "size_in_bytes": 655360, + "offset": 783407360 + }, + "NhwcConv_32_out-/up_blocks.0/resnets.1/conv_shortcut/Conv_output_0.out0_1_36": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 784062720 + }, + "GroupNorm_29_sigmoid_out.8_29.out10_24": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 2560 + ], + "size_in_bytes": 655360, + "offset": 784390400 + }, + "/up_blocks.0/resnets.1/conv1/Conv_output_0_0_11.out0_1_37": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 785045760 + }, + "/up_blocks.0/resnets.1/Add.out_12_1_56": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 785373440 + }, + "GroupNorm_30.out8_30.out7_1_30": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 785701120 + }, + "GroupNorm_30_sigmoid_out.8_30.out10_25": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 786028800 + }, + "NhwcConv_33_out-/up_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_38": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 786356480 + }, + "/up_blocks.0/resnets.1/Add_1.out_12_1_57": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 786684160 + }, + "/up_blocks.0/Concat_2_output_0_NHWC.out13_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 2560 + ], + "size_in_bytes": 655360, + "offset": 787011840 + }, + "GroupNorm_31.out8_31.out7_1_31": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 2560 + ], + "size_in_bytes": 655360, + "offset": 787667200 + }, + "NhwcConv_34_out-/up_blocks.0/resnets.2/conv_shortcut/Conv_output_0.out0_1_39": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 788322560 + }, + "GroupNorm_31_sigmoid_out.8_31.out10_26": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 2560 + ], + "size_in_bytes": 655360, + "offset": 788650240 + }, + "/up_blocks.0/resnets.2/conv1/Conv_output_0_0_12.out0_1_40": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 789305600 + }, + "/up_blocks.0/resnets.2/Add.out_12_1_58": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 789633280 + }, + "GroupNorm_32.out8_32.out7_1_32": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 789960960 + }, + "GroupNorm_32_sigmoid_out.8_32.out10_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 790288640 + }, + "NhwcConv_35_out-/up_blocks.0/resnets.2/conv2/Conv_output_0.out0_1_41": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 790616320 + }, + "/up_blocks.0/resnets.2/Add_1.out_12_1_59": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 327680, + "offset": 790944000 + }, + "/up_blocks.0/upsamplers.0/Resize.out_4_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 791271680 + }, + "NhwcConv_36_out-/up_blocks.0/upsamplers.0/conv/Conv_output_0.out0_1_42": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 792582400 + }, + "/up_blocks.1/Concat_output_0_NHWC.out13_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 2560 + ], + "size_in_bytes": 2621440, + "offset": 793893120 + }, + "GroupNorm_33.out8_33.out7_1_33": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 2560 + ], + "size_in_bytes": 2621440, + "offset": 796514560 + }, + "NhwcConv_37_out-/up_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_43": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 799136000 + }, + "GroupNorm_33_sigmoid_out.8_33.out10_28": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 2560 + ], + "size_in_bytes": 2621440, + "offset": 800446720 + }, + "/up_blocks.1/resnets.0/conv1/Conv_output_0_0_13.out0_1_44": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 803068160 + }, + "/up_blocks.1/resnets.0/Add.out_12_1_60": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 804378880 + }, + "GroupNorm_34.out8_34.out7_1_34": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 805689600 + }, + "GroupNorm_34_sigmoid_out.8_34.out10_29": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 807000320 + }, + "NhwcConv_38_out-/up_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_45": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 808311040 + }, + "/up_blocks.1/resnets.0/Add_1.out_12_1_61": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 809621760 + }, + "/up_blocks.1/attentions.0/norm/Add_output_0_NHWC.out7_1_35": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 810932480 + }, + "/up_blocks.1/attentions.0/Reshape_output_0.out0_0_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 812243200 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 813553920 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_60": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 814864640 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_61": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 816175360 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_62": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 817486080 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 818796800 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_30": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 820107520 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_62": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 821418240 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_22": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 822728960 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_63": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 824039680 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 825350400 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_31": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 826661120 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_63": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 827971840 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_23": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 829282560 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 5242880, + "offset": 830593280 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_32": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 5242880, + "offset": 835836160 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 5242880, + "offset": 841079040 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_33": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 846321920 + }, + "/up_blocks.1/attentions.0/Reshape_1_output_0.out_12_0_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 847632640 + }, + "NhwcConv_40_out-/up_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_46": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 848943360 + }, + "/up_blocks.1/attentions.0/Add.out_12_1_64": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 850254080 + }, + "/up_blocks.1/Concat_1_output_0_NHWC.out13_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 2560 + ], + "size_in_bytes": 2621440, + "offset": 851564800 + }, + "GroupNorm_36.out8_36.out7_1_36": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 2560 + ], + "size_in_bytes": 2621440, + "offset": 854186240 + }, + "NhwcConv_41_out-/up_blocks.1/resnets.1/conv_shortcut/Conv_output_0.out0_1_47": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 856807680 + }, + "GroupNorm_36_sigmoid_out.8_36.out10_30": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 2560 + ], + "size_in_bytes": 2621440, + "offset": 858118400 + }, + "/up_blocks.1/resnets.1/conv1/Conv_output_0_0_14.out0_1_48": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 860739840 + }, + "/up_blocks.1/resnets.1/Add.out_12_1_65": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 862050560 + }, + "GroupNorm_37.out8_37.out7_1_37": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 863361280 + }, + "GroupNorm_37_sigmoid_out.8_37.out10_31": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 864672000 + }, + "NhwcConv_42_out-/up_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_49": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 865982720 + }, + "/up_blocks.1/resnets.1/Add_1.out_12_1_66": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 867293440 + }, + "/up_blocks.1/attentions.1/norm/Add_output_0_NHWC.out7_1_38": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 868604160 + }, + "/up_blocks.1/attentions.1/Reshape_output_0.out0_0_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 869914880 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_24": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 871225600 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_64": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 872536320 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_65": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 873847040 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_66": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 875157760 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 876468480 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_34": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 877779200 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_67": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 879089920 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_25": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 880400640 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_67": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 881711360 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 883022080 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_35": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 884332800 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_68": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 885643520 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_26": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 886954240 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 5242880, + "offset": 888264960 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_36": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 5242880, + "offset": 893507840 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 5242880, + "offset": 898750720 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_37": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 903993600 + }, + "/up_blocks.1/attentions.1/Reshape_1_output_0.out_12_0_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 905304320 + }, + "NhwcConv_44_out-/up_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_50": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 906615040 + }, + "/up_blocks.1/attentions.1/Add.out_12_1_69": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 907925760 + }, + "/up_blocks.1/Concat_2_output_0_NHWC.out13_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1920 + ], + "size_in_bytes": 1966080, + "offset": 909236480 + }, + "GroupNorm_39.out8_39.out7_1_39": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1920 + ], + "size_in_bytes": 1966080, + "offset": 911202560 + }, + "NhwcConv_45_out-/up_blocks.1/resnets.2/conv_shortcut/Conv_output_0.out0_1_51": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 913168640 + }, + "GroupNorm_39_sigmoid_out.8_39.out10_32": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1920 + ], + "size_in_bytes": 1966080, + "offset": 914479360 + }, + "/up_blocks.1/resnets.2/conv1/Conv_output_0_0_15.out0_1_52": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 916445440 + }, + "/up_blocks.1/resnets.2/Add.out_12_1_70": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 917756160 + }, + "GroupNorm_40.out8_40.out7_1_40": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 919066880 + }, + "GroupNorm_40_sigmoid_out.8_40.out10_33": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 920377600 + }, + "NhwcConv_46_out-/up_blocks.1/resnets.2/conv2/Conv_output_0.out0_1_53": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 921688320 + }, + "/up_blocks.1/resnets.2/Add_1.out_12_1_71": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 922999040 + }, + "/up_blocks.1/attentions.2/norm/Add_output_0_NHWC.out7_1_41": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 924309760 + }, + "/up_blocks.1/attentions.2/Reshape_output_0.out0_0_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 925620480 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 926931200 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_68": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 928241920 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_69": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 929552640 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_70": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 930863360 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 932174080 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_38": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 933484800 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_output_0.out_12_1_72": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 934795520 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_28": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 936106240 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_71": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 937416960 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 938727680 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_39": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 940038400 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1_output_0.out_12_1_73": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 941349120 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_29": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 942659840 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 5242880, + "offset": 943970560 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_40": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 5242880, + "offset": 949213440 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 5242880, + "offset": 954456320 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_41": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 959699200 + }, + "/up_blocks.1/attentions.2/Reshape_1_output_0.out_12_0_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 961009920 + }, + "NhwcConv_48_out-/up_blocks.1/attentions.2/proj_out/Conv_output_0.out0_1_54": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 962320640 + }, + "/up_blocks.1/attentions.2/Add.out_12_1_74": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 1310720, + "offset": 963631360 + }, + "/up_blocks.1/upsamplers.0/Resize.out_4_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 1280 + ], + "size_in_bytes": 5242880, + "offset": 964942080 + }, + "NhwcConv_49_out-/up_blocks.1/upsamplers.0/conv/Conv_output_0.out0_1_55": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 1280 + ], + "size_in_bytes": 5242880, + "offset": 970184960 + }, + "/up_blocks.2/Concat_output_0_NHWC.out13_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 1920 + ], + "size_in_bytes": 7864320, + "offset": 975427840 + }, + "GroupNorm_42.out8_42.out7_1_42": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 1920 + ], + "size_in_bytes": 7864320, + "offset": 983292160 + }, + "NhwcConv_50_out-/up_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_56": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 991156480 + }, + "GroupNorm_42_sigmoid_out.8_42.out10_34": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 1920 + ], + "size_in_bytes": 7864320, + "offset": 993777920 + }, + "/up_blocks.2/resnets.0/conv1/Conv_output_0_0_16.out0_1_57": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1001642240 + }, + "/up_blocks.2/resnets.0/Add.out_12_1_75": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1004263680 + }, + "GroupNorm_43.out8_43.out7_1_43": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1006885120 + }, + "GroupNorm_43_sigmoid_out.8_43.out10_35": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1009506560 + }, + "NhwcConv_51_out-/up_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_58": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1012128000 + }, + "/up_blocks.2/resnets.0/Add_1.out_12_1_76": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1014749440 + }, + "/up_blocks.2/attentions.0/norm/Add_output_0_NHWC.out7_1_44": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1017370880 + }, + "/up_blocks.2/attentions.0/Reshape_output_0.out0_0_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1019992320 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_30": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1022613760 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_72": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1025235200 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_73": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1027856640 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_74": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1030478080 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1033099520 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_42": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1035720960 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_77": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1038342400 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_31": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1040963840 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_75": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1043585280 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1046206720 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_43": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1048828160 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_78": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1051449600 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_32": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1054071040 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 10485760, + "offset": 1056692480 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_44": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 10485760, + "offset": 1067178240 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 10485760, + "offset": 1077664000 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_45": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1088149760 + }, + "/up_blocks.2/attentions.0/Reshape_1_output_0.out_12_0_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1090771200 + }, + "NhwcConv_53_out-/up_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_59": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1093392640 + }, + "/up_blocks.2/attentions.0/Add.out_12_1_79": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1096014080 + }, + "/up_blocks.2/Concat_1_output_0_NHWC.out13_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 1280 + ], + "size_in_bytes": 5242880, + "offset": 1098635520 + }, + "GroupNorm_45.out8_45.out7_1_45": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 1280 + ], + "size_in_bytes": 5242880, + "offset": 1103878400 + }, + "NhwcConv_54_out-/up_blocks.2/resnets.1/conv_shortcut/Conv_output_0.out0_1_60": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1109121280 + }, + "GroupNorm_45_sigmoid_out.8_45.out10_36": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 1280 + ], + "size_in_bytes": 5242880, + "offset": 1111742720 + }, + "/up_blocks.2/resnets.1/conv1/Conv_output_0_0_17.out0_1_61": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1116985600 + }, + "/up_blocks.2/resnets.1/Add.out_12_1_80": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1119607040 + }, + "GroupNorm_46.out8_46.out7_1_46": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1122228480 + }, + "GroupNorm_46_sigmoid_out.8_46.out10_37": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1124849920 + }, + "NhwcConv_55_out-/up_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_62": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1127471360 + }, + "/up_blocks.2/resnets.1/Add_1.out_12_1_81": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1130092800 + }, + "/up_blocks.2/attentions.1/norm/Add_output_0_NHWC.out7_1_47": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1132714240 + }, + "/up_blocks.2/attentions.1/Reshape_output_0.out0_0_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1135335680 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_33": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1137957120 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_76": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1140578560 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_77": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1143200000 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_78": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1145821440 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_22": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1148442880 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_46": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1151064320 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_82": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1153685760 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_34": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1156307200 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_79": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1158928640 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_23": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1161550080 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_47": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1164171520 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_83": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1166792960 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_35": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1169414400 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 10485760, + "offset": 1172035840 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_48": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 10485760, + "offset": 1182521600 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 10485760, + "offset": 1193007360 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_49": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1203493120 + }, + "/up_blocks.2/attentions.1/Reshape_1_output_0.out_12_0_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1206114560 + }, + "NhwcConv_57_out-/up_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_63": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1208736000 + }, + "/up_blocks.2/attentions.1/Add.out_12_1_84": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1211357440 + }, + "/up_blocks.2/Concat_2_output_0_NHWC.out13_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 960 + ], + "size_in_bytes": 3932160, + "offset": 1213978880 + }, + "GroupNorm_48.out8_48.out7_1_48": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 960 + ], + "size_in_bytes": 3932160, + "offset": 1217911040 + }, + "NhwcConv_58_out-/up_blocks.2/resnets.2/conv_shortcut/Conv_output_0.out0_1_64": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1221843200 + }, + "GroupNorm_48_sigmoid_out.8_48.out10_38": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 960 + ], + "size_in_bytes": 3932160, + "offset": 1224464640 + }, + "/up_blocks.2/resnets.2/conv1/Conv_output_0_0_18.out0_1_65": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1228396800 + }, + "/up_blocks.2/resnets.2/Add.out_12_1_85": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1231018240 + }, + "GroupNorm_49.out8_49.out7_1_49": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1233639680 + }, + "GroupNorm_49_sigmoid_out.8_49.out10_39": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1236261120 + }, + "NhwcConv_59_out-/up_blocks.2/resnets.2/conv2/Conv_output_0.out0_1_66": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1238882560 + }, + "/up_blocks.2/resnets.2/Add_1.out_12_1_86": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1241504000 + }, + "/up_blocks.2/attentions.2/norm/Add_output_0_NHWC.out7_1_50": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1244125440 + }, + "/up_blocks.2/attentions.2/Reshape_output_0.out0_0_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1246746880 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_36": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1249368320 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_80": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1251989760 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_81": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1254611200 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_82": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1257232640 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_24": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1259854080 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_50": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1262475520 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_output_0.out_12_1_87": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1265096960 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_37": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1267718400 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_83": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1270339840 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_25": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1272961280 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_51": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1275582720 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1_output_0.out_12_1_88": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1278204160 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_38": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1280825600 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 10485760, + "offset": 1283447040 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_52": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 10485760, + "offset": 1293932800 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 10485760, + "offset": 1304418560 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_53": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1314904320 + }, + "/up_blocks.2/attentions.2/Reshape_1_output_0.out_12_0_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1317525760 + }, + "NhwcConv_61_out-/up_blocks.2/attentions.2/proj_out/Conv_output_0.out0_1_67": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1320147200 + }, + "/up_blocks.2/attentions.2/Add.out_12_1_89": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 2621440, + "offset": 1322768640 + }, + "/up_blocks.2/upsamplers.0/Resize.out_4_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 640 + ], + "size_in_bytes": 10485760, + "offset": 1325390080 + }, + "NhwcConv_62_out-/up_blocks.2/upsamplers.0/conv/Conv_output_0.out0_1_68": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 640 + ], + "size_in_bytes": 10485760, + "offset": 1335875840 + }, + "/up_blocks.3/Concat_output_0_NHWC.out13_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 960 + ], + "size_in_bytes": 15728640, + "offset": 1346361600 + }, + "GroupNorm_51.out8_51.out7_1_51": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 960 + ], + "size_in_bytes": 15728640, + "offset": 1362090240 + }, + "NhwcConv_63_out-/up_blocks.3/resnets.0/conv_shortcut/Conv_output_0.out0_1_69": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1377818880 + }, + "GroupNorm_51_sigmoid_out.8_51.out10_40": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 960 + ], + "size_in_bytes": 15728640, + "offset": 1383061760 + }, + "/up_blocks.3/resnets.0/conv1/Conv_output_0_0_19.out0_1_70": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1398790400 + }, + "/up_blocks.3/resnets.0/Add.out_12_1_90": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1404033280 + }, + "GroupNorm_52.out8_52.out7_1_52": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1409276160 + }, + "GroupNorm_52_sigmoid_out.8_52.out10_41": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1414519040 + }, + "NhwcConv_64_out-/up_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_71": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1419761920 + }, + "/up_blocks.3/resnets.0/Add_1.out_12_1_91": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1425004800 + }, + "/up_blocks.3/attentions.0/norm/Add_output_0_NHWC.out7_1_53": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1430247680 + }, + "/up_blocks.3/attentions.0/Reshape_output_0.out0_0_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1435490560 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_39": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1440733440 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_84": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1445976320 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_85": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1451219200 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_86": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1456462080 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_26": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1461704960 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_54": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1466947840 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_output_0.out_12_1_92": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1472190720 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_40": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1477433600 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_87": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1482676480 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1487919360 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_55": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1493162240 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1_output_0.out_12_1_93": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1498405120 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_41": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1503648000 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 20971520, + "offset": 1508890880 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_56": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 20971520, + "offset": 1529862400 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 20971520, + "offset": 1550833920 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_57": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1571805440 + }, + "/up_blocks.3/attentions.0/Reshape_1_output_0.out_12_0_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1577048320 + }, + "NhwcConv_66_out-/up_blocks.3/attentions.0/proj_out/Conv_output_0.out0_1_72": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1582291200 + }, + "/up_blocks.3/attentions.0/Add.out_12_1_94": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1587534080 + }, + "/up_blocks.3/Concat_1_output_0_NHWC.out13_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 640 + ], + "size_in_bytes": 10485760, + "offset": 1592776960 + }, + "GroupNorm_54.out8_54.out7_1_54": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 640 + ], + "size_in_bytes": 10485760, + "offset": 1603262720 + }, + "NhwcConv_67_out-/up_blocks.3/resnets.1/conv_shortcut/Conv_output_0.out0_1_73": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1613748480 + }, + "GroupNorm_54_sigmoid_out.8_54.out10_42": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 640 + ], + "size_in_bytes": 10485760, + "offset": 1618991360 + }, + "/up_blocks.3/resnets.1/conv1/Conv_output_0_0_20.out0_1_74": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1629477120 + }, + "/up_blocks.3/resnets.1/Add.out_12_1_95": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1634720000 + }, + "GroupNorm_55.out8_55.out7_1_55": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1639962880 + }, + "GroupNorm_55_sigmoid_out.8_55.out10_43": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1645205760 + }, + "NhwcConv_68_out-/up_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_75": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1650448640 + }, + "/up_blocks.3/resnets.1/Add_1.out_12_1_96": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1655691520 + }, + "/up_blocks.3/attentions.1/norm/Add_output_0_NHWC.out7_1_56": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1660934400 + }, + "/up_blocks.3/attentions.1/Reshape_output_0.out0_0_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1666177280 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_42": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1671420160 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_88": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1676663040 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_89": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1681905920 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_90": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1687148800 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_28": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1692391680 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_58": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1697634560 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_output_0.out_12_1_97": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1702877440 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_43": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1708120320 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_91": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1713363200 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_29": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1718606080 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_59": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1723848960 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1_output_0.out_12_1_98": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1729091840 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_44": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1734334720 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 20971520, + "offset": 1739577600 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_60": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 20971520, + "offset": 1760549120 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 20971520, + "offset": 1781520640 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_61": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1802492160 + }, + "/up_blocks.3/attentions.1/Reshape_1_output_0.out_12_0_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1807735040 + }, + "NhwcConv_70_out-/up_blocks.3/attentions.1/proj_out/Conv_output_0.out0_1_76": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1812977920 + }, + "/up_blocks.3/attentions.1/Add.out_12_1_99": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1818220800 + }, + "/up_blocks.3/Concat_2_output_0_NHWC.out13_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 640 + ], + "size_in_bytes": 10485760, + "offset": 1823463680 + }, + "GroupNorm_57.out8_57.out7_1_57": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 640 + ], + "size_in_bytes": 10485760, + "offset": 1833949440 + }, + "NhwcConv_71_out-/up_blocks.3/resnets.2/conv_shortcut/Conv_output_0.out0_1_77": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1844435200 + }, + "GroupNorm_57_sigmoid_out.8_57.out10_44": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 640 + ], + "size_in_bytes": 10485760, + "offset": 1849678080 + }, + "/up_blocks.3/resnets.2/conv1/Conv_output_0_0_21.out0_1_78": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1860163840 + }, + "/up_blocks.3/resnets.2/Add.out_12_1_100": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1865406720 + }, + "GroupNorm_58.out8_58.out7_1_58": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1870649600 + }, + "GroupNorm_58_sigmoid_out.8_58.out10_45": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1875892480 + }, + "NhwcConv_72_out-/up_blocks.3/resnets.2/conv2/Conv_output_0.out0_1_79": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1881135360 + }, + "/up_blocks.3/resnets.2/Add_1.out_12_1_101": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1886378240 + }, + "/up_blocks.3/attentions.2/norm/Add_output_0_NHWC.out7_1_59": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1891621120 + }, + "/up_blocks.3/attentions.2/Reshape_output_0.out0_0_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1896864000 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out9_45": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1902106880 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_k/MatMul_output_0.out2_6_92": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1907349760 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_q/MatMul_output_0.out2_6_93": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1912592640 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_v/MatMul_output_0.out2_6_94": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1917835520 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_30": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1923078400 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_62": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1928321280 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_output_0.out_12_1_102": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1933564160 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out9_46": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1938807040 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_95": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1944049920 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_31": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1949292800 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_63": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1954535680 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1_output_0.out_12_1_103": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1959778560 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out9_47": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 1965021440 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 20971520, + "offset": 1970264320 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_64": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 20971520, + "offset": 1991235840 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out14_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 20971520, + "offset": 2012207360 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_65": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "offset": 2033178880 + }, + "/up_blocks.3/attentions.2/Reshape_1_output_0.out_12_0_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 2038421760 + }, + "NhwcConv_74_out-/up_blocks.3/attentions.2/proj_out/Conv_output_0.out0_1_80": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 2043664640 + }, + "/up_blocks.3/attentions.2/Add.out_12_1_104": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 2048907520 + }, + "GroupNorm_60.out8_60.out7_1_60": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 2054150400 + }, + "GroupNorm_60_sigmoid_out.8_60.out10_46": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "offset": 2059393280 + }, + "onnx::MatMul_5286": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "offset": 0, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_0.const", + "file_size": 281600 + }, + "onnx::MatMul_5287": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "offset": 281600, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_1.const", + "file_size": 281600 + }, + "onnx::MatMul_5349": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "offset": 563200, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_2.const", + "file_size": 281600 + }, + "onnx::MatMul_5350": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "offset": 844800, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_3.const", + "file_size": 281600 + }, + "onnx::MatMul_5412": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "offset": 1126400, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_4.const", + "file_size": 563200 + }, + "onnx::MatMul_5413": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "offset": 1689600, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_5.const", + "file_size": 563200 + }, + "onnx::MatMul_5475": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "offset": 2252800, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_6.const", + "file_size": 563200 + }, + "onnx::MatMul_5476": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "offset": 2816000, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_7.const", + "file_size": 563200 + }, + "onnx::MatMul_5538": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "offset": 3379200, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_8.const", + "file_size": 1121280 + }, + "onnx::MatMul_5539": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "offset": 4500480, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_9.const", + "file_size": 1121280 + }, + "onnx::MatMul_5601": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "offset": 5621760, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_10.const", + "file_size": 1121280 + }, + "onnx::MatMul_5602": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "offset": 6743040, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_11.const", + "file_size": 1121280 + }, + "onnx::MatMul_5672": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "offset": 7864320, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_12.const", + "file_size": 1121280 + }, + "onnx::MatMul_5673": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "offset": 8985600, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_13.const", + "file_size": 1121280 + }, + "onnx::MatMul_5752": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "offset": 10106880, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_14.const", + "file_size": 1121280 + }, + "onnx::MatMul_5753": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "offset": 11228160, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_15.const", + "file_size": 1121280 + }, + "onnx::MatMul_5815": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "offset": 12349440, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_16.const", + "file_size": 1121280 + }, + "onnx::MatMul_5816": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "offset": 13470720, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_17.const", + "file_size": 1121280 + }, + "onnx::MatMul_5878": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "offset": 14592000, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_18.const", + "file_size": 1121280 + }, + "onnx::MatMul_5879": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "offset": 15713280, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_19.const", + "file_size": 1121280 + }, + "onnx::MatMul_5942": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "offset": 16834560, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_20.const", + "file_size": 563200 + }, + "onnx::MatMul_5943": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "offset": 17397760, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_21.const", + "file_size": 563200 + }, + "onnx::MatMul_6005": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "offset": 17960960, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_22.const", + "file_size": 563200 + }, + "onnx::MatMul_6006": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "offset": 18524160, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_23.const", + "file_size": 563200 + }, + "onnx::MatMul_6068": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "offset": 19087360, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_24.const", + "file_size": 563200 + }, + "onnx::MatMul_6069": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "offset": 19650560, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_25.const", + "file_size": 563200 + }, + "onnx::MatMul_6132": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "offset": 20213760, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_26.const", + "file_size": 281600 + }, + "onnx::MatMul_6133": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "offset": 20495360, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_27.const", + "file_size": 281600 + }, + "onnx::MatMul_6195": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "offset": 20776960, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_28.const", + "file_size": 281600 + }, + "onnx::MatMul_6196": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "offset": 21058560, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_29.const", + "file_size": 281600 + }, + "onnx::MatMul_6258": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "offset": 21340160, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_30.const", + "file_size": 281600 + }, + "onnx::MatMul_6259": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "offset": 21621760, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_31.const", + "file_size": 281600 + }, + "NhwcConv_0_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 31040 + ], + "size_in_bytes": 31040, + "offset": 21903360, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_32.const", + "file_size": 31040 + }, + "GroupNorm_0_wts_7_1_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 21934400, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_33.const", + "file_size": 1280 + }, + "Sigmoid_0.weights10_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 21935680, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_34.const", + "file_size": 256 + }, + "down_blocks.0.resnets.0.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1088000 + ], + "size_in_bytes": 1088000, + "offset": 21935936, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_35.const", + "file_size": 1088000 + }, + "time_embedding.linear_1.weight_7_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 23023936, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_36.const", + "file_size": 471040 + }, + "/time_embedding/act/Sigmoid.weights10_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 23494976, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_37.const", + "file_size": 256 + }, + "time_embedding.linear_2.weight_7_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 23495232, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_38.const", + "file_size": 1868800 + }, + "/down_blocks.0/resnets.0/act_1/Sigmoid.weights10_2": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 25364032, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_39.const", + "file_size": 256 + }, + "down_blocks.0.resnets.0.time_emb_proj.weight_7_2": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 467200 + ], + "size_in_bytes": 467200, + "offset": 25364288, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_40.const", + "file_size": 467200 + }, + "down_blocks.0.resnets.1.time_emb_proj.weight_7_3": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 467200 + ], + "size_in_bytes": 467200, + "offset": 25831488, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_41.const", + "file_size": 467200 + }, + "down_blocks.1.resnets.0.time_emb_proj.weight_7_4": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 934400 + ], + "size_in_bytes": 934400, + "offset": 26298688, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_42.const", + "file_size": 934400 + }, + "down_blocks.1.resnets.1.time_emb_proj.weight_7_5": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 934400 + ], + "size_in_bytes": 934400, + "offset": 27233088, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_43.const", + "file_size": 934400 + }, + "down_blocks.2.resnets.0.time_emb_proj.weight_7_6": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 28167488, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_44.const", + "file_size": 1868800 + }, + "down_blocks.2.resnets.1.time_emb_proj.weight_7_7": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 30036288, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_45.const", + "file_size": 1868800 + }, + "down_blocks.3.resnets.0.time_emb_proj.weight_7_8": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 31905088, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_46.const", + "file_size": 1868800 + }, + "down_blocks.3.resnets.1.time_emb_proj.weight_7_9": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 33773888, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_47.const", + "file_size": 1868800 + }, + "mid_block.resnets.0.time_emb_proj.weight_7_10": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 35642688, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_48.const", + "file_size": 1868800 + }, + "mid_block.resnets.1.time_emb_proj.weight_7_11": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 37511488, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_49.const", + "file_size": 1868800 + }, + "up_blocks.0.resnets.0.time_emb_proj.weight_7_12": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 39380288, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_50.const", + "file_size": 1868800 + }, + "up_blocks.0.resnets.1.time_emb_proj.weight_7_13": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 41249088, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_51.const", + "file_size": 1868800 + }, + "up_blocks.0.resnets.2.time_emb_proj.weight_7_14": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 43117888, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_52.const", + "file_size": 1868800 + }, + "up_blocks.1.resnets.0.time_emb_proj.weight_7_15": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 44986688, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_53.const", + "file_size": 1868800 + }, + "up_blocks.1.resnets.1.time_emb_proj.weight_7_16": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 46855488, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_54.const", + "file_size": 1868800 + }, + "up_blocks.1.resnets.2.time_emb_proj.weight_7_17": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 48724288, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_55.const", + "file_size": 1868800 + }, + "up_blocks.2.resnets.0.time_emb_proj.weight_7_18": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 934400 + ], + "size_in_bytes": 934400, + "offset": 50593088, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_56.const", + "file_size": 934400 + }, + "up_blocks.2.resnets.1.time_emb_proj.weight_7_19": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 934400 + ], + "size_in_bytes": 934400, + "offset": 51527488, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_57.const", + "file_size": 934400 + }, + "up_blocks.2.resnets.2.time_emb_proj.weight_7_20": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 934400 + ], + "size_in_bytes": 934400, + "offset": 52461888, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_58.const", + "file_size": 934400 + }, + "up_blocks.3.resnets.0.time_emb_proj.weight_7_21": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 467200 + ], + "size_in_bytes": 467200, + "offset": 53396288, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_59.const", + "file_size": 467200 + }, + "up_blocks.3.resnets.1.time_emb_proj.weight_7_22": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 467200 + ], + "size_in_bytes": 467200, + "offset": 53863488, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_60.const", + "file_size": 467200 + }, + "up_blocks.3.resnets.2.time_emb_proj.weight_7_23": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 467200 + ], + "size_in_bytes": 467200, + "offset": 54330688, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_61.const", + "file_size": 467200 + }, + "GroupNorm_1_wts_7_1_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 54797888, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_62.const", + "file_size": 1280 + }, + "Sigmoid_1.weights10_3": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 54799168, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_63.const", + "file_size": 256 + }, + "NhwcConv_1_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1088000 + ], + "size_in_bytes": 1088000, + "offset": 54799424, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_64.const", + "file_size": 1088000 + }, + "GroupNorm_2_wts_7_1_2": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 55887424, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_65.const", + "file_size": 1280 + }, + "NhwcConv_2_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 135680 + ], + "size_in_bytes": 135680, + "offset": 55888704, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_66.const", + "file_size": 135680 + }, + "down_blocks.0.attentions.0.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 56024384, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_67.const", + "file_size": 640 + }, + "down_blocks.0.attentions.0.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 56025024, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_68.const", + "file_size": 640 + }, + "onnx::MatMul_5263": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 56025664, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_69.const", + "file_size": 117760 + }, + "onnx::MatMul_5262": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 56143424, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_70.const", + "file_size": 117760 + }, + "onnx::MatMul_5264": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 56261184, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_71.const", + "file_size": 117760 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_0_mask.8_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 4096 + ], + "size_in_bytes": 8192, + "offset": 56378944, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_72.const", + "file_size": 8192 + }, + "onnx::MatMul_5284": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 56387136, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_73.const", + "file_size": 117760 + }, + "down_blocks.0.attentions.0.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 56504896, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_74.const", + "file_size": 640 + }, + "down_blocks.0.attentions.0.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 56505536, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_75.const", + "file_size": 640 + }, + "onnx::MatMul_5285": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 56506176, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_76.const", + "file_size": 117760 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_1_mask.8_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 56623936, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_77.const", + "file_size": 512 + }, + "onnx::MatMul_5307": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 56624448, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_78.const", + "file_size": 117760 + }, + "down_blocks.0.attentions.0.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 56742208, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_79.const", + "file_size": 640 + }, + "down_blocks.0.attentions.0.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 56742848, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_80.const", + "file_size": 640 + }, + "onnx::MatMul_5308_2_0_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 56743488, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_81.const", + "file_size": 471040 + }, + "onnx::MatMul_5308_2_0_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "offset": 57214528, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_82.const", + "file_size": 473600 + }, + "onnx::MatMul_5309": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 57688128, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_83.const", + "file_size": 471040 + }, + "NhwcConv_3_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 135680 + ], + "size_in_bytes": 135680, + "offset": 58159168, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_84.const", + "file_size": 135680 + }, + "GroupNorm_3_wts_7_1_3": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 58294848, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_85.const", + "file_size": 1280 + }, + "Sigmoid_2.weights10_4": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 58296128, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_86.const", + "file_size": 256 + }, + "down_blocks.0.resnets.1.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1088000 + ], + "size_in_bytes": 1088000, + "offset": 58296384, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_87.const", + "file_size": 1088000 + }, + "GroupNorm_4_wts_7_1_4": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 59384384, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_88.const", + "file_size": 1280 + }, + "Sigmoid_3.weights10_5": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 59385664, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_89.const", + "file_size": 256 + }, + "NhwcConv_4_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1088000 + ], + "size_in_bytes": 1088000, + "offset": 59385920, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_90.const", + "file_size": 1088000 + }, + "GroupNorm_5_wts_7_1_5": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 60473920, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_91.const", + "file_size": 1280 + }, + "NhwcConv_5_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 135680 + ], + "size_in_bytes": 135680, + "offset": 60475200, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_92.const", + "file_size": 135680 + }, + "down_blocks.0.attentions.1.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 60610880, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_93.const", + "file_size": 640 + }, + "down_blocks.0.attentions.1.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 60611520, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_94.const", + "file_size": 640 + }, + "onnx::MatMul_5326": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 60612160, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_95.const", + "file_size": 117760 + }, + "onnx::MatMul_5325": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 60729920, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_96.const", + "file_size": 117760 + }, + "onnx::MatMul_5327": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 60847680, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_97.const", + "file_size": 117760 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_2_mask.8_2": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 4096 + ], + "size_in_bytes": 8192, + "offset": 60965440, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_98.const", + "file_size": 8192 + }, + "onnx::MatMul_5347": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 60973632, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_99.const", + "file_size": 117760 + }, + "down_blocks.0.attentions.1.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 61091392, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_100.const", + "file_size": 640 + }, + "down_blocks.0.attentions.1.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 61092032, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_101.const", + "file_size": 640 + }, + "onnx::MatMul_5348": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 61092672, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_102.const", + "file_size": 117760 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_3_mask.8_3": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 61210432, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_103.const", + "file_size": 512 + }, + "onnx::MatMul_5370": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 61210944, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_104.const", + "file_size": 117760 + }, + "down_blocks.0.attentions.1.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 61328704, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_105.const", + "file_size": 640 + }, + "down_blocks.0.attentions.1.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 61329344, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_106.const", + "file_size": 640 + }, + "onnx::MatMul_5371_2_1_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 61329984, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_107.const", + "file_size": 471040 + }, + "onnx::MatMul_5371_2_1_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "offset": 61801024, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_108.const", + "file_size": 473600 + }, + "onnx::MatMul_5372": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 62274624, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_109.const", + "file_size": 471040 + }, + "NhwcConv_6_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 135680 + ], + "size_in_bytes": 135680, + "offset": 62745664, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_110.const", + "file_size": 135680 + }, + "NhwcConv_7_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1077760 + ], + "size_in_bytes": 1077760, + "offset": 62881344, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_111.const", + "file_size": 1077760 + }, + "NhwcConv_8_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 271360 + ], + "size_in_bytes": 271360, + "offset": 63959104, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_112.const", + "file_size": 271360 + }, + "GroupNorm_6_wts_7_1_6": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 64230464, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_113.const", + "file_size": 1280 + }, + "Sigmoid_4.weights10_6": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 64231744, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_114.const", + "file_size": 256 + }, + "down_blocks.1.resnets.0.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2176000 + ], + "size_in_bytes": 2176000, + "offset": 64232000, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_115.const", + "file_size": 2176000 + }, + "GroupNorm_7_wts_7_1_7": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 66408000, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_116.const", + "file_size": 2560 + }, + "Sigmoid_5.weights10_7": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 66410560, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_117.const", + "file_size": 256 + }, + "NhwcConv_9_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4352000 + ], + "size_in_bytes": 4352000, + "offset": 66410816, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_118.const", + "file_size": 4352000 + }, + "GroupNorm_8_wts_7_1_8": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 70762816, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_119.const", + "file_size": 2560 + }, + "NhwcConv_10_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 512000 + ], + "size_in_bytes": 512000, + "offset": 70765376, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_120.const", + "file_size": 512000 + }, + "down_blocks.1.attentions.0.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 71277376, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_121.const", + "file_size": 1280 + }, + "down_blocks.1.attentions.0.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 71278656, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_122.const", + "file_size": 1280 + }, + "onnx::MatMul_5389": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 71279936, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_123.const", + "file_size": 471040 + }, + "onnx::MatMul_5388": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 71750976, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_124.const", + "file_size": 471040 + }, + "onnx::MatMul_5390": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 72222016, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_125.const", + "file_size": 471040 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_4_mask.8_4": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 72693056, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_126.const", + "file_size": 2048 + }, + "onnx::MatMul_5410": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 72695104, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_127.const", + "file_size": 471040 + }, + "down_blocks.1.attentions.0.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 73166144, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_128.const", + "file_size": 1280 + }, + "down_blocks.1.attentions.0.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 73167424, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_129.const", + "file_size": 1280 + }, + "onnx::MatMul_5411": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 73168704, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_130.const", + "file_size": 471040 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_5_mask.8_5": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 73639744, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_131.const", + "file_size": 512 + }, + "onnx::MatMul_5433": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 73640256, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_132.const", + "file_size": 471040 + }, + "down_blocks.1.attentions.0.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 74111296, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_133.const", + "file_size": 1280 + }, + "down_blocks.1.attentions.0.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 74112576, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_134.const", + "file_size": 1280 + }, + "onnx::MatMul_5434_2_2_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1894400 + ], + "size_in_bytes": 1894400, + "offset": 74113856, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_135.const", + "file_size": 1894400 + }, + "onnx::MatMul_5434_2_2_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1894400 + ], + "size_in_bytes": 1894400, + "offset": 76008256, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_136.const", + "file_size": 1894400 + }, + "onnx::MatMul_5435": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 77902656, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_137.const", + "file_size": 1868800 + }, + "NhwcConv_11_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 512000 + ], + "size_in_bytes": 512000, + "offset": 79771456, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_138.const", + "file_size": 512000 + }, + "GroupNorm_9_wts_7_1_9": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 80283456, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_139.const", + "file_size": 2560 + }, + "Sigmoid_6.weights10_8": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 80286016, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_140.const", + "file_size": 256 + }, + "down_blocks.1.resnets.1.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4352000 + ], + "size_in_bytes": 4352000, + "offset": 80286272, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_141.const", + "file_size": 4352000 + }, + "GroupNorm_10_wts_7_1_10": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 84638272, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_142.const", + "file_size": 2560 + }, + "Sigmoid_7.weights10_9": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 84640832, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_143.const", + "file_size": 256 + }, + "NhwcConv_12_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4352000 + ], + "size_in_bytes": 4352000, + "offset": 84641088, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_144.const", + "file_size": 4352000 + }, + "GroupNorm_11_wts_7_1_11": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 88993088, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_145.const", + "file_size": 2560 + }, + "NhwcConv_13_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 512000 + ], + "size_in_bytes": 512000, + "offset": 88995648, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_146.const", + "file_size": 512000 + }, + "down_blocks.1.attentions.1.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 89507648, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_147.const", + "file_size": 1280 + }, + "down_blocks.1.attentions.1.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 89508928, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_148.const", + "file_size": 1280 + }, + "onnx::MatMul_5452": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 89510208, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_149.const", + "file_size": 471040 + }, + "onnx::MatMul_5451": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 89981248, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_150.const", + "file_size": 471040 + }, + "onnx::MatMul_5453": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 90452288, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_151.const", + "file_size": 471040 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_6_mask.8_6": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 90923328, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_152.const", + "file_size": 2048 + }, + "onnx::MatMul_5473": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 90925376, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_153.const", + "file_size": 471040 + }, + "down_blocks.1.attentions.1.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 91396416, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_154.const", + "file_size": 1280 + }, + "down_blocks.1.attentions.1.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 91397696, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_155.const", + "file_size": 1280 + }, + "onnx::MatMul_5474": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 91398976, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_156.const", + "file_size": 471040 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_7_mask.8_7": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 91870016, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_157.const", + "file_size": 512 + }, + "onnx::MatMul_5496": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 91870528, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_158.const", + "file_size": 471040 + }, + "down_blocks.1.attentions.1.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 92341568, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_159.const", + "file_size": 1280 + }, + "down_blocks.1.attentions.1.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 92342848, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_160.const", + "file_size": 1280 + }, + "onnx::MatMul_5497_2_3_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1894400 + ], + "size_in_bytes": 1894400, + "offset": 92344128, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_161.const", + "file_size": 1894400 + }, + "onnx::MatMul_5497_2_3_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1894400 + ], + "size_in_bytes": 1894400, + "offset": 94238528, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_162.const", + "file_size": 1894400 + }, + "onnx::MatMul_5498": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 96132928, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_163.const", + "file_size": 1868800 + }, + "NhwcConv_14_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 512000 + ], + "size_in_bytes": 512000, + "offset": 98001728, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_164.const", + "file_size": 512000 + }, + "NhwcConv_15_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4311040 + ], + "size_in_bytes": 4311040, + "offset": 98513728, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_165.const", + "file_size": 4311040 + }, + "NhwcConv_16_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1024000 + ], + "size_in_bytes": 1024000, + "offset": 102824768, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_166.const", + "file_size": 1024000 + }, + "GroupNorm_12_wts_7_1_12": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 103848768, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_167.const", + "file_size": 2560 + }, + "Sigmoid_8.weights10_10": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 103851328, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_168.const", + "file_size": 256 + }, + "down_blocks.2.resnets.0.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 8622080 + ], + "size_in_bytes": 8622080, + "offset": 103851584, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_169.const", + "file_size": 8622080 + }, + "GroupNorm_13_wts_7_1_13": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 112473664, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_170.const", + "file_size": 5120 + }, + "Sigmoid_9.weights10_11": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 112478784, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_171.const", + "file_size": 256 + }, + "NhwcConv_17_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 17244160 + ], + "size_in_bytes": 17244160, + "offset": 112479040, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_172.const", + "file_size": 17244160 + }, + "GroupNorm_14_wts_7_1_14": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 129723200, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_173.const", + "file_size": 5120 + }, + "NhwcConv_18_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2048000 + ], + "size_in_bytes": 2048000, + "offset": 129728320, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_174.const", + "file_size": 2048000 + }, + "down_blocks.2.attentions.0.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 131776320, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_175.const", + "file_size": 2560 + }, + "down_blocks.2.attentions.0.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 131778880, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_176.const", + "file_size": 2560 + }, + "onnx::MatMul_5515": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 131781440, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_177.const", + "file_size": 1868800 + }, + "onnx::MatMul_5514": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 133650240, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_178.const", + "file_size": 1868800 + }, + "onnx::MatMul_5516": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 135519040, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_179.const", + "file_size": 1868800 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_8_mask.8_8": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 137387840, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_180.const", + "file_size": 512 + }, + "onnx::MatMul_5536": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 137388352, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_181.const", + "file_size": 1868800 + }, + "down_blocks.2.attentions.0.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 139257152, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_182.const", + "file_size": 2560 + }, + "down_blocks.2.attentions.0.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 139259712, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_183.const", + "file_size": 2560 + }, + "onnx::MatMul_5537": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 139262272, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_184.const", + "file_size": 1868800 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_9_mask.8_9": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 141131072, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_185.const", + "file_size": 512 + }, + "onnx::MatMul_5559": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 141131584, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_186.const", + "file_size": 1868800 + }, + "down_blocks.2.attentions.0.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 143000384, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_187.const", + "file_size": 2560 + }, + "down_blocks.2.attentions.0.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 143002944, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_188.const", + "file_size": 2560 + }, + "onnx::MatMul_5560_2_4_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7536640 + ], + "size_in_bytes": 7536640, + "offset": 143005504, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_189.const", + "file_size": 7536640 + }, + "onnx::MatMul_5560_2_4_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7577600 + ], + "size_in_bytes": 7577600, + "offset": 150542144, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_190.const", + "file_size": 7577600 + }, + "onnx::MatMul_5561": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7577600 + ], + "size_in_bytes": 7577600, + "offset": 158119744, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_191.const", + "file_size": 7577600 + }, + "NhwcConv_19_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2048000 + ], + "size_in_bytes": 2048000, + "offset": 165697344, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_192.const", + "file_size": 2048000 + }, + "GroupNorm_15_wts_7_1_15": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 167745344, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_193.const", + "file_size": 5120 + }, + "Sigmoid_10.weights10_12": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 167750464, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_194.const", + "file_size": 256 + }, + "down_blocks.2.resnets.1.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 17244160 + ], + "size_in_bytes": 17244160, + "offset": 167750720, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_195.const", + "file_size": 17244160 + }, + "GroupNorm_16_wts_7_1_16": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 184994880, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_196.const", + "file_size": 5120 + }, + "Sigmoid_11.weights10_13": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 185000000, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_197.const", + "file_size": 256 + }, + "NhwcConv_20_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 17244160 + ], + "size_in_bytes": 17244160, + "offset": 185000256, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_198.const", + "file_size": 17244160 + }, + "GroupNorm_17_wts_7_1_17": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 202244416, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_199.const", + "file_size": 5120 + }, + "NhwcConv_21_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2048000 + ], + "size_in_bytes": 2048000, + "offset": 202249536, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_200.const", + "file_size": 2048000 + }, + "down_blocks.2.attentions.1.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 204297536, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_201.const", + "file_size": 2560 + }, + "down_blocks.2.attentions.1.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 204300096, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_202.const", + "file_size": 2560 + }, + "onnx::MatMul_5578": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 204302656, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_203.const", + "file_size": 1868800 + }, + "onnx::MatMul_5577": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 206171456, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_204.const", + "file_size": 1868800 + }, + "onnx::MatMul_5579": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 208040256, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_205.const", + "file_size": 1868800 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_10_mask.8_10": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 209909056, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_206.const", + "file_size": 512 + }, + "onnx::MatMul_5599": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 209909568, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_207.const", + "file_size": 1868800 + }, + "down_blocks.2.attentions.1.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 211778368, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_208.const", + "file_size": 2560 + }, + "down_blocks.2.attentions.1.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 211780928, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_209.const", + "file_size": 2560 + }, + "onnx::MatMul_5600": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 211783488, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_210.const", + "file_size": 1868800 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_11_mask.8_11": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 213652288, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_211.const", + "file_size": 512 + }, + "onnx::MatMul_5622": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 213652800, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_212.const", + "file_size": 1868800 + }, + "down_blocks.2.attentions.1.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 215521600, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_213.const", + "file_size": 2560 + }, + "down_blocks.2.attentions.1.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 215524160, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_214.const", + "file_size": 2560 + }, + "onnx::MatMul_5623_2_5_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7536640 + ], + "size_in_bytes": 7536640, + "offset": 215526720, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_215.const", + "file_size": 7536640 + }, + "onnx::MatMul_5623_2_5_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7577600 + ], + "size_in_bytes": 7577600, + "offset": 223063360, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_216.const", + "file_size": 7577600 + }, + "onnx::MatMul_5624": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7577600 + ], + "size_in_bytes": 7577600, + "offset": 230640960, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_217.const", + "file_size": 7577600 + }, + "NhwcConv_22_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2048000 + ], + "size_in_bytes": 2048000, + "offset": 238218560, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_218.const", + "file_size": 2048000 + }, + "NhwcConv_23_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 17244160 + ], + "size_in_bytes": 17244160, + "offset": 240266560, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_219.const", + "file_size": 17244160 + }, + "GroupNorm_18_wts_7_1_18": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 257510720, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_220.const", + "file_size": 5120 + }, + "Sigmoid_12.weights10_14": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 257515840, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_221.const", + "file_size": 256 + }, + "down_blocks.3.resnets.0.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16998400 + ], + "size_in_bytes": 16998400, + "offset": 257516096, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_222.const", + "file_size": 16998400 + }, + "GroupNorm_19_wts_7_1_19": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 274514496, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_223.const", + "file_size": 5120 + }, + "Sigmoid_13.weights10_15": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 274519616, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_224.const", + "file_size": 256 + }, + "NhwcConv_24_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16998400 + ], + "size_in_bytes": 16998400, + "offset": 274519872, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_225.const", + "file_size": 16998400 + }, + "GroupNorm_20_wts_7_1_20": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 291518272, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_226.const", + "file_size": 5120 + }, + "Sigmoid_14.weights10_16": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 291523392, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_227.const", + "file_size": 256 + }, + "down_blocks.3.resnets.1.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16998400 + ], + "size_in_bytes": 16998400, + "offset": 291523648, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_228.const", + "file_size": 16998400 + }, + "GroupNorm_21_wts_7_1_21": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 308522048, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_229.const", + "file_size": 5120 + }, + "Sigmoid_15.weights10_17": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 308527168, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_230.const", + "file_size": 256 + }, + "NhwcConv_25_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16998400 + ], + "size_in_bytes": 16998400, + "offset": 308527424, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_231.const", + "file_size": 16998400 + }, + "GroupNorm_22_wts_7_1_22": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 325525824, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_232.const", + "file_size": 5120 + }, + "Sigmoid_16.weights10_18": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 325530944, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_233.const", + "file_size": 256 + }, + "mid_block.resnets.0.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16998400 + ], + "size_in_bytes": 16998400, + "offset": 325531200, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_234.const", + "file_size": 16998400 + }, + "GroupNorm_23_wts_7_1_23": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 342529600, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_235.const", + "file_size": 5120 + }, + "Sigmoid_17.weights10_19": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 342534720, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_236.const", + "file_size": 256 + }, + "NhwcConv_26_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16998400 + ], + "size_in_bytes": 16998400, + "offset": 342534976, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_237.const", + "file_size": 16998400 + }, + "GroupNorm_24_wts_7_1_24": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 359533376, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_238.const", + "file_size": 5120 + }, + "NhwcConv_27_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2048000 + ], + "size_in_bytes": 2048000, + "offset": 359538496, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_239.const", + "file_size": 2048000 + }, + "mid_block.attentions.0.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 361586496, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_240.const", + "file_size": 2560 + }, + "mid_block.attentions.0.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 361589056, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_241.const", + "file_size": 2560 + }, + "onnx::MatMul_5649": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1884160 + ], + "size_in_bytes": 1884160, + "offset": 361591616, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_242.const", + "file_size": 1884160 + }, + "onnx::MatMul_5648": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1884160 + ], + "size_in_bytes": 1884160, + "offset": 363475776, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_243.const", + "file_size": 1884160 + }, + "onnx::MatMul_5650": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1884160 + ], + "size_in_bytes": 1884160, + "offset": 365359936, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_244.const", + "file_size": 1884160 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_12_mask.8_12": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 367244096, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_245.const", + "file_size": 512 + }, + "onnx::MatMul_5670": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1884160 + ], + "size_in_bytes": 1884160, + "offset": 367244608, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_246.const", + "file_size": 1884160 + }, + "mid_block.attentions.0.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 369128768, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_247.const", + "file_size": 2560 + }, + "mid_block.attentions.0.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 369131328, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_248.const", + "file_size": 2560 + }, + "onnx::MatMul_5671": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1884160 + ], + "size_in_bytes": 1884160, + "offset": 369133888, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_249.const", + "file_size": 1884160 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_13_mask.8_13": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 371018048, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_250.const", + "file_size": 512 + }, + "onnx::MatMul_5693": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1884160 + ], + "size_in_bytes": 1884160, + "offset": 371018560, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_251.const", + "file_size": 1884160 + }, + "mid_block.attentions.0.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 372902720, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_252.const", + "file_size": 2560 + }, + "mid_block.attentions.0.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 372905280, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_253.const", + "file_size": 2560 + }, + "onnx::MatMul_5694_2_6_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "offset": 372907840, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_254.const", + "file_size": 7475200 + }, + "onnx::MatMul_5694_2_6_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7536640 + ], + "size_in_bytes": 7536640, + "offset": 380383040, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_255.const", + "file_size": 7536640 + }, + "onnx::MatMul_5695": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7536640 + ], + "size_in_bytes": 7536640, + "offset": 387919680, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_256.const", + "file_size": 7536640 + }, + "NhwcConv_28_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2048000 + ], + "size_in_bytes": 2048000, + "offset": 395456320, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_257.const", + "file_size": 2048000 + }, + "GroupNorm_25_wts_7_1_25": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 397504320, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_258.const", + "file_size": 5120 + }, + "Sigmoid_18.weights10_20": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 397509440, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_259.const", + "file_size": 256 + }, + "mid_block.resnets.1.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16998400 + ], + "size_in_bytes": 16998400, + "offset": 397509696, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_260.const", + "file_size": 16998400 + }, + "GroupNorm_26_wts_7_1_26": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 414508096, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_261.const", + "file_size": 5120 + }, + "Sigmoid_19.weights10_21": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 414513216, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_262.const", + "file_size": 256 + }, + "NhwcConv_29_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16998400 + ], + "size_in_bytes": 16998400, + "offset": 414513472, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_263.const", + "file_size": 16998400 + }, + "GroupNorm_27_wts_7_1_27": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 5120 + ], + "size_in_bytes": 10240, + "offset": 431511872, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_264.const", + "file_size": 10240 + }, + "NhwcConv_30_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4096000 + ], + "size_in_bytes": 4096000, + "offset": 431522112, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_265.const", + "file_size": 4096000 + }, + "Sigmoid_20.weights10_22": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 435618112, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_266.const", + "file_size": 256 + }, + "up_blocks.0.resnets.0.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 34488320 + ], + "size_in_bytes": 34488320, + "offset": 435618368, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_267.const", + "file_size": 34488320 + }, + "GroupNorm_28_wts_7_1_28": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 470106688, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_268.const", + "file_size": 5120 + }, + "Sigmoid_21.weights10_23": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 470111808, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_269.const", + "file_size": 256 + }, + "NhwcConv_31_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16998400 + ], + "size_in_bytes": 16998400, + "offset": 470112064, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_270.const", + "file_size": 16998400 + }, + "GroupNorm_29_wts_7_1_29": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 5120 + ], + "size_in_bytes": 10240, + "offset": 487110464, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_271.const", + "file_size": 10240 + }, + "NhwcConv_32_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4096000 + ], + "size_in_bytes": 4096000, + "offset": 487120704, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_272.const", + "file_size": 4096000 + }, + "Sigmoid_22.weights10_24": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 491216704, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_273.const", + "file_size": 256 + }, + "up_blocks.0.resnets.1.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 34488320 + ], + "size_in_bytes": 34488320, + "offset": 491216960, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_274.const", + "file_size": 34488320 + }, + "GroupNorm_30_wts_7_1_30": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 525705280, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_275.const", + "file_size": 5120 + }, + "Sigmoid_23.weights10_25": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 525710400, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_276.const", + "file_size": 256 + }, + "NhwcConv_33_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16998400 + ], + "size_in_bytes": 16998400, + "offset": 525710656, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_277.const", + "file_size": 16998400 + }, + "GroupNorm_31_wts_7_1_31": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 5120 + ], + "size_in_bytes": 10240, + "offset": 542709056, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_278.const", + "file_size": 10240 + }, + "NhwcConv_34_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4096000 + ], + "size_in_bytes": 4096000, + "offset": 542719296, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_279.const", + "file_size": 4096000 + }, + "Sigmoid_24.weights10_26": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 546815296, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_280.const", + "file_size": 256 + }, + "up_blocks.0.resnets.2.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 34488320 + ], + "size_in_bytes": 34488320, + "offset": 546815552, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_281.const", + "file_size": 34488320 + }, + "GroupNorm_32_wts_7_1_32": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 581303872, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_282.const", + "file_size": 5120 + }, + "Sigmoid_25.weights10_27": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 581308992, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_283.const", + "file_size": 256 + }, + "NhwcConv_35_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16998400 + ], + "size_in_bytes": 16998400, + "offset": 581309248, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_284.const", + "file_size": 16998400 + }, + "/up_blocks.0/upsamplers.0/Resize.weights4_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 598307648, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_285.const", + "file_size": 256 + }, + "NhwcConv_36_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 17244160 + ], + "size_in_bytes": 17244160, + "offset": 598307904, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_286.const", + "file_size": 17244160 + }, + "GroupNorm_33_wts_7_1_33": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 5120 + ], + "size_in_bytes": 10240, + "offset": 615552064, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_287.const", + "file_size": 10240 + }, + "NhwcConv_37_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4096000 + ], + "size_in_bytes": 4096000, + "offset": 615562304, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_288.const", + "file_size": 4096000 + }, + "Sigmoid_26.weights10_28": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 619658304, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_289.const", + "file_size": 256 + }, + "up_blocks.1.resnets.0.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 34488320 + ], + "size_in_bytes": 34488320, + "offset": 619658560, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_290.const", + "file_size": 34488320 + }, + "GroupNorm_34_wts_7_1_34": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 654146880, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_291.const", + "file_size": 5120 + }, + "Sigmoid_27.weights10_29": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 654152000, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_292.const", + "file_size": 256 + }, + "NhwcConv_38_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 17244160 + ], + "size_in_bytes": 17244160, + "offset": 654152256, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_293.const", + "file_size": 17244160 + }, + "GroupNorm_35_wts_7_1_35": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 671396416, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_294.const", + "file_size": 5120 + }, + "NhwcConv_39_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2048000 + ], + "size_in_bytes": 2048000, + "offset": 671401536, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_295.const", + "file_size": 2048000 + }, + "up_blocks.1.attentions.0.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 673449536, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_296.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.0.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 673452096, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_297.const", + "file_size": 2560 + }, + "onnx::MatMul_5729": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 673454656, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_298.const", + "file_size": 1868800 + }, + "onnx::MatMul_5728": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 675323456, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_299.const", + "file_size": 1868800 + }, + "onnx::MatMul_5730": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 677192256, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_300.const", + "file_size": 1868800 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_14_mask.8_14": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 679061056, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_301.const", + "file_size": 512 + }, + "onnx::MatMul_5750": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 679061568, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_302.const", + "file_size": 1868800 + }, + "up_blocks.1.attentions.0.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 680930368, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_303.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.0.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 680932928, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_304.const", + "file_size": 2560 + }, + "onnx::MatMul_5751": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 680935488, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_305.const", + "file_size": 1868800 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_15_mask.8_15": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 682804288, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_306.const", + "file_size": 512 + }, + "onnx::MatMul_5773": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 682804800, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_307.const", + "file_size": 1868800 + }, + "up_blocks.1.attentions.0.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 684673600, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_308.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.0.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 684676160, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_309.const", + "file_size": 2560 + }, + "onnx::MatMul_5774_2_7_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7536640 + ], + "size_in_bytes": 7536640, + "offset": 684678720, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_310.const", + "file_size": 7536640 + }, + "onnx::MatMul_5774_2_7_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7577600 + ], + "size_in_bytes": 7577600, + "offset": 692215360, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_311.const", + "file_size": 7577600 + }, + "onnx::MatMul_5775": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7577600 + ], + "size_in_bytes": 7577600, + "offset": 699792960, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_312.const", + "file_size": 7577600 + }, + "NhwcConv_40_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2048000 + ], + "size_in_bytes": 2048000, + "offset": 707370560, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_313.const", + "file_size": 2048000 + }, + "GroupNorm_36_wts_7_1_36": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 5120 + ], + "size_in_bytes": 10240, + "offset": 709418560, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_314.const", + "file_size": 10240 + }, + "NhwcConv_41_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4096000 + ], + "size_in_bytes": 4096000, + "offset": 709428800, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_315.const", + "file_size": 4096000 + }, + "Sigmoid_28.weights10_30": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 713524800, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_316.const", + "file_size": 256 + }, + "up_blocks.1.resnets.1.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 34488320 + ], + "size_in_bytes": 34488320, + "offset": 713525056, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_317.const", + "file_size": 34488320 + }, + "GroupNorm_37_wts_7_1_37": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 748013376, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_318.const", + "file_size": 5120 + }, + "Sigmoid_29.weights10_31": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 748018496, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_319.const", + "file_size": 256 + }, + "NhwcConv_42_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 17244160 + ], + "size_in_bytes": 17244160, + "offset": 748018752, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_320.const", + "file_size": 17244160 + }, + "GroupNorm_38_wts_7_1_38": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 765262912, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_321.const", + "file_size": 5120 + }, + "NhwcConv_43_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2048000 + ], + "size_in_bytes": 2048000, + "offset": 765268032, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_322.const", + "file_size": 2048000 + }, + "up_blocks.1.attentions.1.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 767316032, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_323.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.1.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 767318592, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_324.const", + "file_size": 2560 + }, + "onnx::MatMul_5792": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 767321152, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_325.const", + "file_size": 1868800 + }, + "onnx::MatMul_5791": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 769189952, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_326.const", + "file_size": 1868800 + }, + "onnx::MatMul_5793": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 771058752, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_327.const", + "file_size": 1868800 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_16_mask.8_16": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 772927552, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_328.const", + "file_size": 512 + }, + "onnx::MatMul_5813": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 772928064, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_329.const", + "file_size": 1868800 + }, + "up_blocks.1.attentions.1.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 774796864, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_330.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.1.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 774799424, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_331.const", + "file_size": 2560 + }, + "onnx::MatMul_5814": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 774801984, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_332.const", + "file_size": 1868800 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_17_mask.8_17": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 776670784, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_333.const", + "file_size": 512 + }, + "onnx::MatMul_5836": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 776671296, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_334.const", + "file_size": 1868800 + }, + "up_blocks.1.attentions.1.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 778540096, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_335.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.1.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 778542656, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_336.const", + "file_size": 2560 + }, + "onnx::MatMul_5837_2_8_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7536640 + ], + "size_in_bytes": 7536640, + "offset": 778545216, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_337.const", + "file_size": 7536640 + }, + "onnx::MatMul_5837_2_8_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7577600 + ], + "size_in_bytes": 7577600, + "offset": 786081856, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_338.const", + "file_size": 7577600 + }, + "onnx::MatMul_5838": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7577600 + ], + "size_in_bytes": 7577600, + "offset": 793659456, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_339.const", + "file_size": 7577600 + }, + "NhwcConv_44_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2048000 + ], + "size_in_bytes": 2048000, + "offset": 801237056, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_340.const", + "file_size": 2048000 + }, + "GroupNorm_39_wts_7_1_39": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 3840 + ], + "size_in_bytes": 7680, + "offset": 803285056, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_341.const", + "file_size": 7680 + }, + "NhwcConv_45_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 3072000 + ], + "size_in_bytes": 3072000, + "offset": 803292736, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_342.const", + "file_size": 3072000 + }, + "Sigmoid_30.weights10_32": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 806364736, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_343.const", + "file_size": 256 + }, + "up_blocks.1.resnets.2.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 25702400 + ], + "size_in_bytes": 25702400, + "offset": 806364992, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_344.const", + "file_size": 25702400 + }, + "GroupNorm_40_wts_7_1_40": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 832067392, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_345.const", + "file_size": 5120 + }, + "Sigmoid_31.weights10_33": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 832072512, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_346.const", + "file_size": 256 + }, + "NhwcConv_46_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 17244160 + ], + "size_in_bytes": 17244160, + "offset": 832072768, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_347.const", + "file_size": 17244160 + }, + "GroupNorm_41_wts_7_1_41": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 849316928, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_348.const", + "file_size": 5120 + }, + "NhwcConv_47_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2048000 + ], + "size_in_bytes": 2048000, + "offset": 849322048, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_349.const", + "file_size": 2048000 + }, + "up_blocks.1.attentions.2.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 851370048, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_350.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.2.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 851372608, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_351.const", + "file_size": 2560 + }, + "onnx::MatMul_5855": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 851375168, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_352.const", + "file_size": 1868800 + }, + "onnx::MatMul_5854": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 853243968, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_353.const", + "file_size": 1868800 + }, + "onnx::MatMul_5856": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 855112768, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_354.const", + "file_size": 1868800 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/MatMulmha_0_18_mask.8_18": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 856981568, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_355.const", + "file_size": 512 + }, + "onnx::MatMul_5876": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 856982080, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_356.const", + "file_size": 1868800 + }, + "up_blocks.1.attentions.2.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 858850880, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_357.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.2.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 858853440, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_358.const", + "file_size": 2560 + }, + "onnx::MatMul_5877": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 858856000, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_359.const", + "file_size": 1868800 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/MatMulmha_0_19_mask.8_19": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 860724800, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_360.const", + "file_size": 512 + }, + "onnx::MatMul_5899": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 860725312, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_361.const", + "file_size": 1868800 + }, + "up_blocks.1.attentions.2.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 862594112, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_362.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.2.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 862596672, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_363.const", + "file_size": 2560 + }, + "onnx::MatMul_5900_2_9_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7536640 + ], + "size_in_bytes": 7536640, + "offset": 862599232, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_364.const", + "file_size": 7536640 + }, + "onnx::MatMul_5900_2_9_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7577600 + ], + "size_in_bytes": 7577600, + "offset": 870135872, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_365.const", + "file_size": 7577600 + }, + "onnx::MatMul_5901": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7577600 + ], + "size_in_bytes": 7577600, + "offset": 877713472, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_366.const", + "file_size": 7577600 + }, + "NhwcConv_48_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2048000 + ], + "size_in_bytes": 2048000, + "offset": 885291072, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_367.const", + "file_size": 2048000 + }, + "/up_blocks.1/upsamplers.0/Resize.weights4_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 887339072, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_368.const", + "file_size": 256 + }, + "NhwcConv_49_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 17408000 + ], + "size_in_bytes": 17408000, + "offset": 887339328, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_369.const", + "file_size": 17408000 + }, + "GroupNorm_42_wts_7_1_42": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 3840 + ], + "size_in_bytes": 7680, + "offset": 904747328, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_370.const", + "file_size": 7680 + }, + "NhwcConv_50_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1546240 + ], + "size_in_bytes": 1546240, + "offset": 904755008, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_371.const", + "file_size": 1546240 + }, + "Sigmoid_32.weights10_34": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 906301248, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_372.const", + "file_size": 256 + }, + "up_blocks.2.resnets.0.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 13056000 + ], + "size_in_bytes": 13056000, + "offset": 906301504, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_373.const", + "file_size": 13056000 + }, + "GroupNorm_43_wts_7_1_43": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 919357504, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_374.const", + "file_size": 2560 + }, + "Sigmoid_33.weights10_35": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 919360064, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_375.const", + "file_size": 256 + }, + "NhwcConv_51_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4352000 + ], + "size_in_bytes": 4352000, + "offset": 919360320, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_376.const", + "file_size": 4352000 + }, + "GroupNorm_44_wts_7_1_44": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 923712320, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_377.const", + "file_size": 2560 + }, + "NhwcConv_52_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 512000 + ], + "size_in_bytes": 512000, + "offset": 923714880, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_378.const", + "file_size": 512000 + }, + "up_blocks.2.attentions.0.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 924226880, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_379.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.0.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 924228160, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_380.const", + "file_size": 1280 + }, + "onnx::MatMul_5919": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 924229440, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_381.const", + "file_size": 471040 + }, + "onnx::MatMul_5918": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 924700480, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_382.const", + "file_size": 471040 + }, + "onnx::MatMul_5920": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 925171520, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_383.const", + "file_size": 471040 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_20_mask.8_20": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 925642560, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_384.const", + "file_size": 2048 + }, + "onnx::MatMul_5940": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 925644608, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_385.const", + "file_size": 471040 + }, + "up_blocks.2.attentions.0.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 926115648, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_386.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.0.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 926116928, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_387.const", + "file_size": 1280 + }, + "onnx::MatMul_5941": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 926118208, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_388.const", + "file_size": 471040 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_21_mask.8_21": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 926589248, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_389.const", + "file_size": 512 + }, + "onnx::MatMul_5963": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 926589760, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_390.const", + "file_size": 471040 + }, + "up_blocks.2.attentions.0.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 927060800, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_391.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.0.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 927062080, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_392.const", + "file_size": 1280 + }, + "onnx::MatMul_5964_2_10_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1894400 + ], + "size_in_bytes": 1894400, + "offset": 927063360, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_393.const", + "file_size": 1894400 + }, + "onnx::MatMul_5964_2_10_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1894400 + ], + "size_in_bytes": 1894400, + "offset": 928957760, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_394.const", + "file_size": 1894400 + }, + "onnx::MatMul_5965": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 930852160, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_395.const", + "file_size": 1868800 + }, + "NhwcConv_53_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 512000 + ], + "size_in_bytes": 512000, + "offset": 932720960, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_396.const", + "file_size": 512000 + }, + "GroupNorm_45_wts_7_1_45": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "offset": 933232960, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_397.const", + "file_size": 5120 + }, + "NhwcConv_54_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1024000 + ], + "size_in_bytes": 1024000, + "offset": 933238080, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_398.const", + "file_size": 1024000 + }, + "Sigmoid_34.weights10_36": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 934262080, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_399.const", + "file_size": 256 + }, + "up_blocks.2.resnets.1.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 8704000 + ], + "size_in_bytes": 8704000, + "offset": 934262336, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_400.const", + "file_size": 8704000 + }, + "GroupNorm_46_wts_7_1_46": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 942966336, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_401.const", + "file_size": 2560 + }, + "Sigmoid_35.weights10_37": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 942968896, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_402.const", + "file_size": 256 + }, + "NhwcConv_55_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4352000 + ], + "size_in_bytes": 4352000, + "offset": 942969152, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_403.const", + "file_size": 4352000 + }, + "GroupNorm_47_wts_7_1_47": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 947321152, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_404.const", + "file_size": 2560 + }, + "NhwcConv_56_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 512000 + ], + "size_in_bytes": 512000, + "offset": 947323712, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_405.const", + "file_size": 512000 + }, + "up_blocks.2.attentions.1.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 947835712, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_406.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.1.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 947836992, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_407.const", + "file_size": 1280 + }, + "onnx::MatMul_5982": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 947838272, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_408.const", + "file_size": 471040 + }, + "onnx::MatMul_5981": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 948309312, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_409.const", + "file_size": 471040 + }, + "onnx::MatMul_5983": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 948780352, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_410.const", + "file_size": 471040 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_22_mask.8_22": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 949251392, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_411.const", + "file_size": 2048 + }, + "onnx::MatMul_6003": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 949253440, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_412.const", + "file_size": 471040 + }, + "up_blocks.2.attentions.1.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 949724480, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_413.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.1.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 949725760, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_414.const", + "file_size": 1280 + }, + "onnx::MatMul_6004": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 949727040, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_415.const", + "file_size": 471040 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_23_mask.8_23": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 950198080, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_416.const", + "file_size": 512 + }, + "onnx::MatMul_6026": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 950198592, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_417.const", + "file_size": 471040 + }, + "up_blocks.2.attentions.1.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 950669632, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_418.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.1.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 950670912, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_419.const", + "file_size": 1280 + }, + "onnx::MatMul_6027_2_11_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1894400 + ], + "size_in_bytes": 1894400, + "offset": 950672192, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_420.const", + "file_size": 1894400 + }, + "onnx::MatMul_6027_2_11_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1894400 + ], + "size_in_bytes": 1894400, + "offset": 952566592, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_421.const", + "file_size": 1894400 + }, + "onnx::MatMul_6028": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 954460992, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_422.const", + "file_size": 1868800 + }, + "NhwcConv_57_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 512000 + ], + "size_in_bytes": 512000, + "offset": 956329792, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_423.const", + "file_size": 512000 + }, + "GroupNorm_48_wts_7_1_48": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1920 + ], + "size_in_bytes": 3840, + "offset": 956841792, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_424.const", + "file_size": 3840 + }, + "NhwcConv_58_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 773120 + ], + "size_in_bytes": 773120, + "offset": 956845632, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_425.const", + "file_size": 773120 + }, + "Sigmoid_36.weights10_38": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 957618752, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_426.const", + "file_size": 256 + }, + "up_blocks.2.resnets.2.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 6528000 + ], + "size_in_bytes": 6528000, + "offset": 957619008, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_427.const", + "file_size": 6528000 + }, + "GroupNorm_49_wts_7_1_49": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 964147008, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_428.const", + "file_size": 2560 + }, + "Sigmoid_37.weights10_39": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 964149568, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_429.const", + "file_size": 256 + }, + "NhwcConv_59_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4352000 + ], + "size_in_bytes": 4352000, + "offset": 964149824, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_430.const", + "file_size": 4352000 + }, + "GroupNorm_50_wts_7_1_50": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 968501824, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_431.const", + "file_size": 2560 + }, + "NhwcConv_60_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 512000 + ], + "size_in_bytes": 512000, + "offset": 968504384, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_432.const", + "file_size": 512000 + }, + "up_blocks.2.attentions.2.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 969016384, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_433.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.2.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 969017664, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_434.const", + "file_size": 1280 + }, + "onnx::MatMul_6045": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 969018944, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_435.const", + "file_size": 471040 + }, + "onnx::MatMul_6044": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 969489984, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_436.const", + "file_size": 471040 + }, + "onnx::MatMul_6046": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 969961024, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_437.const", + "file_size": 471040 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/MatMulmha_0_24_mask.8_24": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 970432064, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_438.const", + "file_size": 2048 + }, + "onnx::MatMul_6066": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 970434112, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_439.const", + "file_size": 471040 + }, + "up_blocks.2.attentions.2.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 970905152, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_440.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.2.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 970906432, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_441.const", + "file_size": 1280 + }, + "onnx::MatMul_6067": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 970907712, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_442.const", + "file_size": 471040 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/MatMulmha_0_25_mask.8_25": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 971378752, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_443.const", + "file_size": 512 + }, + "onnx::MatMul_6089": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 971379264, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_444.const", + "file_size": 471040 + }, + "up_blocks.2.attentions.2.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 971850304, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_445.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.2.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 971851584, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_446.const", + "file_size": 1280 + }, + "onnx::MatMul_6090_2_12_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1894400 + ], + "size_in_bytes": 1894400, + "offset": 971852864, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_447.const", + "file_size": 1894400 + }, + "onnx::MatMul_6090_2_12_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1894400 + ], + "size_in_bytes": 1894400, + "offset": 973747264, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_448.const", + "file_size": 1894400 + }, + "onnx::MatMul_6091": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "offset": 975641664, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_449.const", + "file_size": 1868800 + }, + "NhwcConv_61_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 512000 + ], + "size_in_bytes": 512000, + "offset": 977510464, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_450.const", + "file_size": 512000 + }, + "/up_blocks.2/upsamplers.0/Resize.weights4_2": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 978022464, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_451.const", + "file_size": 256 + }, + "NhwcConv_62_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4352000 + ], + "size_in_bytes": 4352000, + "offset": 978022720, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_452.const", + "file_size": 4352000 + }, + "GroupNorm_51_wts_7_1_51": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1920 + ], + "size_in_bytes": 3840, + "offset": 982374720, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_453.const", + "file_size": 3840 + }, + "NhwcConv_63_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 386560 + ], + "size_in_bytes": 386560, + "offset": 982378560, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_454.const", + "file_size": 386560 + }, + "Sigmoid_38.weights10_40": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 982765120, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_455.const", + "file_size": 256 + }, + "up_blocks.3.resnets.0.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 3212800 + ], + "size_in_bytes": 3212800, + "offset": 982765376, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_456.const", + "file_size": 3212800 + }, + "GroupNorm_52_wts_7_1_52": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 985978176, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_457.const", + "file_size": 1280 + }, + "Sigmoid_39.weights10_41": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 985979456, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_458.const", + "file_size": 256 + }, + "NhwcConv_64_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1088000 + ], + "size_in_bytes": 1088000, + "offset": 985979712, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_459.const", + "file_size": 1088000 + }, + "GroupNorm_53_wts_7_1_53": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 987067712, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_460.const", + "file_size": 1280 + }, + "NhwcConv_65_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 135680 + ], + "size_in_bytes": 135680, + "offset": 987068992, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_461.const", + "file_size": 135680 + }, + "up_blocks.3.attentions.0.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 987204672, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_462.const", + "file_size": 640 + }, + "up_blocks.3.attentions.0.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 987205312, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_463.const", + "file_size": 640 + }, + "onnx::MatMul_6109": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 987205952, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_464.const", + "file_size": 117760 + }, + "onnx::MatMul_6108": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 987323712, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_465.const", + "file_size": 117760 + }, + "onnx::MatMul_6110": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 987441472, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_466.const", + "file_size": 117760 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/MatMulmha_0_26_mask.8_26": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 4096 + ], + "size_in_bytes": 8192, + "offset": 987559232, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_467.const", + "file_size": 8192 + }, + "onnx::MatMul_6130": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 987567424, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_468.const", + "file_size": 117760 + }, + "up_blocks.3.attentions.0.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 987685184, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_469.const", + "file_size": 640 + }, + "up_blocks.3.attentions.0.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 987685824, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_470.const", + "file_size": 640 + }, + "onnx::MatMul_6131": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 987686464, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_471.const", + "file_size": 117760 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/MatMulmha_0_27_mask.8_27": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 987804224, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_472.const", + "file_size": 512 + }, + "onnx::MatMul_6153": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 987804736, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_473.const", + "file_size": 117760 + }, + "up_blocks.3.attentions.0.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 987922496, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_474.const", + "file_size": 640 + }, + "up_blocks.3.attentions.0.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 987923136, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_475.const", + "file_size": 640 + }, + "onnx::MatMul_6154_2_13_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 987923776, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_476.const", + "file_size": 471040 + }, + "onnx::MatMul_6154_2_13_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "offset": 988394816, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_477.const", + "file_size": 473600 + }, + "onnx::MatMul_6155": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 988868416, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_478.const", + "file_size": 471040 + }, + "NhwcConv_66_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 135680 + ], + "size_in_bytes": 135680, + "offset": 989339456, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_479.const", + "file_size": 135680 + }, + "GroupNorm_54_wts_7_1_54": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 989475136, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_480.const", + "file_size": 2560 + }, + "NhwcConv_67_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 271360 + ], + "size_in_bytes": 271360, + "offset": 989477696, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_481.const", + "file_size": 271360 + }, + "Sigmoid_40.weights10_42": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 989749056, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_482.const", + "file_size": 256 + }, + "up_blocks.3.resnets.1.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2176000 + ], + "size_in_bytes": 2176000, + "offset": 989749312, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_483.const", + "file_size": 2176000 + }, + "GroupNorm_55_wts_7_1_55": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 991925312, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_484.const", + "file_size": 1280 + }, + "Sigmoid_41.weights10_43": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 991926592, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_485.const", + "file_size": 256 + }, + "NhwcConv_68_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1088000 + ], + "size_in_bytes": 1088000, + "offset": 991926848, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_486.const", + "file_size": 1088000 + }, + "GroupNorm_56_wts_7_1_56": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 993014848, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_487.const", + "file_size": 1280 + }, + "NhwcConv_69_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 135680 + ], + "size_in_bytes": 135680, + "offset": 993016128, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_488.const", + "file_size": 135680 + }, + "up_blocks.3.attentions.1.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 993151808, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_489.const", + "file_size": 640 + }, + "up_blocks.3.attentions.1.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 993152448, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_490.const", + "file_size": 640 + }, + "onnx::MatMul_6172": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 993153088, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_491.const", + "file_size": 117760 + }, + "onnx::MatMul_6171": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 993270848, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_492.const", + "file_size": 117760 + }, + "onnx::MatMul_6173": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 993388608, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_493.const", + "file_size": 117760 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/MatMulmha_0_28_mask.8_28": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 4096 + ], + "size_in_bytes": 8192, + "offset": 993506368, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_494.const", + "file_size": 8192 + }, + "onnx::MatMul_6193": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 993514560, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_495.const", + "file_size": 117760 + }, + "up_blocks.3.attentions.1.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 993632320, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_496.const", + "file_size": 640 + }, + "up_blocks.3.attentions.1.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 993632960, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_497.const", + "file_size": 640 + }, + "onnx::MatMul_6194": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 993633600, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_498.const", + "file_size": 117760 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/MatMulmha_0_29_mask.8_29": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 993751360, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_499.const", + "file_size": 512 + }, + "onnx::MatMul_6216": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 993751872, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_500.const", + "file_size": 117760 + }, + "up_blocks.3.attentions.1.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 993869632, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_501.const", + "file_size": 640 + }, + "up_blocks.3.attentions.1.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 993870272, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_502.const", + "file_size": 640 + }, + "onnx::MatMul_6217_2_14_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 993870912, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_503.const", + "file_size": 471040 + }, + "onnx::MatMul_6217_2_14_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "offset": 994341952, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_504.const", + "file_size": 473600 + }, + "onnx::MatMul_6218": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 994815552, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_505.const", + "file_size": 471040 + }, + "NhwcConv_70_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 135680 + ], + "size_in_bytes": 135680, + "offset": 995286592, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_506.const", + "file_size": 135680 + }, + "GroupNorm_57_wts_7_1_57": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "offset": 995422272, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_507.const", + "file_size": 2560 + }, + "NhwcConv_71_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 271360 + ], + "size_in_bytes": 271360, + "offset": 995424832, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_508.const", + "file_size": 271360 + }, + "Sigmoid_42.weights10_44": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 995696192, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_509.const", + "file_size": 256 + }, + "up_blocks.3.resnets.2.conv1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2176000 + ], + "size_in_bytes": 2176000, + "offset": 995696448, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_510.const", + "file_size": 2176000 + }, + "GroupNorm_58_wts_7_1_58": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 997872448, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_511.const", + "file_size": 1280 + }, + "Sigmoid_43.weights10_45": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 997873728, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_512.const", + "file_size": 256 + }, + "NhwcConv_72_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1088000 + ], + "size_in_bytes": 1088000, + "offset": 997873984, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_513.const", + "file_size": 1088000 + }, + "GroupNorm_59_wts_7_1_59": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 998961984, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_514.const", + "file_size": 1280 + }, + "NhwcConv_73_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 135680 + ], + "size_in_bytes": 135680, + "offset": 998963264, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_515.const", + "file_size": 135680 + }, + "up_blocks.3.attentions.2.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 999098944, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_516.const", + "file_size": 640 + }, + "up_blocks.3.attentions.2.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 999099584, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_517.const", + "file_size": 640 + }, + "onnx::MatMul_6235": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 999100224, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_518.const", + "file_size": 117760 + }, + "onnx::MatMul_6234": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 999217984, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_519.const", + "file_size": 117760 + }, + "onnx::MatMul_6236": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 999335744, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_520.const", + "file_size": 117760 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/MatMulmha_0_30_mask.8_30": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 4096 + ], + "size_in_bytes": 8192, + "offset": 999453504, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_521.const", + "file_size": 8192 + }, + "onnx::MatMul_6256": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 999461696, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_522.const", + "file_size": 117760 + }, + "up_blocks.3.attentions.2.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 999579456, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_523.const", + "file_size": 640 + }, + "up_blocks.3.attentions.2.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 999580096, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_524.const", + "file_size": 640 + }, + "onnx::MatMul_6257": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 999580736, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_525.const", + "file_size": 117760 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/MatMulmha_0_31_mask.8_31": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 999698496, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_526.const", + "file_size": 512 + }, + "onnx::MatMul_6279": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "offset": 999699008, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_527.const", + "file_size": 117760 + }, + "up_blocks.3.attentions.2.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 999816768, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_528.const", + "file_size": 640 + }, + "up_blocks.3.attentions.2.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "offset": 999817408, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_529.const", + "file_size": 640 + }, + "onnx::MatMul_6280_2_15_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 999818048, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_530.const", + "file_size": 471040 + }, + "onnx::MatMul_6280_2_15_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "offset": 1000289088, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_531.const", + "file_size": 473600 + }, + "onnx::MatMul_6281": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "offset": 1000762688, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_532.const", + "file_size": 471040 + }, + "NhwcConv_74_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 135680 + ], + "size_in_bytes": 135680, + "offset": 1001233728, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_533.const", + "file_size": 135680 + }, + "GroupNorm_60_wts_7_1_60": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "offset": 1001369408, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_534.const", + "file_size": 1280 + }, + "Sigmoid_44.weights10_46": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 1001370688, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_535.const", + "file_size": 256 + }, + "NhwcConv_75_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 54400 + ], + "size_in_bytes": 54400, + "offset": 1001370944, + "file_name": ".cache\\down_blocks.0attentions.0transformer_blocks.0attn2to_kMatMul_536.const", + "file_size": 54400 + } + }, + "aux_info": {} +} \ No newline at end of file