youfengy commited on
Commit
6082038
·
verified ·
1 Parent(s): fe93ef8

Upload 15 files

Browse files
onnx/decoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f02dbc32615cb67509fc56a8b632cd089ce83763c4fdd0684a0db2ea75d6d92e
3
  size 166670441
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b17677a8e52be9f0a924f0e45f4c160aa5b90df9f8b5ea56ec37318f6b645044
3
  size 166670441
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7f873f936a3df005ec66a0bdb59ec46867abee46299d851931ac58a8e50ff51
3
  size 166832634
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a5d16285704a1c060d4f88ed78c981647d27e8663b5fccf7d853f00b3a3bcaa
3
  size 166832634
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:360c22e8d266e3c78e33f8a6fd84aeb6888bd4f6bc0f89bc4f6e3313a97f00a5
3
  size 42431444
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85822fdb4b29ab4b628f1028d4c488030b08eed68bbe37eadc6df9f72587ca19
3
  size 42431444
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7f3596e68f9fbd78d88a2d74b31781feb01f9d3a815f058ab0e36434f8c9fd1
3
  size 42154677
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee7220db64f55f166559461cffc2141468af4615da0543bf659f65442e9fe17c
3
  size 42154677
onnx/decoder_with_past_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b661a1113f4ff1449cf633aa8f68c15ddb16b6d2df57e898b59a9b5f40fa00cf
3
  size 154076576
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56b85be5d484a1ea402fb68ee70cb9f10a8ebf31db582f4650c04c24d7d36aa5
3
  size 154076576
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3608448e65af845b3a34d6fbaed226ffc4f8b774cf969777a024929636a6fe11
3
  size 38952139
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1412f385659a38913bb1c366f58dfd817f752283f911b64b7320d22c9a4973d5
3
  size 38952139
onnx/encoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2816dcb1b5df89b4c5099288652d25850ccf10d2bce626fe29166c02c4da8ec
3
  size 141404308
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bd48a64d314c8f74e541b676bbe9847ec4a24796a095b12e67fee6dda596cc5
3
  size 141404308
onnx/encoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2615f0642add5ca2a89c7a748823ead83c9ef895600d312a25f850c435e60326
3
  size 35640025
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:991e20004a6478ca0388c048dd6c440ea8f7c42208576519761146bdd3b20974
3
  size 35640025
quantize_config.json CHANGED
@@ -4,134 +4,134 @@
4
  "per_model_config": {
5
  "decoder_model": {
6
  "op_types": [
7
- "Mul",
8
- "Pow",
9
- "Softmax",
10
- "Reshape",
11
- "Min",
12
- "Less",
13
- "ConstantOfShape",
14
- "Div",
15
- "MatMul",
16
  "Unsqueeze",
17
- "Range",
18
- "Gather",
 
 
19
  "Shape",
20
  "Tile",
21
- "ReduceMean",
22
- "LessOrEqual",
23
- "Sub",
24
- "Sqrt",
25
  "Cast",
 
26
  "Where",
27
- "Log",
 
28
  "Add",
 
 
 
 
29
  "Relu",
30
- "Transpose",
31
- "Expand",
 
 
32
  "Neg",
33
- "Constant",
34
- "Concat"
 
35
  ],
36
  "weight_type": "QInt8"
37
  },
38
  "decoder_model_merged": {
39
  "op_types": [
40
- "Mul",
41
- "Pow",
42
- "Softmax",
43
  "Reshape",
44
- "Min",
45
- "Less",
46
- "ConstantOfShape",
47
- "Div",
48
- "MatMul",
49
  "Slice",
50
- "Unsqueeze",
51
- "Range",
52
- "Gather",
53
  "Shape",
 
54
  "Tile",
55
- "ReduceMean",
56
- "LessOrEqual",
57
- "Sub",
58
- "Sqrt",
59
  "Cast",
 
60
  "Where",
61
- "Log",
62
- "If",
63
  "Add",
 
 
 
 
64
  "Relu",
65
- "Transpose",
66
- "Expand",
 
 
67
  "Neg",
68
- "Constant",
69
- "Concat"
 
70
  ],
71
  "weight_type": "QInt8"
72
  },
73
  "decoder_with_past_model": {
74
  "op_types": [
75
- "Mul",
76
- "Pow",
77
- "Softmax",
78
  "Reshape",
79
- "Min",
80
- "Less",
81
- "ConstantOfShape",
82
- "Div",
83
- "MatMul",
84
  "Slice",
85
- "Unsqueeze",
86
- "Range",
87
- "Gather",
88
  "Shape",
89
  "Tile",
90
- "ReduceMean",
91
- "LessOrEqual",
92
- "Sub",
93
- "Sqrt",
94
  "Cast",
 
95
  "Where",
96
- "Log",
 
97
  "Add",
 
 
 
 
98
  "Relu",
99
- "Transpose",
100
- "Expand",
 
 
101
  "Neg",
102
- "Constant",
103
- "Concat"
 
104
  ],
105
  "weight_type": "QInt8"
106
  },
107
  "encoder_model": {
108
  "op_types": [
109
- "Mul",
110
- "Pow",
111
- "Softmax",
112
- "Reshape",
113
- "Min",
114
- "Less",
115
- "ConstantOfShape",
116
- "Div",
117
- "MatMul",
118
  "Unsqueeze",
119
- "Range",
120
- "Gather",
121
- "Shape",
122
- "ReduceMean",
123
- "Sub",
124
  "Sqrt",
 
 
125
  "Abs",
 
 
 
126
  "Cast",
 
127
  "Where",
128
- "Log",
 
129
  "Add",
130
- "Relu",
131
- "Greater",
132
- "Transpose",
133
  "Constant",
134
- "Concat"
 
 
 
 
 
 
 
 
 
135
  ],
136
  "weight_type": "QInt8"
137
  }
 
4
  "per_model_config": {
5
  "decoder_model": {
6
  "op_types": [
 
 
 
 
 
 
 
 
 
7
  "Unsqueeze",
8
+ "Sqrt",
9
+ "ReduceMean",
10
+ "Reshape",
11
+ "Expand",
12
  "Shape",
13
  "Tile",
14
+ "Transpose",
15
+ "Gather",
 
 
16
  "Cast",
17
+ "Range",
18
  "Where",
19
+ "ConstantOfShape",
20
+ "Concat",
21
  "Add",
22
+ "Constant",
23
+ "Sub",
24
+ "Pow",
25
+ "Less",
26
  "Relu",
27
+ "Log",
28
+ "Div",
29
+ "Mul",
30
+ "MatMul",
31
  "Neg",
32
+ "Softmax",
33
+ "LessOrEqual",
34
+ "Min"
35
  ],
36
  "weight_type": "QInt8"
37
  },
38
  "decoder_model_merged": {
39
  "op_types": [
40
+ "Unsqueeze",
41
+ "Sqrt",
42
+ "ReduceMean",
43
  "Reshape",
 
 
 
 
 
44
  "Slice",
45
+ "Expand",
 
 
46
  "Shape",
47
+ "If",
48
  "Tile",
49
+ "Transpose",
50
+ "Gather",
 
 
51
  "Cast",
52
+ "Range",
53
  "Where",
54
+ "ConstantOfShape",
55
+ "Concat",
56
  "Add",
57
+ "Constant",
58
+ "Sub",
59
+ "Pow",
60
+ "Less",
61
  "Relu",
62
+ "Log",
63
+ "Div",
64
+ "Mul",
65
+ "MatMul",
66
  "Neg",
67
+ "Softmax",
68
+ "LessOrEqual",
69
+ "Min"
70
  ],
71
  "weight_type": "QInt8"
72
  },
73
  "decoder_with_past_model": {
74
  "op_types": [
75
+ "Unsqueeze",
76
+ "Sqrt",
77
+ "ReduceMean",
78
  "Reshape",
 
 
 
 
 
79
  "Slice",
80
+ "Expand",
 
 
81
  "Shape",
82
  "Tile",
83
+ "Transpose",
84
+ "Gather",
 
 
85
  "Cast",
86
+ "Range",
87
  "Where",
88
+ "ConstantOfShape",
89
+ "Concat",
90
  "Add",
91
+ "Constant",
92
+ "Sub",
93
+ "Pow",
94
+ "Less",
95
  "Relu",
96
+ "Log",
97
+ "Div",
98
+ "Mul",
99
+ "MatMul",
100
  "Neg",
101
+ "Softmax",
102
+ "LessOrEqual",
103
+ "Min"
104
  ],
105
  "weight_type": "QInt8"
106
  },
107
  "encoder_model": {
108
  "op_types": [
109
+ "Greater",
 
 
 
 
 
 
 
 
110
  "Unsqueeze",
 
 
 
 
 
111
  "Sqrt",
112
+ "ReduceMean",
113
+ "Reshape",
114
  "Abs",
115
+ "Shape",
116
+ "Transpose",
117
+ "Gather",
118
  "Cast",
119
+ "Range",
120
  "Where",
121
+ "ConstantOfShape",
122
+ "Concat",
123
  "Add",
 
 
 
124
  "Constant",
125
+ "Sub",
126
+ "Pow",
127
+ "Less",
128
+ "Relu",
129
+ "Log",
130
+ "Div",
131
+ "Mul",
132
+ "MatMul",
133
+ "Softmax",
134
+ "Min"
135
  ],
136
  "weight_type": "QInt8"
137
  }