spolivin commited on
Commit
d43ffba
1 Parent(s): 2a84090

Upload quantize_config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. quantize_config.json +35 -0
quantize_config.json ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "per_model_config": {
5
+ "model": {
6
+ "op_types": [
7
+ "Unsqueeze",
8
+ "Div",
9
+ "Conv",
10
+ "Mul",
11
+ "MatMul",
12
+ "ConstantOfShape",
13
+ "Expand",
14
+ "Equal",
15
+ "Where",
16
+ "Sqrt",
17
+ "Sub",
18
+ "Add",
19
+ "Slice",
20
+ "Shape",
21
+ "Gather",
22
+ "ReduceMean",
23
+ "Softmax",
24
+ "Pow",
25
+ "Constant",
26
+ "Concat",
27
+ "Transpose",
28
+ "Gemm",
29
+ "Reshape",
30
+ "Erf"
31
+ ],
32
+ "weight_type": "QUInt8"
33
+ }
34
+ }
35
+ }