karming-wan commited on
Commit
67fe56c
·
1 Parent(s): ba8902f

qconfig.weights_dtype = QuantType.QUInt8

Browse files
onnx/model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ece90752365fc7744870a223a3d0ab2132e17c3256f17c0cb3ab9c1a3c1fd122
3
- size 9588132
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2052543792a2e3fa2b9cda3a2bba1479f60c7a412b42b2728c766a299c9a83a2
3
+ size 9588203
quantize_config.json CHANGED
@@ -27,7 +27,7 @@
27
  "MatMul": 1
28
  },
29
  "reduce_range": false,
30
- "weights_dtype": "QInt8",
31
  "weights_symmetric": true
32
  },
33
  "transformers_version": "4.35.2",
 
27
  "MatMul": 1
28
  },
29
  "reduce_range": false,
30
+ "weights_dtype": "QUInt8",
31
  "weights_symmetric": true
32
  },
33
  "transformers_version": "4.35.2",