qconfig.weights_dtype = QuantType.QUInt8

Files changed (2) hide show

onnx/model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ece90752365fc7744870a223a3d0ab2132e17c3256f17c0cb3ab9c1a3c1fd122
-size 9588132

 version https://git-lfs.github.com/spec/v1
+oid sha256:2052543792a2e3fa2b9cda3a2bba1479f60c7a412b42b2728c766a299c9a83a2
+size 9588203

quantize_config.json CHANGED Viewed

@@ -27,7 +27,7 @@
       "MatMul": 1
     },
     "reduce_range": false,
-    "weights_dtype": "QInt8",
     "weights_symmetric": true
   },
   "transformers_version": "4.35.2",

       "MatMul": 1
     },
     "reduce_range": false,
+    "weights_dtype": "QUInt8",
     "weights_symmetric": true
   },
   "transformers_version": "4.35.2",