Upload folder using huggingface_hub

Browse files

Files changed (8) hide show

onnx/model.onnx +3 -0
onnx/model_bnb4.onnx +3 -0
onnx/model_fp16.onnx +3 -0
onnx/model_int8.onnx +3 -0
onnx/model_q4.onnx +3 -0
onnx/model_quantized.onnx +3 -0
onnx/model_uint8.onnx +3 -0
quantize_config.json +129 -0

onnx/model.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:30b37c72933c37c1dcbbd58abf613845ace73fef92e8dec4ff78903a03aaa881
+size 176581010

onnx/model_bnb4.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eb4f3688801b2996b76f708e4d5625c2d669ff254a78428f839f594ad49bf290
+size 146085627

onnx/model_fp16.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3216c0aa38d61b9e59659e737d5c5f2a966f65bfeafd5913ef1d3d8fb4fa3d81
+size 88576823

onnx/model_int8.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d49e880a41129d2f442b92bf95dc914826b0c3169a62ee55c83ec8f8fce6e1fd
+size 45391656

onnx/model_q4.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f20615398dceb5aa47d6b35d36fec990cda2d647ac4682ed3cc9f94b9ae85c5f
+size 146640027

onnx/model_quantized.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7595346cadedf91130719b87bff3073eff181c3fdd1e63f62310de4c6895ba40
+size 45391749

onnx/model_uint8.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7595346cadedf91130719b87bff3073eff181c3fdd1e63f62310de4c6895ba40
+size 45391749

quantize_config.json ADDED Viewed

	@@ -0,0 +1,129 @@

+{
+    "fp16": {},
+    "q8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "BatchNormalization",
+                    "Cast",
+                    "Concat",
+                    "Constant",
+                    "Conv",
+                    "Div",
+                    "Erf",
+                    "Flatten",
+                    "Gather",
+                    "Gemm",
+                    "GlobalAveragePool",
+                    "Identity",
+                    "MatMul",
+                    "Mul",
+                    "ReduceMean",
+                    "Relu",
+                    "Reshape",
+                    "Shape",
+                    "Sigmoid",
+                    "Slice",
+                    "Softmax",
+                    "Split",
+                    "Sqrt",
+                    "Squeeze",
+                    "Sub",
+                    "Transpose",
+                    "Unsqueeze"
+                ],
+                "weight_type": "QUInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "int8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "BatchNormalization",
+                    "Cast",
+                    "Concat",
+                    "Constant",
+                    "Conv",
+                    "Div",
+                    "Erf",
+                    "Flatten",
+                    "Gather",
+                    "Gemm",
+                    "GlobalAveragePool",
+                    "Identity",
+                    "MatMul",
+                    "Mul",
+                    "ReduceMean",
+                    "Relu",
+                    "Reshape",
+                    "Shape",
+                    "Sigmoid",
+                    "Slice",
+                    "Softmax",
+                    "Split",
+                    "Sqrt",
+                    "Squeeze",
+                    "Sub",
+                    "Transpose",
+                    "Unsqueeze"
+                ],
+                "weight_type": "QInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "uint8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "BatchNormalization",
+                    "Cast",
+                    "Concat",
+                    "Constant",
+                    "Conv",
+                    "Div",
+                    "Erf",
+                    "Flatten",
+                    "Gather",
+                    "Gemm",
+                    "GlobalAveragePool",
+                    "Identity",
+                    "MatMul",
+                    "Mul",
+                    "ReduceMean",
+                    "Relu",
+                    "Reshape",
+                    "Shape",
+                    "Sigmoid",
+                    "Slice",
+                    "Softmax",
+                    "Split",
+                    "Sqrt",
+                    "Squeeze",
+                    "Sub",
+                    "Transpose",
+                    "Unsqueeze"
+                ],
+                "weight_type": "QUInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "q4": {
+        "block_size": 32,
+        "is_symmetric": true,
+        "accuracy_level": null
+    },
+    "bnb4": {
+        "block_size": 64,
+        "quant_type": 1
+    }
+}