Upload folder using huggingface_hub

Files changed (14) hide show

decoder_model.onnx DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:d24bcccc1112825def21cf4241933aae2c89187b3663928e9a083faeaed92249
-size 5437678

decoder_model.onnx_data DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:58e859c15c13e65b9a5478e3a4e3dc81f5b0d5500d5d18c942064a447f6af150
-size 26953662464

decoder_model_merged.onnx DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:48a4703bff0b9eff305ece6e15f20ab52d52d48eccaa28bbb2159f38cebeacc4
-size 10888493

decoder_model_merged.onnx_data DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:58e859c15c13e65b9a5478e3a4e3dc81f5b0d5500d5d18c942064a447f6af150
-size 26953662464

decoder_model_merged_quantized.onnx DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f1266c653f7026aa4126cac8eadae4eb82e617e37ed65cd60bfda5a490dcd305
-size 19045741

decoder_model_merged_quantized.onnx_data DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:0f57f92dce820666b27faace4a325a7d8d41691b4f9d3e3540ba70e696b42a06
-size 6739214336

decoder_with_past_model.onnx DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:4425410e11031c394eb76701bc8c82c0fdf74273934e62d6028d9d3242a67ce7
-size 5471136

decoder_with_past_model.onnx_data DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:58e859c15c13e65b9a5478e3a4e3dc81f5b0d5500d5d18c942064a447f6af150
-size 26953662464

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:97ef03e1d46da5972d3324761e9b16a43112bb48a7eaa62658d2a4e2141b370f
-size 19048364

 version https://git-lfs.github.com/spec/v1
+oid sha256:f1266c653f7026aa4126cac8eadae4eb82e617e37ed65cd60bfda5a490dcd305
+size 19045741

onnx/decoder_model_merged_quantized.onnx_data CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dab778698ac3bc754db6291ecc0c43d92278f6a69a7d5d006e39a4e98349c2b8
 size 6739214336

 version https://git-lfs.github.com/spec/v1
+oid sha256:0f57f92dce820666b27faace4a325a7d8d41691b4f9d3e3540ba70e696b42a06
 size 6739214336

{q1 → onnx/q1}/decoder_model_merged_quantized.onnx RENAMED Viewed

File without changes

{q1 → onnx/q1}/decoder_model_merged_quantized.onnx_data RENAMED Viewed

File without changes

onnx/quantize_config.json ADDED Viewed

+{
+    "per_channel": true,
+    "reduce_range": true,
+    "use_external_data_format": true,
+    "per_model_config": {
+        "decoder_model_merged": {
+            "op_types": [
+                "Concat",
+                "Transpose",
+                "Neg",
+                "Sigmoid",
+                "ReduceMean",
+                "Identity",
+                "Expand",
+                "Shape",
+                "Equal",
+                "Sqrt",
+                "Range",
+                "Where",
+                "Gather",
+                "Pow",
+                "Constant",
+                "Sub",
+                "Less",
+                "Div",
+                "MatMul",
+                "Cast",
+                "Unsqueeze",
+                "If",
+                "Softmax",
+                "Add",
+                "ConstantOfShape",
+                "Squeeze",
+                "Mul",
+                "Reshape",
+                "Slice"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}

quantize_config.json CHANGED Viewed

@@ -5,34 +5,34 @@
     "per_model_config": {
         "decoder_model_merged": {
             "op_types": [
-                "Concat",
-                "Transpose",
-                "Neg",
                 "Sigmoid",
-                "ReduceMean",
-                "Identity",
-                "Expand",
-                "Shape",
-                "Equal",
-                "Sqrt",
-                "Range",
-                "Where",
-                "Gather",
-                "Pow",
-                "Constant",
-                "Sub",
-                "Less",
                 "Div",
                 "MatMul",
                 "Cast",
                 "Unsqueeze",
-                "If",
                 "Softmax",
-                "Add",
-                "ConstantOfShape",
                 "Squeeze",
-                "Mul",
-                "Reshape",
                 "Slice"
             ],
             "weight_type": "QInt8"

     "per_model_config": {
         "decoder_model_merged": {
             "op_types": [
                 "Sigmoid",
+                "If",
+                "Reshape",
                 "Div",
                 "MatMul",
                 "Cast",
+                "ConstantOfShape",
+                "Constant",
+                "Neg",
+                "Gather",
+                "Mul",
+                "Add",
+                "Where",
+                "Less",
+                "Expand",
+                "Concat",
+                "Sub",
+                "Equal",
                 "Unsqueeze",
+                "Pow",
+                "Sqrt",
+                "Transpose",
                 "Softmax",
+                "Identity",
+                "Range",
+                "Shape",
                 "Squeeze",
+                "ReduceMean",
                 "Slice"
             ],
             "weight_type": "QInt8"