Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

config.json +1 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +83 -83

config.json CHANGED Viewed

@@ -54,7 +54,7 @@
   "scale_embedding": true,
   "share_encoder_decoder_embeddings": true,
   "static_position_embeddings": true,
-  "transformers_version": "4.33.0.dev0",
   "use_cache": true,
   "vocab_size": 53685
 }

   "scale_embedding": true,
   "share_encoder_decoder_embeddings": true,
   "static_position_embeddings": true,
+  "transformers_version": "4.34.0.dev0",
   "use_cache": true,
   "vocab_size": 53685
 }

generation_config.json CHANGED Viewed

@@ -12,5 +12,5 @@
   "num_beams": 4,
   "pad_token_id": 53684,
   "renormalize_logits": true,
-  "transformers_version": "4.33.0.dev0"
 }

   "num_beams": 4,
   "pad_token_id": 53684,
   "renormalize_logits": true,
+  "transformers_version": "4.34.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2f0d893453f8a43d23b576dd6bf3fa1115f1518e3b91d9c40c14dbccb43b7343
-size 322330060

 version https://git-lfs.github.com/spec/v1
+oid sha256:6749fbaa057790f6aa24044d6c4c8e9e9866c4c09643c7a626a212423ef62ef6
+size 212383237

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:39f01ded3e54e0bd052238352ffd14242b6a59a843fa1a6c51413ea4f232c3f1
-size 322565542

 version https://git-lfs.github.com/spec/v1
+oid sha256:baf572c55c5201340cd91802ae3c3032c8dfcdc7f25ed27446a6a644cffce622
+size 212618804

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1db1532aa7e2ac44e4fc4b5b7a239133c13589aff7ae5af2ebe9ef1df812a123
-size 82130305

 version https://git-lfs.github.com/spec/v1
+oid sha256:1cfc6a84f9c189e6928c9710b281fae3f1f42d4ffbba109e7b4ec8e31ceb06dd
+size 54373748

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7e20ba038bf624f634480c1ad20e466d8b2c83d976ff97040df0af794004632e
-size 81758949

 version https://git-lfs.github.com/spec/v1
+oid sha256:cde3e02aaca72cfaf2267f6c31c4dcc1b323d769bf90c273f2a1c1d56198ddba
+size 54003046

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:283f351d005aba8e3922fed2d646f898dadbed4809602d62469f9ed4e6b62eba
-size 309679551

 version https://git-lfs.github.com/spec/v1
+oid sha256:3efadf66d7039a6a5c42f565f9e99ac1f270f46535ab7363e0004ec635891b4d
+size 199732728

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e6bcc438c2493a8e6aaa818acf203ddd2884785fcbc9ab711fcdba4d29c4aa25
-size 78487485

 version https://git-lfs.github.com/spec/v1
+oid sha256:e8f3945a5b393a3533930f920d0e98c5cb4d3804646611534360aa918b2489f2
+size 50731582

quantize_config.json CHANGED Viewed

@@ -2,122 +2,122 @@
     "per_channel": true,
     "reduce_range": true,
     "per_model_config": {
-        "decoder_model_merged": {
             "op_types": [
-                "Sqrt",
-                "Equal",
-                "Cast",
-                "Mul",
-                "Slice",
-                "Gather",
-                "Constant",
-                "ReduceMean",
-                "Div",
-                "Squeeze",
-                "MatMul",
-                "ConstantOfShape",
-                "Reshape",
                 "Pow",
-                "Transpose",
-                "Range",
-                "Sub",
                 "Shape",
-                "If",
-                "Unsqueeze",
                 "Concat",
                 "Add",
                 "Where",
                 "Less",
-                "Sigmoid",
-                "Expand",
-                "Softmax"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model": {
             "op_types": [
-                "Sqrt",
-                "Equal",
-                "Cast",
-                "Mul",
-                "Slice",
-                "Gather",
-                "Constant",
-                "ReduceMean",
-                "Div",
-                "Squeeze",
-                "MatMul",
-                "ConstantOfShape",
-                "Reshape",
                 "Pow",
-                "Transpose",
-                "Range",
-                "Sub",
                 "Shape",
-                "Unsqueeze",
                 "Concat",
                 "Add",
-                "Where",
-                "Less",
-                "Sigmoid",
                 "Expand",
-                "Softmax"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_with_past_model": {
             "op_types": [
-                "Sqrt",
-                "Equal",
-                "Cast",
-                "Mul",
-                "Gather",
-                "Constant",
-                "ReduceMean",
-                "Div",
-                "MatMul",
-                "ConstantOfShape",
-                "Reshape",
                 "Pow",
-                "Transpose",
-                "Range",
-                "Sub",
                 "Shape",
-                "Unsqueeze",
                 "Concat",
                 "Add",
-                "Where",
-                "Sigmoid",
                 "Expand",
-                "Softmax"
             ],
             "weight_type": "QInt8"
         },
-        "encoder_model": {
             "op_types": [
-                "Sqrt",
-                "Equal",
-                "Cast",
-                "Mul",
-                "Gather",
-                "Constant",
-                "ReduceMean",
-                "Div",
-                "MatMul",
-                "ConstantOfShape",
-                "Reshape",
                 "Pow",
-                "Transpose",
-                "Range",
-                "Sub",
                 "Shape",
-                "Unsqueeze",
-                "Concat",
                 "Add",
-                "Where",
-                "Sigmoid",
                 "Expand",
-                "Softmax"
             ],
             "weight_type": "QInt8"
         }

     "per_channel": true,
     "reduce_range": true,
     "per_model_config": {
+        "decoder_model": {
             "op_types": [
                 "Pow",
                 "Shape",
+                "ReduceMean",
+                "Mul",
+                "Reshape",
                 "Concat",
                 "Add",
+                "Sqrt",
+                "Sub",
+                "Slice",
+                "Div",
+                "Cast",
+                "Expand",
                 "Where",
+                "Range",
+                "Softmax",
+                "MatMul",
+                "Unsqueeze",
+                "Transpose",
+                "Squeeze",
+                "ConstantOfShape",
                 "Less",
+                "Gather",
+                "Equal",
+                "Constant",
+                "Sigmoid"
             ],
             "weight_type": "QInt8"
         },
+        "encoder_model": {
             "op_types": [
                 "Pow",
                 "Shape",
+                "ReduceMean",
+                "Mul",
+                "Reshape",
                 "Concat",
                 "Add",
+                "Sqrt",
+                "Sub",
+                "Div",
+                "Cast",
                 "Expand",
+                "Where",
+                "Range",
+                "Softmax",
+                "MatMul",
+                "Unsqueeze",
+                "Transpose",
+                "ConstantOfShape",
+                "Gather",
+                "Equal",
+                "Constant",
+                "Sigmoid"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model_merged": {
             "op_types": [
                 "Pow",
                 "Shape",
+                "ReduceMean",
+                "Mul",
+                "Reshape",
                 "Concat",
                 "Add",
+                "Sqrt",
+                "Sub",
+                "Slice",
+                "Div",
+                "Cast",
                 "Expand",
+                "Where",
+                "Range",
+                "Softmax",
+                "MatMul",
+                "Unsqueeze",
+                "Transpose",
+                "Squeeze",
+                "If",
+                "ConstantOfShape",
+                "Less",
+                "Gather",
+                "Equal",
+                "Constant",
+                "Sigmoid"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_with_past_model": {
             "op_types": [
                 "Pow",
                 "Shape",
+                "ReduceMean",
+                "Mul",
+                "Reshape",
                 "Add",
+                "Concat",
+                "Sqrt",
+                "Sub",
+                "Div",
+                "Cast",
                 "Expand",
+                "Where",
+                "Range",
+                "Softmax",
+                "MatMul",
+                "Unsqueeze",
+                "Transpose",
+                "ConstantOfShape",
+                "Gather",
+                "Equal",
+                "Constant",
+                "Sigmoid"
             ],
             "weight_type": "QInt8"
         }