Upload folder using huggingface_hub

Browse files

Files changed (10) hide show

config.json +2 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +139 -0
tokenizer_config.json +1 -0

config.json CHANGED Viewed

@@ -3,6 +3,7 @@
   "architectures": [
     "MT5ForConditionalGeneration"
   ],
   "d_ff": 1024,
   "d_kv": 64,
   "d_model": 512,
@@ -24,7 +25,7 @@
   "relative_attention_num_buckets": 32,
   "tie_word_embeddings": false,
   "tokenizer_class": "T5Tokenizer",
-  "transformers_version": "4.29.2",
   "use_cache": true,
   "vocab_size": 250112
 }

   "architectures": [
     "MT5ForConditionalGeneration"
   ],
+  "classifier_dropout": 0.0,
   "d_ff": 1024,
   "d_kv": 64,
   "d_model": 512,
   "relative_attention_num_buckets": 32,
   "tie_word_embeddings": false,
   "tokenizer_class": "T5Tokenizer",
+  "transformers_version": "4.33.0.dev0",
   "use_cache": true,
   "vocab_size": 250112
 }

generation_config.json CHANGED Viewed

@@ -3,5 +3,5 @@
   "decoder_start_token_id": 0,
   "eos_token_id": 1,
   "pad_token_id": 0,
-  "transformers_version": "4.29.2"
 }

   "decoder_start_token_id": 0,
   "eos_token_id": 1,
   "pad_token_id": 0,
+  "transformers_version": "4.33.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:58fb09e90e612342c6134ea6cfb3d373a0c0a3830d0151b62374342e9b19d338
-size 1125416416

 version https://git-lfs.github.com/spec/v1
+oid sha256:701b93c03fdcc3c243fd7a8be4b3373eaf80a4b7878ab5f6472b34fc6faf4ea5
+size 1125416109

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9d575c570aa9cee2a91c4dfe39df28236ef7b1bc78a24c665d409953bdaf3dd6
-size 1125647482

 version https://git-lfs.github.com/spec/v1
+oid sha256:37907b00bbf37057c8a6443d02461dd9330db268beb2233ad113a65a6fe23d93
+size 1125646795

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e11ff57dbcb4e64ff79786549502179af3591cc7f90eba50e3e5cfee4f186492
-size 283645709

 version https://git-lfs.github.com/spec/v1
+oid sha256:61b2e843dd174874268cccd17aa1f6445bcd739af98507b2ac4758bd81c1c9be
+size 283644868

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:37e433df2928d430614db560b90c989c568374e776b3767fabadf409c0d5757c
-size 283249243

 version https://git-lfs.github.com/spec/v1
+oid sha256:69e0a3e53dad4cf0702233e991490d3f359188122e20bbf04b67244d15a042b4
+size 283248855

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e0c8eb8670ff73978a1e048da89bbd5acab340ae7b5e002d69664b779e4a63db
-size 1112816728

 version https://git-lfs.github.com/spec/v1
+oid sha256:755bcd2d76017e69dea38bb864d7d2a0d0f3808481dd57206907bd411c41516e
+size 1112816423

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a949cad5bf7ae4f7bf9163e2b509991979914d036ff5ada8a11bd0fadf2a02eb
-size 280035095

 version https://git-lfs.github.com/spec/v1
+oid sha256:89c588bf6fa8b168a6d2c780a854bc192ff994ae6a65006946415abd372410af
+size 280034718

quantize_config.json ADDED Viewed

	@@ -0,0 +1,139 @@

+{
+    "per_channel": true,
+    "reduce_range": true,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "Tile",
+                "MatMul",
+                "ConstantOfShape",
+                "Sub",
+                "Expand",
+                "Cast",
+                "LessOrEqual",
+                "Log",
+                "Sqrt",
+                "Less",
+                "Tanh",
+                "Shape",
+                "Neg",
+                "Mul",
+                "Softmax",
+                "Constant",
+                "Pow",
+                "Reshape",
+                "ReduceMean",
+                "Gather",
+                "Add",
+                "Where",
+                "Transpose",
+                "Concat",
+                "Range",
+                "Div",
+                "Unsqueeze",
+                "Min"
+            ],
+            "weight_type": "QInt8"
+        },
+        "encoder_model": {
+            "op_types": [
+                "MatMul",
+                "ConstantOfShape",
+                "Sub",
+                "Cast",
+                "Log",
+                "Sqrt",
+                "Less",
+                "Tanh",
+                "Shape",
+                "Mul",
+                "Softmax",
+                "Constant",
+                "Pow",
+                "Reshape",
+                "ReduceMean",
+                "Gather",
+                "Add",
+                "Where",
+                "Transpose",
+                "Concat",
+                "Range",
+                "Div",
+                "Unsqueeze",
+                "Min",
+                "Abs",
+                "Greater"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "Tile",
+                "MatMul",
+                "ConstantOfShape",
+                "Sub",
+                "Expand",
+                "Cast",
+                "LessOrEqual",
+                "Log",
+                "Sqrt",
+                "Less",
+                "Tanh",
+                "Shape",
+                "Neg",
+                "Mul",
+                "If",
+                "Softmax",
+                "Constant",
+                "Slice",
+                "Pow",
+                "Reshape",
+                "ReduceMean",
+                "Gather",
+                "Add",
+                "Where",
+                "Transpose",
+                "Concat",
+                "Range",
+                "Div",
+                "Unsqueeze",
+                "Min"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "Tile",
+                "MatMul",
+                "ConstantOfShape",
+                "Sub",
+                "Expand",
+                "Cast",
+                "LessOrEqual",
+                "Log",
+                "Sqrt",
+                "Less",
+                "Tanh",
+                "Shape",
+                "Neg",
+                "Mul",
+                "Softmax",
+                "Constant",
+                "Slice",
+                "Pow",
+                "Reshape",
+                "ReduceMean",
+                "Gather",
+                "Add",
+                "Where",
+                "Transpose",
+                "Concat",
+                "Range",
+                "Div",
+                "Unsqueeze",
+                "Min"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}

tokenizer_config.json CHANGED Viewed

@@ -3,6 +3,7 @@
   "clean_up_tokenization_spaces": true,
   "eos_token": "</s>",
   "extra_ids": 0,
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "<pad>",
   "sp_model_kwargs": {},

   "clean_up_tokenization_spaces": true,
   "eos_token": "</s>",
   "extra_ids": 0,
+  "legacy": true,
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "<pad>",
   "sp_model_kwargs": {},