Upload folder using huggingface_hub

Browse files

Files changed (10) hide show

config.json +1 -1
generation_config.json +2 -2
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +71 -71
tokenizer.json +0 -0

config.json CHANGED Viewed

@@ -53,7 +53,7 @@
   "scale_embedding": true,
   "share_encoder_decoder_embeddings": true,
   "static_position_embeddings": true,
-  "transformers_version": "4.32.0.dev0",
   "use_cache": true,
   "vocab_size": 65001
 }

   "scale_embedding": true,
   "share_encoder_decoder_embeddings": true,
   "static_position_embeddings": true,
+  "transformers_version": "4.34.0.dev0",
   "use_cache": true,
   "vocab_size": 65001
 }

generation_config.json CHANGED Viewed

@@ -1,5 +1,4 @@
 {
-  "_from_model_config": true,
   "bad_words_ids": [
     [
       65000
@@ -12,5 +11,6 @@
   "max_length": 512,
   "num_beams": 4,
   "pad_token_id": 65000,
-  "transformers_version": "4.32.0.dev0"
 }

 {
   "bad_words_ids": [
     [
       65000
   "max_length": 512,
   "num_beams": 4,
   "pad_token_id": 65000,
+  "renormalize_logits": true,
+  "transformers_version": "4.34.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4da2ebc17ce162357c04c25c32eb6084c0dfcd95b14dc559a757c8eb75040a04
-size 368725660

 version https://git-lfs.github.com/spec/v1
+oid sha256:ab393f34abc9bae71ae77d2a182f77cf005952f85f797ef4fc89e1f4e487b10f
+size 235603669

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:328116e3814e87a9add8565e4d946fbb569d5aa61e0025078bd8ac0db0487241
-size 368961142

 version https://git-lfs.github.com/spec/v1
+oid sha256:ef093b1e79a7fd68bdd884e2986a14614b9885cb5e1ced8a590df0ac241cde61
+size 235839236

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9f6f03ba3bd3ee4561aab1f3498ad84d35960765ff727e1f975ee32ba7815873
-size 93819732

 version https://git-lfs.github.com/spec/v1
+oid sha256:5c0d95a8072a463c747343cf25ac9b4a17e9a90e08131e7efab12691ca13c979
+size 60212803

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9d64ef6ef74489ddd308ac0b467359de02791142e794774dbfba093107c5378e
-size 93448376

 version https://git-lfs.github.com/spec/v1
+oid sha256:955cc7be5a942ddef39e9721b7abd888837f41ba65983a86eb428b1bbf23e05c
+size 59842101

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:af45f8d12a7784061292298cb38b7e9efc706c704098bde6cb231254681a146b
-size 356075151

 version https://git-lfs.github.com/spec/v1
+oid sha256:b6c8c4448b8bfd45b33cbdf07120e62cf8f60b69c9e301de749952098b445413
+size 222953160

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6221accfbf793beedb15af5e75612b6bf8ad81bafc68d77f47f530f08f0a79ec
-size 90176912

 version https://git-lfs.github.com/spec/v1
+oid sha256:2e28a6de8ad245fd27673d676ab8ee54e3fdb24a32cb634877f906f4d2939bac
+size 56570637

quantize_config.json CHANGED Viewed

@@ -4,120 +4,120 @@
     "per_model_config": {
         "encoder_model": {
             "op_types": [
-                "Constant",
-                "Range",
-                "Pow",
-                "Div",
-                "ReduceMean",
                 "Reshape",
                 "Gather",
                 "Equal",
-                "Softmax",
-                "ConstantOfShape",
                 "Cast",
-                "Transpose",
                 "Add",
-                "Sqrt",
-                "Shape",
-                "Sigmoid",
-                "Unsqueeze",
-                "Mul",
-                "Sub",
-                "Where",
                 "MatMul",
                 "Expand",
-                "Concat"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
-                "Constant",
-                "Range",
-                "Pow",
-                "Div",
-                "ReduceMean",
                 "Reshape",
                 "Gather",
                 "Equal",
-                "Softmax",
-                "ConstantOfShape",
                 "Cast",
-                "Transpose",
                 "Add",
-                "Sqrt",
-                "Shape",
-                "Sigmoid",
-                "Unsqueeze",
-                "Mul",
-                "Sub",
-                "Where",
                 "MatMul",
                 "Expand",
-                "Concat"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model": {
             "op_types": [
-                "Constant",
                 "Range",
-                "Pow",
                 "Squeeze",
-                "Less",
-                "Slice",
                 "Div",
-                "Gather",
-                "Reshape",
-                "ReduceMean",
                 "Equal",
-                "Softmax",
-                "ConstantOfShape",
                 "Cast",
-                "Transpose",
                 "Add",
-                "Sqrt",
-                "Shape",
-                "Sigmoid",
-                "Unsqueeze",
-                "Mul",
-                "Sub",
-                "Where",
                 "MatMul",
                 "Expand",
-                "Concat"
             ],
             "weight_type": "QInt8"
         },
-        "decoder_model_merged": {
             "op_types": [
-                "Constant",
-                "If",
                 "Range",
-                "Pow",
                 "Squeeze",
-                "Less",
-                "Slice",
                 "Div",
-                "Gather",
-                "Reshape",
-                "ReduceMean",
                 "Equal",
-                "Softmax",
-                "ConstantOfShape",
                 "Cast",
-                "Transpose",
                 "Add",
-                "Sqrt",
-                "Shape",
-                "Sigmoid",
-                "Unsqueeze",
-                "Mul",
-                "Sub",
-                "Where",
                 "MatMul",
                 "Expand",
-                "Concat"
             ],
             "weight_type": "QInt8"
         }

     "per_model_config": {
         "encoder_model": {
             "op_types": [
+                "Sigmoid",
                 "Reshape",
+                "Range",
+                "Sqrt",
+                "Where",
+                "Unsqueeze",
+                "Constant",
                 "Gather",
+                "Div",
+                "Shape",
+                "Pow",
                 "Equal",
+                "ReduceMean",
+                "Mul",
                 "Cast",
                 "Add",
                 "MatMul",
+                "Softmax",
+                "Sub",
+                "Concat",
                 "Expand",
+                "Transpose",
+                "ConstantOfShape"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
+                "Sigmoid",
                 "Reshape",
+                "Range",
+                "Sqrt",
+                "Where",
+                "Unsqueeze",
+                "Constant",
                 "Gather",
+                "Div",
+                "Shape",
+                "Pow",
                 "Equal",
+                "ReduceMean",
+                "Mul",
                 "Cast",
                 "Add",
                 "MatMul",
+                "Softmax",
+                "Sub",
+                "Concat",
                 "Expand",
+                "Transpose",
+                "ConstantOfShape"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model_merged": {
             "op_types": [
+                "Sigmoid",
+                "Reshape",
                 "Range",
+                "Sqrt",
+                "Where",
+                "Unsqueeze",
+                "Constant",
+                "Gather",
                 "Squeeze",
                 "Div",
+                "If",
+                "Shape",
+                "Pow",
                 "Equal",
+                "ReduceMean",
+                "Slice",
+                "Less",
+                "Mul",
                 "Cast",
                 "Add",
                 "MatMul",
+                "Softmax",
+                "Sub",
+                "Concat",
                 "Expand",
+                "Transpose",
+                "ConstantOfShape"
             ],
             "weight_type": "QInt8"
         },
+        "decoder_model": {
             "op_types": [
+                "Sigmoid",
+                "Reshape",
                 "Range",
+                "Sqrt",
+                "Where",
+                "Unsqueeze",
+                "Constant",
+                "Gather",
                 "Squeeze",
                 "Div",
+                "Shape",
+                "Pow",
                 "Equal",
+                "ReduceMean",
+                "Slice",
+                "Less",
+                "Mul",
                 "Cast",
                 "Add",
                 "MatMul",
+                "Softmax",
+                "Sub",
+                "Concat",
                 "Expand",
+                "Transpose",
+                "ConstantOfShape"
             ],
             "weight_type": "QInt8"
         }

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff