Xenova HF staff commited on
Commit
c35ee1c
·
1 Parent(s): 79ee17d

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -53,7 +53,7 @@
53
  "scale_embedding": true,
54
  "share_encoder_decoder_embeddings": true,
55
  "static_position_embeddings": true,
56
- "transformers_version": "4.32.0.dev0",
57
  "use_cache": true,
58
  "vocab_size": 65001
59
  }
 
53
  "scale_embedding": true,
54
  "share_encoder_decoder_embeddings": true,
55
  "static_position_embeddings": true,
56
+ "transformers_version": "4.34.0.dev0",
57
  "use_cache": true,
58
  "vocab_size": 65001
59
  }
generation_config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "_from_model_config": true,
3
  "bad_words_ids": [
4
  [
5
  65000
@@ -12,5 +11,6 @@
12
  "max_length": 512,
13
  "num_beams": 4,
14
  "pad_token_id": 65000,
15
- "transformers_version": "4.32.0.dev0"
 
16
  }
 
1
  {
 
2
  "bad_words_ids": [
3
  [
4
  65000
 
11
  "max_length": 512,
12
  "num_beams": 4,
13
  "pad_token_id": 65000,
14
+ "renormalize_logits": true,
15
+ "transformers_version": "4.34.0.dev0"
16
  }
onnx/decoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4da2ebc17ce162357c04c25c32eb6084c0dfcd95b14dc559a757c8eb75040a04
3
- size 368725660
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab393f34abc9bae71ae77d2a182f77cf005952f85f797ef4fc89e1f4e487b10f
3
+ size 235603669
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:328116e3814e87a9add8565e4d946fbb569d5aa61e0025078bd8ac0db0487241
3
- size 368961142
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef093b1e79a7fd68bdd884e2986a14614b9885cb5e1ced8a590df0ac241cde61
3
+ size 235839236
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f6f03ba3bd3ee4561aab1f3498ad84d35960765ff727e1f975ee32ba7815873
3
- size 93819732
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c0d95a8072a463c747343cf25ac9b4a17e9a90e08131e7efab12691ca13c979
3
+ size 60212803
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d64ef6ef74489ddd308ac0b467359de02791142e794774dbfba093107c5378e
3
- size 93448376
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:955cc7be5a942ddef39e9721b7abd888837f41ba65983a86eb428b1bbf23e05c
3
+ size 59842101
onnx/decoder_with_past_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af45f8d12a7784061292298cb38b7e9efc706c704098bde6cb231254681a146b
3
- size 356075151
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6c8c4448b8bfd45b33cbdf07120e62cf8f60b69c9e301de749952098b445413
3
+ size 222953160
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6221accfbf793beedb15af5e75612b6bf8ad81bafc68d77f47f530f08f0a79ec
3
- size 90176912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e28a6de8ad245fd27673d676ab8ee54e3fdb24a32cb634877f906f4d2939bac
3
+ size 56570637
quantize_config.json CHANGED
@@ -4,120 +4,120 @@
4
  "per_model_config": {
5
  "encoder_model": {
6
  "op_types": [
7
- "Constant",
8
- "Range",
9
- "Pow",
10
- "Div",
11
- "ReduceMean",
12
  "Reshape",
 
 
 
 
 
13
  "Gather",
 
 
 
14
  "Equal",
15
- "Softmax",
16
- "ConstantOfShape",
17
  "Cast",
18
- "Transpose",
19
  "Add",
20
- "Sqrt",
21
- "Shape",
22
- "Sigmoid",
23
- "Unsqueeze",
24
- "Mul",
25
- "Sub",
26
- "Where",
27
  "MatMul",
 
 
 
28
  "Expand",
29
- "Concat"
 
30
  ],
31
  "weight_type": "QInt8"
32
  },
33
  "decoder_with_past_model": {
34
  "op_types": [
35
- "Constant",
36
- "Range",
37
- "Pow",
38
- "Div",
39
- "ReduceMean",
40
  "Reshape",
 
 
 
 
 
41
  "Gather",
 
 
 
42
  "Equal",
43
- "Softmax",
44
- "ConstantOfShape",
45
  "Cast",
46
- "Transpose",
47
  "Add",
48
- "Sqrt",
49
- "Shape",
50
- "Sigmoid",
51
- "Unsqueeze",
52
- "Mul",
53
- "Sub",
54
- "Where",
55
  "MatMul",
 
 
 
56
  "Expand",
57
- "Concat"
 
58
  ],
59
  "weight_type": "QInt8"
60
  },
61
- "decoder_model": {
62
  "op_types": [
63
- "Constant",
 
64
  "Range",
65
- "Pow",
 
 
 
 
66
  "Squeeze",
67
- "Less",
68
- "Slice",
69
  "Div",
70
- "Gather",
71
- "Reshape",
72
- "ReduceMean",
73
  "Equal",
74
- "Softmax",
75
- "ConstantOfShape",
 
 
76
  "Cast",
77
- "Transpose",
78
  "Add",
79
- "Sqrt",
80
- "Shape",
81
- "Sigmoid",
82
- "Unsqueeze",
83
- "Mul",
84
- "Sub",
85
- "Where",
86
  "MatMul",
 
 
 
87
  "Expand",
88
- "Concat"
 
89
  ],
90
  "weight_type": "QInt8"
91
  },
92
- "decoder_model_merged": {
93
  "op_types": [
94
- "Constant",
95
- "If",
96
  "Range",
97
- "Pow",
 
 
 
 
98
  "Squeeze",
99
- "Less",
100
- "Slice",
101
  "Div",
102
- "Gather",
103
- "Reshape",
104
- "ReduceMean",
105
  "Equal",
106
- "Softmax",
107
- "ConstantOfShape",
 
 
108
  "Cast",
109
- "Transpose",
110
  "Add",
111
- "Sqrt",
112
- "Shape",
113
- "Sigmoid",
114
- "Unsqueeze",
115
- "Mul",
116
- "Sub",
117
- "Where",
118
  "MatMul",
 
 
 
119
  "Expand",
120
- "Concat"
 
121
  ],
122
  "weight_type": "QInt8"
123
  }
 
4
  "per_model_config": {
5
  "encoder_model": {
6
  "op_types": [
7
+ "Sigmoid",
 
 
 
 
8
  "Reshape",
9
+ "Range",
10
+ "Sqrt",
11
+ "Where",
12
+ "Unsqueeze",
13
+ "Constant",
14
  "Gather",
15
+ "Div",
16
+ "Shape",
17
+ "Pow",
18
  "Equal",
19
+ "ReduceMean",
20
+ "Mul",
21
  "Cast",
 
22
  "Add",
 
 
 
 
 
 
 
23
  "MatMul",
24
+ "Softmax",
25
+ "Sub",
26
+ "Concat",
27
  "Expand",
28
+ "Transpose",
29
+ "ConstantOfShape"
30
  ],
31
  "weight_type": "QInt8"
32
  },
33
  "decoder_with_past_model": {
34
  "op_types": [
35
+ "Sigmoid",
 
 
 
 
36
  "Reshape",
37
+ "Range",
38
+ "Sqrt",
39
+ "Where",
40
+ "Unsqueeze",
41
+ "Constant",
42
  "Gather",
43
+ "Div",
44
+ "Shape",
45
+ "Pow",
46
  "Equal",
47
+ "ReduceMean",
48
+ "Mul",
49
  "Cast",
 
50
  "Add",
 
 
 
 
 
 
 
51
  "MatMul",
52
+ "Softmax",
53
+ "Sub",
54
+ "Concat",
55
  "Expand",
56
+ "Transpose",
57
+ "ConstantOfShape"
58
  ],
59
  "weight_type": "QInt8"
60
  },
61
+ "decoder_model_merged": {
62
  "op_types": [
63
+ "Sigmoid",
64
+ "Reshape",
65
  "Range",
66
+ "Sqrt",
67
+ "Where",
68
+ "Unsqueeze",
69
+ "Constant",
70
+ "Gather",
71
  "Squeeze",
 
 
72
  "Div",
73
+ "If",
74
+ "Shape",
75
+ "Pow",
76
  "Equal",
77
+ "ReduceMean",
78
+ "Slice",
79
+ "Less",
80
+ "Mul",
81
  "Cast",
 
82
  "Add",
 
 
 
 
 
 
 
83
  "MatMul",
84
+ "Softmax",
85
+ "Sub",
86
+ "Concat",
87
  "Expand",
88
+ "Transpose",
89
+ "ConstantOfShape"
90
  ],
91
  "weight_type": "QInt8"
92
  },
93
+ "decoder_model": {
94
  "op_types": [
95
+ "Sigmoid",
96
+ "Reshape",
97
  "Range",
98
+ "Sqrt",
99
+ "Where",
100
+ "Unsqueeze",
101
+ "Constant",
102
+ "Gather",
103
  "Squeeze",
 
 
104
  "Div",
105
+ "Shape",
106
+ "Pow",
 
107
  "Equal",
108
+ "ReduceMean",
109
+ "Slice",
110
+ "Less",
111
+ "Mul",
112
  "Cast",
 
113
  "Add",
 
 
 
 
 
 
 
114
  "MatMul",
115
+ "Softmax",
116
+ "Sub",
117
+ "Concat",
118
  "Expand",
119
+ "Transpose",
120
+ "ConstantOfShape"
121
  ],
122
  "weight_type": "QInt8"
123
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff