Xenova HF staff commited on
Commit
f301282
·
1 Parent(s): 7cf10f4

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -54,7 +54,7 @@
54
  "scale_embedding": true,
55
  "share_encoder_decoder_embeddings": true,
56
  "static_position_embeddings": true,
57
- "transformers_version": "4.32.0.dev0",
58
  "use_cache": true,
59
  "vocab_size": 67028
60
  }
 
54
  "scale_embedding": true,
55
  "share_encoder_decoder_embeddings": true,
56
  "static_position_embeddings": true,
57
+ "transformers_version": "4.34.0.dev0",
58
  "use_cache": true,
59
  "vocab_size": 67028
60
  }
generation_config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "_from_model_config": true,
3
  "bad_words_ids": [
4
  [
5
  67027
@@ -12,5 +11,6 @@
12
  "max_length": 512,
13
  "num_beams": 4,
14
  "pad_token_id": 67027,
15
- "transformers_version": "4.32.0.dev0"
 
16
  }
 
1
  {
 
2
  "bad_words_ids": [
3
  [
4
  67027
 
11
  "max_length": 512,
12
  "num_beams": 4,
13
  "pad_token_id": 67027,
14
+ "renormalize_logits": true,
15
+ "transformers_version": "4.34.0.dev0"
16
  }
onnx/decoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9fa1dfdd43118d561ac282b8e1f74e58c28e45001c209cd4b6551c30a515caf
3
- size 377036360
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b2b4eec6dda4695a5292107723d15e54aebec7b40a9921e0bcd928a889b522f
3
+ size 239763073
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b0555dc7bbe2dd30791f4206f6b8e1f57520f4c80d9fc0e6677aa89a8295714
3
- size 377271842
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8c860569f64844dfe9a70c3859675ad9864c09541038dd5a9139f3794e68dc1
3
+ size 239998640
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0ee206b32a54d889090eef15169c72a84a6bfcc40cc7c18cec65a68746818c2e
3
- size 95913623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f8034fddc4cdcb6fa6c3b64a06e1cd9b1955c0c6dcd13e0e47610ab99ac4a99
3
+ size 61258735
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:71f4e889fbe597a3e83faf2fe4394cb258827640639893f1d1865b42273ca486
3
- size 95542267
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9d1474106c1bdf8aaf236eb7ace8a29edf6fee655c583132f521e5b63ccbf97
3
+ size 60888033
onnx/decoder_with_past_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:222a405da1e39837db12b265095f9784bc070156804b5397fdbb3e5633810046
3
- size 364385851
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e54aaeeb859239e5c108cbeb7451bdbe46e5a8298e97c88353034b22a2781b65
3
+ size 227112564
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4c4e12d1e536e84002fb6fd39771fb6ca44b7138b3a99265542f096149dfb134
3
- size 92270803
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b64503e3da43ba222635cd22eff35baec2599f4e8e1575ef95d22ae0a8df77d8
3
+ size 57616569
quantize_config.json CHANGED
@@ -6,27 +6,27 @@
6
  "op_types": [
7
  "Pow",
8
  "Mul",
 
 
 
 
 
 
 
9
  "Sigmoid",
10
- "Transpose",
11
- "Sub",
12
- "Equal",
13
- "Constant",
14
  "Sqrt",
 
 
15
  "Softmax",
16
- "ReduceMean",
17
- "Shape",
18
- "Unsqueeze",
19
- "Concat",
20
- "Gather",
21
- "Reshape",
22
- "MatMul",
23
  "Where",
24
- "Range",
 
25
  "Add",
26
- "ConstantOfShape",
27
- "Div",
28
- "Expand",
29
- "Cast"
 
30
  ],
31
  "weight_type": "QInt8"
32
  },
@@ -34,90 +34,90 @@
34
  "op_types": [
35
  "Pow",
36
  "Mul",
 
 
 
 
 
 
 
37
  "Sigmoid",
38
- "Transpose",
39
- "Sub",
40
- "Equal",
41
- "Constant",
42
  "Sqrt",
 
 
43
  "Softmax",
44
- "ReduceMean",
45
- "Shape",
46
- "Unsqueeze",
47
- "Concat",
48
- "Gather",
49
- "Reshape",
50
- "MatMul",
51
  "Where",
 
 
52
  "Add",
53
- "Range",
54
- "ConstantOfShape",
55
- "Div",
56
- "Expand",
57
- "Cast"
58
  ],
59
  "weight_type": "QInt8"
60
  },
61
- "decoder_model": {
62
  "op_types": [
63
  "Pow",
64
  "Mul",
65
- "Sigmoid",
66
- "Squeeze",
67
- "Transpose",
68
- "Sub",
69
- "Equal",
70
- "Constant",
71
- "Slice",
72
- "Sqrt",
73
- "Softmax",
74
- "ReduceMean",
75
- "Shape",
76
- "Unsqueeze",
77
- "Concat",
78
  "Gather",
79
- "Reshape",
80
- "MatMul",
81
- "Where",
82
  "Range",
83
- "Add",
84
  "ConstantOfShape",
 
 
 
85
  "Less",
 
86
  "Expand",
87
- "Div",
88
- "Cast"
 
 
 
 
 
 
 
 
 
 
 
89
  ],
90
  "weight_type": "QInt8"
91
  },
92
- "decoder_model_merged": {
93
  "op_types": [
94
  "Pow",
95
  "Mul",
96
- "Sigmoid",
97
- "Squeeze",
98
- "Transpose",
99
- "Sub",
100
- "Equal",
101
- "Constant",
102
- "Slice",
103
- "Sqrt",
104
- "Softmax",
105
- "ReduceMean",
106
- "Shape",
107
- "Unsqueeze",
108
- "Concat",
109
  "Gather",
110
- "Reshape",
111
- "MatMul",
112
- "Where",
113
- "If",
114
  "Range",
115
- "Add",
116
  "ConstantOfShape",
 
 
 
117
  "Less",
 
118
  "Expand",
119
- "Div",
120
- "Cast"
 
 
 
 
 
 
 
 
 
 
121
  ],
122
  "weight_type": "QInt8"
123
  }
 
6
  "op_types": [
7
  "Pow",
8
  "Mul",
9
+ "Div",
10
+ "Gather",
11
+ "ReduceMean",
12
+ "Range",
13
+ "ConstantOfShape",
14
+ "Concat",
15
+ "Unsqueeze",
16
  "Sigmoid",
 
 
 
 
17
  "Sqrt",
18
+ "Expand",
19
+ "Equal",
20
  "Softmax",
 
 
 
 
 
 
 
21
  "Where",
22
+ "Cast",
23
+ "Shape",
24
  "Add",
25
+ "Constant",
26
+ "MatMul",
27
+ "Reshape",
28
+ "Sub",
29
+ "Transpose"
30
  ],
31
  "weight_type": "QInt8"
32
  },
 
34
  "op_types": [
35
  "Pow",
36
  "Mul",
37
+ "Div",
38
+ "Gather",
39
+ "ReduceMean",
40
+ "Range",
41
+ "ConstantOfShape",
42
+ "Concat",
43
+ "Unsqueeze",
44
  "Sigmoid",
 
 
 
 
45
  "Sqrt",
46
+ "Expand",
47
+ "Equal",
48
  "Softmax",
 
 
 
 
 
 
 
49
  "Where",
50
+ "Cast",
51
+ "Shape",
52
  "Add",
53
+ "Constant",
54
+ "MatMul",
55
+ "Reshape",
56
+ "Sub",
57
+ "Transpose"
58
  ],
59
  "weight_type": "QInt8"
60
  },
61
+ "decoder_model_merged": {
62
  "op_types": [
63
  "Pow",
64
  "Mul",
65
+ "Div",
 
 
 
 
 
 
 
 
 
 
 
 
66
  "Gather",
67
+ "ReduceMean",
 
 
68
  "Range",
69
+ "Slice",
70
  "ConstantOfShape",
71
+ "Concat",
72
+ "Unsqueeze",
73
+ "Sigmoid",
74
  "Less",
75
+ "Sqrt",
76
  "Expand",
77
+ "Equal",
78
+ "Softmax",
79
+ "Squeeze",
80
+ "Cast",
81
+ "Shape",
82
+ "Add",
83
+ "Where",
84
+ "Constant",
85
+ "MatMul",
86
+ "Reshape",
87
+ "Sub",
88
+ "Transpose",
89
+ "If"
90
  ],
91
  "weight_type": "QInt8"
92
  },
93
+ "decoder_model": {
94
  "op_types": [
95
  "Pow",
96
  "Mul",
97
+ "Div",
 
 
 
 
 
 
 
 
 
 
 
 
98
  "Gather",
99
+ "ReduceMean",
 
 
 
100
  "Range",
101
+ "Slice",
102
  "ConstantOfShape",
103
+ "Concat",
104
+ "Unsqueeze",
105
+ "Sigmoid",
106
  "Less",
107
+ "Sqrt",
108
  "Expand",
109
+ "Equal",
110
+ "Softmax",
111
+ "Squeeze",
112
+ "Cast",
113
+ "Shape",
114
+ "Add",
115
+ "Where",
116
+ "Constant",
117
+ "MatMul",
118
+ "Reshape",
119
+ "Sub",
120
+ "Transpose"
121
  ],
122
  "weight_type": "QInt8"
123
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff