Xenova HF staff commited on
Commit
aa09803
1 Parent(s): b82e34d

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -23,7 +23,7 @@
23
  "pooler_size_per_head": 128,
24
  "pooler_type": "first_token_transform",
25
  "position_embedding_type": "absolute",
26
- "transformers_version": "4.29.2",
27
  "type_vocab_size": 2,
28
  "use_cache": true,
29
  "vocab_size": 105879
 
23
  "pooler_size_per_head": 128,
24
  "pooler_type": "first_token_transform",
25
  "position_embedding_type": "absolute",
26
+ "transformers_version": "4.33.0.dev0",
27
  "type_vocab_size": 2,
28
  "use_cache": true,
29
  "vocab_size": 105879
generation_config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
  "_from_model_config": true,
3
  "pad_token_id": 0,
4
- "transformers_version": "4.29.2"
5
  }
 
1
  {
2
  "_from_model_config": true,
3
  "pad_token_id": 0,
4
+ "transformers_version": "4.33.0.dev0"
5
  }
onnx/model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a8bb56c1c0b8468cddfab60c87b57b43eb43b6ccc3bb41e251dfef7c6c7c7b03
3
- size 995386085
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8b0ea2376868d5393163b87fedc6da0a83b2a2378922cfead2d80049de8501d
3
+ size 670125922
onnx/model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc95dcdf605709e469c2858eb2243a4827ca39c90d9b45f8ebec22f6667d952b
3
- size 250869303
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6dcae35e1de2d31e7afb13a2a9b4b43d2c9a63f9a438ea5f75d66d359036da7
3
+ size 169024183
quantize_config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "per_model_config": {
5
+ "model": {
6
+ "op_types": [
7
+ "Reshape",
8
+ "Add",
9
+ "Concat",
10
+ "Constant",
11
+ "Transpose",
12
+ "Sub",
13
+ "Div",
14
+ "Pow",
15
+ "ReduceMean",
16
+ "Softmax",
17
+ "Gather",
18
+ "Sqrt",
19
+ "Unsqueeze",
20
+ "Erf",
21
+ "Mul",
22
+ "MatMul",
23
+ "Shape",
24
+ "Slice",
25
+ "Cast"
26
+ ],
27
+ "weight_type": "QInt8"
28
+ }
29
+ }
30
+ }