Xenova HF staff commited on
Commit
9036bb2
·
verified ·
1 Parent(s): 4cba548

Upload folder using huggingface_hub

Browse files
onnx/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1682658b3fc5be1b0e1d7b3018833604db33cdeb7fb10a5ce07e7958ffb1e36
3
+ size 37970693
onnx/model_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fee7820c761beedbe19b7a739ca606afc07f0360802eb7c9d51911532b8ea82
3
+ size 37970712
onnx/model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e990fb3d3dcaf886d14618ae7b21f72b7df3a65f8c135f7f50bd222850919dd
3
+ size 19069292
onnx/model_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8ab85392fc00980864d6361feae10d5edf46fb8d5cbfd2cb4e33ab262c60cb7
3
+ size 9919544
onnx/model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fee7820c761beedbe19b7a739ca606afc07f0360802eb7c9d51911532b8ea82
3
+ size 37970712
onnx/model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fcd24d064bfea9139f631cab894d7dfbe93df862be7a5e9fecdc2064a293e79
3
+ size 9919589
onnx/model_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fcd24d064bfea9139f631cab894d7dfbe93df862be7a5e9fecdc2064a293e79
3
+ size 9919589
quantize_config.json ADDED
@@ -0,0 +1,90 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fp16": {},
3
+ "q8": {
4
+ "per_model_config": {
5
+ "model": {
6
+ "op_types": [
7
+ "Add",
8
+ "BatchNormalization",
9
+ "Constant",
10
+ "Conv",
11
+ "Div",
12
+ "Erf",
13
+ "Flatten",
14
+ "Gemm",
15
+ "GlobalAveragePool",
16
+ "Identity",
17
+ "Mul",
18
+ "ReduceMean",
19
+ "Relu",
20
+ "Sigmoid",
21
+ "Sub"
22
+ ],
23
+ "weight_type": "QUInt8"
24
+ }
25
+ },
26
+ "per_channel": false,
27
+ "reduce_range": false
28
+ },
29
+ "int8": {
30
+ "per_model_config": {
31
+ "model": {
32
+ "op_types": [
33
+ "Add",
34
+ "BatchNormalization",
35
+ "Constant",
36
+ "Conv",
37
+ "Div",
38
+ "Erf",
39
+ "Flatten",
40
+ "Gemm",
41
+ "GlobalAveragePool",
42
+ "Identity",
43
+ "Mul",
44
+ "ReduceMean",
45
+ "Relu",
46
+ "Sigmoid",
47
+ "Sub"
48
+ ],
49
+ "weight_type": "QInt8"
50
+ }
51
+ },
52
+ "per_channel": false,
53
+ "reduce_range": false
54
+ },
55
+ "uint8": {
56
+ "per_model_config": {
57
+ "model": {
58
+ "op_types": [
59
+ "Add",
60
+ "BatchNormalization",
61
+ "Constant",
62
+ "Conv",
63
+ "Div",
64
+ "Erf",
65
+ "Flatten",
66
+ "Gemm",
67
+ "GlobalAveragePool",
68
+ "Identity",
69
+ "Mul",
70
+ "ReduceMean",
71
+ "Relu",
72
+ "Sigmoid",
73
+ "Sub"
74
+ ],
75
+ "weight_type": "QUInt8"
76
+ }
77
+ },
78
+ "per_channel": false,
79
+ "reduce_range": false
80
+ },
81
+ "q4": {
82
+ "block_size": 32,
83
+ "is_symmetric": true,
84
+ "accuracy_level": null
85
+ },
86
+ "bnb4": {
87
+ "block_size": 64,
88
+ "quant_type": 1
89
+ }
90
+ }