raspi0124
commited on
Commit
·
8ce4b2f
1
Parent(s):
a5d6fa0
ONNXっぽいやつができたのでコミット
Browse files- config.json +27 -0
- onnx/model.onnx +3 -0
- onnx/model_bnb4.onnx +3 -0
- onnx/model_fp16.onnx +3 -0
- onnx/model_int8.onnx +3 -0
- onnx/model_q4.onnx +3 -0
- onnx/model_q4f16.onnx +3 -0
- onnx/model_quantized.onnx +3 -0
- onnx/model_uint8.onnx +3 -0
- quantize_config.json +18 -0
config.json
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_attn_implementation_autoset": true,
|
3 |
+
"_name_or_path": "cl-nagoya/ruri-small",
|
4 |
+
"activation": "gelu",
|
5 |
+
"architectures": [
|
6 |
+
"DistilBertModel"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.1,
|
9 |
+
"dim": 768,
|
10 |
+
"dropout": 0.1,
|
11 |
+
"export_model_type": "transformer",
|
12 |
+
"hidden_dim": 3072,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"max_position_embeddings": 512,
|
15 |
+
"model_type": "distilbert",
|
16 |
+
"n_heads": 12,
|
17 |
+
"n_layers": 6,
|
18 |
+
"output_hidden_states": true,
|
19 |
+
"pad_token_id": 0,
|
20 |
+
"qa_dropout": 0.1,
|
21 |
+
"seq_classif_dropout": 0.2,
|
22 |
+
"sinusoidal_pos_embds": true,
|
23 |
+
"tie_weights_": true,
|
24 |
+
"torch_dtype": "bfloat16",
|
25 |
+
"transformers_version": "4.46.3",
|
26 |
+
"vocab_size": 32768
|
27 |
+
}
|
onnx/model.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc3a2fc698d0ec5aa7ab45f0b10517aab972dfede0243a31b9430659609334da
|
3 |
+
size 272490076
|
onnx/model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0600443d7191cf5c7aa7a22f78a80397e16ab1264b7d03fcf862e79b3b02705
|
3 |
+
size 126514174
|
onnx/model_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:492b59f1a59751f77559d0f569dc9572b61ef97e50b737f73005524199b9b154
|
3 |
+
size 136314565
|
onnx/model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38a2813abf640e6d0aa9ce004edc380fdebe87c84258494f8e2f6412d79ac9e6
|
3 |
+
size 68668245
|
onnx/model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7bc29cca42120fc9a226c6137a3f030abd5698c313e685f285f23af8c8c551e
|
3 |
+
size 129168118
|
onnx/model_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b55a7be79de330304ba2e0b37fa832ca7e411d91f3beb722fdfc65ad81d5320a
|
3 |
+
size 75273104
|
onnx/model_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38a2813abf640e6d0aa9ce004edc380fdebe87c84258494f8e2f6412d79ac9e6
|
3 |
+
size 68668245
|
onnx/model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15688908de5bc58d3d0e9c7e3ab2c8504d6b2e05ff96df8411b1fac147122311
|
3 |
+
size 68668245
|
quantize_config.json
ADDED
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"modes": [
|
3 |
+
"fp16",
|
4 |
+
"q8",
|
5 |
+
"int8",
|
6 |
+
"uint8",
|
7 |
+
"q4",
|
8 |
+
"q4f16",
|
9 |
+
"bnb4"
|
10 |
+
],
|
11 |
+
"per_channel": true,
|
12 |
+
"reduce_range": true,
|
13 |
+
"block_size": null,
|
14 |
+
"is_symmetric": true,
|
15 |
+
"accuracy_level": null,
|
16 |
+
"quant_type": 1,
|
17 |
+
"op_block_list": null
|
18 |
+
}
|