raspi0124 commited on
Commit
8ce4b2f
·
1 Parent(s): a5d6fa0

ONNXっぽいやつができたのでコミット

Browse files
config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_attn_implementation_autoset": true,
3
+ "_name_or_path": "cl-nagoya/ruri-small",
4
+ "activation": "gelu",
5
+ "architectures": [
6
+ "DistilBertModel"
7
+ ],
8
+ "attention_dropout": 0.1,
9
+ "dim": 768,
10
+ "dropout": 0.1,
11
+ "export_model_type": "transformer",
12
+ "hidden_dim": 3072,
13
+ "initializer_range": 0.02,
14
+ "max_position_embeddings": 512,
15
+ "model_type": "distilbert",
16
+ "n_heads": 12,
17
+ "n_layers": 6,
18
+ "output_hidden_states": true,
19
+ "pad_token_id": 0,
20
+ "qa_dropout": 0.1,
21
+ "seq_classif_dropout": 0.2,
22
+ "sinusoidal_pos_embds": true,
23
+ "tie_weights_": true,
24
+ "torch_dtype": "bfloat16",
25
+ "transformers_version": "4.46.3",
26
+ "vocab_size": 32768
27
+ }
onnx/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc3a2fc698d0ec5aa7ab45f0b10517aab972dfede0243a31b9430659609334da
3
+ size 272490076
onnx/model_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0600443d7191cf5c7aa7a22f78a80397e16ab1264b7d03fcf862e79b3b02705
3
+ size 126514174
onnx/model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:492b59f1a59751f77559d0f569dc9572b61ef97e50b737f73005524199b9b154
3
+ size 136314565
onnx/model_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38a2813abf640e6d0aa9ce004edc380fdebe87c84258494f8e2f6412d79ac9e6
3
+ size 68668245
onnx/model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7bc29cca42120fc9a226c6137a3f030abd5698c313e685f285f23af8c8c551e
3
+ size 129168118
onnx/model_q4f16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b55a7be79de330304ba2e0b37fa832ca7e411d91f3beb722fdfc65ad81d5320a
3
+ size 75273104
onnx/model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38a2813abf640e6d0aa9ce004edc380fdebe87c84258494f8e2f6412d79ac9e6
3
+ size 68668245
onnx/model_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15688908de5bc58d3d0e9c7e3ab2c8504d6b2e05ff96df8411b1fac147122311
3
+ size 68668245
quantize_config.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "modes": [
3
+ "fp16",
4
+ "q8",
5
+ "int8",
6
+ "uint8",
7
+ "q4",
8
+ "q4f16",
9
+ "bnb4"
10
+ ],
11
+ "per_channel": true,
12
+ "reduce_range": true,
13
+ "block_size": null,
14
+ "is_symmetric": true,
15
+ "accuracy_level": null,
16
+ "quant_type": 1,
17
+ "op_block_list": null
18
+ }