Upload ONNX weights (#7)
Browse files- Upload ONNX weights (a254de22948510b593ecf4258a1d9a4d60c310b4)
- Update config.json (60375ee206ef2bd0467088e5511c84888f3db3ee)
- Upload folder using huggingface_hub (009620751b7925e8012cb72d1ad824c101433abd)
Co-authored-by: Joshua <[email protected]>
- config.json +6 -0
- onnx/decoder_model_merged.onnx +3 -0
- onnx/decoder_model_merged_bnb4.onnx +3 -0
- onnx/decoder_model_merged_fp16.onnx +3 -0
- onnx/decoder_model_merged_int8.onnx +3 -0
- onnx/decoder_model_merged_q4.onnx +3 -0
- onnx/decoder_model_merged_q4f16.onnx +3 -0
- onnx/decoder_model_merged_quantized.onnx +3 -0
- onnx/decoder_model_merged_uint8.onnx +3 -0
- onnx/embed_tokens.onnx +3 -0
- onnx/embed_tokens_bnb4.onnx +3 -0
- onnx/embed_tokens_fp16.onnx +3 -0
- onnx/embed_tokens_int8.onnx +3 -0
- onnx/embed_tokens_q4.onnx +3 -0
- onnx/embed_tokens_q4f16.onnx +3 -0
- onnx/embed_tokens_quantized.onnx +3 -0
- onnx/embed_tokens_uint8.onnx +3 -0
- onnx/vision_encoder.onnx +3 -0
- onnx/vision_encoder_bnb4.onnx +3 -0
- onnx/vision_encoder_fp16.onnx +3 -0
- onnx/vision_encoder_int8.onnx +3 -0
- onnx/vision_encoder_q4.onnx +3 -0
- onnx/vision_encoder_q4f16.onnx +3 -0
- onnx/vision_encoder_quantized.onnx +3 -0
- onnx/vision_encoder_uint8.onnx +3 -0
config.json
CHANGED
@@ -116,6 +116,12 @@
|
|
116 |
"tie_word_embeddings": false,
|
117 |
"torch_dtype": "bfloat16",
|
118 |
"transformers_version": "4.50.0.dev0",
|
|
|
|
|
|
|
|
|
|
|
|
|
119 |
"use_cache": true,
|
120 |
"vision_config": {
|
121 |
"hidden_size": 768,
|
|
|
116 |
"tie_word_embeddings": false,
|
117 |
"torch_dtype": "bfloat16",
|
118 |
"transformers_version": "4.50.0.dev0",
|
119 |
+
"transformers.js_config": {
|
120 |
+
"kv_cache_dtype": {
|
121 |
+
"q4f16": "float16",
|
122 |
+
"fp16": "float16"
|
123 |
+
}
|
124 |
+
},
|
125 |
"use_cache": true,
|
126 |
"vision_config": {
|
127 |
"hidden_size": 768,
|
onnx/decoder_model_merged.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c75155e5e121b9d89bf5435d396ccd9e817572d8a0e4589e1c0eb5574bb3c69e
|
3 |
+
size 540972236
|
onnx/decoder_model_merged_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51ef8fa60e201a412c1a0b24333bfa2a6c73d4f45e58b9e2411866cfc6fc707b
|
3 |
+
size 78486831
|
onnx/decoder_model_merged_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ccd0761dc1e061c706381fb345a01977d4ec4db2ee97d3acb6886f65fbe2ba81
|
3 |
+
size 270764878
|
onnx/decoder_model_merged_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fdce1ec841ad5b730d2c220ff2147f2114cecf7b5518c27cc050c29bf75e997
|
3 |
+
size 137553254
|
onnx/decoder_model_merged_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef6045cf8e613277a745f5b56eaf1cc2dda00c64d984acaa005fa5ef706efcc5
|
3 |
+
size 86894835
|
onnx/decoder_model_merged_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9cda6976be0f2b446a01ace90aa04a520116b4641e544cbc74dd8a70335b606
|
3 |
+
size 77385255
|
onnx/decoder_model_merged_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88d2ef3239d292224065443e7dc6a8b87195db94a38280e23bd4b5ca18c1d3b5
|
3 |
+
size 137553365
|
onnx/decoder_model_merged_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88d2ef3239d292224065443e7dc6a8b87195db94a38280e23bd4b5ca18c1d3b5
|
3 |
+
size 137553365
|
onnx/embed_tokens.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:816939a02a48a540330655f6cc1a33cb47b2021aec0ebb356a016c50b826f3f6
|
3 |
+
size 113541419
|
onnx/embed_tokens_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b6ad5d0ac29dc4bd893b61606f760fac40481a4eecbcb318502b05e3562aa37
|
3 |
+
size 113541438
|
onnx/embed_tokens_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f08a824993fe5ea9d5affd34a986a3700c4c5cb0fd21993182c03a58c4a0ee3a
|
3 |
+
size 56770887
|
onnx/embed_tokens_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74e69c670cb770eb3b430c7fdd770a9e4e0f174edef568e6aa67df4276c398e5
|
3 |
+
size 28385824
|
onnx/embed_tokens_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b6ad5d0ac29dc4bd893b61606f760fac40481a4eecbcb318502b05e3562aa37
|
3 |
+
size 113541438
|
onnx/embed_tokens_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:664289fb111a87112cf97c9ac4d9122119740bc5da3a6eb8305fa1063dec65a4
|
3 |
+
size 56770906
|
onnx/embed_tokens_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74e69c670cb770eb3b430c7fdd770a9e4e0f174edef568e6aa67df4276c398e5
|
3 |
+
size 28385824
|
onnx/embed_tokens_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74e69c670cb770eb3b430c7fdd770a9e4e0f174edef568e6aa67df4276c398e5
|
3 |
+
size 28385824
|
onnx/vision_encoder.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c97aafac0543632c778938e2870afb73a81c7cc3a3e01e84b43a096bd668820
|
3 |
+
size 374316454
|
onnx/vision_encoder_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fcc3b8bf6e0b12be05c5ce66adc5d504fb0efb4a00dbfc53a8f8dbc1cca1516e
|
3 |
+
size 58034696
|
onnx/vision_encoder_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f86f88e185e231b91232147206771e267d8ab038aa4e30fb29e376d9ec4db4fb
|
3 |
+
size 187295327
|
onnx/vision_encoder_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3251860101c63f90c44ec475c874346c461de48421aacc13b5f5741004282240
|
3 |
+
size 94247884
|
onnx/vision_encoder_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbcfa73fba2477b564a364123bc066922c9e692a9389c24eb904009f922e9aa0
|
3 |
+
size 63784944
|
onnx/vision_encoder_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0e3c83edfaf3c946e592f50d9b238eb422c0c4ef62643883a46d7c5ebb7284a
|
3 |
+
size 55038218
|
onnx/vision_encoder_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5e42cf6c8719dba60582c3722cba72673de5e2b739c01e5147bc34d9193ae20
|
3 |
+
size 94247926
|
onnx/vision_encoder_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5e42cf6c8719dba60582c3722cba72673de5e2b739c01e5147bc34d9193ae20
|
3 |
+
size 94247926
|