nintwentydo commited on
Commit
90b9193
·
verified ·
1 Parent(s): cae0645

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +42 -0
  2. config.json +38 -0
  3. generation_config.json +6 -0
  4. model-00001-of-00052.safetensors +3 -0
  5. model-00002-of-00052.safetensors +3 -0
  6. model-00003-of-00052.safetensors +3 -0
  7. model-00004-of-00052.safetensors +3 -0
  8. model-00005-of-00052.safetensors +3 -0
  9. model-00006-of-00052.safetensors +3 -0
  10. model-00007-of-00052.safetensors +3 -0
  11. model-00008-of-00052.safetensors +3 -0
  12. model-00009-of-00052.safetensors +3 -0
  13. model-00010-of-00052.safetensors +3 -0
  14. model-00011-of-00052.safetensors +3 -0
  15. model-00012-of-00052.safetensors +3 -0
  16. model-00013-of-00052.safetensors +3 -0
  17. model-00014-of-00052.safetensors +3 -0
  18. model-00015-of-00052.safetensors +3 -0
  19. model-00016-of-00052.safetensors +3 -0
  20. model-00017-of-00052.safetensors +3 -0
  21. model-00018-of-00052.safetensors +3 -0
  22. model-00019-of-00052.safetensors +3 -0
  23. model-00020-of-00052.safetensors +3 -0
  24. model-00021-of-00052.safetensors +3 -0
  25. model-00022-of-00052.safetensors +3 -0
  26. model-00023-of-00052.safetensors +3 -0
  27. model-00024-of-00052.safetensors +3 -0
  28. model-00025-of-00052.safetensors +3 -0
  29. model-00026-of-00052.safetensors +3 -0
  30. model-00027-of-00052.safetensors +3 -0
  31. model-00028-of-00052.safetensors +3 -0
  32. model-00029-of-00052.safetensors +3 -0
  33. model-00030-of-00052.safetensors +3 -0
  34. model-00031-of-00052.safetensors +3 -0
  35. model-00032-of-00052.safetensors +3 -0
  36. model-00033-of-00052.safetensors +3 -0
  37. model-00034-of-00052.safetensors +3 -0
  38. model-00035-of-00052.safetensors +3 -0
  39. model-00036-of-00052.safetensors +3 -0
  40. model-00037-of-00052.safetensors +3 -0
  41. model-00038-of-00052.safetensors +3 -0
  42. model-00039-of-00052.safetensors +3 -0
  43. model-00040-of-00052.safetensors +3 -0
  44. model-00041-of-00052.safetensors +3 -0
  45. model-00042-of-00052.safetensors +3 -0
  46. model-00043-of-00052.safetensors +3 -0
  47. model-00044-of-00052.safetensors +3 -0
  48. model-00045-of-00052.safetensors +3 -0
  49. model-00046-of-00052.safetensors +3 -0
  50. model-00047-of-00052.safetensors +3 -0
README.md ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ language:
3
+ - en
4
+ - fr
5
+ - de
6
+ - es
7
+ - it
8
+ - pt
9
+ - zh
10
+ - ja
11
+ - ru
12
+ - ko
13
+ license: other
14
+ license_name: mrl
15
+ base_model: mistralai/Pixtral-Large-Instruct-2411
16
+ inference: false
17
+ license_link: https://mistral.ai/licenses/MRL-0.1.md
18
+ library_name: transformers
19
+ pipeline_tag: image-text-to-text
20
+ ---
21
+
22
+ # Pixtral-Large-Instruct-2411 🧡
23
+
24
+ Transformers implementation of [Pixtral-Large-Instruct-2411](https://huggingface.co/mistralai/Pixtral-Large-Instruct-2411).
25
+
26
+
27
+ ## Tokenizer And Prompt Template
28
+ Using conversion of v7m1 tokenizer with 32k vocab size.
29
+
30
+ Chat template in tokenizer_config.json uses the v7 instruct template:
31
+
32
+ ```
33
+ <s>[SYSTEM_PROMPT] <system prompt>[/SYSTEM_PROMPT][INST] <user message>[/INST] <assistant response></s>[INST] <user message>[/INST]
34
+ ```
35
+
36
+ ## Notes
37
+ *- tool use hasn't been implemented in the template yet.*
38
+ *- I've added extra stop tokens between consecutive user messages. Helps contexts where there'll be multiple speakers etc but your milage may vary.*
39
+ *- If you have a better implementation of the tokenizer let me know and I'm happy to swap it out.*
40
+ *- As always pls respect the model license.*
41
+
42
+ Currently doing a fresh measurement run ahead of re-doing my exl2 quants which I'll upload. Apologies in advance if anything is wonky, tbh this is just a personal learning exercise for me and I decided to make this model my fixation to freshen up on my knowledge lol.
config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "LlavaForConditionalGeneration"
4
+ ],
5
+ "ignore_index": -100,
6
+ "image_seq_length": 1,
7
+ "image_token_index": 10,
8
+ "model_type": "llava",
9
+ "projector_hidden_act": "gelu",
10
+ "text_config": {
11
+ "hidden_size": 12288,
12
+ "intermediate_size": 28672,
13
+ "max_position_embeddings": 131072,
14
+ "model_type": "mistral",
15
+ "num_attention_heads": 96,
16
+ "num_hidden_layers": 88,
17
+ "num_key_value_heads": 8,
18
+ "rms_norm_eps": 1e-05,
19
+ "rope_theta": 1000000.0,
20
+ "sliding_window": null,
21
+ "vocab_size": 32768
22
+ },
23
+ "transformers_version": "4.48.0.dev0",
24
+ "vision_config": {
25
+ "head_dim": 88,
26
+ "num_attention_heads": 16,
27
+ "hidden_act": "silu",
28
+ "hidden_size": 1408,
29
+ "image_size": 1024,
30
+ "intermediate_size": 6144,
31
+ "model_type": "pixtral",
32
+ "num_hidden_layers": 40,
33
+ "patch_size": 16,
34
+ "rope_theta": 10000.0
35
+ },
36
+ "vision_feature_layer": -1,
37
+ "vision_feature_select_strategy": "full"
38
+ }
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 2,
5
+ "transformers_version": "4.48.0.dev0"
6
+ }
model-00001-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14f0870e452149f4dcf6dd3b8bd2473598dfd51152cb11d7e20414056cd0831b
3
+ size 4509270008
model-00002-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9fcbbe01e14828c044cf0ae930c826acff6ee3b8e81fd6ca5ef6c97a42fd7f3a
3
+ size 4882270024
model-00003-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e84a1a7c117ecee5b9be23ace65ff17aa7dcd55350794a02820a80d9e2c3a07
3
+ size 4831889368
model-00004-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cd040875f38bc94db33c01c68af083f6288a0e8f883a6a3f2579ce01a95cd90
3
+ size 4831938776
model-00005-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9338c97508c94cfd6fe5d92e9285622d46d14d7ac97fa8dec6199d3569e764d5
3
+ size 4831938776
model-00006-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:540fb77c3fc0150cbe012a285afc57918957f2ed92542910e876ae14235143b8
3
+ size 4882270024
model-00007-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c53b5751a6f73e070752bc8d7c9409442c0e1e8e3d6902c377026f71b9cfcd9b
3
+ size 4831889384
model-00008-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:194ce36f2dbeb4b391857b32579d579bb668637a26f19b1ac48252f55accb753
3
+ size 4831938792
model-00009-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abb1b4063d634fdb4ee19894e89e5f9c9e21019a2b80adfb6ba14c13fa3c5406
3
+ size 4831938800
model-00010-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a4fc55163298b3882aa6aa1f8f229bd9857e1494cd1ea543e4f257376bd1c49
3
+ size 4882270040
model-00011-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa3f51e16047a320259ae21c6d9506266ce9bec2be0c49508f7d99386d68d5bd
3
+ size 4831889376
model-00012-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19b5737821632a06fc0e61e24718094be4bf361cb3fc57fbaa82a6f7019f08cb
3
+ size 4831938792
model-00013-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cea09a3e29d77fddd25d7e55992d8f17a49bcf8ed9c38ca4cba517e0045d45f5
3
+ size 4831938800
model-00014-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:075167a29ae960189491f0f250e9c0bc3d9491bc3d3c46ee6d0089c46e43f4ec
3
+ size 4882270040
model-00015-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42588f8fe11c0846cfd9e96603828256cc4e8f101e54a7f24bed2f5c28cb9fe5
3
+ size 4831889376
model-00016-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7281b0ee3f2590bc6c19130ed8f233887f136f8fdfab9c64b34402e9919d7db5
3
+ size 4831938792
model-00017-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06e442f95527ea9a5f82f193e9781bbbd376e305019b28d52f84426f10928d8c
3
+ size 4831938800
model-00018-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6dbfb7bbd99bc0d0d44b1c34112b71a81fdf1c5354835176a4fe187d00bfce1b
3
+ size 4882270040
model-00019-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:791b54d8e7ff38c2e575df46115c7cd21a3a9defe544b9f943cdd0cdc78f3fb3
3
+ size 4831889376
model-00020-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35df3afdd407778ae26e1f9df6f6ea12681acd90de4d9525f4b4cde2ef30662d
3
+ size 4831938792
model-00021-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd7991d7936b08bf468f2f2da9dbac46224b732bedd9ab09c2ba4ff06a82557c
3
+ size 4831938800
model-00022-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4a4473980e3bc05a3366fa638bb861519a4665f33bc1512ac6cd0cbdc7711a5
3
+ size 4882270040
model-00023-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65ca1eb9328ada88ad65e08c8b18d526d298bab6965a7372be537a994c5205eb
3
+ size 4831889376
model-00024-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba34028c5979cfd3781ca70aead3b1b2b55180d93394ce2857db4e5b0e9af8b6
3
+ size 4831938792
model-00025-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b1dee0420ed6c93f7bcaed4197655344303b338f3d9d1027fd7f036738bf932
3
+ size 4831938800
model-00026-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cb83cb476282252ffddddabc69ea27fc08f3f7a022acefe4335419f28050e6c
3
+ size 4882270040
model-00027-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05f852d81895c3ba645c106f21ab9fb63d2988baed0967b17266955e65c9e95a
3
+ size 4831889376
model-00028-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1859871627e14661d1ee731005e87b312d4af7aa25a436f468a7b7e4bf329dd4
3
+ size 4831938792
model-00029-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b7d2b168b2caa8a0445fedf597478d62dbd6850a777b0c08e7eebed3b0d9a6a
3
+ size 4831938800
model-00030-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4c20b8e733f6dbd8d5a300eea95b0afa3a1bc2a780768a6e274ea08cfeb1020
3
+ size 4882270040
model-00031-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:400f4c047a67586f764af4ae0abba7440df8107ceba3ac0fd4166f5bcaab34e1
3
+ size 4831889376
model-00032-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ac94d3d776f9882c868cb20db22e8bcf79e5f0abb134d06e64ddcf6e652b81c
3
+ size 4831938792
model-00033-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ed94b8ba78c5d51635a47d724d64a3959e955c71187ecc23747f686dbc33d3a
3
+ size 4831938800
model-00034-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc84284a1541d12eb8d6a113a68f978a255151dffb021c86e8d4f3ec08c1f480
3
+ size 4882270040
model-00035-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24493e298808e6481a72a8dbc8a4ee173d7a2bd7657f78987bbaafe85f3d5221
3
+ size 4831889376
model-00036-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8fcdde3f303bae55b414633dbaf047f6f00806976a5b726e2d73fdd6fc14564
3
+ size 4831938792
model-00037-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb44645fc87b76f6b69ef97217d7760955e1fd0402efa68b24fd9ffd1ee3c9a5
3
+ size 4831938800
model-00038-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a62587682a17ba3d030c6479661d01932afe76c2eaade70383e0ed4bece8213
3
+ size 4882270040
model-00039-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ea5f4b55c5dde56308cd14ab941c8912b2c71c971feda89cd199993bfef36d3
3
+ size 4831889376
model-00040-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf6a29d3af8c20a2a70676407d5f8581df4e849af24eaf2760a9c38fafe8779f
3
+ size 4831938792
model-00041-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bff31ed650cf76fbad236fb6685f2a4c4f86db6da037cea3a73ebc5e28a1c93a
3
+ size 4831938800
model-00042-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f090172fa822725090d97b55d31873fecd1ecc01606fbc4fb1357704f6760ac
3
+ size 4882270040
model-00043-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2390076a1035012086880648ee9cbc9a6f3407ac411bf79ebef557641964fc69
3
+ size 4831889376
model-00044-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:785ba85d22ecc3d3b6b62dbcb1e843e57fa57bf0bba7877e15f5d3fda9f6100f
3
+ size 4831938792
model-00045-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f6470663d2e7c12a1af0f1c54fb2fb5176de2d47de0e6ee06bb652738ee3421
3
+ size 4831938800
model-00046-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f28328f36a9ac4a470716488589812b656badad04877e4bfec2288660771fd9
3
+ size 4882270040
model-00047-of-00052.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4450bdb8aac77ef388cb192dbd78a949aa18d7e2800ce112d00894a31466b7ec
3
+ size 4831889376