Gunulhona commited on
Commit
0bba956
·
verified ·
1 Parent(s): 20b2b47

Upload folder using huggingface_hub

Browse files
Files changed (47) hide show
  1. config.json +32 -0
  2. mergekit_moe_config.yml +16 -0
  3. model-00001-of-00040.safetensors +3 -0
  4. model-00002-of-00040.safetensors +3 -0
  5. model-00003-of-00040.safetensors +3 -0
  6. model-00004-of-00040.safetensors +3 -0
  7. model-00005-of-00040.safetensors +3 -0
  8. model-00006-of-00040.safetensors +3 -0
  9. model-00007-of-00040.safetensors +3 -0
  10. model-00008-of-00040.safetensors +3 -0
  11. model-00009-of-00040.safetensors +3 -0
  12. model-00010-of-00040.safetensors +3 -0
  13. model-00011-of-00040.safetensors +3 -0
  14. model-00012-of-00040.safetensors +3 -0
  15. model-00013-of-00040.safetensors +3 -0
  16. model-00014-of-00040.safetensors +3 -0
  17. model-00015-of-00040.safetensors +3 -0
  18. model-00016-of-00040.safetensors +3 -0
  19. model-00017-of-00040.safetensors +3 -0
  20. model-00018-of-00040.safetensors +3 -0
  21. model-00019-of-00040.safetensors +3 -0
  22. model-00020-of-00040.safetensors +3 -0
  23. model-00021-of-00040.safetensors +3 -0
  24. model-00022-of-00040.safetensors +3 -0
  25. model-00023-of-00040.safetensors +3 -0
  26. model-00024-of-00040.safetensors +3 -0
  27. model-00025-of-00040.safetensors +3 -0
  28. model-00026-of-00040.safetensors +3 -0
  29. model-00027-of-00040.safetensors +3 -0
  30. model-00028-of-00040.safetensors +3 -0
  31. model-00029-of-00040.safetensors +3 -0
  32. model-00030-of-00040.safetensors +3 -0
  33. model-00031-of-00040.safetensors +3 -0
  34. model-00032-of-00040.safetensors +3 -0
  35. model-00033-of-00040.safetensors +3 -0
  36. model-00034-of-00040.safetensors +3 -0
  37. model-00035-of-00040.safetensors +3 -0
  38. model-00036-of-00040.safetensors +3 -0
  39. model-00037-of-00040.safetensors +3 -0
  40. model-00038-of-00040.safetensors +3 -0
  41. model-00039-of-00040.safetensors +3 -0
  42. model-00040-of-00040.safetensors +3 -0
  43. model.safetensors.index.json +0 -0
  44. special_tokens_map.json +24 -0
  45. tokenizer.json +0 -0
  46. tokenizer.model +3 -0
  47. tokenizer_config.json +0 -0
config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "mistralai/Mistral-7B-Instruct-v0.3",
3
+ "architectures": [
4
+ "MixtralForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 1,
8
+ "eos_token_id": 2,
9
+ "head_dim": 128,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 4096,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 14336,
14
+ "max_position_embeddings": 32768,
15
+ "model_type": "mixtral",
16
+ "num_attention_heads": 32,
17
+ "num_experts_per_tok": 2,
18
+ "num_hidden_layers": 32,
19
+ "num_key_value_heads": 8,
20
+ "num_local_experts": 10,
21
+ "output_router_logits": false,
22
+ "rms_norm_eps": 1e-05,
23
+ "rope_theta": 1000000.0,
24
+ "router_aux_loss_coef": 0.001,
25
+ "router_jitter_noise": 0.0,
26
+ "sliding_window": null,
27
+ "tie_word_embeddings": false,
28
+ "torch_dtype": "bfloat16",
29
+ "transformers_version": "4.46.0.dev0",
30
+ "use_cache": true,
31
+ "vocab_size": 32768
32
+ }
mergekit_moe_config.yml ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ base_model: mistralai/Mistral-7B-Instruct-v0.3
2
+ gate_mode: random
3
+ dtype: bfloat16
4
+ experts:
5
+ - source_model: mistralai/Mistral-7B-Instruct-v0.3
6
+ - source_model: teknium/OpenHermes-2.5-Mistral-7B
7
+ - source_model: NousResearch/Hermes-2-Pro-Mistral-7B
8
+ - source_model: Open-Orca/Mistral-7B-OpenOrca
9
+ - source_model: Open-Orca/Mistral-7B-OpenOrca
10
+ - source_model: mistralai/Mistral-7B-Instruct-v0.3
11
+ - source_model: teknium/OpenHermes-2.5-Mistral-7B
12
+ - source_model: NousResearch/Hermes-2-Pro-Mistral-7B
13
+ - source_model: Open-Orca/Mistral-7B-OpenOrca
14
+ - source_model: Open-Orca/Mistral-7B-OpenOrca
15
+
16
+ # and then train the sucker!
model-00001-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8fb9bfa7cfe312f07ceedafc5b26f8f11903fa1e5b99cd015ee2e0ab4f3aa37
3
+ size 2936032888
model-00002-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4ebae345aefe406a2e520a3bbbc4a440c76cc2da4fafb7d76234c5b04f8addf
3
+ size 2902478616
model-00003-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7350fd54f5f707807e04ecc13a1d4d455bf17f530f3261bf2d33451170fc9b4c
3
+ size 2902478616
model-00004-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0ea56f45322c4f07acaf5c7c32ef157f5f42f8094075dd0c198d10dad276ad8
3
+ size 2902478616
model-00005-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1b4846b4fb51b75cbf223380058f69ccbed8517bf0a862a57d4a33cba014995
3
+ size 2936016096
model-00006-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f43c922315663ee0511765f6bd9cee63545add7fd7626eddbb7a27fb884a3d9
3
+ size 2902478616
model-00007-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0db617bc1608e5ad82e8c3ea6153ed44c56d0a2f5ef45df01392f8c8ed2f5cf1
3
+ size 2902478616
model-00008-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97945d80779f994d831b5147039d2a9ed4c8a14833f2c38d9d5401f9468cf940
3
+ size 2902478616
model-00009-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cfeb605dc7526752e34c73f6aa462dd7891fe3415a841d5a7a7b2033b1dd23b
3
+ size 2902478616
model-00010-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fb8cadb76fc6967ee3884fe19ae5ec1e65929f871f47e38a3ca0012c84461ad
3
+ size 2986356392
model-00011-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d69d1a0112394c647de1804a138dabef4f0b1876c1dfb4b7311b7772ea10262e
3
+ size 2969578952
model-00012-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18debd762e827d2f1ca8f672ddd3d844839f256b3ded8103be9a3b06108a5613
3
+ size 2902478616
model-00013-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a268f586b245a3dfed2b5590898108d0946378b89feab0fbb251db3af0364ec
3
+ size 2902478632
model-00014-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7241165fe3afb5bd8cad55b07908ed84cd8ace8b95268b344df6500c9f5339da
3
+ size 2902478640
model-00015-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cde0608f5defa621df1dfb299f4f3f186937e237dccc602f6199a934d3410929
3
+ size 2902478640
model-00016-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:257c2b48ed6e74c22921f4d2950184c14c8597c8fd9a9fcb3f8255a376a1e030
3
+ size 2936016120
model-00017-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09776ab08f52a29dbf99860da975bdf8be916904fc42d363212c8af1259e16b9
3
+ size 2902478640
model-00018-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc2517dc3ec5d1a95adc51222ae44799a9bde467a8bb2906099e9da640d575df
3
+ size 2902478640
model-00019-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a41f104b0125ce23bce2e39c4756eab0ef9516d9f4f8a88713feafe4049cfece
3
+ size 2902478640
model-00020-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a9f6c167a70bbbb3036338b72a07aa3a191917321add35a9a621df4bc1d5da2
3
+ size 2902478640
model-00021-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b709d9583895f70ff3e07a1a706c194fad2fd843f15005d4b2dbb7b4a1362c7
3
+ size 2936016120
model-00022-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef4a4ab0fc4a936c83204f74732b38cbaa140b27c0154dbcb191d5926c914971
3
+ size 2902478640
model-00023-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6332f913f017cc57c26744b4224295af23f29ff7eaf0119c487ccea9876a8b7
3
+ size 2902478640
model-00024-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a85416526c990ef05bbd6f185536a9afcedf90bfb6f11266987e310f48fdb56
3
+ size 2902478640
model-00025-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92eadb591dee4ec70be272002bc4d254a7295cfe108caa1f86b5c2158816faeb
3
+ size 2902478640
model-00026-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:122d2ae2d0f2135f4634125d51957e41161eaf41c3b9ebd6212db73a29ade5b4
3
+ size 2936016120
model-00027-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dac0fc0e325953112c3c0e16acfb1212f3ec348c5f8ff9c193bef95b5869f1c8
3
+ size 2902478640
model-00028-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3211def6df371199a00beccdfb70eb607dac78cc9b30f686f33a967d70e51d95
3
+ size 2902478640
model-00029-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fa99c0daf197ae117fa7e0d9ae5ebde309c4bffba1f5e8fa68b411fc18b0a24
3
+ size 2902478640
model-00030-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04a7f767a1073cb67ff1fd84a5753f34b12c40c5a1bb7663b0aaf150b0c76a66
3
+ size 2902478640
model-00031-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9376ac639def573799b49dd11117dc398493ed967dadb95cca9a92b24208ccb
3
+ size 2936016120
model-00032-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83c61f6fa2cf78656de3167e08585d6628281ba5724e36d5578401a0c65cc016
3
+ size 2902478640
model-00033-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5238ccad324113fc4dd7939514dcd304bcc31250d4e2a2615292d373699b23da
3
+ size 2902478640
model-00034-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d982fe7fc921f83814c6d6e99f89419a0142a9965dd13b0f9cff395654c4389
3
+ size 2902478640
model-00035-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7d32b2d324e9f2978c3efeb52f97d28f5c50d51296e5539466cb15710ed5ed2
3
+ size 2902478640
model-00036-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6dff05f8738ce9dd65bc4a52fde19ce1249cbc62f077c9277132a4184624520
3
+ size 2986356424
model-00037-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f618bc31dfcb1523c2ef1bed20a7f7e058870d494a608b4c3dc0072075782a0c
3
+ size 2969578984
model-00038-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6150a8540cdbe6756cfb4af973a058e5107de83065579ea6c2bfcacecf2d1459
3
+ size 2902478640
model-00039-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a775f1654d3778934a38475dd2d3d6b889c2a386efc3d7b37ed88b3dd47dc620
3
+ size 2902478640
model-00040-of-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2105e7d9b617b28b4dc53094d60f9ceac473a7dc3e2786146c2608cd9f69d92
3
+ size 2267560056
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
special_tokens_map.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": "<s>",
17
+ "unk_token": {
18
+ "content": "<unk>",
19
+ "lstrip": false,
20
+ "normalized": false,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ }
24
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37f00374dea48658ee8f5d0f21895b9bc55cb0103939607c8185bfd1c6ca1f89
3
+ size 587404
tokenizer_config.json ADDED
The diff for this file is too large to render. See raw diff