Wtzwho commited on Feb 15, 2024

Commit

b518f38

1 Parent(s): 0f6b786

Initial commit with model files

Browse files

Files changed (33) hide show

.gitattributes +27 -35
config.json +33 -0
mergekit_moe_config.yml +104 -0
model-00001-of-00025.safetensors +3 -0
model-00002-of-00025.safetensors +3 -0
model-00003-of-00025.safetensors +3 -0
model-00004-of-00025.safetensors +3 -0
model-00005-of-00025.safetensors +3 -0
model-00006-of-00025.safetensors +3 -0
model-00007-of-00025.safetensors +3 -0
model-00008-of-00025.safetensors +3 -0
model-00009-of-00025.safetensors +3 -0
model-00010-of-00025.safetensors +3 -0
model-00011-of-00025.safetensors +3 -0
model-00012-of-00025.safetensors +3 -0
model-00013-of-00025.safetensors +3 -0
model-00014-of-00025.safetensors +3 -0
model-00015-of-00025.safetensors +3 -0
model-00016-of-00025.safetensors +3 -0
model-00017-of-00025.safetensors +3 -0
model-00018-of-00025.safetensors +3 -0
model-00019-of-00025.safetensors +3 -0
model-00020-of-00025.safetensors +3 -0
model-00021-of-00025.safetensors +3 -0
model-00022-of-00025.safetensors +3 -0
model-00023-of-00025.safetensors +3 -0
model-00024-of-00025.safetensors +3 -0
model-00025-of-00025.safetensors +3 -0
model.safetensors.index.json +0 -0
special_tokens_map.json +24 -0
tokenizer.json +0 -0
tokenizer.model +3 -0
tokenizer_config.json +42 -0

.gitattributes CHANGED Viewed

@@ -1,35 +1,27 @@
-*.7z filter=lfs diff=lfs merge=lfs -text
-*.arrow filter=lfs diff=lfs merge=lfs -text
-*.bin filter=lfs diff=lfs merge=lfs -text
-*.bz2 filter=lfs diff=lfs merge=lfs -text
-*.ckpt filter=lfs diff=lfs merge=lfs -text
-*.ftz filter=lfs diff=lfs merge=lfs -text
-*.gz filter=lfs diff=lfs merge=lfs -text
-*.h5 filter=lfs diff=lfs merge=lfs -text
-*.joblib filter=lfs diff=lfs merge=lfs -text
-*.lfs.* filter=lfs diff=lfs merge=lfs -text
-*.mlmodel filter=lfs diff=lfs merge=lfs -text
-*.model filter=lfs diff=lfs merge=lfs -text
-*.msgpack filter=lfs diff=lfs merge=lfs -text
-*.npy filter=lfs diff=lfs merge=lfs -text
-*.npz filter=lfs diff=lfs merge=lfs -text
-*.onnx filter=lfs diff=lfs merge=lfs -text
-*.ot filter=lfs diff=lfs merge=lfs -text
-*.parquet filter=lfs diff=lfs merge=lfs -text
-*.pb filter=lfs diff=lfs merge=lfs -text
-*.pickle filter=lfs diff=lfs merge=lfs -text
-*.pkl filter=lfs diff=lfs merge=lfs -text
-*.pt filter=lfs diff=lfs merge=lfs -text
-*.pth filter=lfs diff=lfs merge=lfs -text
-*.rar filter=lfs diff=lfs merge=lfs -text
-*.safetensors filter=lfs diff=lfs merge=lfs -text
-saved_model/**/* filter=lfs diff=lfs merge=lfs -text
-*.tar.* filter=lfs diff=lfs merge=lfs -text
-*.tar filter=lfs diff=lfs merge=lfs -text
-*.tflite filter=lfs diff=lfs merge=lfs -text
-*.tgz filter=lfs diff=lfs merge=lfs -text
-*.wasm filter=lfs diff=lfs merge=lfs -text
-*.xz filter=lfs diff=lfs merge=lfs -text
-*.zip filter=lfs diff=lfs merge=lfs -text
-*.zst filter=lfs diff=lfs merge=lfs -text
-*tfevents* filter=lfs diff=lfs merge=lfs -text

+*.iso filter=lfs diff=lfs merge=lfs -text
+model-00001-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00002-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00003-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00004-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00005-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00006-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00007-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00008-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00009-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00010-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00011-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00012-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00013-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00014-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00015-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00016-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00017-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00018-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00019-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00020-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00021-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00022-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00023-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00024-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+model-00025-of-00025.safetensors filter=lfs diff=lfs merge=lfs -text
+tokenizer.model filter=lfs diff=lfs merge=lfs -text

config.json ADDED Viewed

	@@ -0,0 +1,33 @@

+{
+  "_name_or_path": "TinyLlama/TinyLlama-1.1B-Chat-v1.0",
+  "architectures": [
+    "MixtralForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "hidden_act": "silu",
+  "hidden_size": 2048,
+  "initializer_range": 0.02,
+  "intermediate_size": 5632,
+  "max_position_embeddings": 2048,
+  "model_type": "mixtral",
+  "num_attention_heads": 32,
+  "num_experts_per_tok": 2,
+  "num_hidden_layers": 22,
+  "num_key_value_heads": 4,
+  "num_local_experts": 32,
+  "output_router_logits": false,
+  "pretraining_tp": 1,
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": null,
+  "rope_theta": 10000.0,
+  "router_aux_loss_coef": 0.001,
+  "sliding_window": null,
+  "tie_word_embeddings": false,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.37.2",
+  "use_cache": true,
+  "vocab_size": 32000
+}

mergekit_moe_config.yml ADDED Viewed

	@@ -0,0 +1,104 @@

+base_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+gate_mode: hidden
+dtype: bfloat16
+experts_per_token: 2
+experts:
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You understand and manage emotions effectively."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You devise innovative solutions for complex problems."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You possess extensive knowledge of world history."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You appreciate and critique art with depth."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You apply scientific methods to question and explore."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You analyze and interpret literary works insightfully."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You engage in deep philosophical thought and discussion."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You master multiple languages and their nuances."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You understand and create complex musical compositions."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You advocate for and contribute to environmental sustainability."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You offer deep psychological insights and advice."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You innovate with technology to solve modern challenges."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You guide on health, wellness, and fitness."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You navigate and advise on complex financial matters."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You maintain an informed perspective on global affairs."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You reason through ethical dilemmas with clarity."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You possess expertise in culinary arts and nutrition."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You understand and teach sports and physical health."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You advocate for human rights and social justice."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You strategize and advise on entrepreneurial endeavors."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You offer insights on travel and geographical exploration."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You examine and celebrate cultural diversity."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You explore and explain astronomical phenomena."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You apply effective teaching and learning techniques."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You offer insights on travel and geographical exploration."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You examine and celebrate cultural diversity."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You explore and explain astronomical phenomena."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You apply effective teaching and learning techniques."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You create engaging digital content and media."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You navigate and foster social and professional networks."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You provide guidelines for emergency preparedness and response."
+  - source_model: TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    positive_prompts:
+      - "You reason and advise on complex legal matters."

model-00001-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:22d62e0babf5670db638adf372d3211e78da726df4edf735f1124370dcb5d41b
+size 1992401112

model-00002-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:69cf5d4888090d17dfed838ccbe1141efa60cca59d6527e5c642d86ad18a0a70
+size 1983916976

model-00003-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:db7c8f3bbc5c2601fdc8881cf45bd8f07491705774007c655a4697b38c9e6b0d
+size 1983916968

model-00004-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:48aeabee97d265a308b44f03fc21ac5bef852244921ef9b619660f59092a465f
+size 1983916984

model-00005-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d1c796a4ddc92db9f2b960645db029b38933b13d76809deafbd25a248f5beb1b
+size 1983917064

model-00006-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f5d6e81cda5bd36d1dc01858f6df939be2a7a9290778aeac1bc1ad1ae04fc8f7
+size 1983917056

model-00007-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2e29fe468dd69ea748296bae8587a693093c7bffc9fe66ea77bc0fc0de73aca1
+size 1983917056

model-00008-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eeb6f1b147c91e787ae41d204b2c077c0d08c54b4200b79bccc437bc84619a63
+size 1983917056

model-00009-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bad77edcdc61e36d029a51945fd3a619a6f415b49dda768dddfa27bcbf0b00ef
+size 1983917000

model-00010-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5de80f571f7f6341d0bc505c4caeddb027d6366d33a499ca9bd6386c449e5199
+size 1983916968

model-00011-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c5e29fd066eb72ff6addc170fb8fa3aedd691f4b5cf364ab765ba1b4eaf4f830
+size 1983916968

model-00012-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8cd4e9e4d0904fd2a57eacd7ec8dd5dc9b2fe687ac5a0ffec5391e54dd208d82
+size 1983916976

model-00013-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c43ce7163b93c7bc1489896bcc7fa02004d37c8c03519473c7bd8ab6e16b1ecd
+size 1983917048

model-00014-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:22c4a325d1abe18742e3a3e4cf8fb6fe605fe24bb44ee0b76b6676bffae410f6
+size 1983917056

model-00015-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:72136bf6d1eee595e0a475f9fc266db1d5d57a9e93f0541c20a75ddccaffcd3d
+size 1983917064

model-00016-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:afc7e8be98b19045edf1764734501519cf180d18b6c54ac9850dd2ca08a5b6ab
+size 1983917056

model-00017-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a2b9e68863f734ccfd52bcc78c4799aa88bf8b2c45a97c8294bf316b89c894f9
+size 1983917008

model-00018-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:317b3363c8730ebab9b914eae6b3142d2df0e7945d99b0f7a10535b0a75636eb
+size 1983916976

model-00019-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:878208c880e74943296fc2af5078cd4207eb6c9cc359118e18ba6fc1cf04ab8c
+size 1983916968

model-00020-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:88d19b1915cc57b4523fa26644437f2664f323eecfdb86c5ea9a5e02faa6301d
+size 1983916968

model-00021-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a1406d9693950a7e053f36afd8bf2b9d25b57f28746bf99185ecbba42811b1d1
+size 1983917040

model-00022-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a6ad9ab101881c914601959d0349b339ff85dbe21cd1be0efa4c4df98570fad
+size 1983917056

model-00023-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:41f82d4fc804b0e9a8f59e6424985b0bd486ebce89ded28b7909d3b615e97cee
+size 1983917056

model-00024-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:96486445279865737ff67f5524c51c4cbb5aad0dc2f1e47f2a26c99e3d75bc2c
+size 1983917056

model-00025-of-00025.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:df09326a276aa6f4e0dbfb4c1e7c1d1a9fea9f359e4a6c0ad8ded456c59f52d4
+size 1779284544

model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<s>",
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
+size 499723

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,42 @@

+{
+  "add_bos_token": true,
+  "add_eos_token": false,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n{{ '<|user|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'system' %}\n{{ '<|system|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'assistant' %}\n{{ '<|assistant|>\n'  + message['content'] + eos_token }}\n{% endif %}\n{% if loop.last and add_generation_prompt %}\n{{ '<|assistant|>' }}\n{% endif %}\n{% endfor %}",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "legacy": false,
+  "model_max_length": 2048,
+  "pad_token": "<s>",
+  "padding_side": "left",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "LlamaTokenizer",
+  "unk_token": "<unk>",
+  "use_default_system_prompt": false
+}