Upload 153 files
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- merges.txt +0 -0
- mlc-chat-config.json +78 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
- params_shard_14.bin +3 -0
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,78 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "mistral",
|
4 |
+
"quantization": "q4f16_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 5120,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 40,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 131072,
|
12 |
+
"position_embedding_base": 1000000.0,
|
13 |
+
"num_key_value_heads": 8,
|
14 |
+
"head_dim": 128,
|
15 |
+
"context_window_size": 1024000,
|
16 |
+
"sliding_window_size": -1,
|
17 |
+
"prefill_chunk_size": 2048,
|
18 |
+
"attention_sink_size": 4,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"max_batch_size": 80
|
21 |
+
},
|
22 |
+
"vocab_size": 131072,
|
23 |
+
"context_window_size": 1024000,
|
24 |
+
"sliding_window_size": -1,
|
25 |
+
"prefill_chunk_size": 2048,
|
26 |
+
"attention_sink_size": 4,
|
27 |
+
"tensor_parallel_shards": 1,
|
28 |
+
"pipeline_parallel_stages": 1,
|
29 |
+
"temperature": 1.0,
|
30 |
+
"presence_penalty": 0.0,
|
31 |
+
"frequency_penalty": 0.0,
|
32 |
+
"repetition_penalty": 1.0,
|
33 |
+
"top_p": 1.0,
|
34 |
+
"tokenizer_files": [
|
35 |
+
"tokenizer.json",
|
36 |
+
"vocab.json",
|
37 |
+
"merges.txt",
|
38 |
+
"tokenizer_config.json"
|
39 |
+
],
|
40 |
+
"tokenizer_info": {
|
41 |
+
"token_postproc_method": "byte_level",
|
42 |
+
"prepend_space_in_encode": false,
|
43 |
+
"strip_space_in_decode": false
|
44 |
+
},
|
45 |
+
"conv_template": {
|
46 |
+
"name": "chatml",
|
47 |
+
"system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
|
48 |
+
"system_message": "A conversation between a user and an LLM-based AI assistant. The assistant gives helpful and honest answers.",
|
49 |
+
"system_prefix_token_ids": null,
|
50 |
+
"add_role_after_system_message": true,
|
51 |
+
"roles": {
|
52 |
+
"user": "<|im_start|>user",
|
53 |
+
"assistant": "<|im_start|>assistant"
|
54 |
+
},
|
55 |
+
"role_templates": {
|
56 |
+
"user": "{user_message}",
|
57 |
+
"assistant": "{assistant_message}",
|
58 |
+
"tool": "{tool_message}"
|
59 |
+
},
|
60 |
+
"messages": [],
|
61 |
+
"seps": [
|
62 |
+
"<|im_end|>\n"
|
63 |
+
],
|
64 |
+
"role_content_sep": "\n",
|
65 |
+
"role_empty_sep": "\n",
|
66 |
+
"stop_str": [
|
67 |
+
"<|im_end|>"
|
68 |
+
],
|
69 |
+
"stop_token_ids": [
|
70 |
+
2
|
71 |
+
],
|
72 |
+
"function_string": "",
|
73 |
+
"use_function_calling": false
|
74 |
+
},
|
75 |
+
"pad_token_id": 0,
|
76 |
+
"bos_token_id": 1,
|
77 |
+
"eos_token_id": 2
|
78 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aab58bad6d1380b5cc26efa8902410d836953b381317993ab9a9777f0bad6322
|
3 |
+
size 335544320
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89f3c317202a58085ca4f537bec06ffafd576face6a7be1dd449b77924fec5be
|
3 |
+
size 41943040
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98d8cb18d785f6b042b4137481286e7c1bd533c69b711b8873c3f3ce4672057a
|
3 |
+
size 31467520
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d10b799de707bf99b9c378d8c101ce7b81120fd360636f6d65e11b5409629f3
|
3 |
+
size 25579520
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1516881ecb49591d33754e18a16975bdd4efb62b0cb3ae3e7bf6ac7c7913a49
|
3 |
+
size 36700160
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f725c09aa6405013eee10a6348e174d97e0302fdf585eea21c4f4d960ff4e7d
|
3 |
+
size 29501440
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1759239c9196fdf9e2abcde4d90dbabb7cfa372dccd4618497c9beb8a8374b18
|
3 |
+
size 73400320
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:738341334a6e9f5b70f6b338eca04feec90b576c4d220f01d8b2598d6d6e1c7b
|
3 |
+
size 31467520
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:449589546c11200f56de204f9abe6be91f3582f3202adefa20188defb9dbe2e0
|
3 |
+
size 36700160
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44a294ec8e8cc602af91caf16e7e31441a96f203f2ac5052170469d2e508724a
|
3 |
+
size 73400320
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a08238c22bd07811bc99283eeaf0e72400bfd54cb0a37e2dc747979d5d6b2392
|
3 |
+
size 25579520
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b07cd01b8a2492c1f196a57e83ef8e1db54f5161478ec75bd4433df218bdaeb7
|
3 |
+
size 36700160
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3f6d58d3e79ebd8f772831c5481cf760dd4e5f68894cf5c4c7bb140f70bd579
|
3 |
+
size 29501440
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:495fc155de9e7a1031316613014dc30b63a5424daec33df0a77c18987f05e5ae
|
3 |
+
size 36700160
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:977bc423638e2902ca69fd0e901c268b53cef855061c633d533916d9eb597db1
|
3 |
+
size 73400320
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f01406a86aec1489d5a5cfb78c118cc333bc9d5ab9445ee82915da1679b6c7e
|
3 |
+
size 31467520
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60a463e862176f5e8e92ebf2dccbe8631a396b27cb7ad746d192ac78f0591e55
|
3 |
+
size 73400320
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd2d339aca40bc337e0f53692c65a2539c639385a7c12b813fd80d998c0c9dbf
|
3 |
+
size 20971520
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed6bc9e365cf58cd53c76e92d83843ae957b18f542f4f285660d15a7b5ae774e
|
3 |
+
size 36700160
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97aa5cd27e99cd809977846196c924357f914240c97675f2be5449ff6a9ac3be
|
3 |
+
size 29501440
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e2333e3456303013733afa93459d7a92b50a4db450de631bb32a625fdf8ab61
|
3 |
+
size 36700160
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7dcd7cef372e843bc13c53fd2df7a279be38484c17375fd5c8d145824025284f
|
3 |
+
size 73400320
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86577ad67c83cef4d364961ba8864c67e593527b6ff04d19baba15cd5a03cb2c
|
3 |
+
size 18380800
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:923225355e4b608ba51bcd012170f8c32047ea08fa9ba1c57813eb9d1bf1a099
|
3 |
+
size 36700160
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8442bc8babbe0ee1869e0241ea68bdf3b03b10a116da2fa4c4ab1c65c8f2501
|
3 |
+
size 73400320
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d8b2c2e80f2d0f60aebf48f3da090a22d3c99a918acf268c113d089178f6d47
|
3 |
+
size 29501440
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:780bf4b0ef18595747b4532f593157520b444e7448c213568d711e9b294d7035
|
3 |
+
size 73400320
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:236e1796d3a3af057db9b03f0f9caea8a382cade6f112c7d975a184e6b330e50
|
3 |
+
size 31467520
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:108343c3c7e52bb916294c56be3e8f9c49b8091f09e63b32f5e53f42f3c3794e
|
3 |
+
size 36700160
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:368a2e615dcce9c932d11a5525ba25856adaf5678520f7632ab7997a6094df9f
|
3 |
+
size 73400320
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:090ae854a5924e29d3093721569751ca3948061eef6acf08078b2f07dea3d1db
|
3 |
+
size 25579520
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:211af88ab14691d49522e70e97a8156e97b633e236668fab70c18ecc72e9ae27
|
3 |
+
size 36700160
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd0e4cb3e75f01c352e1cd46da29183c5134f9b08e0dd084df61c49ce80425a7
|
3 |
+
size 29501440
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:551f4388003fd5779e5ac3620cd8033dfbbb836b167e92da4d6093db1ed78925
|
3 |
+
size 73400320
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fdc1a58ff74eabe9ea7834987c73b042290409617f09646557a35ec7e245d9d8
|
3 |
+
size 31467520
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6790b575da773a3ed7de24174a302abb40843e8fd384b36f8ffb27467aedc70
|
3 |
+
size 25579520
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecf1c116a7a210a72091913556e9c86503cdaf17bb9e02de54f21a8ecff3c0b8
|
3 |
+
size 36700160
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f43a7f341030266bb8a97e6d8668023ce23be9abb32262865c7e9e52911c9b84
|
3 |
+
size 73400320
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bee34cd69ca60a1ee4bcfdbe18a324d344ced5674f9dbc3fa9bacf380151e4ec
|
3 |
+
size 25579520
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88e177e09e1bcacba6360510bda2d5b85fee6df9ed9c981169264f32552cd1f6
|
3 |
+
size 36700160
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b70ec5e581e86b2c5ab652ca108f9c18df826bae43e0a4f7eb16cef4cbb37f0e
|
3 |
+
size 29501440
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c2ef74a98697dfddf3fc8d687bea0efc2ba7d61cc2f7662cd7ba7c11b30ec16
|
3 |
+
size 73400320
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ef12236f53fd7fdd8663a5f24b2d90cdfeda1fc725555c021b27263f8fd0573
|
3 |
+
size 31467520
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ce9a87d9b7bbe84ac7ccbc8c24e35b07e33123894bfdada5862366b05fad314
|
3 |
+
size 36700160
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec2b3d9f22f3c3b036be1fa342016ef3beac6e421355b9378eef4fd06d9e37a9
|
3 |
+
size 73400320
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c3b384a5d5fa8c9ccfb041d4c315b0d8a41ddb5916cb963361c8d638a8c45d7
|
3 |
+
size 25579520
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db3ed7fbb9646acdb991f067551129df577f4c2922e44c5be0acb2b684e1f7b3
|
3 |
+
size 36700160
|