Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- merges.txt +0 -0
- mlc-chat-config.json +40 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,40 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "gpt_bigcode",
|
3 |
+
"quantization": "q3f16_1",
|
4 |
+
"model_config": {
|
5 |
+
"n_embd": 6144,
|
6 |
+
"n_inner": 24576,
|
7 |
+
"n_head": 48,
|
8 |
+
"n_layer": 40,
|
9 |
+
"n_positions": 8192,
|
10 |
+
"layer_norm_epsilon": 1e-05,
|
11 |
+
"vocab_size": 49152,
|
12 |
+
"context_window_size": 8192,
|
13 |
+
"prefill_chunk_size": 8192,
|
14 |
+
"tensor_parallel_shards": 1
|
15 |
+
},
|
16 |
+
"vocab_size": 49152,
|
17 |
+
"context_window_size": 8192,
|
18 |
+
"sliding_window_size": -1,
|
19 |
+
"prefill_chunk_size": 8192,
|
20 |
+
"attention_sink_size": -1,
|
21 |
+
"tensor_parallel_shards": 1,
|
22 |
+
"max_batch_size": 80,
|
23 |
+
"mean_gen_len": 128,
|
24 |
+
"max_gen_len": 512,
|
25 |
+
"shift_fill_factor": 0.3,
|
26 |
+
"temperature": 0.7,
|
27 |
+
"repetition_penalty": 1.0,
|
28 |
+
"top_p": 0.95,
|
29 |
+
"conv_template": "LM",
|
30 |
+
"pad_token_id": 0,
|
31 |
+
"bos_token_id": 0,
|
32 |
+
"eos_token_id": 0,
|
33 |
+
"tokenizer_files": [
|
34 |
+
"tokenizer.json",
|
35 |
+
"vocab.json",
|
36 |
+
"merges.txt",
|
37 |
+
"tokenizer_config.json"
|
38 |
+
],
|
39 |
+
"version": "0.1.0"
|
40 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15ca670a6f0a3ccb8207659c2a2c6826d49b4643647c3759706f7e5f036c889b
|
3 |
+
size 121110528
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0fd7576f7486176d3673abde4e288e7243f7bb60fce5d9ca5f679988959a3d2
|
3 |
+
size 60555264
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ce8cb6fa68ccf3bc97445897e22a5bbe137f41ea39d38cdc72851dec7080369
|
3 |
+
size 60456960
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:949383c191a8a3148bad56a54ad8aeac6c5b0eae1b4ec0f4243e453a5aede576
|
3 |
+
size 60456960
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec27eb74b19ef22637bb1aca686d2359193b2e72a587f06474521c9410699ab4
|
3 |
+
size 32281088
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c00da470581e9499d301058638fd2b5e8af8058bff271b5adca634cd501cb4ee
|
3 |
+
size 32916480
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:245d4ba12939c60bc08ec937a6b6735d3c903b5fd73b6c95efe5d5a0b00a9407
|
3 |
+
size 60555264
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d2800eb2767e61300dc679e768269e0c6f97603373b355aeeeea7fa65857fb6
|
3 |
+
size 60456960
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83b5cb7eb124dd23f851c192ba2ef9593a6f4f330c7bdd730d9ab55190b74da8
|
3 |
+
size 32887296
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38bef13cbdd301b66e1fffbaba810fbba336842562b8ec8686a05ac98cf11927
|
3 |
+
size 60555264
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5fb8d57d792b771fd9627c69fb9fada6fd8c000d6b1a18412d551185c25a4775
|
3 |
+
size 60456960
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:264bc53b1c6ecba4d5329079d0850fa2a7e20d74b7012cd6d09e02e5ee5cf382
|
3 |
+
size 26694656
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5300a80eb168c3e4266cf708b091278341e137ce513ea7ebb4c53db062ac0703
|
3 |
+
size 25323008
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f96cafa0a5117635b55a001076443dcba59f0293cee53664dd374f41f594cec
|
3 |
+
size 32911872
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ba81918fd58f28632a0428bee819a92c84dcde8925c9a06195267b23c16ae1d
|
3 |
+
size 60555264
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df0d84fad37731c69f691fe33bb7446f0ddf9902fa4d77665b9bdd6638196b4d
|
3 |
+
size 60456960
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b508561e07eb400ca2f6fdf965de896aa98b4e3e8528a244fb2b9c1659bd5eab
|
3 |
+
size 32281088
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:885fca677ceafa212d8bf8c5aeaccc3946bc4992871f9f4959bbec197ef2c04d
|
3 |
+
size 32891904
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17e589acd5ed5644cf38f63b69a7e9e4a7600774d52ec526cbce86b5f7720e97
|
3 |
+
size 60555264
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86d41d28589b4531d3b9e1a8d9ad48ef3a2cc67144d0dc71b45e46f62f9b51e3
|
3 |
+
size 60456960
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c34930168f480b872a174211c38229ca3a8784e8b87a2bc56210c617d435a9f
|
3 |
+
size 32911872
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07b2d5db1033e924c4efea8652d30450cfdf447ec8c2c78c276a834ff31fddb1
|
3 |
+
size 60555264
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:375f0d232ad4bd1fc7ae090bb0ffa6fcfb3dfdc8f952cd8ad967316944aec9b1
|
3 |
+
size 60456960
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:116c1e9df56d53181b9d5e0fe5ede0d1fd0b35dce4d897a787929eb30895c842
|
3 |
+
size 26694656
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:825d97d2b5ab1f9cde910097ffdeca0f863e86a3a8bec2d7a32e4b27abd459a3
|
3 |
+
size 60555264
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:942dc40a3b3c69d39550f37e4ca087966a6ac013c0fe3fe325e744c16234297a
|
3 |
+
size 25323008
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc7ee276cd114720cc3653decba13e43c90f087174b3ae4c9ad6361d49154749
|
3 |
+
size 60555264
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d210f8ea46d095528f2c42cd08a8e3c691e962a25bbc5cf4c1ce8cb19f73c066
|
3 |
+
size 60456960
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ba1d96111877e5ceae266bfb08d9ff52c5e5b8e9840acd73ebdad556594c3d4
|
3 |
+
size 32281088
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ee1f7cc8911d175742f56444ce1dbfc065ce9b782e98e8c2d12ef7c17cd0245
|
3 |
+
size 32891904
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:891b5ec811fe70107138335a6cdc5f76457fea8bf4e01427e449c018e3ea3ad4
|
3 |
+
size 60555264
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:55357a214808152b5bc343fe63f0dd2ad1967efd57fb5af9186fd9c2f30c002f
|
3 |
+
size 60456960
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe7144cd9da62f7ad6d731f56f175df215b8eda085f9c9721fa41463ced469f9
|
3 |
+
size 32911872
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:320d67922c785f4d130a02ff05a977089e6fe3e957d9c459354f6340b046fb7a
|
3 |
+
size 60555264
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de43a38b133134d75c835c2d865093ada32c15ba46c37d030bd020cfd89f5377
|
3 |
+
size 60456960
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e95142d0c2641449f57a3f70e97b528f3893b769c6ac63ac4485fcadb18337ae
|
3 |
+
size 60456960
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50501f8f83c00741698cc86f961d0fd0d416dc5ec54270a8f30db7a5c583c7e1
|
3 |
+
size 26694656
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bdb93a1bf779c3f6f6daa3772978a548e77655c3b1916f751fcd43f7dd13bf50
|
3 |
+
size 25323008
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aea794f328a7b825de99e53ce9044bdbfd7520489dce395fa2e8a9d69a9de196
|
3 |
+
size 60555264
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aaf1a1e740ffe61c39f02d7b1cf455a9b8dce6b3b62642ddac61c74874121fda
|
3 |
+
size 60456960
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97c6b09dacd9c4dd441aacf160a136177a2f77e580e7b5e30190e03efc666854
|
3 |
+
size 32281088
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c4a1f6dbe753f78d40b87dfdb555d74aa0884139498db240e2bdf0970ff7951
|
3 |
+
size 32891904
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea9f007924f39af0817dec871ef9f9a8b1589898dbfa7754eeed4ade1af94f51
|
3 |
+
size 60555264
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15952b62598b4632f2476cae3cbaea9fa188fb0d83678b981fd3c7702c5b8850
|
3 |
+
size 60456960
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99decd2473b82808ab1aa64f8f6d097712dd549536685223c2684a13bccc9bd5
|
3 |
+
size 32911872
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e37f777bf4f1b33072402357d5ab621f8ab2580f5e36c8e6ad5686d7e64d9531
|
3 |
+
size 60555264
|