ruihanglai
commited on
Commit
•
6459e62
1
Parent(s):
229ec85
init
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +78 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,78 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q4f16_0",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 11008,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-06,
|
11 |
+
"vocab_size": 32000,
|
12 |
+
"position_embedding_base": 10000,
|
13 |
+
"context_window_size": 4096,
|
14 |
+
"prefill_chunk_size": 2048,
|
15 |
+
"num_key_value_heads": 32,
|
16 |
+
"head_dim": 128,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"max_batch_size": 80
|
19 |
+
},
|
20 |
+
"vocab_size": 32000,
|
21 |
+
"context_window_size": 4096,
|
22 |
+
"sliding_window_size": -1,
|
23 |
+
"prefill_chunk_size": 2048,
|
24 |
+
"attention_sink_size": -1,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"temperature": 0.6,
|
27 |
+
"presence_penalty": 0.0,
|
28 |
+
"frequency_penalty": 0.0,
|
29 |
+
"repetition_penalty": 1.0,
|
30 |
+
"top_p": 0.9,
|
31 |
+
"tokenizer_files": [
|
32 |
+
"tokenizer.model",
|
33 |
+
"tokenizer.json",
|
34 |
+
"tokenizer_config.json"
|
35 |
+
],
|
36 |
+
"tokenizer_info": {
|
37 |
+
"token_postproc_method": "byte_fallback",
|
38 |
+
"prepend_space_in_encode": true,
|
39 |
+
"strip_space_in_decode": true
|
40 |
+
},
|
41 |
+
"conv_template": {
|
42 |
+
"name": "llama-2",
|
43 |
+
"system_template": "[INST] <<SYS>>\n{system_message}\n<</SYS>>\n\n",
|
44 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
45 |
+
"system_prefix_token_ids": [
|
46 |
+
1
|
47 |
+
],
|
48 |
+
"add_role_after_system_message": false,
|
49 |
+
"roles": {
|
50 |
+
"user": "<s>[INST]",
|
51 |
+
"assistant": "[/INST]",
|
52 |
+
"tool": "[INST]"
|
53 |
+
},
|
54 |
+
"role_templates": {
|
55 |
+
"user": "{user_message}",
|
56 |
+
"assistant": "{assistant_message}",
|
57 |
+
"tool": "{tool_message}"
|
58 |
+
},
|
59 |
+
"messages": [],
|
60 |
+
"seps": [
|
61 |
+
" ",
|
62 |
+
" </s>"
|
63 |
+
],
|
64 |
+
"role_content_sep": " ",
|
65 |
+
"role_empty_sep": " ",
|
66 |
+
"stop_str": [
|
67 |
+
"[INST]"
|
68 |
+
],
|
69 |
+
"stop_token_ids": [
|
70 |
+
2
|
71 |
+
],
|
72 |
+
"function_string": "",
|
73 |
+
"use_function_calling": false
|
74 |
+
},
|
75 |
+
"pad_token_id": 0,
|
76 |
+
"bos_token_id": 1,
|
77 |
+
"eos_token_id": 2
|
78 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8dedb962bc87dfe7171f75f0e126602347a8f9b6331b994946a0a12cb8b4f4a4
|
3 |
+
size 65536000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22047e093ee9a69f6842875f570540cc7a8fef6397614234e1da6fadabf031df
|
3 |
+
size 30744576
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93846694af104dfd85bb17f4444dc61d364bdb7ff71836f19228ce1d024e489c
|
3 |
+
size 25165824
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3e8a2d6e0ae41dd066d88aca92005369e87012d9268adc5e851929db1debfb4
|
3 |
+
size 22544384
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7598d6fd8e28e2224dfd096640012c71f057b24a2fc15f9827261d66f0e95730
|
3 |
+
size 45088768
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74351c8b5831f745a25167f15d106270614be3694b1745a9a3a3f409a9ce9606
|
3 |
+
size 25165824
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1c11d35662a36361d522013a027394c9ace8d9c82fcd1866da5829cf2f63ed9
|
3 |
+
size 32661504
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8bbd59adc287b5819e2fe614c575eabe96069c5666cdbc5b2d18213820569d8a
|
3 |
+
size 31989760
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24c47356de927bfe4b43a6851e149f4c2d8dcf1d2bb1385bf872524845f413b3
|
3 |
+
size 45088768
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2911e97040d097a7ca06e5bb5a1e0550e98b3e7b0b898b15651b969e25e7da94
|
3 |
+
size 25165824
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73bf756d6426e68f2136c619928d3946e3bbe1702608fdad356348cb54a45ad4
|
3 |
+
size 22544384
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1315fab7fdc472dd59d4ab16e254726fedce9176de76ff4da04dc820a3209419
|
3 |
+
size 45088768
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fda97f90e0854534616ede161fa7d07f1c501cd04d7390dd1ee2238a70ee0267
|
3 |
+
size 25165824
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3bb5b214d437b15ee9a4bd5eba8d27fc8e6c42f086815d1e066f9aa033e015e
|
3 |
+
size 22544384
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21d2d3bcfbf89a6bfade041924ec58b89ea2212e3825528c99158b125224ced9
|
3 |
+
size 32661504
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7d8eae0c41d0a67689cfd576a0c03ae7a3896a8fd87e70baf8e5eac74bc3836
|
3 |
+
size 31989760
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10e8f236868420ec99315ef9a4ccc13c639d2f24b20ec6b75aedd137c016513d
|
3 |
+
size 45088768
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73178f4e6b1372576d67844e8b414ab080398998f4cf76b50dc1a7bc1839399d
|
3 |
+
size 25165824
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0b54f2729e68c4a76b70e69801912e5b93da55981bea14e615769c24974f08d
|
3 |
+
size 21045248
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99c711a186b399334f36e4869f097f5478ee13a7eeaf302beae4238233096b34
|
3 |
+
size 45088768
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad82a1d467b4b7b8994c95ec2869b4978f56dbd671cd6f858771a663c277a843
|
3 |
+
size 25165824
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91f963cf504dba45d7a0f08162277e86fc9daccfb8a6a789054de1bbfad20134
|
3 |
+
size 32661504
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:262c89dbaa3623930fe72a381a5dc34dcae3bbe1cadb65f13bd04f21fe8df625
|
3 |
+
size 31989760
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8cd8fe523ec2a5a545bf2c6b74cd6781926ebc3fc7d9f6c0b46817287297b9fb
|
3 |
+
size 45088768
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3be8154e99949c9f48dcd80403669e20b84bc5a266f42a592d2c09b7c6c2f3e
|
3 |
+
size 25165824
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dac6a051d20fcdd2028f10fb2a6b270051944a4c4a18e0f1db2dbf73df6fd8cb
|
3 |
+
size 22544384
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6cf0cf9510b3fef468bf4b80bab87dd6300bcfe346c0f24d2fd15b3dfb5e24b6
|
3 |
+
size 45088768
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:093834ed61cd75ae51d098c3b75b97c465683b351633221721b1f398ac08f650
|
3 |
+
size 45088768
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38ddd0e6bb21341c2f1047f0afcf45c39b25cee98d215fc132823e9bab4afc40
|
3 |
+
size 25165824
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc5fce49a5e9f9ace3392c1c40c0494fa72ecb218b101334a298e847052e6dec
|
3 |
+
size 32661504
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f50b3cdc331fd1a0fbb4f7f3f0f2b9588f4f7936d422e2bb752b460f64ca756e
|
3 |
+
size 31989760
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfcb94f8bf3e8e6f1a99f0ef838fa987624410099377acfed873c2ed6a38eef5
|
3 |
+
size 45088768
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85371dc989af7d8b9838147e919a6b147d2cd324aacde112be75a2c48ac6dec2
|
3 |
+
size 25165824
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0673fdd02e18dda0b182f9c3d564e56279988bc337f7d7a88e0421e51817515
|
3 |
+
size 22544384
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:621ca81d84ac012e5acfb09840d9ae03a8ff912f29223d8edae5878e1a15e250
|
3 |
+
size 45088768
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d959aeb79408a3e649ec41e6be63eacb83a69b002f59e6030951ccdafde7e75c
|
3 |
+
size 25165824
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b252bc57364b0105a64c2234d673e1498f7b16a670115d33460a020bbccdc36
|
3 |
+
size 32661504
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58b654596fdc4059658d1b43c1f089524b4b6ba6543543b2950497760f2eaa46
|
3 |
+
size 65536000
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d26507fb81c8afab025ebbc2127708131f7b32a24f147e982c558c02e2e5c114
|
3 |
+
size 25165824
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c08df61202685c8596103763ed52828189414556c3f081b06471bdc619ed41cb
|
3 |
+
size 22544384
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11499649671971d2610e9693a9d2aade3badcc1d665add9c1db2b2d90728cb56
|
3 |
+
size 45088768
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b12a175e8978ba3d0f1219b0d800e91b2b71c7231e5551b2fa9a454c90e3a6f3
|
3 |
+
size 25165824
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a3fac344eb8bff848e468e6ba896cd67e2e009681ed8df7f60f0341c255cc6b
|
3 |
+
size 29253632
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8b18563ddf89929c6b055c255e08f5b85783106fe638751485fbc7962c62803
|
3 |
+
size 31989760
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23981371c4f7c0fa6ca9fdf3e5d95aa6fb553e3f9a20ef19264a48f3a07feec3
|
3 |
+
size 45088768
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6606818a40252bcec21c644b8247b8d68ff69e06825a6b4e6842e2e0db7c5f6
|
3 |
+
size 25165824
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be7216cb1bc689e818b2958d890bb044941c35865a66ad06d8d51c05efc06216
|
3 |
+
size 22544384
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87b8acdbede84ffa54bbb68a669037f6af846f2801c451230dc9fc6f206565bf
|
3 |
+
size 45088768
|