Upload 247 files
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +78 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_140.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,78 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "svdllama",
|
4 |
+
"quantization": "q0f16",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 11008,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-06,
|
11 |
+
"vocab_size": 32000,
|
12 |
+
"tie_word_embeddings": false,
|
13 |
+
"rope_scaling": null,
|
14 |
+
"pipeline_parallel_stages": 1,
|
15 |
+
"position_embedding_base": 10000.0,
|
16 |
+
"context_window_size": 2048,
|
17 |
+
"prefill_chunk_size": 2048,
|
18 |
+
"num_key_value_heads": 32,
|
19 |
+
"head_dim": 128,
|
20 |
+
"tensor_parallel_shards": 1,
|
21 |
+
"max_batch_size": 128,
|
22 |
+
"ratio": 0.6
|
23 |
+
},
|
24 |
+
"vocab_size": 32000,
|
25 |
+
"context_window_size": 2048,
|
26 |
+
"sliding_window_size": -1,
|
27 |
+
"prefill_chunk_size": 2048,
|
28 |
+
"attention_sink_size": -1,
|
29 |
+
"tensor_parallel_shards": 1,
|
30 |
+
"pipeline_parallel_stages": 1,
|
31 |
+
"temperature": 1.0,
|
32 |
+
"presence_penalty": 0.0,
|
33 |
+
"frequency_penalty": 0.0,
|
34 |
+
"repetition_penalty": 1.0,
|
35 |
+
"top_p": 1.0,
|
36 |
+
"tokenizer_files": [
|
37 |
+
"tokenizer.model",
|
38 |
+
"tokenizer_config.json"
|
39 |
+
],
|
40 |
+
"tokenizer_info": {
|
41 |
+
"token_postproc_method": "byte_fallback",
|
42 |
+
"prepend_space_in_encode": false,
|
43 |
+
"strip_space_in_decode": false
|
44 |
+
},
|
45 |
+
"conv_template": {
|
46 |
+
"name": "LM",
|
47 |
+
"system_template": "{system_message}",
|
48 |
+
"system_message": "",
|
49 |
+
"system_prefix_token_ids": [
|
50 |
+
1
|
51 |
+
],
|
52 |
+
"add_role_after_system_message": true,
|
53 |
+
"roles": {
|
54 |
+
"user": "",
|
55 |
+
"assistant": ""
|
56 |
+
},
|
57 |
+
"role_templates": {
|
58 |
+
"user": "{user_message}",
|
59 |
+
"assistant": "{assistant_message}",
|
60 |
+
"tool": "{tool_message}"
|
61 |
+
},
|
62 |
+
"messages": [],
|
63 |
+
"seps": [
|
64 |
+
""
|
65 |
+
],
|
66 |
+
"role_content_sep": "",
|
67 |
+
"role_empty_sep": "",
|
68 |
+
"stop_str": [],
|
69 |
+
"stop_token_ids": [
|
70 |
+
2
|
71 |
+
],
|
72 |
+
"function_string": "",
|
73 |
+
"use_function_calling": false
|
74 |
+
},
|
75 |
+
"pad_token_id": 0,
|
76 |
+
"bos_token_id": 1,
|
77 |
+
"eos_token_id": 2
|
78 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29815774f62ac838ba8e8efdfca108bc1de046f4424492dc7dc64d87fa34e6f6
|
3 |
+
size 262144000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d0c7bbaf979f748cde2079238e14a14bb15171454963fc8b394d7fc8c5d8bc7
|
3 |
+
size 39430656
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b4bf60cfdf89497eae1d0256db0b4fe71bb37ae72a8273d8c9a19ad51f7d1e0
|
3 |
+
size 30179328
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:156f42791b22a336534b02faa899d0f179f0781d130a21d7dd93df3644b98e75
|
3 |
+
size 30179328
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50d942fd076a97a33df7306ef557190ce303e6eee324bb99c318f503ef2199f2
|
3 |
+
size 30179328
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eff6ea43770dbe022aafa97acf7b7e6daf04e7e044b2d1eb76c77d24f5461074
|
3 |
+
size 20127744
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7cdba9fcbe81814fa014156c32ec95a4338eeda816900075b3f857c92c907f90
|
3 |
+
size 39430656
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a670fc8956ee5a05a35245340a573b938457fb9e8504238fec735969d8603c7a
|
3 |
+
size 39430656
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:003f05eaa7d75f740714fa103757398ada6091acf095024e02d0c36fc2b2365d
|
3 |
+
size 39430656
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64aa499b411ace5bcedd155fefb4281c8bf5158996908d1a7041a39cf572cac1
|
3 |
+
size 29343744
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1765c30470bff7118409d31e9d2cea9c185b644adff1af83f52d4ca974f103f
|
3 |
+
size 24739840
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eaa5fab8b0534318fd3048cfaac5a617ae3fddc31322cd7b3c5137b24ed6f4d1
|
3 |
+
size 30179328
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:387ebbbc4217d45c5bacb102f8fe29649d580a3b7c91d464e9fbfe72c95c2c20
|
3 |
+
size 30179328
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:228dfcc20d5fec66ea6bb54d10c510b1ceeb98e25fc498f8b0c417a659749832
|
3 |
+
size 20127744
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a0814a35ef7e73b55b68704c3e92d964d21d73288050e2c1caa59bdb04d2d7d
|
3 |
+
size 39430656
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40d55ecf9c1c6e6a4d911229b949d64f3904c6c6905b0f6f4d6a8cdb22703807
|
3 |
+
size 39430656
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3517cc9a503f2bfcbe850f3c90d04b834505f62bc721e075b8725e02ffa1f976
|
3 |
+
size 24739840
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:148ffc324c19963550aae3aad68c2b52a01d59090396d71bbe9468891ba53ac3
|
3 |
+
size 39430656
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:058560adcf9f6fd2834ae2c53d3e8a09b2b4201730ec39989570a11eff2a5edd
|
3 |
+
size 29351936
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18da4e6c019795597596de0a3fa3b716007f4f8721d68840a70413155ec66edf
|
3 |
+
size 30179328
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6e1b62b21eaeddbe1816e55a7c89ed1b0b2c8eb22411b7c5d1bfacbb3a2642c
|
3 |
+
size 30179328
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6525c6bde8656680ee9a8b1026759a252376bdb97a677d169df46281f5ad6b9d
|
3 |
+
size 20127744
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea96233e50c3c6fd1a94a2aab51b101ab1ca931757132bf774969fbf9f18388b
|
3 |
+
size 39430656
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8202045330d2fe7b5790a420e106523264372c57131c0f4641be0e4888999b25
|
3 |
+
size 39430656
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b8e207fde303c403285515d4917d50f4dcc408b9685b0fe79255116393226b0
|
3 |
+
size 39430656
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc919deb15432f1950dc44bd8b4b3e36704fd79f875500521cf5588316201c1c
|
3 |
+
size 39430656
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a7ed66d19f048a7c6e0e689c30934aa69286449dfbc6ef3378c6767658e011b
|
3 |
+
size 29343744
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2540a27df7d9f301aea2c391fb65bc2c3fe4e7a26b534c9f67794950a516c41f
|
3 |
+
size 24739840
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c4aeeb5e2700175f5a047213c21f38338f366d05b08b5103ba85d44e461857f
|
3 |
+
size 30179328
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63744658689c95bb002a6522ea777dc590212a3306efd7e3891ceee8a2b3abef
|
3 |
+
size 30179328
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59446c1a823e38e48d08bc4a9228a621cdebe6f4c1a03b135a272395c985efd0
|
3 |
+
size 39430656
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee91f71d5b7497b1e0e2cc80984083e49fc4a201a170477fbd6ecedd8c6bf9ec
|
3 |
+
size 39430656
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e617d490de34c4595e80615313d8b6a6ce42c85f25596a5252418c7de7de03f
|
3 |
+
size 24739840
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d096fbc7783469905eeccb5941bf65c1830d8b3782a963085546f55313724f33
|
3 |
+
size 39430656
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37d6b9c4220969af149128ca9925f666c2b54aa95252d55b10ef474f82bd2e4d
|
3 |
+
size 29351936
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bdaf413dfa62481ce22ea279f9755dc7e8acc251a8e56ca6dcc05870cfe949f
|
3 |
+
size 39430656
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0abb461332e958225dcdcc681aea21c4fb0167123dbe780b2b8816c218360ee
|
3 |
+
size 30179328
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aeb7297ed66fa6e938433be7ed68ca77eed567d18b0f7565c1277138c7f69b2d
|
3 |
+
size 30179328
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33fdea2a9ebb44c06f9a8c645d2fbd108d6e44f8de95849b5aceb91051663072
|
3 |
+
size 20127744
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:185873737f52b4852009312f58ed13ae9a2b3ff5b147b17d132be254da9852c8
|
3 |
+
size 39430656
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13085c705d565fb4d635563ede30c56a1b02f44d2a465d20b264053a5c7cc9de
|
3 |
+
size 39430656
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60b2e71362e4e0a5bf34195125b28868233f5b3bc281075b66cbaaf65a25c364
|
3 |
+
size 39430656
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c665cd18b50a3255ca011016f255f4b49bb8c755718165983cbcba8db94c1dc
|
3 |
+
size 29343744
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3746c36cc3b030cba7858ed67314c06e096cbce762fa7975ea99877df69a503
|
3 |
+
size 24739840
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83da8e4ef6541564ee8fd13a17483e8ee5ceed9b02d18a7a645c81c97b6d7afb
|
3 |
+
size 30179328
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a22798521b94de1396334eaec24b4ea1ec156fd6b42087e68e72fa51200118b
|
3 |
+
size 30179328
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45e8288fc0761f49591a1d90c5717913892972124bc44b9f985abcf8023ea71f
|
3 |
+
size 39430656
|
params_shard_140.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec36888bee6e1b5cadf1f7004d15dfd1f6959415e8a98ca4b34538199ed198aa
|
3 |
+
size 39430656
|