Add model weights
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +80 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,80 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q4f16_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 128256,
|
12 |
+
"position_embedding_base": 500000.0,
|
13 |
+
"context_window_size": 8192,
|
14 |
+
"prefill_chunk_size": 2048,
|
15 |
+
"num_key_value_heads": 8,
|
16 |
+
"head_dim": 128,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"max_batch_size": 80
|
19 |
+
},
|
20 |
+
"vocab_size": 128256,
|
21 |
+
"context_window_size": 8192,
|
22 |
+
"sliding_window_size": -1,
|
23 |
+
"prefill_chunk_size": 2048,
|
24 |
+
"attention_sink_size": -1,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"temperature": 1.0,
|
27 |
+
"presence_penalty": 0.0,
|
28 |
+
"frequency_penalty": 0.0,
|
29 |
+
"repetition_penalty": 1.0,
|
30 |
+
"top_p": 1.0,
|
31 |
+
"tokenizer_files": [
|
32 |
+
"tokenizer.json",
|
33 |
+
"tokenizer_config.json"
|
34 |
+
],
|
35 |
+
"tokenizer_info": {
|
36 |
+
"token_postproc_method": "byte_level",
|
37 |
+
"prepend_space_in_encode": false,
|
38 |
+
"strip_space_in_decode": false
|
39 |
+
},
|
40 |
+
"conv_template": {
|
41 |
+
"name": "llama-3",
|
42 |
+
"system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}<|eot_id|>\n",
|
43 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
44 |
+
"system_prefix_token_ids": [
|
45 |
+
128000
|
46 |
+
],
|
47 |
+
"add_role_after_system_message": true,
|
48 |
+
"roles": {
|
49 |
+
"user": "<|start_header_id|>user",
|
50 |
+
"assistant": "<|start_header_id|>assistant"
|
51 |
+
},
|
52 |
+
"role_templates": {
|
53 |
+
"user": "{user_message}",
|
54 |
+
"assistant": "{assistant_message}",
|
55 |
+
"tool": "{tool_message}"
|
56 |
+
},
|
57 |
+
"messages": [],
|
58 |
+
"seps": [
|
59 |
+
"<|eot_id|>"
|
60 |
+
],
|
61 |
+
"role_content_sep": "<|end_header_id|>\n\n",
|
62 |
+
"role_empty_sep": "<|end_header_id|>\n\n",
|
63 |
+
"stop_str": [
|
64 |
+
"<|end_of_text|>",
|
65 |
+
"<|eot_id|>"
|
66 |
+
],
|
67 |
+
"stop_token_ids": [
|
68 |
+
128001,
|
69 |
+
128009
|
70 |
+
],
|
71 |
+
"function_string": "",
|
72 |
+
"use_function_calling": false
|
73 |
+
},
|
74 |
+
"pad_token_id": 0,
|
75 |
+
"bos_token_id": 128000,
|
76 |
+
"eos_token_id": [
|
77 |
+
128001,
|
78 |
+
128009
|
79 |
+
]
|
80 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:857135d05507431e76ef68864ca1e838f8c44db9e76070d49bc55ff3290745cb
|
3 |
+
size 262668288
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2981c674ea795c52cb3560ed6b083efdc8000d3835eeb4258d2fa92d368268c
|
3 |
+
size 29360128
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32bb4c640f08430de4ef5aeee44aba6ca2513961ae5aa6ce38c55a8ef795f510
|
3 |
+
size 29360128
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bccf8d1b0a2f85e31383fdccc0e7ac8caa09d94e45d0c7f8c6140ff4eb72837
|
3 |
+
size 29360128
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66c49cbafaae13db5df2bc95c68bf1a77c8aaf0ba88e55356ab3940f0f29316f
|
3 |
+
size 58720256
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bee2d0ea9ecc2f6569bad1e06c8c1023799d170e7bbec193a58bc9c7182a14fc
|
3 |
+
size 33046528
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60127667748ef46e28b670071e314a66ae562f4eb6ded79fadcc0dd62fc0e9c6
|
3 |
+
size 29360128
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e13b9f4849c77111f49bf23673607e7a990907f0a99c1616a874669a9e45c8fb
|
3 |
+
size 58720256
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:debeda54c6abe491a39508fdea186f6b14527e85d87416adb6955bb8096b74dd
|
3 |
+
size 22036480
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25c0ce834fee1e57d221a1017c1906792511a8a3854c7568b557beea7ce83ccb
|
3 |
+
size 23592960
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72411a1ce95bee6f23842d15a55719fb5775f0b2b219730720e17cd98878d160
|
3 |
+
size 23592960
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e2781b7520034ced5b89a98e814e9812f53c4ce131fddb111d2bf5fbabe921b
|
3 |
+
size 30949376
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:011d7b54897ecd070aa61091a241c33f3bab3223526d2d2d3ad397c59305f8f4
|
3 |
+
size 58720256
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:776a7561ffa37f1150f8b2d5eb566c5435e456cf16f8de0120ea99cc68197144
|
3 |
+
size 25174016
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:721892a1771fd7cc14f116366b08e4311cce9b4f36e747a260f84eea01046561
|
3 |
+
size 262668288
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2328a9e043f74b15f0843a8b02637a4b1b6e5925809c2dc53dd131aeefdc2958
|
3 |
+
size 32833536
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0a90f4f68e9c81c85c7917885655e06ddef610d1320b716e154af9b4d934c70
|
3 |
+
size 29360128
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c41c137040565fb754fb207e90efc1a86ef105963eeb320e6fd4fa168a8819bb
|
3 |
+
size 58720256
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78a601d0781f6582c0038c69b279cbdbe5745e13a11a5898c42967e614c81704
|
3 |
+
size 33054720
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9da18e6dcdcf66ba92571777ab103454fc015f40cdd33285f7ca6db13884ff66
|
3 |
+
size 29360128
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e41aa0f79f5eaee1028c72676620880387da4675bd02f9be04791d35adeee8b
|
3 |
+
size 32841728
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74b7911c97552ac12667b22c644bbe492005104edbb5deb62dc703a588bb22b1
|
3 |
+
size 58720256
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dcb45d24a727acb75dea3faeadd71c6799feb0cb1745ac9a8f377d3072801f1a
|
3 |
+
size 22036480
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d0b82dc970cd1e729011a647b9456d610648bd1a19e7f43ed1448822d7941b9
|
3 |
+
size 29360128
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b7a537c59f9a6fbefc0a182caf4a152be997aa96d6677fcbcb7dc317b65c3d0
|
3 |
+
size 58720256
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d40f77195460c6dec23e98d565afd81111fd3185fcde203e56ddbdc7e95e18d
|
3 |
+
size 27271168
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b15c6929a8669278ee4b9da89a29cd6165198803be2590cb221d342ff7abed69
|
3 |
+
size 29360128
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1240b65ede2c3ac18c26e44bb642818926d068477a7b4f2504577f6b559ffa7f
|
3 |
+
size 30949376
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eeb18791f603ca1179287a6f86eb73d91631f70fbba27e8928f6d2e05d3fe427
|
3 |
+
size 58720256
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15e9bdb63dafea50100dc37b0dbfc98018cf23f28d0bae63957a7c6c12a30a3a
|
3 |
+
size 25174016
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de0bff2eec54891eae88d88a06c3ea1b56f65d834cdd95af94029c6090796a98
|
3 |
+
size 29360128
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47605db8276b2353b88a0ad13c6db6ec50daaa500a38cc02fd0daca9d339831e
|
3 |
+
size 58720256
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa205a817002deb0d3a4bd83887cee3222444ef6c1c56af34697f4f793fa6349
|
3 |
+
size 58720256
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b8fdf1e88bce8b93f8cdd234935cc4c8d9b41d4b631e46696cb20cdf11cac0b
|
3 |
+
size 33046528
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5dc565bd6a05ff75b7f35a4850472e35d1b3ae17c3b21792b5e1f322ae94c981
|
3 |
+
size 29360128
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09df1db31951ba2079f574751f9e600c274285d5d18035a1fd9e55e009fcfe03
|
3 |
+
size 58720256
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0761d39c72930427eed8cc552f89eb4d4eab72cf8bbbb268a1bb555c4cdb718c
|
3 |
+
size 22036480
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79004078dadc09fe810e619fe1db8ba563dd6d92f152443e25f07b25ab4cd426
|
3 |
+
size 29360128
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f819c3c50b4c6e7a324e811bf63ad8e05c96291b608078e071d4a5b063b3d3ce
|
3 |
+
size 58720256
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ecfd682d9abbc804d3b345ecc18e6b2b050b36629b17629f27dce1431cc85e8
|
3 |
+
size 27271168
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67ae606f5dc36996dd7de664f0acd37e1d89adcd5d6b565cad0b072498be03dd
|
3 |
+
size 29360128
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e824ac5d1d0353cd150ea13d3575f057f653556986202b7c231c65102632ede3
|
3 |
+
size 30949376
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a32364b39110504129a3867f4c682150e4ac9491f252639c349c02b62309d6eb
|
3 |
+
size 29360128
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df7cf86f8737a99b78988fbce47678b3a1e8cadd71e005fb50a6d6f40ca017bb
|
3 |
+
size 58720256
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8046b6fef1e627a063ccab0b8cbdd98644eb1ff1329de2cd436ebb7b38ad1bb
|
3 |
+
size 25174016
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a37bd28abd311301bad5cb51e641a4119e370c87672a5d07a64122a9a3f0368e
|
3 |
+
size 29360128
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e92c9eb0fc75f40834973350f42eef25d0fd6a2ec3e9f78a62bc00fc58986f71
|
3 |
+
size 58720256
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb2b383c6c46347a66484c6ed7cd91cae6f1ba1e3ff5b9b05bba588d3b5af507
|
3 |
+
size 33046528
|