Upload MLC weights
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +81 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "llama",
|
4 |
+
"quantization": "q4f16_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 4096,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"rms_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 128258,
|
12 |
+
"tie_word_embeddings": false,
|
13 |
+
"position_embedding_base": 500000.0,
|
14 |
+
"rope_scaling": null,
|
15 |
+
"context_window_size": 8192,
|
16 |
+
"prefill_chunk_size": 128,
|
17 |
+
"num_key_value_heads": 8,
|
18 |
+
"head_dim": 128,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"pipeline_parallel_stages": 1,
|
21 |
+
"max_batch_size": 128
|
22 |
+
},
|
23 |
+
"vocab_size": 128258,
|
24 |
+
"context_window_size": 8192,
|
25 |
+
"sliding_window_size": -1,
|
26 |
+
"prefill_chunk_size": 128,
|
27 |
+
"attention_sink_size": -1,
|
28 |
+
"tensor_parallel_shards": 1,
|
29 |
+
"pipeline_parallel_stages": 1,
|
30 |
+
"temperature": 0.6,
|
31 |
+
"presence_penalty": 0.0,
|
32 |
+
"frequency_penalty": 0.0,
|
33 |
+
"repetition_penalty": 1.0,
|
34 |
+
"top_p": 0.9,
|
35 |
+
"tokenizer_files": [
|
36 |
+
"tokenizer.json",
|
37 |
+
"tokenizer_config.json"
|
38 |
+
],
|
39 |
+
"tokenizer_info": {
|
40 |
+
"token_postproc_method": "byte_level",
|
41 |
+
"prepend_space_in_encode": false,
|
42 |
+
"strip_space_in_decode": false
|
43 |
+
},
|
44 |
+
"conv_template": {
|
45 |
+
"name": "llama-3",
|
46 |
+
"system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}<|eot_id|>",
|
47 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
48 |
+
"system_prefix_token_ids": [
|
49 |
+
128000
|
50 |
+
],
|
51 |
+
"add_role_after_system_message": true,
|
52 |
+
"roles": {
|
53 |
+
"user": "<|start_header_id|>user",
|
54 |
+
"assistant": "<|start_header_id|>assistant"
|
55 |
+
},
|
56 |
+
"role_templates": {
|
57 |
+
"user": "{user_message}",
|
58 |
+
"assistant": "{assistant_message}",
|
59 |
+
"tool": "{tool_message}"
|
60 |
+
},
|
61 |
+
"messages": [],
|
62 |
+
"seps": [
|
63 |
+
"<|eot_id|>"
|
64 |
+
],
|
65 |
+
"role_content_sep": "<|end_header_id|>\n\n",
|
66 |
+
"role_empty_sep": "<|end_header_id|>\n\n",
|
67 |
+
"stop_str": [
|
68 |
+
"<|end_of_text|>",
|
69 |
+
"<|eot_id|>"
|
70 |
+
],
|
71 |
+
"stop_token_ids": [
|
72 |
+
128001,
|
73 |
+
128009
|
74 |
+
],
|
75 |
+
"function_string": "",
|
76 |
+
"use_function_calling": false
|
77 |
+
},
|
78 |
+
"pad_token_id": 128257,
|
79 |
+
"bos_token_id": 128256,
|
80 |
+
"eos_token_id": 128257
|
81 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c034b705ba695c6a97f36d5dea3d33d0ee1a7ce471db301d5650c6ae9514366c
|
3 |
+
size 262672384
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46206be6bec85b6466681a960c73f2f52213b1d33ef33b1939d0b0ff830bc77c
|
3 |
+
size 29360128
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45b64163c7561a8c6e5d95f3b923c1db03833802b02e0819ae6f1beff0807e33
|
3 |
+
size 33046528
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f18033e12d45c711bcb473b64e1d32257326c6b2d7393ec972e619246a4293a3
|
3 |
+
size 58720256
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7829c83eb66f216f67dd050da6ac5c6435b8923def29daad9b5b90ec991712a3
|
3 |
+
size 25174016
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33a36fae376f5d12608068eda0a61c8ab3cefe6f96e4648f3bd4923119935f8c
|
3 |
+
size 29360128
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38aebedadd7432f90b4f33efbf8b2132a0d7ac0c8ddd41a551c9a7aa1781cd26
|
3 |
+
size 58720256
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66b5a79632a8ab059378df9baf2429fea0ecd671c02c7be361b82892eba1a242
|
3 |
+
size 33046528
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:579e33d1558735b58622894e5c21c7c643bcabaa8bae9b9a0962c914259cb7d1
|
3 |
+
size 58720256
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f2f68a66f063b04c14a517410f96f96ccdb4f64094a1026720fde9760f7cc00
|
3 |
+
size 32505856
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:085fa3566e94d93e3702a6fc00a7f1cba79ca224492d4904eb1d143bde5ea183
|
3 |
+
size 9437184
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80bdf1f6251410d2cf6bd1b3ca7b4ae61f56d5cf3e8d3ed857e1321248a7a41f
|
3 |
+
size 29360128
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4793e55b91eceb4ad3525859852c749a2541dccde4156b90fe90a46768daf53e
|
3 |
+
size 58720256
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97e1ae7b9b8fb1de75e29f84c1de395b9bd578fba985efd5f83877298942af0e
|
3 |
+
size 22036480
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e05784ac52898e4aa1de326245601512e665e2d26feeb9c5bafa49c767746aa8
|
3 |
+
size 29360128
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8bc3ab64cffca66324c65d559f9335b7be8519301c41fa848d43f7b50af1b630
|
3 |
+
size 58720256
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fd937d34ed2328e590111270648d190f6a80e290486e1879dda2fe4763c75d5
|
3 |
+
size 27271168
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:140a1ac31328340026993e482fc44864141e0853021a855207542ca6ae25c464
|
3 |
+
size 29360128
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b9cdb23f25c54c2dd84fc13a88e48a6fa9882c612ec17d178b6b66dccfb3cc8
|
3 |
+
size 30949376
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:093726b8cc4a0d2997a0ba49e4d0f0af5c0465c391ad603aeb35d0ebef518de6
|
3 |
+
size 58720256
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:198d676292857014ac631ca9acdb65984e1d70f170889b2b6f037fab456bdecb
|
3 |
+
size 32842240
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f891b49d39434d22cfe0ba6ce9fb9347a4b36823bcecba0837b39beef166a82d
|
3 |
+
size 25174016
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30c21fdc54de611de65d692996a98a650994711016406bb0f01ddab9ccc9c0f0
|
3 |
+
size 29360128
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:444037d3834cc814150c3e4bb240b503b4b5c0066dd2ae3dc6c505fb2664ac71
|
3 |
+
size 58720256
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a78229493b73deaa76da549d04460ac216a8b4351c96c452546a9e80e63b0dd
|
3 |
+
size 33046528
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15299964b9d2a37444f5df66f27236da182f399653fa79aefec034de8ebb23a4
|
3 |
+
size 29360128
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc37634fbacaac2b63ba5d27b9c231cc8ce8934e7dbbfdf47cef6b69e1d62799
|
3 |
+
size 58720256
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8a09cf6e971ebb553dbc93c52cdfdd80fbdd73f5bfeeb71753801900ff0420a
|
3 |
+
size 22036480
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43932ffde8ddeb48834fba02ce10be76683c821dd846cc21c5c893abc2c4edd6
|
3 |
+
size 29360128
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f69eb3ff4efee66ccdd6dcd771db7e62209f5a4f1df202222c6c306f81fa224a
|
3 |
+
size 58720256
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5aac8d86dcd57babceb43c2eb45316db140cbec7538fa8df8d1e3bd91198e22
|
3 |
+
size 27271168
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f883fd6f1b8cd23ab8b285c0a998604320a07931b00a3412f74caa6af41ed8e6
|
3 |
+
size 262672384
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fea21e8b19f608660c2506dcfa8f8e44d3c229b481abca948dfde826cb53eff9
|
3 |
+
size 29360128
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7586ad7898e8f40819ef5165e46c1280b9625b67cdfa9f522347498d04efbadf
|
3 |
+
size 30949376
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:efb58b952140dd3d76a129d449cb17f88a6573c09cc801749164f453e8a9d928
|
3 |
+
size 58720256
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ffb42df3154fab18612e7d6e15e81873a88e792fdac97b9244e1dbbca3e2462a
|
3 |
+
size 25174016
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15e8ceafa23e1b8335928c7b08ea7b8224f83961c2aa6303a9c3048fcdf82d8d
|
3 |
+
size 29360128
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c30a0f348a353ec6009dd7f1c97b08a3db0768c9779c0cb939918b8024aeb575
|
3 |
+
size 58720256
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36ef5a44bf5c4761736418d3c8164954c81418682a215c446f213db0f5bd8719
|
3 |
+
size 33046528
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:840166c641019a508c890503e4a6e3d0d4daa24e85871c595d8bc26e4b98e19a
|
3 |
+
size 29360128
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02a32e7d051af5048fe81d52f7b1d83e788aba2fa526fea5fac262c012846ca5
|
3 |
+
size 58720256
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f9010318d027faa7be53c6cae4c1dd31f96cbf9dfbbb009f960e6d7a6074614
|
3 |
+
size 22036480
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4b808c3ec0afdd3f056d84fc168b4f94b849fccfbd05f31f6abb62b62701359
|
3 |
+
size 32834048
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a2c3381a502cfce772fb59457f2c4b69928047249c952e7e6771eafd3c39670c
|
3 |
+
size 29360128
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba00a47b7e34ae3e36f8cece3fdbc5a52795bb72b0f81612a27b00dbae1b5006
|
3 |
+
size 58720256
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:227f1b70f6f3220cb93cbc356a70b6008f5f4a3dc7534d5686ac4a7fd22f781d
|
3 |
+
size 27271168
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e030391d7437ad6f5c3ff77e913d6b87283aec4ef0714e2de91d416e090b1cc
|
3 |
+
size 29360128
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76d983e738e86d12364d34900780ac95dbcd2ed1571929d2fcbb63b9338b5a58
|
3 |
+
size 30949376
|