Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +100 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,100 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "deepseek_v2",
|
4 |
+
"quantization": "q4f32_1",
|
5 |
+
"model_config": {
|
6 |
+
"vocab_size": 102400,
|
7 |
+
"hidden_size": 2048,
|
8 |
+
"intermediate_size": 10944,
|
9 |
+
"moe_intermediate_size": 1408,
|
10 |
+
"num_hidden_layers": 27,
|
11 |
+
"num_attention_heads": 16,
|
12 |
+
"num_key_value_heads": 16,
|
13 |
+
"n_shared_experts": 2,
|
14 |
+
"n_routed_experts": 64,
|
15 |
+
"num_experts_per_tok": 6,
|
16 |
+
"norm_topk_prob": false,
|
17 |
+
"first_k_dense_replace": 1,
|
18 |
+
"moe_layer_freq": 1,
|
19 |
+
"routed_scaling_factor": 1.0,
|
20 |
+
"attention_bias": false,
|
21 |
+
"kv_lora_rank": 512,
|
22 |
+
"qk_rope_head_dim": 64,
|
23 |
+
"v_head_dim": 128,
|
24 |
+
"qk_nope_head_dim": 128,
|
25 |
+
"rms_norm_eps": 1e-06,
|
26 |
+
"rope_theta": 10000,
|
27 |
+
"q_lora_rank": null,
|
28 |
+
"rope_scaling": {
|
29 |
+
"beta_fast": 32,
|
30 |
+
"beta_slow": 1,
|
31 |
+
"factor": 40,
|
32 |
+
"mscale": 0.707,
|
33 |
+
"mscale_all_dim": 0.707,
|
34 |
+
"original_max_position_embeddings": 4096,
|
35 |
+
"type": "yarn"
|
36 |
+
},
|
37 |
+
"context_window_size": 163840,
|
38 |
+
"prefill_chunk_size": 8192,
|
39 |
+
"tensor_parallel_shards": 1,
|
40 |
+
"dtype": "float32",
|
41 |
+
"max_batch_size": 128
|
42 |
+
},
|
43 |
+
"vocab_size": 102400,
|
44 |
+
"context_window_size": 163840,
|
45 |
+
"sliding_window_size": -1,
|
46 |
+
"prefill_chunk_size": 8192,
|
47 |
+
"attention_sink_size": -1,
|
48 |
+
"tensor_parallel_shards": 1,
|
49 |
+
"pipeline_parallel_stages": 1,
|
50 |
+
"temperature": 0.3,
|
51 |
+
"presence_penalty": 0.0,
|
52 |
+
"frequency_penalty": 0.0,
|
53 |
+
"repetition_penalty": 1.0,
|
54 |
+
"top_p": 0.95,
|
55 |
+
"tokenizer_files": [
|
56 |
+
"tokenizer.json",
|
57 |
+
"tokenizer_config.json"
|
58 |
+
],
|
59 |
+
"tokenizer_info": {
|
60 |
+
"token_postproc_method": "byte_level",
|
61 |
+
"prepend_space_in_encode": false,
|
62 |
+
"strip_space_in_decode": false
|
63 |
+
},
|
64 |
+
"conv_template": {
|
65 |
+
"name": "deepseek_v2",
|
66 |
+
"system_template": "{system_message}",
|
67 |
+
"system_message": "",
|
68 |
+
"system_prefix_token_ids": [
|
69 |
+
100000
|
70 |
+
],
|
71 |
+
"add_role_after_system_message": true,
|
72 |
+
"roles": {
|
73 |
+
"user": "User",
|
74 |
+
"assistant": "Assistant"
|
75 |
+
},
|
76 |
+
"role_templates": {
|
77 |
+
"user": "{user_message}",
|
78 |
+
"assistant": "{assistant_message}",
|
79 |
+
"tool": "{tool_message}"
|
80 |
+
},
|
81 |
+
"messages": [],
|
82 |
+
"seps": [
|
83 |
+
"\n\n",
|
84 |
+
"<\uff5cend\u2581of\u2581sentence\uff5c>"
|
85 |
+
],
|
86 |
+
"role_content_sep": ": ",
|
87 |
+
"role_empty_sep": ":",
|
88 |
+
"stop_str": [
|
89 |
+
"<\uff5cend\u2581of\u2581sentence\uff5c>"
|
90 |
+
],
|
91 |
+
"stop_token_ids": [
|
92 |
+
100001
|
93 |
+
],
|
94 |
+
"function_string": "",
|
95 |
+
"use_function_calling": false
|
96 |
+
},
|
97 |
+
"pad_token_id": 0,
|
98 |
+
"bos_token_id": 100000,
|
99 |
+
"eos_token_id": 100001
|
100 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58bef94f47e3f00df16df141b0fcc29092b3866998b87640c92f43d43327e4aa
|
3 |
+
size 104857600
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98f02a99345a887878493d91180a06d6b30228fe73b5c0a034a10347c2a81b0f
|
3 |
+
size 104857600
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc0b6aca01de02a697064e77d8e9d7c658764fbebc0efbd51bb241004d25cc6e
|
3 |
+
size 92274688
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3adade9eff5a6e5e9a8891d927faec1b66c7c33597b2279091d4bc97430dc53
|
3 |
+
size 184549376
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0a3ccd1da5eec0f6950903a99f746f0ebc3fd1459e62290a7a0383ce4d44e05
|
3 |
+
size 23068672
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ba023e276e6139558d1838deac37af97618b4873b2999bc2398157e79713c51
|
3 |
+
size 92274688
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3ae2bc23ed85a73b7fea53f7c186d813cdfd46b281841dd14323ee81e1c7db4
|
3 |
+
size 29279232
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:365386e59aaa1e0a92afcec044f13d2627db6a0f80b8a9328823144fcd334799
|
3 |
+
size 184549376
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19593fc62d3fc794436ea52e3ddaf0c156724cffdcfde424dc46d460d37c62a2
|
3 |
+
size 23068672
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39ecde72839a5dce594ceda33cb36f93d13eec17b22cf1e9ae4fcc286b30b295
|
3 |
+
size 92274688
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e86563b0196d8cab54ed3cde41b5ad35033e9d2b465a7b7670d063a877bbb74
|
3 |
+
size 29279232
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d8db0b39ba15a0394ab9d3cd1b468321e72eb187dcc6a08b6b3d57e59392fe5
|
3 |
+
size 11542528
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca593c94db3d4520dbe8fbe4b89f35019a73547dcf5519884cf39a9dd5efad08
|
3 |
+
size 29279232
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58692f31c20477dd6f48033427f8586edc5a3ef68c52652d7b963430fd67fdfe
|
3 |
+
size 184549376
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bda294953f03ef9d52a1e55972c121c0d2d1e39133180cb8530cbf5df3e2e72
|
3 |
+
size 23068672
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09cbc2373b9672f18488cac73afdabf02610eb7cf3b8803a9c662b37fd02bdc5
|
3 |
+
size 92274688
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3df4cb478ac8e3612cbe13389bc61f87f007b8004e664d282235f524ecbacf64
|
3 |
+
size 29279232
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa4e9f2c5034a80759b782084deb2dcbadea83ba7e00a684dcdc6538c7203450
|
3 |
+
size 184549376
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:339d2aff30041b8245d482b869efd06840c2c876c6f95474663aecefc97e56f9
|
3 |
+
size 23068672
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f60d1cd5716f34e0b6c3da3d11afab8a876fb1ad20f39e8e33b04a46bbe1c0d3
|
3 |
+
size 92274688
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f119458239fd510939817bbf2daab6827ab1ad00368a5e39fd56e39eb8129e23
|
3 |
+
size 29279232
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb83dcc7c4df277516e1cc6246c3bb17db17ebb4a8c4f548b3b05b835ed6dbb4
|
3 |
+
size 31601664
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58501f3e2476cb773943491e75827efc8cdd9c3c3782b740ca7ffabdaccb81b7
|
3 |
+
size 184549376
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6d78b6c96b767c77cdf647cd90bc78e3e9d7459b383045241d81da8b1430feb
|
3 |
+
size 23068672
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ec2f44ddf9cd62444fadae530798985954cb4745d76bc7d54e4c0f5cd9a56a1
|
3 |
+
size 92274688
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecb9986e8aa55a6fc765578813dced5266516705e7392cf3166947e6f48fa230
|
3 |
+
size 29279232
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:650da1ef81d4e7212b8b605538facf9ba6521c6480267c3da2e481603c99db5d
|
3 |
+
size 184549376
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:249cddcfd341860f9aa55ef4c8c5f08a0a5f69eb51eca52ce6586a916be6a7cd
|
3 |
+
size 23068672
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50fbe71e0d154aa209bd10e79849492639cd86510047626a5d94ec0bf549b552
|
3 |
+
size 92274688
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:098524d143293dc83fbed0935bd997c166fe823d8868d112bf1593048b04499c
|
3 |
+
size 29279232
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3da67a1405e2119683f37eb6d2abb65813c301e8a457589f62c2854c3c877a7a
|
3 |
+
size 184549376
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e9dc45dc3c80576e0fea9d5f90a7fe44f14d846eefce73dae41c2ee18eb36e8
|
3 |
+
size 23068672
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4d1ead56b3e3483934fd328f918e14914adeeff352833b9ad3e9ec4e995ba75
|
3 |
+
size 27574272
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a482a07af1d791afd0e95278fae0f7c7b133cd65f62243a8cddadf584b81296
|
3 |
+
size 92274688
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26db7a6b7baf3ba7f6b4b396af3cd525dc7c3cc115154411e4691fe78d07e5f0
|
3 |
+
size 29279232
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49f3ee0c50474524e75b99d28715c80819a77326fe66997d6aa6038a7082e293
|
3 |
+
size 184549376
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e439eb088fa8636653bb56e94a4c3b5a4b29aed85292dedf0a1897de553ba6f6
|
3 |
+
size 23068672
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82afeb1ee96ac116f6ed060c3c18bd4b39a2052abee02cc56610d9745a73dbb1
|
3 |
+
size 92274688
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2aa5e20783f07a527d7905ea7ddfeda06543c9fe81fce8100ef0497162ee3130
|
3 |
+
size 29279232
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eeec3ba3c1eb8f810eabf4469fae29a21adfab0dc567ee1b14de8bcc15a0383d
|
3 |
+
size 184549376
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57a8df94b13e3d6aab108cbc52bd276dcd7736e5ab5f6de7f5db38bb9efda6f7
|
3 |
+
size 23068672
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9d68b95b16535532b942f9dede89ccf8c7f89e121d0eaafd75c4a398c64be36
|
3 |
+
size 92274688
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37212807c1857a7adc56e0bc382ea6eb10381319f7ea39e16649439842c24af7
|
3 |
+
size 29279232
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b9391ed25af742d8d0e5921a034a7398bde3d075988de14fbdd8d81b8c54c53
|
3 |
+
size 184549376
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90402dc35180173f939ddec2cce52c531411432f29c01015127874664516c671
|
3 |
+
size 184549376
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b456f546c6a5099f9d57b3e87ec5ba43fc8b98d188724565afa83dd7c7a3b72
|
3 |
+
size 23068672
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69785e51fcb0466b1380dddfb3ff0a825cd7b2e72d03bfd9afc9052badb10623
|
3 |
+
size 92274688
|