riczhou commited on
Commit
f492e43
·
verified ·
1 Parent(s): 73370e8

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
mlc-chat-config.json ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "deepseek_v2",
4
+ "quantization": "q4f32_1",
5
+ "model_config": {
6
+ "vocab_size": 102400,
7
+ "hidden_size": 2048,
8
+ "intermediate_size": 10944,
9
+ "moe_intermediate_size": 1408,
10
+ "num_hidden_layers": 27,
11
+ "num_attention_heads": 16,
12
+ "num_key_value_heads": 16,
13
+ "n_shared_experts": 2,
14
+ "n_routed_experts": 64,
15
+ "num_experts_per_tok": 6,
16
+ "norm_topk_prob": false,
17
+ "first_k_dense_replace": 1,
18
+ "moe_layer_freq": 1,
19
+ "routed_scaling_factor": 1.0,
20
+ "attention_bias": false,
21
+ "kv_lora_rank": 512,
22
+ "qk_rope_head_dim": 64,
23
+ "v_head_dim": 128,
24
+ "qk_nope_head_dim": 128,
25
+ "rms_norm_eps": 1e-06,
26
+ "rope_theta": 10000,
27
+ "q_lora_rank": null,
28
+ "rope_scaling": {
29
+ "beta_fast": 32,
30
+ "beta_slow": 1,
31
+ "factor": 40,
32
+ "mscale": 0.707,
33
+ "mscale_all_dim": 0.707,
34
+ "original_max_position_embeddings": 4096,
35
+ "type": "yarn"
36
+ },
37
+ "context_window_size": 163840,
38
+ "prefill_chunk_size": 8192,
39
+ "tensor_parallel_shards": 1,
40
+ "dtype": "float32",
41
+ "max_batch_size": 128
42
+ },
43
+ "vocab_size": 102400,
44
+ "context_window_size": 163840,
45
+ "sliding_window_size": -1,
46
+ "prefill_chunk_size": 8192,
47
+ "attention_sink_size": -1,
48
+ "tensor_parallel_shards": 1,
49
+ "pipeline_parallel_stages": 1,
50
+ "temperature": 0.3,
51
+ "presence_penalty": 0.0,
52
+ "frequency_penalty": 0.0,
53
+ "repetition_penalty": 1.0,
54
+ "top_p": 0.95,
55
+ "tokenizer_files": [
56
+ "tokenizer.json",
57
+ "tokenizer_config.json"
58
+ ],
59
+ "tokenizer_info": {
60
+ "token_postproc_method": "byte_level",
61
+ "prepend_space_in_encode": false,
62
+ "strip_space_in_decode": false
63
+ },
64
+ "conv_template": {
65
+ "name": "deepseek_v2",
66
+ "system_template": "{system_message}",
67
+ "system_message": "",
68
+ "system_prefix_token_ids": [
69
+ 100000
70
+ ],
71
+ "add_role_after_system_message": true,
72
+ "roles": {
73
+ "user": "User",
74
+ "assistant": "Assistant"
75
+ },
76
+ "role_templates": {
77
+ "user": "{user_message}",
78
+ "assistant": "{assistant_message}",
79
+ "tool": "{tool_message}"
80
+ },
81
+ "messages": [],
82
+ "seps": [
83
+ "\n\n",
84
+ "<\uff5cend\u2581of\u2581sentence\uff5c>"
85
+ ],
86
+ "role_content_sep": ": ",
87
+ "role_empty_sep": ":",
88
+ "stop_str": [
89
+ "<\uff5cend\u2581of\u2581sentence\uff5c>"
90
+ ],
91
+ "stop_token_ids": [
92
+ 100001
93
+ ],
94
+ "function_string": "",
95
+ "use_function_calling": false
96
+ },
97
+ "pad_token_id": 0,
98
+ "bos_token_id": 100000,
99
+ "eos_token_id": 100001
100
+ }
ndarray-cache-b16.json ADDED
The diff for this file is too large to render. See raw diff
 
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58bef94f47e3f00df16df141b0fcc29092b3866998b87640c92f43d43327e4aa
3
+ size 104857600
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98f02a99345a887878493d91180a06d6b30228fe73b5c0a034a10347c2a81b0f
3
+ size 104857600
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc0b6aca01de02a697064e77d8e9d7c658764fbebc0efbd51bb241004d25cc6e
3
+ size 92274688
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3adade9eff5a6e5e9a8891d927faec1b66c7c33597b2279091d4bc97430dc53
3
+ size 184549376
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0a3ccd1da5eec0f6950903a99f746f0ebc3fd1459e62290a7a0383ce4d44e05
3
+ size 23068672
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ba023e276e6139558d1838deac37af97618b4873b2999bc2398157e79713c51
3
+ size 92274688
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3ae2bc23ed85a73b7fea53f7c186d813cdfd46b281841dd14323ee81e1c7db4
3
+ size 29279232
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:365386e59aaa1e0a92afcec044f13d2627db6a0f80b8a9328823144fcd334799
3
+ size 184549376
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19593fc62d3fc794436ea52e3ddaf0c156724cffdcfde424dc46d460d37c62a2
3
+ size 23068672
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39ecde72839a5dce594ceda33cb36f93d13eec17b22cf1e9ae4fcc286b30b295
3
+ size 92274688
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e86563b0196d8cab54ed3cde41b5ad35033e9d2b465a7b7670d063a877bbb74
3
+ size 29279232
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d8db0b39ba15a0394ab9d3cd1b468321e72eb187dcc6a08b6b3d57e59392fe5
3
+ size 11542528
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca593c94db3d4520dbe8fbe4b89f35019a73547dcf5519884cf39a9dd5efad08
3
+ size 29279232
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58692f31c20477dd6f48033427f8586edc5a3ef68c52652d7b963430fd67fdfe
3
+ size 184549376
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bda294953f03ef9d52a1e55972c121c0d2d1e39133180cb8530cbf5df3e2e72
3
+ size 23068672
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09cbc2373b9672f18488cac73afdabf02610eb7cf3b8803a9c662b37fd02bdc5
3
+ size 92274688
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3df4cb478ac8e3612cbe13389bc61f87f007b8004e664d282235f524ecbacf64
3
+ size 29279232
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa4e9f2c5034a80759b782084deb2dcbadea83ba7e00a684dcdc6538c7203450
3
+ size 184549376
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:339d2aff30041b8245d482b869efd06840c2c876c6f95474663aecefc97e56f9
3
+ size 23068672
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f60d1cd5716f34e0b6c3da3d11afab8a876fb1ad20f39e8e33b04a46bbe1c0d3
3
+ size 92274688
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f119458239fd510939817bbf2daab6827ab1ad00368a5e39fd56e39eb8129e23
3
+ size 29279232
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb83dcc7c4df277516e1cc6246c3bb17db17ebb4a8c4f548b3b05b835ed6dbb4
3
+ size 31601664
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58501f3e2476cb773943491e75827efc8cdd9c3c3782b740ca7ffabdaccb81b7
3
+ size 184549376
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6d78b6c96b767c77cdf647cd90bc78e3e9d7459b383045241d81da8b1430feb
3
+ size 23068672
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ec2f44ddf9cd62444fadae530798985954cb4745d76bc7d54e4c0f5cd9a56a1
3
+ size 92274688
params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecb9986e8aa55a6fc765578813dced5266516705e7392cf3166947e6f48fa230
3
+ size 29279232
params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:650da1ef81d4e7212b8b605538facf9ba6521c6480267c3da2e481603c99db5d
3
+ size 184549376
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:249cddcfd341860f9aa55ef4c8c5f08a0a5f69eb51eca52ce6586a916be6a7cd
3
+ size 23068672
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50fbe71e0d154aa209bd10e79849492639cd86510047626a5d94ec0bf549b552
3
+ size 92274688
params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:098524d143293dc83fbed0935bd997c166fe823d8868d112bf1593048b04499c
3
+ size 29279232
params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3da67a1405e2119683f37eb6d2abb65813c301e8a457589f62c2854c3c877a7a
3
+ size 184549376
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e9dc45dc3c80576e0fea9d5f90a7fe44f14d846eefce73dae41c2ee18eb36e8
3
+ size 23068672
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4d1ead56b3e3483934fd328f918e14914adeeff352833b9ad3e9ec4e995ba75
3
+ size 27574272
params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a482a07af1d791afd0e95278fae0f7c7b133cd65f62243a8cddadf584b81296
3
+ size 92274688
params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26db7a6b7baf3ba7f6b4b396af3cd525dc7c3cc115154411e4691fe78d07e5f0
3
+ size 29279232
params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49f3ee0c50474524e75b99d28715c80819a77326fe66997d6aa6038a7082e293
3
+ size 184549376
params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e439eb088fa8636653bb56e94a4c3b5a4b29aed85292dedf0a1897de553ba6f6
3
+ size 23068672
params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82afeb1ee96ac116f6ed060c3c18bd4b39a2052abee02cc56610d9745a73dbb1
3
+ size 92274688
params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2aa5e20783f07a527d7905ea7ddfeda06543c9fe81fce8100ef0497162ee3130
3
+ size 29279232
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eeec3ba3c1eb8f810eabf4469fae29a21adfab0dc567ee1b14de8bcc15a0383d
3
+ size 184549376
params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57a8df94b13e3d6aab108cbc52bd276dcd7736e5ab5f6de7f5db38bb9efda6f7
3
+ size 23068672
params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9d68b95b16535532b942f9dede89ccf8c7f89e121d0eaafd75c4a398c64be36
3
+ size 92274688
params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37212807c1857a7adc56e0bc382ea6eb10381319f7ea39e16649439842c24af7
3
+ size 29279232
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b9391ed25af742d8d0e5921a034a7398bde3d075988de14fbdd8d81b8c54c53
3
+ size 184549376
params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90402dc35180173f939ddec2cce52c531411432f29c01015127874664516c671
3
+ size 184549376
params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b456f546c6a5099f9d57b3e87ec5ba43fc8b98d188724565afa83dd7c7a3b72
3
+ size 23068672
params_shard_42.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69785e51fcb0466b1380dddfb3ff0a825cd7b2e72d03bfd9afc9052badb10623
3
+ size 92274688