Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- merges.txt +0 -0
- mlc-chat-config.json +80 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,80 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "qwen2",
|
4 |
+
"quantization": "q4f16_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_act": "silu",
|
7 |
+
"hidden_size": 8192,
|
8 |
+
"intermediate_size": 29568,
|
9 |
+
"num_attention_heads": 64,
|
10 |
+
"num_hidden_layers": 80,
|
11 |
+
"num_key_value_heads": 8,
|
12 |
+
"rms_norm_eps": 1e-06,
|
13 |
+
"rope_theta": 1000000.0,
|
14 |
+
"vocab_size": 152064,
|
15 |
+
"context_window_size": 32768,
|
16 |
+
"prefill_chunk_size": 2048,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"head_dim": 128,
|
19 |
+
"dtype": "float32",
|
20 |
+
"max_batch_size": 80
|
21 |
+
},
|
22 |
+
"vocab_size": 152064,
|
23 |
+
"context_window_size": 32768,
|
24 |
+
"sliding_window_size": -1,
|
25 |
+
"prefill_chunk_size": 2048,
|
26 |
+
"attention_sink_size": -1,
|
27 |
+
"tensor_parallel_shards": 1,
|
28 |
+
"temperature": 0.7,
|
29 |
+
"presence_penalty": 0.0,
|
30 |
+
"frequency_penalty": 0.0,
|
31 |
+
"repetition_penalty": 1.05,
|
32 |
+
"top_p": 0.8,
|
33 |
+
"tokenizer_files": [
|
34 |
+
"tokenizer.json",
|
35 |
+
"vocab.json",
|
36 |
+
"merges.txt",
|
37 |
+
"tokenizer_config.json"
|
38 |
+
],
|
39 |
+
"tokenizer_info": {
|
40 |
+
"token_postproc_method": "byte_level",
|
41 |
+
"prepend_space_in_encode": false,
|
42 |
+
"strip_space_in_decode": false
|
43 |
+
},
|
44 |
+
"conv_template": {
|
45 |
+
"name": "chatml",
|
46 |
+
"system_template": "<|im_start|>system\n{system_message}",
|
47 |
+
"system_message": "A conversation between a user and an LLM-based AI assistant. The assistant gives helpful and honest answers.",
|
48 |
+
"system_prefix_token_ids": null,
|
49 |
+
"add_role_after_system_message": true,
|
50 |
+
"roles": {
|
51 |
+
"user": "<|im_start|>user",
|
52 |
+
"assistant": "<|im_start|>assistant"
|
53 |
+
},
|
54 |
+
"role_templates": {
|
55 |
+
"user": "{user_message}",
|
56 |
+
"assistant": "{assistant_message}",
|
57 |
+
"tool": "{tool_message}"
|
58 |
+
},
|
59 |
+
"messages": [],
|
60 |
+
"seps": [
|
61 |
+
"<|im_end|>\n"
|
62 |
+
],
|
63 |
+
"role_content_sep": "\n",
|
64 |
+
"role_empty_sep": "\n",
|
65 |
+
"stop_str": [
|
66 |
+
"<|im_end|>"
|
67 |
+
],
|
68 |
+
"stop_token_ids": [
|
69 |
+
2
|
70 |
+
],
|
71 |
+
"function_string": "",
|
72 |
+
"use_function_calling": false
|
73 |
+
},
|
74 |
+
"pad_token_id": 151643,
|
75 |
+
"bos_token_id": 151643,
|
76 |
+
"eos_token_id": [
|
77 |
+
151645,
|
78 |
+
151643
|
79 |
+
]
|
80 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c46bd5bf0de46b5357872d9c6222cc0b0f962fdd76493e37d28d85c492ce123
|
3 |
+
size 622854144
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe3d613c3c574121ad99c498c1ce0657d2853cbde2a898e6444bc102f0d309c3
|
3 |
+
size 77856768
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18133e6e29427e6b1a3eb88e91f5b40d05fc0bd7dd2809f78f2bde8867db6aeb
|
3 |
+
size 33554432
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:331ee2db7d8fea2a931eb2c4fffa3b7a74fb09a6360254d5c61f62755bd641a0
|
3 |
+
size 30277632
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:baa94a6b9af345cf235569dfe5cfed4c48bbd9b16683f6fea9820cb6e8d0412b
|
3 |
+
size 41943040
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8202474216f53146d1b1b205c658f6bbcc4efa622b52e27e700c295cde012e15
|
3 |
+
size 33554432
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f874a004c73ad5b2834cb7e166c4cfd6085c29b660f00f7ac78244723c4b587
|
3 |
+
size 41943040
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6e9b9a4c39cc6049c82f8abdc3174b5ab3b3c7fd6b245559e431694a63b4197
|
3 |
+
size 33554432
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d614c513cb393848222391e25a2b0fda1ab15300b3fe408ee40718f3bc1cdafe
|
3 |
+
size 29876224
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c5486741d64943217ed0ac38fe3f36027bab3ccc2a32ff6769cfc968dfeb18e
|
3 |
+
size 121110528
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8db33e8c93008d1a3ae5315f8ca3db14086b7fc8575ccf83e92b471b10a9be36
|
3 |
+
size 242221056
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a49deed3c6f15cd1de2f89e559c19f97c840a29ed2c077a4420e7655bbe4343
|
3 |
+
size 30277632
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54046739894d2f50cb8a7202bcb79dee5faa2c1e5e4150d84f368c61526043b1
|
3 |
+
size 121110528
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62de2481f4eb57537dcec7d76986300e33b3e95c7f2d87d07588832586d7de7d
|
3 |
+
size 121110528
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a392a15ed4bbacc78027990676fef9dbd1a2c32fdd4919c78e4f9d6ec92c1c0b
|
3 |
+
size 19382272
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67c6f283a672e54195446b3258842097ef44319198f3460500682c3a33095bc8
|
3 |
+
size 242221056
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac3f015fb38bb5b4a44346c81ef7f5996df4cae3a02c89e928d030c175067089
|
3 |
+
size 30277632
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6ea17aec03ccc8ee50b58531fa05528c91ff7b4a8c438627c4f399fdcc583e8
|
3 |
+
size 41943040
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:086186291863945f630293ee4d6009f6be66bd09e06509ced8aa38f352ec8b88
|
3 |
+
size 33554432
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27700af9393489ed6df7c7795a2391e0d3122a7c2523833146b0f6016b3fb6f0
|
3 |
+
size 242221056
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b856de81b7fc7cfd9056836e7dde2538cce61ebf687f8cff8f30ffbbcf79fce6
|
3 |
+
size 30277632
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f542e72f3492d11782f6ee61b641e611f8db9fc39a259f6cd1574394b0c94fdf
|
3 |
+
size 41943040
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45f2e6bb6f6bb2392995673984552d6afe1a1b401f69680974da381ccde56ece
|
3 |
+
size 33554432
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd31f7efd5ce2bf510325a2121a75671109079f09359b33389998a218eefe93a
|
3 |
+
size 29876224
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6a30ec81ec18be23e3a95817ca050067343f217fddde6c4ac58713d0d07952c
|
3 |
+
size 24662016
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8495f0f9017ee662c9b2a91a3b6f088c1522e1b529f3d457cef6ec2ce927eb64
|
3 |
+
size 121110528
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fae380e5bc9e7fcbe6e74f7bbbcb72ad836d43b2fb388ca1ece30a0361cc1df4
|
3 |
+
size 121110528
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ed490aa71e4cbdb42701aa392253020c6aad3b83e751b0974c349ae4f34e861
|
3 |
+
size 19382272
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85696ed818f0720e7759d3e4140fcaabbc79a901ce48c833007e3d32e1656909
|
3 |
+
size 242221056
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2dcf17487a82b1299fbc297fb27d6f58ab0e3bdc3a06357ce96b76e16c3f6729
|
3 |
+
size 30277632
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3dfd08d7d74288ffc1615b682b419d7bdbb510ebb874cbdf0697a25a6d519b4c
|
3 |
+
size 41943040
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d4306f934e0e4764fe5c2e9244cf4d264a33158de66e2c81692403680e21959
|
3 |
+
size 33554432
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f546d24c883f23473e59e881560407ebd1c5d70f0ad4d659fda029f67b70da0
|
3 |
+
size 242221056
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3cc24fc39047cd43204704a856dd27e1cffcd19eaf0bc72eef2954c767400745
|
3 |
+
size 30277632
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27324501bffd01e4ac31075412221cd7eda14296c049728448eef6301dd243e5
|
3 |
+
size 41943040
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9102de3d43111042e5a8eac60e99818c14818acc692de3aaf1469e3b33dd533c
|
3 |
+
size 121110528
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:edc853050de5f2562b1a93b2dfcb62c539492da28e7481ad6155c0203c6ef8f2
|
3 |
+
size 33554432
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:893ce500a5e8bc1e383ea2b229b45782d8efae2e2ec5092485c34b0cfa6470a7
|
3 |
+
size 29876224
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b67e3383d58778a972f253764572286ad8649d91bfe31a4ed797be4beaaaf598
|
3 |
+
size 121110528
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f8a60c611ecaa9f59960e5d8481850dfbccc38d3eeb4a3afc31c5f368412978
|
3 |
+
size 121110528
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f392ed0e64b528bf864e5ce50d8dc1aeab0b24d3744426ef7ef516dbeddfcd1c
|
3 |
+
size 19382272
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d88d46f6df289edb6b63ac5d4815badb13e8c2fac291a69bfab7ecf47c1675d1
|
3 |
+
size 242221056
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fbc88d461972d22c59015c7863c4f54b696bc53ee90225edb195856699d1901
|
3 |
+
size 30277632
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87dc6991b5a899ffed6cd9d38299cfe3f00034d71144ed7555075270bcd1c1e6
|
3 |
+
size 41943040
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bb2c279f3616b07a89f09b474f8d6110d6fc01d56515876697b0901d2d7ce00
|
3 |
+
size 33554432
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:711097d8350dd274a25149652186c7cf6d10c6ca027545b69d92513b789e7285
|
3 |
+
size 121110528
|