Initial commit
Browse files- logs.txt +0 -0
- mlc-chat-config.json +38 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_6.bin +3 -0
- params_shard_7.bin +3 -0
- params_shard_8.bin +3 -0
- params_shard_9.bin +3 -0
- tokenizer.json +0 -0
- tokenizer_config.json +7 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "gpt_bigcode",
|
3 |
+
"quantization": "q4f32_1",
|
4 |
+
"model_config": {
|
5 |
+
"n_embd": 2048,
|
6 |
+
"n_inner": 8192,
|
7 |
+
"n_head": 16,
|
8 |
+
"n_layer": 24,
|
9 |
+
"n_positions": 2048,
|
10 |
+
"layer_norm_epsilon": 1e-05,
|
11 |
+
"vocab_size": 49280,
|
12 |
+
"context_window_size": 2048,
|
13 |
+
"prefill_chunk_size": 2048,
|
14 |
+
"tensor_parallel_shards": 1
|
15 |
+
},
|
16 |
+
"vocab_size": 49280,
|
17 |
+
"context_window_size": 2048,
|
18 |
+
"sliding_window_size": -1,
|
19 |
+
"prefill_chunk_size": 2048,
|
20 |
+
"attention_sink_size": -1,
|
21 |
+
"tensor_parallel_shards": 1,
|
22 |
+
"max_batch_size": 80,
|
23 |
+
"mean_gen_len": 128,
|
24 |
+
"max_gen_len": 512,
|
25 |
+
"shift_fill_factor": 0.3,
|
26 |
+
"temperature": 0.7,
|
27 |
+
"repetition_penalty": 1.0,
|
28 |
+
"top_p": 0.95,
|
29 |
+
"conv_template": "LM",
|
30 |
+
"pad_token_id": 0,
|
31 |
+
"bos_token_id": 49152,
|
32 |
+
"eos_token_id": 49152,
|
33 |
+
"tokenizer_files": [
|
34 |
+
"tokenizer.json",
|
35 |
+
"tokenizer_config.json"
|
36 |
+
],
|
37 |
+
"version": "0.1.0"
|
38 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce7995d9e534983ab9b65004c4318781ba9e311102fcc86179da9d58d9feffd5
|
3 |
+
size 50462720
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83cf067f6c2c858ce3604399c1220502d3ba27434b2c2eee301de6b3dc0f801e
|
3 |
+
size 32608768
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf66b232fff92a887b9d54b32da3bb75c5a957eef47e94760165690b76ec9051
|
3 |
+
size 33382912
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59508ae8cb05e91551775f48b255f7ea4fd6892c38815d8877b4612693b29ffb
|
3 |
+
size 28963840
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebd57037b92b52e60e5551870ec06bfd370199bf1958f94565fbce308f8e4310
|
3 |
+
size 33387008
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3db402af190044c6b7b224e07c697d269f138edc15e2de5ebb341a94e8211e90
|
3 |
+
size 33382912
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb9f733959677751d0b14b97a5dd367e561e07f289fbed47b7d3fe4f2b15989b
|
3 |
+
size 28963840
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3f3799ad8f298e33776e4aa13f4d9f8ecf4fa5e6b3927b8d956254497609d3b
|
3 |
+
size 33387008
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8baf7a9908e43f9bc6b4bd21c34bf2580dd82251a19d4c8e12ce76af10d95a8
|
3 |
+
size 33382912
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7923021d31f53e8c473d7b4c8a032114a4af04f63971f741ad5ab5a6a4c4e69f
|
3 |
+
size 28963840
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed636998cd0148e32633cfe58df8727bfc7524e671667c3239942053318d8a29
|
3 |
+
size 33387008
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce7995d9e534983ab9b65004c4318781ba9e311102fcc86179da9d58d9feffd5
|
3 |
+
size 50462720
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c5f972884d0859f6e2185839a2feaee9eff24c50d0885411978c4bfc8503fd7
|
3 |
+
size 28963840
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:029b0b62b97c55d431a678777922f8ec724d0d919243db8bea3d175567823c3c
|
3 |
+
size 15757312
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d613688203f70ed5b33397db9c204ebb075352447c7f76e5840cdbab88a20e71
|
3 |
+
size 33387008
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86e4bfe130e1571eda3dad7bdeba230f8ea19b87155f4f1fed8dc4a16b4d1b4d
|
3 |
+
size 33382912
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f728b6357c765cea53ec069e109584622bcc8be83f0abc960960e3cacf5d3a8c
|
3 |
+
size 28963840
|
params_shard_6.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d6c6c9e66343863c967ca30480ea37a45d687409399f0903dd9a33b7b59fe35
|
3 |
+
size 33387008
|
params_shard_7.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f27289922b6326e51deb53e352be5542abc203bb5cb4e805ea58e6a6125bf7e3
|
3 |
+
size 33382912
|
params_shard_8.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0b7d40d4cba8274c910f908f8e539f333c90fb35a0212c858d55c549763ece5
|
3 |
+
size 28963840
|
params_shard_9.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a99d2d53c0ad156a7c934c33325944226942a19f6cb91a6d8248a91aab188d7
|
3 |
+
size 33387008
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"errors": "replace",
|
3 |
+
"tokenizer_class": "GPT2TokenizerFast",
|
4 |
+
"bos_token": "<|endoftext|>",
|
5 |
+
"eos_token": "<|endoftext|>",
|
6 |
+
"model_max_length": 2048
|
7 |
+
}
|