upload model
Browse files- merges.txt +0 -0
- mlc-chat-config.json +68 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_6.bin +3 -0
- params_shard_7.bin +3 -0
- params_shard_8.bin +3 -0
- params_shard_9.bin +3 -0
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,68 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "llama",
|
3 |
+
"quantization": "q4f16_0",
|
4 |
+
"model_config": {
|
5 |
+
"hidden_size": 4096,
|
6 |
+
"intermediate_size": 14336,
|
7 |
+
"num_attention_heads": 32,
|
8 |
+
"num_hidden_layers": 32,
|
9 |
+
"rms_norm_eps": 1e-5,
|
10 |
+
"vocab_size": 102400,
|
11 |
+
"position_embedding_base": 500000.0,
|
12 |
+
"context_window_size": 2048,
|
13 |
+
"prefill_chunk_size": 2048,
|
14 |
+
"num_key_value_heads": 8,
|
15 |
+
"head_dim": 128,
|
16 |
+
"tensor_parallel_shards": 1,
|
17 |
+
"max_batch_size": 80
|
18 |
+
},
|
19 |
+
"vocab_size": 102400,
|
20 |
+
"context_window_size": 2048,
|
21 |
+
"sliding_window_size": -1,
|
22 |
+
"prefill_chunk_size": 2048,
|
23 |
+
"attention_sink_size": -1,
|
24 |
+
"tensor_parallel_shards": 1,
|
25 |
+
"mean_gen_len": 128,
|
26 |
+
"max_gen_len": 512,
|
27 |
+
"shift_fill_factor": 0.3,
|
28 |
+
"temperature": 0,
|
29 |
+
"presence_penalty": 0.0,
|
30 |
+
"frequency_penalty": 0.0,
|
31 |
+
"repetition_penalty": 1.0,
|
32 |
+
"top_p": 0.95,
|
33 |
+
"conv_template": {
|
34 |
+
"name": "exaone",
|
35 |
+
"system_template": "[|system|]{system_message}[|endofturn|]",
|
36 |
+
"system_message": "You are EXAONE model from LG AI Research, a helpful assistant.",
|
37 |
+
"system_prefix_token_ids": [1],
|
38 |
+
"add_role_after_system_message": false,
|
39 |
+
"roles": {
|
40 |
+
"user": "|user|]",
|
41 |
+
"assistant": "[|assistant|]"
|
42 |
+
},
|
43 |
+
"role_templates": {
|
44 |
+
"user": "{user_message}",
|
45 |
+
"assistant": "{assistant_message}",
|
46 |
+
"tool": "{tool_message}"
|
47 |
+
},
|
48 |
+
"messages": [],
|
49 |
+
"seps": ["\n"],
|
50 |
+
"role_content_sep": "",
|
51 |
+
"role_empty_sep": "\n",
|
52 |
+
"stop_str": ["[|endofturn|]"],
|
53 |
+
"stop_token_ids": [361],
|
54 |
+
"function_string": "",
|
55 |
+
"use_function_calling": false,
|
56 |
+
"image_token_index": -1
|
57 |
+
},
|
58 |
+
"pad_token_id": 0,
|
59 |
+
"bos_token_id": 1,
|
60 |
+
"eos_token_id": 361,
|
61 |
+
"tokenizer_files": [
|
62 |
+
"tokenizer.json",
|
63 |
+
"vocab.json",
|
64 |
+
"merges.txt",
|
65 |
+
"tokenizer_config.json"
|
66 |
+
],
|
67 |
+
"version": "0.1.0"
|
68 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2ab8f84cb0d0aff870ee76ca69bc55e6a532ebc76b4324c03b5ec6ac0a0ba2c
|
3 |
+
size 209715200
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6a477800dbccdfc7f992d43ff4281678f85dc6cdfb601ff2d1e0ce36554645d
|
3 |
+
size 209715200
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1dd0f546d3cbb6ad7e38e7d398789b1a3afd96f597aa14854b5634459c8f9da
|
3 |
+
size 29360128
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd2f872279a879461a1a6624819df8185573b9f89fb8b72e918f0724529cd1d1
|
3 |
+
size 58720256
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c921a9e62808a371d1d228c00547c9246d7c91fd03ab734c1d544d890eeda7f
|
3 |
+
size 33046528
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eca700ecbff35a47f0d2b86bf61affdfe424a47f6987a5cf331240cb720d54ef
|
3 |
+
size 29360128
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:978cd4518873638c416b971c098bdfa21c55f7044b42b121219ec997702f6c53
|
3 |
+
size 58720256
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67a30ddbaa31121c9cbca65f93d3fa6645100602227a4141ce0a5a9690d1ef93
|
3 |
+
size 22036480
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a80d760bf783792d3758b88a70c9c24cc2e87041198331f7d528605d2961fdd8
|
3 |
+
size 29360128
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51bbdacdd392917761bec1c8ba24e2ba185a26237145685a6db4a5e94ff1e331
|
3 |
+
size 58720256
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9af445411dd7baa3cab43d2fa45bc359da32b5644a418ebf25a204d6329420d
|
3 |
+
size 27271168
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c71ac6bd113716f814182bc290a84c9c25e7139c31d0213164422cbf0a5b1574
|
3 |
+
size 29360128
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20b6dc549de1e984d4491c4af98d7db36b8992ac04dac6fc2eb742e8d5272afb
|
3 |
+
size 26214400
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c084afc0960b260d98ef76fa9e03ccfa6eb749c90d1008447a7f02b31a9424f
|
3 |
+
size 30949376
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b313d6f2f9946cd31b3afff165536d10597b3b84098f093aa02f183b4dd1dec
|
3 |
+
size 58720256
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eebf206f8beebb69995fde8927a1f0220a48e249a207d3b80a372c085599701d
|
3 |
+
size 25174016
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3aabd35c50eb9aec0d99c2ba2de9b07ddd578a14515002faa8daee67762463a
|
3 |
+
size 29360128
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7672e0726f4183149a65d1a4b13459f3d02986cb7cac23302767661295597cba
|
3 |
+
size 58720256
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd3aec0889ebfe24f041648c5601cd5d35e084b6473d63ba0f08a669fe0dc831
|
3 |
+
size 33046528
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9935be239f1862067f0c313368659d78e53b901b042cb5214e1d3694955a2c13
|
3 |
+
size 29360128
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71263e45591d8e5666a5c40caa7ac5d7e20584b53b4c253f91682e051f8f3422
|
3 |
+
size 58720256
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4efd984eb4ea0f1174f500559b74e561e98ae2fa33df7cb4276201eba751c456
|
3 |
+
size 22036480
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6ab93cfe9668a6ffe4b46dee078f0aee2634344ac00896fc527241b9539a063
|
3 |
+
size 29360128
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0cfedcf8aa8a02241e4245cd6b7c8cce4667ca86055fd5936f20608ef363970d
|
3 |
+
size 29360128
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5307ebe0a798e9c2b9face0959946fdd1d3728a8edcc88ee017bbbadae2c20f
|
3 |
+
size 58720256
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9dcd921537512de48295a5ef3a9f9a45cb8a4f9f9c859fdb0221f872fe3a892a
|
3 |
+
size 58720256
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e148cae473c3d1a07fb78a723a7372706c878886f0d47e115001a477a4ff228
|
3 |
+
size 29892608
|
params_shard_6.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cba414fb4793fd72d0aca5d1e7110ffd4659667a395a4dc95f9f9d0fba2eda42
|
3 |
+
size 29360128
|
params_shard_7.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bca94926d3a27a95091c33cd5fd247823bf0e57b47464efaa1643dac7d8a8a27
|
3 |
+
size 30949376
|
params_shard_8.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3eb185d7cbd0cd1420aab7deca3646950c1e666e5998df06628035bc5bef2860
|
3 |
+
size 58720256
|
params_shard_9.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:077259ecc87870b5a3069c688e15576fc7cec92164db592dd6ee0d3b0f3e70ff
|
3 |
+
size 25174016
|