Duplicate from ChenMnZ/Llama-2-13b-chat-omniquant-w3a16g128asym
Browse filesCo-authored-by: Mengzhao Chen <[email protected]>
This view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +36 -0
- Llama-2-13b-chat-omniquant-w3a16g128asym-cuda.so +3 -0
- mod_cache_before_build.pkl +3 -0
- params/mlc-chat-config.json +18 -0
- params/ndarray-cache.json +0 -0
- params/params_shard_0.bin +3 -0
- params/params_shard_1.bin +3 -0
- params/params_shard_10.bin +3 -0
- params/params_shard_100.bin +3 -0
- params/params_shard_101.bin +3 -0
- params/params_shard_102.bin +3 -0
- params/params_shard_103.bin +3 -0
- params/params_shard_104.bin +3 -0
- params/params_shard_105.bin +3 -0
- params/params_shard_106.bin +3 -0
- params/params_shard_107.bin +3 -0
- params/params_shard_108.bin +3 -0
- params/params_shard_109.bin +3 -0
- params/params_shard_11.bin +3 -0
- params/params_shard_110.bin +3 -0
- params/params_shard_111.bin +3 -0
- params/params_shard_112.bin +3 -0
- params/params_shard_113.bin +3 -0
- params/params_shard_114.bin +3 -0
- params/params_shard_115.bin +3 -0
- params/params_shard_116.bin +3 -0
- params/params_shard_117.bin +3 -0
- params/params_shard_118.bin +3 -0
- params/params_shard_119.bin +3 -0
- params/params_shard_12.bin +3 -0
- params/params_shard_120.bin +3 -0
- params/params_shard_121.bin +3 -0
- params/params_shard_122.bin +3 -0
- params/params_shard_123.bin +3 -0
- params/params_shard_124.bin +3 -0
- params/params_shard_125.bin +3 -0
- params/params_shard_126.bin +3 -0
- params/params_shard_127.bin +3 -0
- params/params_shard_128.bin +3 -0
- params/params_shard_129.bin +3 -0
- params/params_shard_13.bin +3 -0
- params/params_shard_130.bin +3 -0
- params/params_shard_131.bin +3 -0
- params/params_shard_132.bin +3 -0
- params/params_shard_133.bin +3 -0
- params/params_shard_134.bin +3 -0
- params/params_shard_135.bin +3 -0
- params/params_shard_136.bin +3 -0
- params/params_shard_137.bin +3 -0
- params/params_shard_138.bin +3 -0
.gitattributes
ADDED
@@ -0,0 +1,36 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
*.7z filter=lfs diff=lfs merge=lfs -text
|
2 |
+
*.arrow filter=lfs diff=lfs merge=lfs -text
|
3 |
+
*.bin filter=lfs diff=lfs merge=lfs -text
|
4 |
+
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
5 |
+
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
6 |
+
*.ftz filter=lfs diff=lfs merge=lfs -text
|
7 |
+
*.gz filter=lfs diff=lfs merge=lfs -text
|
8 |
+
*.h5 filter=lfs diff=lfs merge=lfs -text
|
9 |
+
*.joblib filter=lfs diff=lfs merge=lfs -text
|
10 |
+
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
11 |
+
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
12 |
+
*.model filter=lfs diff=lfs merge=lfs -text
|
13 |
+
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
14 |
+
*.npy filter=lfs diff=lfs merge=lfs -text
|
15 |
+
*.npz filter=lfs diff=lfs merge=lfs -text
|
16 |
+
*.onnx filter=lfs diff=lfs merge=lfs -text
|
17 |
+
*.ot filter=lfs diff=lfs merge=lfs -text
|
18 |
+
*.parquet filter=lfs diff=lfs merge=lfs -text
|
19 |
+
*.pb filter=lfs diff=lfs merge=lfs -text
|
20 |
+
*.pickle filter=lfs diff=lfs merge=lfs -text
|
21 |
+
*.pkl filter=lfs diff=lfs merge=lfs -text
|
22 |
+
*.so filter=lfs diff=lfs merge=lfs -text
|
23 |
+
*.pt filter=lfs diff=lfs merge=lfs -text
|
24 |
+
*.pth filter=lfs diff=lfs merge=lfs -text
|
25 |
+
*.rar filter=lfs diff=lfs merge=lfs -text
|
26 |
+
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
27 |
+
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
28 |
+
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
29 |
+
*.tar filter=lfs diff=lfs merge=lfs -text
|
30 |
+
*.tflite filter=lfs diff=lfs merge=lfs -text
|
31 |
+
*.tgz filter=lfs diff=lfs merge=lfs -text
|
32 |
+
*.wasm filter=lfs diff=lfs merge=lfs -text
|
33 |
+
*.xz filter=lfs diff=lfs merge=lfs -text
|
34 |
+
*.zip filter=lfs diff=lfs merge=lfs -text
|
35 |
+
*.zst filter=lfs diff=lfs merge=lfs -text
|
36 |
+
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
Llama-2-13b-chat-omniquant-w3a16g128asym-cuda.so
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17045fa2d500f8696ab9bddf9548bd786a82436ce072359f37e4ab1500d0dbed
|
3 |
+
size 22643752
|
mod_cache_before_build.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abd18a0c6ce594e5c43aac85b225cb4fcbffe4951262c5221090713a021f0a41
|
3 |
+
size 37565116
|
params/mlc-chat-config.json
ADDED
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_lib": "Llama-2-13b-chat-omniquant-w3a16g128asym",
|
3 |
+
"local_id": "Llama-2-13b-chat-omniquant-w3a16g128asym",
|
4 |
+
"conv_template": "llama-2",
|
5 |
+
"temperature": 0.7,
|
6 |
+
"repetition_penalty": 1.0,
|
7 |
+
"top_p": 0.95,
|
8 |
+
"mean_gen_len": 128,
|
9 |
+
"max_gen_len": 512,
|
10 |
+
"shift_fill_factor": 0.3,
|
11 |
+
"tokenizer_files": [
|
12 |
+
"tokenizer.model",
|
13 |
+
"tokenizer.json"
|
14 |
+
],
|
15 |
+
"model_category": "llama",
|
16 |
+
"model_name": "Llama-2-13b-chat-omniquant",
|
17 |
+
"vocab_size": 32000
|
18 |
+
}
|
params/ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params/params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eeb8c2d8a4ba799831bc7f2feed6bac6fb242a6d26632fa2502a091e83596e44
|
3 |
+
size 327680000
|
params/params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dee239ceed33cb76b56ae440d76168dcd927a7b9ea206d1b9ed65f2e13c7f9dd
|
3 |
+
size 32686080
|
params/params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:052e39bcc9928677d0cc309b8aa7eadee05e81e3c4956a15e8e64147c0d58cfd
|
3 |
+
size 28303360
|
params/params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2b1b8de7d4a5bb2a4cbe673d491f52633314b7adaa4aebb596c7b86acaca9e6
|
3 |
+
size 25108480
|
params/params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abfaffc7d0b44821060fab95dc388fcbf24b97b1f44bf84c75646c2601dfcc9d
|
3 |
+
size 56623104
|
params/params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9310568dc306c19430d38d0249c6ec89a6b1dcc8493ef0276cd9e63e4729f802
|
3 |
+
size 28303360
|
params/params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36a5d5049e307ae70fe49989ba1b57c1aa1f78d2479974301b1215b898a7b7f1
|
3 |
+
size 31457280
|
params/params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb84205a295ca29e3eff094ed94b6d9f48aa80c0d186eba335a44c611d8dab59
|
3 |
+
size 56623104
|
params/params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ead65ed64be3a901243f10ce39ce27ecf06cdeec2a7f767b1f6707656b6625ec
|
3 |
+
size 31723520
|
params/params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46418342fc87197c07794afd1f5dc3a8a3bddd888312aa1347f9d453fa28c665
|
3 |
+
size 32727040
|
params/params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80b56ee85f4f49d1fea7c47b5c3daee815ded876584837dd50d0ce4a4d118842
|
3 |
+
size 31457280
|
params/params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5792fc88610671136685b796ccfadc39267cc4c5f9fd9a353372506170f1dc3f
|
3 |
+
size 56623104
|
params/params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ee4f60529ec8bff6686a6cd72e7a37b0153e032f57441bc0f0ecdcecde5a539
|
3 |
+
size 28303360
|
params/params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69ecf3f4c45d5c5a248078a0f7fd5a7e49b9d6c4581a00a2bca3de0a22d68880
|
3 |
+
size 31457280
|
params/params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36ed472bf3d1b97a336445dcd9f62140cccacd73dce89ff0269adc2567b52958
|
3 |
+
size 31457280
|
params/params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e79a7edec8f45f2c70cff8850679abdd4fe66027717cf1c8f6ee327454eac5d
|
3 |
+
size 25108480
|
params/params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c21db2fe3318ac4992c1d820ec6cd93dce7e3b678b805816eaee9c890a6d297
|
3 |
+
size 56623104
|
params/params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1aa2222dad121d79f1d9ad6432f7685306a52a9f39c72ddb04f072e44596d946
|
3 |
+
size 28303360
|
params/params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8492dcfc58a3c20ff16bbf4153c08b75f13565b607fb9bdb18a26808384f286d
|
3 |
+
size 31457280
|
params/params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:298c832e68dd63678cfa23deb334a769ab6cce8aeeacee8e167fc67966c57dee
|
3 |
+
size 56623104
|
params/params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:916360be4370d753dbb52c2c07970e310347229bd03d3864bf4f350d164acac6
|
3 |
+
size 31723520
|
params/params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad6076fdab29377a927be0ded4ff5b763b4a01e9c2163c22f60722f74e3b0813
|
3 |
+
size 32727040
|
params/params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbd56722fbb46f928fc361a8bdcf82f7a4fd0112504600783fa3c50f8afff1af
|
3 |
+
size 31457280
|
params/params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5fa00f4bded110ae3aa9909f207d5ea3488e529773474523984e4a5ec15f44f
|
3 |
+
size 56623104
|
params/params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83d77b5cfca65ae2d3ba9e43f199f655c247317736a5fef7e5585da2cb93d638
|
3 |
+
size 25108480
|
params/params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7229da5d157879d7a01c5b5429c7a7e29232f75731aa7cd8ca7aebd50c6d0e5
|
3 |
+
size 28303360
|
params/params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6c8972b75b220b4edd32091fd44a71893c59ee7c18b4426d02255cc372a6e72
|
3 |
+
size 31457280
|
params/params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d296ae814c2bc415d1c9cc7faa79d56a2cfb62eacd16604c40f9d00045e626c3
|
3 |
+
size 25108480
|
params/params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49ab51f0e97133c88a2c0b572e4673057474687c79ce3b0583f07cea02f14211
|
3 |
+
size 56623104
|
params/params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dbe7ee343768a91f19d2fb54ada8339049648406c86d4b6a58b819cec5622718
|
3 |
+
size 28303360
|
params/params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb12390cdffc7b562190e40c82bd6f5fa07d4da06993950062777fe04d42bead
|
3 |
+
size 31457280
|
params/params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:004655e81c96aa4167ac6e42ad135737e97d327e8b06744355c97b153c6f904b
|
3 |
+
size 56623104
|
params/params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f211bc96a16914bb6e07ad27dbe9fddbf51e00d2fb883b43c7b9c436cac7746
|
3 |
+
size 31723520
|
params/params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17ddb4b592d38323cb1f24746c8c6b663bf9d03f2ee11b276ea6aa0a5ae70a22
|
3 |
+
size 32727040
|
params/params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b89c7689ae5a84a66a3becfbbfe7f39d827e67ffe5995d42047c9f0f0451203
|
3 |
+
size 31457280
|
params/params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a05af784b8df6c465084a5a0c82620b6706148a07325a6d1aac633ed45b5495
|
3 |
+
size 56623104
|
params/params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99d03939a6596b95c87b28260e1a6ec37cfe4c87d515ff7004a2b76a6ca7ce2c
|
3 |
+
size 56623104
|
params/params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00415db5d6720af2e2fdf09d7646f1d9258a6cdc786263d8a06fc2c35bb1de84
|
3 |
+
size 28303360
|
params/params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d57ed4c29751598fe4998619c004fdd6732a787c946dae80ca27ec6174680fc
|
3 |
+
size 31457280
|
params/params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be08535bf6839db3641cf783ea14a520e14243e2bff71bd4adddae8dcee87e57
|
3 |
+
size 25108480
|
params/params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f8cf8078688669a48bd1aaf98589ba24b4fca5a57b0c46e6f302cba72f57f38
|
3 |
+
size 56623104
|
params/params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d17097f3411096dc053819e3a9c98b2c5e612c36dcf52a9c5131862afeea606
|
3 |
+
size 28303360
|
params/params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9012a2d524678ae8a1e3a333cc439f38a2208c2900da851ddf7e3e5ef22087e9
|
3 |
+
size 31457280
|
params/params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35f0f3303aa5a73a0e261d900303afc66582f9cb80365aeb713c437ffdfe8d67
|
3 |
+
size 56623104
|
params/params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:805ad0f0738d10ceb9aeeff60c709b3abcb70aedee0a0299a54b6f1cb7d26f65
|
3 |
+
size 31723520
|