kaushiknp ChenMnZ commited on
Commit
5e74d2a
0 Parent(s):

Duplicate from ChenMnZ/Llama-2-13b-chat-omniquant-w3a16g128asym

Browse files

Co-authored-by: Mengzhao Chen <[email protected]>

This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +36 -0
  2. Llama-2-13b-chat-omniquant-w3a16g128asym-cuda.so +3 -0
  3. mod_cache_before_build.pkl +3 -0
  4. params/mlc-chat-config.json +18 -0
  5. params/ndarray-cache.json +0 -0
  6. params/params_shard_0.bin +3 -0
  7. params/params_shard_1.bin +3 -0
  8. params/params_shard_10.bin +3 -0
  9. params/params_shard_100.bin +3 -0
  10. params/params_shard_101.bin +3 -0
  11. params/params_shard_102.bin +3 -0
  12. params/params_shard_103.bin +3 -0
  13. params/params_shard_104.bin +3 -0
  14. params/params_shard_105.bin +3 -0
  15. params/params_shard_106.bin +3 -0
  16. params/params_shard_107.bin +3 -0
  17. params/params_shard_108.bin +3 -0
  18. params/params_shard_109.bin +3 -0
  19. params/params_shard_11.bin +3 -0
  20. params/params_shard_110.bin +3 -0
  21. params/params_shard_111.bin +3 -0
  22. params/params_shard_112.bin +3 -0
  23. params/params_shard_113.bin +3 -0
  24. params/params_shard_114.bin +3 -0
  25. params/params_shard_115.bin +3 -0
  26. params/params_shard_116.bin +3 -0
  27. params/params_shard_117.bin +3 -0
  28. params/params_shard_118.bin +3 -0
  29. params/params_shard_119.bin +3 -0
  30. params/params_shard_12.bin +3 -0
  31. params/params_shard_120.bin +3 -0
  32. params/params_shard_121.bin +3 -0
  33. params/params_shard_122.bin +3 -0
  34. params/params_shard_123.bin +3 -0
  35. params/params_shard_124.bin +3 -0
  36. params/params_shard_125.bin +3 -0
  37. params/params_shard_126.bin +3 -0
  38. params/params_shard_127.bin +3 -0
  39. params/params_shard_128.bin +3 -0
  40. params/params_shard_129.bin +3 -0
  41. params/params_shard_13.bin +3 -0
  42. params/params_shard_130.bin +3 -0
  43. params/params_shard_131.bin +3 -0
  44. params/params_shard_132.bin +3 -0
  45. params/params_shard_133.bin +3 -0
  46. params/params_shard_134.bin +3 -0
  47. params/params_shard_135.bin +3 -0
  48. params/params_shard_136.bin +3 -0
  49. params/params_shard_137.bin +3 -0
  50. params/params_shard_138.bin +3 -0
.gitattributes ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.so filter=lfs diff=lfs merge=lfs -text
23
+ *.pt filter=lfs diff=lfs merge=lfs -text
24
+ *.pth filter=lfs diff=lfs merge=lfs -text
25
+ *.rar filter=lfs diff=lfs merge=lfs -text
26
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
27
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
29
+ *.tar filter=lfs diff=lfs merge=lfs -text
30
+ *.tflite filter=lfs diff=lfs merge=lfs -text
31
+ *.tgz filter=lfs diff=lfs merge=lfs -text
32
+ *.wasm filter=lfs diff=lfs merge=lfs -text
33
+ *.xz filter=lfs diff=lfs merge=lfs -text
34
+ *.zip filter=lfs diff=lfs merge=lfs -text
35
+ *.zst filter=lfs diff=lfs merge=lfs -text
36
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
Llama-2-13b-chat-omniquant-w3a16g128asym-cuda.so ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17045fa2d500f8696ab9bddf9548bd786a82436ce072359f37e4ab1500d0dbed
3
+ size 22643752
mod_cache_before_build.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abd18a0c6ce594e5c43aac85b225cb4fcbffe4951262c5221090713a021f0a41
3
+ size 37565116
params/mlc-chat-config.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_lib": "Llama-2-13b-chat-omniquant-w3a16g128asym",
3
+ "local_id": "Llama-2-13b-chat-omniquant-w3a16g128asym",
4
+ "conv_template": "llama-2",
5
+ "temperature": 0.7,
6
+ "repetition_penalty": 1.0,
7
+ "top_p": 0.95,
8
+ "mean_gen_len": 128,
9
+ "max_gen_len": 512,
10
+ "shift_fill_factor": 0.3,
11
+ "tokenizer_files": [
12
+ "tokenizer.model",
13
+ "tokenizer.json"
14
+ ],
15
+ "model_category": "llama",
16
+ "model_name": "Llama-2-13b-chat-omniquant",
17
+ "vocab_size": 32000
18
+ }
params/ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params/params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eeb8c2d8a4ba799831bc7f2feed6bac6fb242a6d26632fa2502a091e83596e44
3
+ size 327680000
params/params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dee239ceed33cb76b56ae440d76168dcd927a7b9ea206d1b9ed65f2e13c7f9dd
3
+ size 32686080
params/params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:052e39bcc9928677d0cc309b8aa7eadee05e81e3c4956a15e8e64147c0d58cfd
3
+ size 28303360
params/params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2b1b8de7d4a5bb2a4cbe673d491f52633314b7adaa4aebb596c7b86acaca9e6
3
+ size 25108480
params/params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abfaffc7d0b44821060fab95dc388fcbf24b97b1f44bf84c75646c2601dfcc9d
3
+ size 56623104
params/params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9310568dc306c19430d38d0249c6ec89a6b1dcc8493ef0276cd9e63e4729f802
3
+ size 28303360
params/params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36a5d5049e307ae70fe49989ba1b57c1aa1f78d2479974301b1215b898a7b7f1
3
+ size 31457280
params/params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb84205a295ca29e3eff094ed94b6d9f48aa80c0d186eba335a44c611d8dab59
3
+ size 56623104
params/params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ead65ed64be3a901243f10ce39ce27ecf06cdeec2a7f767b1f6707656b6625ec
3
+ size 31723520
params/params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46418342fc87197c07794afd1f5dc3a8a3bddd888312aa1347f9d453fa28c665
3
+ size 32727040
params/params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80b56ee85f4f49d1fea7c47b5c3daee815ded876584837dd50d0ce4a4d118842
3
+ size 31457280
params/params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5792fc88610671136685b796ccfadc39267cc4c5f9fd9a353372506170f1dc3f
3
+ size 56623104
params/params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ee4f60529ec8bff6686a6cd72e7a37b0153e032f57441bc0f0ecdcecde5a539
3
+ size 28303360
params/params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69ecf3f4c45d5c5a248078a0f7fd5a7e49b9d6c4581a00a2bca3de0a22d68880
3
+ size 31457280
params/params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36ed472bf3d1b97a336445dcd9f62140cccacd73dce89ff0269adc2567b52958
3
+ size 31457280
params/params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e79a7edec8f45f2c70cff8850679abdd4fe66027717cf1c8f6ee327454eac5d
3
+ size 25108480
params/params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c21db2fe3318ac4992c1d820ec6cd93dce7e3b678b805816eaee9c890a6d297
3
+ size 56623104
params/params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1aa2222dad121d79f1d9ad6432f7685306a52a9f39c72ddb04f072e44596d946
3
+ size 28303360
params/params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8492dcfc58a3c20ff16bbf4153c08b75f13565b607fb9bdb18a26808384f286d
3
+ size 31457280
params/params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:298c832e68dd63678cfa23deb334a769ab6cce8aeeacee8e167fc67966c57dee
3
+ size 56623104
params/params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:916360be4370d753dbb52c2c07970e310347229bd03d3864bf4f350d164acac6
3
+ size 31723520
params/params_shard_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad6076fdab29377a927be0ded4ff5b763b4a01e9c2163c22f60722f74e3b0813
3
+ size 32727040
params/params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbd56722fbb46f928fc361a8bdcf82f7a4fd0112504600783fa3c50f8afff1af
3
+ size 31457280
params/params_shard_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5fa00f4bded110ae3aa9909f207d5ea3488e529773474523984e4a5ec15f44f
3
+ size 56623104
params/params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83d77b5cfca65ae2d3ba9e43f199f655c247317736a5fef7e5585da2cb93d638
3
+ size 25108480
params/params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7229da5d157879d7a01c5b5429c7a7e29232f75731aa7cd8ca7aebd50c6d0e5
3
+ size 28303360
params/params_shard_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6c8972b75b220b4edd32091fd44a71893c59ee7c18b4426d02255cc372a6e72
3
+ size 31457280
params/params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d296ae814c2bc415d1c9cc7faa79d56a2cfb62eacd16604c40f9d00045e626c3
3
+ size 25108480
params/params_shard_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49ab51f0e97133c88a2c0b572e4673057474687c79ce3b0583f07cea02f14211
3
+ size 56623104
params/params_shard_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbe7ee343768a91f19d2fb54ada8339049648406c86d4b6a58b819cec5622718
3
+ size 28303360
params/params_shard_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb12390cdffc7b562190e40c82bd6f5fa07d4da06993950062777fe04d42bead
3
+ size 31457280
params/params_shard_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:004655e81c96aa4167ac6e42ad135737e97d327e8b06744355c97b153c6f904b
3
+ size 56623104
params/params_shard_127.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f211bc96a16914bb6e07ad27dbe9fddbf51e00d2fb883b43c7b9c436cac7746
3
+ size 31723520
params/params_shard_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17ddb4b592d38323cb1f24746c8c6b663bf9d03f2ee11b276ea6aa0a5ae70a22
3
+ size 32727040
params/params_shard_129.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b89c7689ae5a84a66a3becfbbfe7f39d827e67ffe5995d42047c9f0f0451203
3
+ size 31457280
params/params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a05af784b8df6c465084a5a0c82620b6706148a07325a6d1aac633ed45b5495
3
+ size 56623104
params/params_shard_130.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99d03939a6596b95c87b28260e1a6ec37cfe4c87d515ff7004a2b76a6ca7ce2c
3
+ size 56623104
params/params_shard_131.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00415db5d6720af2e2fdf09d7646f1d9258a6cdc786263d8a06fc2c35bb1de84
3
+ size 28303360
params/params_shard_132.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d57ed4c29751598fe4998619c004fdd6732a787c946dae80ca27ec6174680fc
3
+ size 31457280
params/params_shard_133.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be08535bf6839db3641cf783ea14a520e14243e2bff71bd4adddae8dcee87e57
3
+ size 25108480
params/params_shard_134.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f8cf8078688669a48bd1aaf98589ba24b4fca5a57b0c46e6f302cba72f57f38
3
+ size 56623104
params/params_shard_135.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d17097f3411096dc053819e3a9c98b2c5e612c36dcf52a9c5131862afeea606
3
+ size 28303360
params/params_shard_136.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9012a2d524678ae8a1e3a333cc439f38a2208c2900da851ddf7e3e5ef22087e9
3
+ size 31457280
params/params_shard_137.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35f0f3303aa5a73a0e261d900303afc66582f9cb80365aeb713c437ffdfe8d67
3
+ size 56623104
params/params_shard_138.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:805ad0f0738d10ceb9aeeff60c709b3abcb70aedee0a0299a54b6f1cb7d26f65
3
+ size 31723520