vignesh-spericorn commited on
Commit
3ba3ad5
·
verified ·
1 Parent(s): 26d2c34

Quantized Llama-3.1-8B-Instruct model for Android.

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Llama-3.1-8B-Instruct-q4f16_1-android.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d10431147255f8376e61690640aac09838106caa2fc90e8f3527ed9dea4f6eb
3
+ size 485771
mlc-chat-config.json ADDED
@@ -0,0 +1,91 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "llama",
4
+ "quantization": "q4f16_1",
5
+ "model_config": {
6
+ "hidden_size": 4096,
7
+ "intermediate_size": 14336,
8
+ "num_attention_heads": 32,
9
+ "num_hidden_layers": 32,
10
+ "rms_norm_eps": 1e-05,
11
+ "vocab_size": 128256,
12
+ "tie_word_embeddings": false,
13
+ "position_embedding_base": 500000.0,
14
+ "rope_scaling": {
15
+ "factor": 8.0,
16
+ "low_freq_factor": 1.0,
17
+ "high_freq_factor": 4.0,
18
+ "original_max_position_embeddings": 8192,
19
+ "rope_type": "llama3"
20
+ },
21
+ "context_window_size": 16384,
22
+ "prefill_chunk_size": 2048,
23
+ "num_key_value_heads": 8,
24
+ "head_dim": 128,
25
+ "tensor_parallel_shards": 1,
26
+ "pipeline_parallel_stages": 1,
27
+ "max_batch_size": 80
28
+ },
29
+ "vocab_size": 128256,
30
+ "context_window_size": 16384,
31
+ "sliding_window_size": -1,
32
+ "prefill_chunk_size": 2048,
33
+ "attention_sink_size": -1,
34
+ "tensor_parallel_shards": 1,
35
+ "pipeline_parallel_stages": 1,
36
+ "temperature": 0.6,
37
+ "presence_penalty": 0.0,
38
+ "frequency_penalty": 0.0,
39
+ "repetition_penalty": 1.0,
40
+ "top_p": 0.9,
41
+ "tokenizer_files": [
42
+ "tokenizer.json",
43
+ "tokenizer_config.json"
44
+ ],
45
+ "tokenizer_info": {
46
+ "token_postproc_method": "byte_level",
47
+ "prepend_space_in_encode": false,
48
+ "strip_space_in_decode": false
49
+ },
50
+ "conv_template": {
51
+ "name": "llama-3",
52
+ "system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}<|eot_id|>",
53
+ "system_message": "You are a helpful, respectful and honest assistant.",
54
+ "system_prefix_token_ids": [
55
+ 128000
56
+ ],
57
+ "add_role_after_system_message": true,
58
+ "roles": {
59
+ "user": "<|start_header_id|>user",
60
+ "assistant": "<|start_header_id|>assistant"
61
+ },
62
+ "role_templates": {
63
+ "user": "{user_message}",
64
+ "assistant": "{assistant_message}",
65
+ "tool": "{tool_message}"
66
+ },
67
+ "messages": [],
68
+ "seps": [
69
+ "<|eot_id|>"
70
+ ],
71
+ "role_content_sep": "<|end_header_id|>\n\n",
72
+ "role_empty_sep": "<|end_header_id|>\n\n",
73
+ "stop_str": [
74
+ "<|end_of_text|>",
75
+ "<|eot_id|>"
76
+ ],
77
+ "stop_token_ids": [
78
+ 128001,
79
+ 128009
80
+ ],
81
+ "function_string": "",
82
+ "use_function_calling": false
83
+ },
84
+ "pad_token_id": 0,
85
+ "bos_token_id": 128000,
86
+ "eos_token_id": [
87
+ 128001,
88
+ 128008,
89
+ 128009
90
+ ]
91
+ }
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30e0c9df09008d26d6637efc22a3820e0f9c0cad52726b0283c148688e712e79
3
+ size 262668288
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b839780d7d6d3a0fa2e56de9ccb1317f9effbf732e961b1413eef6c714fa42f8
3
+ size 29360128
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52bc3179bce3a922c7e1772499d6373e977a6ceaee740c0ad4a2130346be4190
3
+ size 33046528
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93398ab90303c104be503570f3a2018c174f5311e65f8217c688df0b676477f5
3
+ size 29360128
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2576b3e76c54eacd2f42ecb58c56051ebcc3b1187f38f375428406d96bddd08
3
+ size 58720256
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2007301affaba92c8b57b60b377d37ab49031bbcc4e14534780d601d08f901e0
3
+ size 22036480
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7168ca5da715e4f8857140384d1e1ce68d9d435b18655caecfaa6abfb0acc1fa
3
+ size 29360128
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db3787cb3af04af21eae064a06c93d435f8456ef557c0236feea5f684efbc06d
3
+ size 58720256
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04d0dae4558d60088df05a874cbc2aaf1ca32a56446d7148af881da9f30d6ac8
3
+ size 27271168
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe0a9ca1458c39ad3845075baf59ebe2b15421e33fb172f5c34d0312adf49b74
3
+ size 29360128
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9add55c60969390a50d2b54fdf088112e1b8fa8560a217d17a9e17b05422d25c
3
+ size 30949376
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1ba4db5736e0d31030cade7a6f9c80cc2617f932dc25ba1946d408fd74589d2
3
+ size 58720256
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46a01095032dc8e6fce9f2b5628799d1bd2cf715ea1db5c2780ab599e0b45578
3
+ size 32841728
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3190e67f9bb4087dd0085e00e9bac98187ccdd32a1338377184582ee33648c74
3
+ size 25174016
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae8658bc05408acad38a66d98d77b067026a1e7e750535a72ed5fd85eca76a0e
3
+ size 29360128
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9170002181b9752c559efc29d128266b7fcb4c0f3f22b91d8c7ba03c431e7e28
3
+ size 58720256
params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:526c5e5d253a2a0695570586ffa9dbf57508390c620f837ee421788f7cae0e3a
3
+ size 33046528
params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d86414512665c749c3fe522106b7c328222b0e007befbc2afa33ca74036a3230
3
+ size 29360128
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:968a9243afecacdb822e4d26999356954f74a6ce34067b894738deb08acc2d8e
3
+ size 58720256
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71ab195c5d2eecdb9f95ab39bf0e3301d5244a1837312ee5b8dfd84bac60e54f
3
+ size 22036480
params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:350aaf137cd4eea43bd7b14637350fadab029b207bffc22e0ca21fe0de7016ce
3
+ size 29360128
params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6ea8b80c0c4ddaeb8699c2cc667dd8875a7a6fe391e0e5f40d3ab55d69986da
3
+ size 58720256
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29b8d81e771bd6f0edb792d7734e10ffe4eb6e94ea99682f99dbbe715b8d433f
3
+ size 27271168
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4758f2510398d0d62c59ad356d4168503d612b15c10bfeed77ddf1a7fb7e864
3
+ size 262668288
params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:266037dd30cd51f5c40d6f793033e8f18d094a94c469485542ad06837def40b1
3
+ size 29360128
params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7a99571b6a88007e4a5cbfc52995345e19a6cf8d68ab8e5714c61662ec61f7f
3
+ size 30949376
params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:549c7a05a875b880ed2549dfb6af0606d46b27399dc7e61b6bf0cde37a466815
3
+ size 58720256
params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af4750940312b615a33d9fa2b375d57eeaeb3ceb5dbfec789b6f69645c7108b4
3
+ size 25174016
params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84d8036ae5fb674c1f6ce4ccbd2f2c03ebb1fa47e91f44eb0834bb6eb64184e1
3
+ size 29360128
params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29a7844be721048b8f69ff638778cd72730cf04be348131a06172c98d1d1b59d
3
+ size 58720256
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a5a04e5bfa29dc0c61638b9bbd27f884508343f7208a9163cf53112ea09b1d3
3
+ size 33046528
params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7712451348bcbfed70b2dcc8818d20f95d90c525ab256cdaceac4d26f914e8ea
3
+ size 29360128
params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c3df3852df27eabaa3016b751b54ab317a00bd7904987ffa048c36fdf99f0cf
3
+ size 58720256
params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12831f974dba4fd2993406669437196469e4cb2e4a865955511bc2bd862440a7
3
+ size 22036480
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93686dc4245e85f12cc20b2679458614c2ed2ca33383eeb650984c4116f62401
3
+ size 32833536
params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e1a230dd906d2aa9c18f36c835806d57d2370313f43a2c9b12995d4436b0e57
3
+ size 29360128
params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30873de097b49faf3a8b9d80295c5433ba66518cc4b67055a96065685da4ad30
3
+ size 58720256
params_shard_42.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e49913bc3cffb9eccac7a877228f731788414606e9a4bc07313bacacafb18d88
3
+ size 27271168
params_shard_43.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1aa0a5a9ad7f49422986d22b5079da97552420ff7f0eb0a1957ad5f94bbe5253
3
+ size 29360128
params_shard_44.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e01ca1b9f7295fe6c65fba87f84e2a29f3405085f67ae95bb466e16a30d41806
3
+ size 30949376
params_shard_45.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f65276051e49f60120002688826683827385981e954be78c0c754653b32df733
3
+ size 58720256
params_shard_46.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14886dc2b22de5d5aad178a9510b14f5d2d8cd1b7bf401dffec6ea4287f04064
3
+ size 25174016
params_shard_47.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7419bf0b33f82107a26b5644604822a9f746a193f74a9201f65c1880bb1be26d
3
+ size 29360128
params_shard_48.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e43d7babb35294e524cad4e37069341f0cb72c98b5ead736bd590aaa9e12afbc
3
+ size 58720256
params_shard_49.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd9b16e879c40a046315e107e26bab8df07394f2cde4adaf51a5606feb964004
3
+ size 33046528
params_shard_5.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb5fd175492192eba07857acc8277a7e186821c6678b5870fca96f51ec4e6841
3
+ size 33054720
params_shard_50.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38a781aba767ce6dd17ea437d36a9501f02157df4e855eafd0d69ff8a061ab22
3
+ size 29360128
params_shard_51.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1615bec0c9fc502a330d22a6891897211e706d26fc181d07aa470b631a8394e
3
+ size 58720256