vignesh-spericorn commited on
Commit
e3eecf3
·
verified ·
1 Parent(s): e0281bd

Quantized Llama-3-8B-Instruct model for Android.

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Llama-3-8B-Instruct-q4f16_1-android.tar ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:468c2d596eba75863af3cdc4860c644c7f79918ec35f9f239df27d76821d63e6
3
+ size 477047
mlc-chat-config.json ADDED
@@ -0,0 +1,84 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "llama",
4
+ "quantization": "q4f16_1",
5
+ "model_config": {
6
+ "hidden_size": 4096,
7
+ "intermediate_size": 14336,
8
+ "num_attention_heads": 32,
9
+ "num_hidden_layers": 32,
10
+ "rms_norm_eps": 1e-05,
11
+ "vocab_size": 128256,
12
+ "tie_word_embeddings": false,
13
+ "position_embedding_base": 500000.0,
14
+ "rope_scaling": null,
15
+ "context_window_size": 8192,
16
+ "prefill_chunk_size": 1024,
17
+ "num_key_value_heads": 8,
18
+ "head_dim": 128,
19
+ "tensor_parallel_shards": 1,
20
+ "pipeline_parallel_stages": 1,
21
+ "max_batch_size": 80
22
+ },
23
+ "vocab_size": 128256,
24
+ "context_window_size": 8192,
25
+ "sliding_window_size": -1,
26
+ "prefill_chunk_size": 1024,
27
+ "attention_sink_size": -1,
28
+ "tensor_parallel_shards": 1,
29
+ "pipeline_parallel_stages": 1,
30
+ "temperature": 0.6,
31
+ "presence_penalty": 0.0,
32
+ "frequency_penalty": 0.0,
33
+ "repetition_penalty": 1.0,
34
+ "top_p": 0.9,
35
+ "tokenizer_files": [
36
+ "tokenizer.json",
37
+ "tokenizer_config.json"
38
+ ],
39
+ "tokenizer_info": {
40
+ "token_postproc_method": "byte_level",
41
+ "prepend_space_in_encode": false,
42
+ "strip_space_in_decode": false
43
+ },
44
+ "conv_template": {
45
+ "name": "llama-3",
46
+ "system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}<|eot_id|>",
47
+ "system_message": "You are a helpful, respectful and honest assistant.",
48
+ "system_prefix_token_ids": [
49
+ 128000
50
+ ],
51
+ "add_role_after_system_message": true,
52
+ "roles": {
53
+ "user": "<|start_header_id|>user",
54
+ "assistant": "<|start_header_id|>assistant"
55
+ },
56
+ "role_templates": {
57
+ "user": "{user_message}",
58
+ "assistant": "{assistant_message}",
59
+ "tool": "{tool_message}"
60
+ },
61
+ "messages": [],
62
+ "seps": [
63
+ "<|eot_id|>"
64
+ ],
65
+ "role_content_sep": "<|end_header_id|>\n\n",
66
+ "role_empty_sep": "<|end_header_id|>\n\n",
67
+ "stop_str": [
68
+ "<|end_of_text|>",
69
+ "<|eot_id|>"
70
+ ],
71
+ "stop_token_ids": [
72
+ 128001,
73
+ 128009
74
+ ],
75
+ "function_string": "",
76
+ "use_function_calling": false
77
+ },
78
+ "pad_token_id": 0,
79
+ "bos_token_id": 128000,
80
+ "eos_token_id": [
81
+ 128001,
82
+ 128009
83
+ ]
84
+ }
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2ed37d77cd108bf6f4ae44b752deb6d9ff230cab0d1dd6e498a7afc24733099
3
+ size 262668288
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c45006b20e9cbbf1941a106dbddd5b043a24a4484cc15f7dca444031d5e59ada
3
+ size 29360128
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92423d1e470526664d2cdd09bcf9111d813fea4cf22223636b05c2d9229a1618
3
+ size 33046528
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c745443ff322319bd8120fb43169e40167159e9dc96047b544015e601114522d
3
+ size 29360128
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddcb0155d652d7dcbdf83af1c8da095c66a2e94f30a755c7889cfc7456e30485
3
+ size 58720256
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee8a779df967099cc3684157d4c68badd7a4df554ee7ae57f7249cde1180c77e
3
+ size 22036480
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:028dcb0f5706b25a6173bf9cb2ebd4aa833f04a3bb6c0756415f63afdad91833
3
+ size 29360128
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6434d2b1cedfb96b5105758c697fafcc2380e41c29350ca1d5942f64ec7a005e
3
+ size 58720256
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:687c80c5494efe7efa0288ef9d3ffb44c1eedc8558c151da9b84d0a6f4eff583
3
+ size 27271168
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54126705bc9a09bb3310855a4ecd3d5e57c5d94b3facf877a1a400c21e871ef6
3
+ size 29360128
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e05bfa4a2c5d0bc93573a75ecd287a4938b83ee4af669fe5e9e0d3c43146bc2
3
+ size 30949376
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30130ce7c89c60aa54c00c167ca8962411178a59c24207f0ad00bfb863404fab
3
+ size 58720256
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63962a1a538ff2ecc296c6d07ff461247cfe1fa28950a97a7779dd80c4bb4d1e
3
+ size 32841728
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f655c2bf134b5b9a85f6247651ef076f624d8165b8f531e6aaa52cde8395c603
3
+ size 25174016
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bc9128b9f3c5abca94c4e13619347a1f36f539e7795552cbdbf437055e0cd9f
3
+ size 29360128
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fa3a2a4c7742eb08bc6b8b8e17d78dfeb2ec1d6490e1a16add6925ca4e79009
3
+ size 58720256
params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d90de65f027fb1fc916f02ff73b55ae84e036fcf2f35fc5407ef25da61c20931
3
+ size 33046528
params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36605734cb52b92aa8635262f13b15d82610da79722877194557d69b37e6463a
3
+ size 29360128
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc13fb93d3054955f68a3840818dd74ee39941c682d45e4ddcaceeca46d9b9f3
3
+ size 58720256
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab76e5856b186751326e893e227802986deaa8151329a3d2a5ba35a9e2d84b1b
3
+ size 22036480
params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6597b2a99b385cb36d77a387f3a035eec1e0a2c53de017c8db246c2774d0471f
3
+ size 29360128
params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f9787abf533597067187590595ca737771f089ecabe53ef76770b37e8f58f18
3
+ size 58720256
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa3a9e9df3c533bdcafa8819381d0bb3efc67d277177349cf6cafbfa84af8fca
3
+ size 27271168
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d34f1fcb18350c4f89329f1db8ae657b37ae48926dfaf8a9aa25d98c26f9a03
3
+ size 262668288
params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b59ffd98eb25881c21bbc6b0843cccf12d3f98a08fe26f1030c93812131cf4f
3
+ size 29360128
params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c50b2f9ff6744c1cadedb37ee0ad1c7f800ad3f607fb76003b127377b75d72d
3
+ size 30949376
params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7d78304a26c4164b72a5d71450c21979e711fb88ea963e142d34165f33deb9b
3
+ size 58720256
params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3223acb25be3c6f301ea8f88e2c4d0f07c6f49c65faae047984e9805cb9486fc
3
+ size 25174016
params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3051a8f94165689c4cfc0c05563c9b02e351f7667d0da97f123a2ee405d38dc6
3
+ size 29360128
params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de466d5e972ee871cea39086fff82049da244b471a136af264af64c4279cceb4
3
+ size 58720256
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a192ac9f10be719ca8780c989693583b894c84817205189d3b0d69f4db96f27
3
+ size 33046528
params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f23031f20e901678c3188e63e5e09ced63d4395c8c34ae87b22cbb349fa3a72d
3
+ size 29360128
params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64b9dc05e957ab2f7df4b5699231ad6b8a0cf5e8919ee749ee11debbbd9ae18e
3
+ size 58720256
params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef42d957681f632ec441cf7ddf8374c7394d6d29685a1c683624a457a4caced7
3
+ size 22036480
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2328a9e043f74b15f0843a8b02637a4b1b6e5925809c2dc53dd131aeefdc2958
3
+ size 32833536
params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c1a32e5f9d72ec6a3a6e03bd929c5a0d8d3c5cca4dbc33e2234476532477e7f
3
+ size 29360128
params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c925ab081cb0f0e5171b6a4111eb469e3268b5b62352e461f5f00af2093c00ed
3
+ size 58720256
params_shard_42.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bc9760e7e0b84d91c4a674d29cf59a3f96f12a4f010190381f4e8ed08e86bca
3
+ size 27271168
params_shard_43.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfae6aaee7745e8173fa56a0c6215cae83c01965552c0df972252bc7e190ec0a
3
+ size 29360128
params_shard_44.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:918cf3dcea91beffd39225a5150ae89b4436558224d8dc7f5100c55770f45c0c
3
+ size 30949376
params_shard_45.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0dc0ca0b511de2388e20d5f72167ed747378f33fcfcedacca43ad5eec3bcb9db
3
+ size 58720256
params_shard_46.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a92a6f8b7e040d97d542c7abe8c53eae25f9d474f0d1c0f51f55559e71989793
3
+ size 25174016
params_shard_47.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4dc8c5169ca64950b8e2d836811e8a5e839d8dec1782507c5f6f4b7cb59a137
3
+ size 29360128
params_shard_48.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ee03a62715c12b3762a8fa1ebad16d5f45bb770c8e961f24ecaf29000d3fc34
3
+ size 58720256
params_shard_49.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91552281ad4b0958fab076436b134a0b83501dc67cb302996bc1b277c7625dc9
3
+ size 33046528
params_shard_5.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ace01f913511f79d5795ab41f53a6d98bbd2cbd3aa5f33131bd7d9721a0ba5a5
3
+ size 33054720
params_shard_50.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:120c9cc985228f3d2df78dbfa93c107521526897c1ff51e9539d084343cd40c2
3
+ size 29360128
params_shard_51.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fc37d82901d34c2dd1cbc777d22ff8bc8772947a1986b79685f1b8e5d339e46
3
+ size 58720256