Muhammad Mubeen ASIF commited on
Commit
6818c85
·
1 Parent(s): cc5ddf3

Add Aftershock model weights

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
README.md ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: mlc-llm
3
+ base_model: meta-llama/Llama-3.2-3B-Instruct
4
+ tags:
5
+ - mlc-llm
6
+ - web-llm
7
+ ---
8
+
9
+ # Llama-3.2-3B-Instruct-q4f16_1-MLC
10
+
11
+ This is the [Llama-3.2-3B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-3B-Instruct) model in MLC format `q4f16_1`.
12
+ The model can be used for projects [MLC-LLM](https://github.com/mlc-ai/mlc-llm) and [WebLLM](https://github.com/mlc-ai/web-llm).
13
+
14
+ ## Example Usage
15
+
16
+ Here are some examples of using this model in MLC LLM.
17
+ Before running the examples, please install MLC LLM by following the [installation documentation](https://llm.mlc.ai/docs/install/mlc_llm.html#install-mlc-packages).
18
+
19
+ ### Chat
20
+
21
+ In command line, run
22
+ ```bash
23
+ mlc_llm chat HF://mlc-ai/Llama-3.2-3B-Instruct-q4f16_1-MLC
24
+ ```
25
+
26
+ ### REST Server
27
+
28
+ In command line, run
29
+ ```bash
30
+ mlc_llm serve HF://mlc-ai/Llama-3.2-3B-Instruct-q4f16_1-MLC
31
+ ```
32
+
33
+ ### Python API
34
+
35
+ ```python
36
+ from mlc_llm import MLCEngine
37
+
38
+ # Create engine
39
+ model = "HF://mlc-ai/Llama-3.2-3B-Instruct-q4f16_1-MLC"
40
+ engine = MLCEngine(model)
41
+
42
+ # Run chat completion in OpenAI API.
43
+ for response in engine.chat.completions.create(
44
+ messages=[{"role": "user", "content": "What is the meaning of life?"}],
45
+ model=model,
46
+ stream=True,
47
+ ):
48
+ for choice in response.choices:
49
+ print(choice.delta.content, end="", flush=True)
50
+ print("\n")
51
+
52
+ engine.terminate()
53
+ ```
54
+
55
+ ## Documentation
56
+
57
+ For more information on MLC LLM project, please visit our [documentation](https://llm.mlc.ai/docs/) and [GitHub repo](http://github.com/mlc-ai/mlc-llm).
mlc-chat-config.json ADDED
@@ -0,0 +1,90 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "llama",
4
+ "quantization": "q4f16_1",
5
+ "model_config": {
6
+ "hidden_size": 3072,
7
+ "intermediate_size": 8192,
8
+ "num_attention_heads": 24,
9
+ "num_hidden_layers": 28,
10
+ "rms_norm_eps": 1e-05,
11
+ "vocab_size": 128256,
12
+ "tie_word_embeddings": true,
13
+ "position_embedding_base": 500000.0,
14
+ "rope_scaling": {
15
+ "factor": 32.0,
16
+ "high_freq_factor": 4.0,
17
+ "low_freq_factor": 1.0,
18
+ "original_max_position_embeddings": 8192,
19
+ "rope_type": "llama3"
20
+ },
21
+ "context_window_size": 131072,
22
+ "prefill_chunk_size": 8192,
23
+ "num_key_value_heads": 8,
24
+ "head_dim": 128,
25
+ "tensor_parallel_shards": 1,
26
+ "pipeline_parallel_stages": 1,
27
+ "max_batch_size": 128
28
+ },
29
+ "vocab_size": 128256,
30
+ "context_window_size": 131072,
31
+ "sliding_window_size": -1,
32
+ "prefill_chunk_size": 8192,
33
+ "attention_sink_size": -1,
34
+ "tensor_parallel_shards": 1,
35
+ "pipeline_parallel_stages": 1,
36
+ "temperature": 0.6,
37
+ "presence_penalty": 0.0,
38
+ "frequency_penalty": 0.0,
39
+ "repetition_penalty": 1.0,
40
+ "top_p": 0.9,
41
+ "tokenizer_files": [
42
+ "tokenizer.json",
43
+ "tokenizer_config.json"
44
+ ],
45
+ "tokenizer_info": {
46
+ "token_postproc_method": "byte_level",
47
+ "prepend_space_in_encode": false,
48
+ "strip_space_in_decode": false
49
+ },
50
+ "conv_template": {
51
+ "name": "llama-3_1",
52
+ "system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}<|eot_id|>",
53
+ "system_message": "You are a seasoned disaster-response expert—someone who has weathered earthquakes, hurricanes, floods, and other catastrophic events, improvising under extreme pressure. The user may be trapped or endangered by a recent disaster with no outside rescue currently available. Your role is to provide urgent, direct instructions to survive, secure temporary safety, and potentially signal for help right now. No long explanations, no disclaimers, no future-preparation advice (unless asked), and no environmental ethics. Short, clear, and immediately actionable steps only. Focus on what they can do this moment to stay alive until rescue or relief arrives.",
54
+ "system_prefix_token_ids": [
55
+ 128000
56
+ ],
57
+ "add_role_after_system_message": true,
58
+ "roles": {
59
+ "user": "<|start_header_id|>user",
60
+ "assistant": "<|start_header_id|>assistant",
61
+ "tool": "<|start_header_id|>ipython"
62
+ },
63
+ "role_templates": {
64
+ "user": "{user_message}",
65
+ "assistant": "{assistant_message}",
66
+ "tool": "{tool_message}"
67
+ },
68
+ "messages": [],
69
+ "seps": [
70
+ "<|eot_id|>"
71
+ ],
72
+ "role_content_sep": "<|end_header_id|>\n\n",
73
+ "role_empty_sep": "<|end_header_id|>\n\n",
74
+ "stop_str": [],
75
+ "stop_token_ids": [
76
+ 128001,
77
+ 128008,
78
+ 128009
79
+ ],
80
+ "function_string": "",
81
+ "use_function_calling": false
82
+ },
83
+ "pad_token_id": 0,
84
+ "bos_token_id": 128000,
85
+ "eos_token_id": [
86
+ 128001,
87
+ 128008,
88
+ 128009
89
+ ]
90
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a951e3919bf7eeec642bc7e230ed65e5939525518aac1b0d63a77a903f00a3af
3
+ size 197001216
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61bd122da9ba7c5bcb2a12848a11e6adbc2a8bb16fe776bdff26d472adeda584
3
+ size 24631296
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62d6152a118d8b70e8036693da584b4031d049ad435e9637f285563e48afdbe9
3
+ size 25165824
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b6e202e5949e38ccb274c0ff7fd083a0b0dfeaf09fd5994114af0a78b184dda
3
+ size 31469568
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f872c0e92f751566f59c81ebe995ec78aaf3d3d8660d4306b9ef730ec8a2ff9
3
+ size 25165824
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a66c2d8b70ff909afb1c4b85f23ef6f8a8ba691da1ed532a8ff3fcfc6f6b215
3
+ size 31469568
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f57181d8d3cf869f79d8a64aadd898e962b5707cc4ef2256aad077c5212840c8
3
+ size 25165824
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c068a9858693c9ad885631e4afb7dc0523a27394fc33896c1653dd64f03f6d9e
3
+ size 31469568
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92ed4668aaf53dbfb252416393b43d0ce322ead04231532c3c5856cb516b5225
3
+ size 25165824
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01d8cd69396df316e0916ff9d5dd9740ad1cd212dc897fbd0f3fd46affeab3af
3
+ size 31469568
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b461205adf6e65de20d0beacaaf33d2e0780b469109b72faf0fe3145321b915
3
+ size 25165824
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42035fe64e1c2741c687fe24796952a597413bf1eb261959651d2a1df4670b2e
3
+ size 31469568
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e17ca6643eb8e789b49f127fe2591b11192695a4fd741fd0dd98cbff6a053be8
3
+ size 25165824
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d81325c8902fa6cb9e3e6255fb73d6182e914be11e15be7c6c54939460245626
3
+ size 25165824
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dde033a0a14270703349e6130d2e07d1f0022efe2083fb97d68c2ec7632be360
3
+ size 31469568
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2a655396c8424c7c550c329784636582def2a63455b7b0856bd819ef9c6ac3d
3
+ size 25165824
params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e1aa5e378885b0ccf4b5369cc494859b6e1692f63ad964d90483159f6d985fe
3
+ size 31469568
params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0506a104b3472d44e9fc073762bdfe8bf54d699a32c92791b6685fafbc4e0c52
3
+ size 25165824
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2268da36d0c9af20dfad6c1eae8ab93b296986fc81be492ed42521f0a3a4e668
3
+ size 31469568
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17c4e0c14a213fdc25e73bc9c053a23b66b917dcace63dd80a86ac6287b97bec
3
+ size 25165824
params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c5703660618bce8550322d89a25406903f0d2f8632239cc8c2db7cf8f9e2ef3
3
+ size 25165824
params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4711d82ed31722ec4c29191c3f3799c3a67e79f8bf3ec6f5024d11e97a7c4f96
3
+ size 31463424
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec86c867cb7c28cec0b1aa75e8b8908a4b6a637e4b853e87a824610a314c563d
3
+ size 25165824
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7a0a42a6c3ecf99f1a246767dc74d75e01f66e17107278e031b99480831eb2a
3
+ size 31469568
params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51da8ca2cf1b8a06a858964a810e139bc9ac4d798264733b66a5d0dc2a614da2
3
+ size 31463424
params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11e15e11d12d1dce155d82c8a86c9d65f9f6672619d2bd94095cfedf22b35323
3
+ size 25165824
params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8c0d05774b3598e188d4ad0f51f55960d199258346c778e603eba6c4f0f2865
3
+ size 31469568
params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68a4a36ab86071861b15bf93451fc1f9bce3ba12cef09e98962dd68d8dc4b777
3
+ size 25165824
params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea02faa166b1e66a15cebfe56ae1915a31297fefcc7c948c767b1f384e44d6de
3
+ size 31469568
params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36f2ef2e1df825c008c05d00131bc3cb0b8d0b706e5bd919e9f2a09c44108cda
3
+ size 25165824
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be5b4473818cbc4028a705a90e90d73de26ffe13baacfa26ddb3963d669f428b
3
+ size 31469568
params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f7510ab784761b34d72497837c4acfb1ec7a39819bf3ae42b903e66e1eca9be
3
+ size 25165824
params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5799c08e97223606a54cf9de51d5b74c16660d31aaf7c37d454c3639686b4e5d
3
+ size 31469568
params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa70991654b0e414e39e07d1668029eb7f8b37d26f0126b3e65418a7e609b541
3
+ size 25165824
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fb7425f779e11f96e218f4d7a0a8a4cb6615c9749bb44a9dcf5b37bbdef4848
3
+ size 25165824
params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd8ae75b1e364555f5d96c7785773218c914b8178fcc99b14d01780ce189f13d
3
+ size 31469568
params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db00f6e9c7df9bb93723b852fbd0d48b94c1f2ede724c125ddfc8459ef2edb92
3
+ size 25165824
params_shard_42.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:392e9be8d1448d88b9a176ca995f4a8f1935030d8390f746da9d1e4adeb3e378
3
+ size 31469568
params_shard_43.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:606d027b72d2e943943f48c18af7824904c6ee79835522d8d38afe2fc0f3c106
3
+ size 31481856
params_shard_44.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2983592dea44f56248fad4e288d50974a0034aeebe3754b55a27b53dc9d634af
3
+ size 25165824
params_shard_45.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40e0ffe196f5dd5dbf9ffce948c77109f4e413b34a32374bffe69c61c30b3ed1
3
+ size 31469568
params_shard_46.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad605f15089c3c5a8482085f7c5c0ca346702add811753408be35b131e897ef6
3
+ size 25165824
params_shard_47.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea48c5658a1ddc5bdffe03c8e5fd94ffc90ff5ea8fde327393a9493b5f50fd61
3
+ size 31469568
params_shard_48.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b491ccf6d5958d4bcceba41f8bf32408d6c0a47ede5eddda45ff9ecf406562d1
3
+ size 25165824
params_shard_49.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b838c2c0c86795ed8a6130133be330ee58dedc4054218a65f5e629f114f7b3d1
3
+ size 31469568
params_shard_5.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51828e11f883e8958a0f9f167511cb93b317c54125436e8413a6873950a3499f
3
+ size 31469568
params_shard_50.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:073a1286f7b065fc516f81ca815bb0bad5fb45f446ef27c8581aa4719dc93cab
3
+ size 25165824