Upload folder using huggingface_hub
Browse files- README.md +13 -3
- config.json +8 -0
- embeddings_bf16.bin +3 -0
- llm.mnn +3 -0
- llm.mnn.json +3 -0
- llm.mnn.weight +3 -0
- llm_config.json +14 -0
- tokenizer.txt +0 -0
README.md
CHANGED
@@ -1,3 +1,13 @@
|
|
1 |
-
---
|
2 |
-
license: apache-2.0
|
3 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
license: apache-2.0
|
3 |
+
language:
|
4 |
+
- en
|
5 |
+
pipeline_tag: text-generation
|
6 |
+
tags:
|
7 |
+
- chat
|
8 |
+
---
|
9 |
+
# Qwen2.5-0.5B-Instruct-MNN
|
10 |
+
|
11 |
+
## Introduction
|
12 |
+
|
13 |
+
This model is a 4-bit quantized version of the MNN model exported from Qwen2.5-0.5B-Instruct-MNN using [llm-export](https://github.com/wangzhaode/llm-export).
|
config.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"llm_model": "llm.mnn",
|
3 |
+
"llm_weight": "llm.mnn.weight",
|
4 |
+
"backend_type": "cpu",
|
5 |
+
"thread_num": 4,
|
6 |
+
"precision": "low",
|
7 |
+
"memory": "low"
|
8 |
+
}
|
embeddings_bf16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e96b0df6d274768cbb7e72404011853d23349999b658dc2f4dfb3c431ea223f
|
3 |
+
size 272269312
|
llm.mnn
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:480da511e603bd82f8d4af4e1f778ad72baadf8307f3585465ad9a94daca1a88
|
3 |
+
size 566264
|
llm.mnn.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:245ce4289f456dcb371a8f8deabf75c3c4ee75f34b19e0d9723ba09b2fbacf8c
|
3 |
+
size 2808932
|
llm.mnn.weight
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ed0f4dcdd31dca15fcb548d2fc8b63b0014031fbd5f627508435726f90c75da
|
3 |
+
size 277967498
|
llm_config.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"hidden_size": 896,
|
3 |
+
"layer_nums": 24,
|
4 |
+
"attention_mask": "float",
|
5 |
+
"key_value_shape": [
|
6 |
+
2,
|
7 |
+
1,
|
8 |
+
0,
|
9 |
+
2,
|
10 |
+
64
|
11 |
+
],
|
12 |
+
"prompt_template": "<|im_start|>user\n%s<|im_end|>\n<|im_start|>assistant\n",
|
13 |
+
"is_visual": false
|
14 |
+
}
|
tokenizer.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|