Upload folder using huggingface_hub
Browse files- README.md +6 -6
- config.json +1 -1
- mergekit_config.yml +2 -2
- model-00001-of-00001.safetensors +1 -1
README.md
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
---
|
2 |
base_model:
|
3 |
-
- autoprogrammer/Llama-3.2-1B-Instruct-sw
|
4 |
-
- autoprogrammer/Llama-3.2-1B-Instruct-be
|
5 |
- autoprogrammer/Llama-3.2-1B-Instruct-zh
|
|
|
|
|
6 |
library_name: transformers
|
7 |
tags:
|
8 |
- mergekit
|
@@ -16,13 +16,13 @@ This is a merge of pre-trained language models created using [mergekit](https://
|
|
16 |
## Merge Details
|
17 |
### Merge Method
|
18 |
|
19 |
-
This model was merged using the [TIES](https://arxiv.org/abs/2306.01708) merge method using [autoprogrammer/Llama-3.2-1B-Instruct-
|
20 |
|
21 |
### Models Merged
|
22 |
|
23 |
The following models were included in the merge:
|
24 |
-
* [autoprogrammer/Llama-3.2-1B-Instruct-sw](https://huggingface.co/autoprogrammer/Llama-3.2-1B-Instruct-sw)
|
25 |
* [autoprogrammer/Llama-3.2-1B-Instruct-zh](https://huggingface.co/autoprogrammer/Llama-3.2-1B-Instruct-zh)
|
|
|
26 |
|
27 |
### Configuration
|
28 |
|
@@ -30,7 +30,7 @@ The following YAML configuration was used to produce this model:
|
|
30 |
|
31 |
```yaml
|
32 |
models:
|
33 |
-
- model: autoprogrammer/Llama-3.2-1B-Instruct-
|
34 |
- model: autoprogrammer/Llama-3.2-1B-Instruct-sw
|
35 |
parameters:
|
36 |
density: 1.0
|
@@ -40,7 +40,7 @@ models:
|
|
40 |
density: 1.0
|
41 |
weight: 1.0
|
42 |
merge_method: ties
|
43 |
-
base_model: autoprogrammer/Llama-3.2-1B-Instruct-
|
44 |
parameters:
|
45 |
normalize: true
|
46 |
dtype: float16
|
|
|
1 |
---
|
2 |
base_model:
|
|
|
|
|
3 |
- autoprogrammer/Llama-3.2-1B-Instruct-zh
|
4 |
+
- autoprogrammer/Llama-3.2-1B-Instruct-sw
|
5 |
+
- autoprogrammer/Llama-3.2-1B-Instruct-th
|
6 |
library_name: transformers
|
7 |
tags:
|
8 |
- mergekit
|
|
|
16 |
## Merge Details
|
17 |
### Merge Method
|
18 |
|
19 |
+
This model was merged using the [TIES](https://arxiv.org/abs/2306.01708) merge method using [autoprogrammer/Llama-3.2-1B-Instruct-th](https://huggingface.co/autoprogrammer/Llama-3.2-1B-Instruct-th) as a base.
|
20 |
|
21 |
### Models Merged
|
22 |
|
23 |
The following models were included in the merge:
|
|
|
24 |
* [autoprogrammer/Llama-3.2-1B-Instruct-zh](https://huggingface.co/autoprogrammer/Llama-3.2-1B-Instruct-zh)
|
25 |
+
* [autoprogrammer/Llama-3.2-1B-Instruct-sw](https://huggingface.co/autoprogrammer/Llama-3.2-1B-Instruct-sw)
|
26 |
|
27 |
### Configuration
|
28 |
|
|
|
30 |
|
31 |
```yaml
|
32 |
models:
|
33 |
+
- model: autoprogrammer/Llama-3.2-1B-Instruct-th
|
34 |
- model: autoprogrammer/Llama-3.2-1B-Instruct-sw
|
35 |
parameters:
|
36 |
density: 1.0
|
|
|
40 |
density: 1.0
|
41 |
weight: 1.0
|
42 |
merge_method: ties
|
43 |
+
base_model: autoprogrammer/Llama-3.2-1B-Instruct-th
|
44 |
parameters:
|
45 |
normalize: true
|
46 |
dtype: float16
|
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "autoprogrammer/Llama-3.2-1B-Instruct-
|
3 |
"architectures": [
|
4 |
"LlamaForCausalLM"
|
5 |
],
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "autoprogrammer/Llama-3.2-1B-Instruct-th",
|
3 |
"architectures": [
|
4 |
"LlamaForCausalLM"
|
5 |
],
|
mergekit_config.yml
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
models:
|
2 |
-
- model: autoprogrammer/Llama-3.2-1B-Instruct-
|
3 |
- model: autoprogrammer/Llama-3.2-1B-Instruct-sw
|
4 |
parameters:
|
5 |
density: 1.0
|
@@ -9,7 +9,7 @@ models:
|
|
9 |
density: 1.0
|
10 |
weight: 1.0
|
11 |
merge_method: ties
|
12 |
-
base_model: autoprogrammer/Llama-3.2-1B-Instruct-
|
13 |
parameters:
|
14 |
normalize: true
|
15 |
dtype: float16
|
|
|
1 |
models:
|
2 |
+
- model: autoprogrammer/Llama-3.2-1B-Instruct-th
|
3 |
- model: autoprogrammer/Llama-3.2-1B-Instruct-sw
|
4 |
parameters:
|
5 |
density: 1.0
|
|
|
9 |
density: 1.0
|
10 |
weight: 1.0
|
11 |
merge_method: ties
|
12 |
+
base_model: autoprogrammer/Llama-3.2-1B-Instruct-th
|
13 |
parameters:
|
14 |
normalize: true
|
15 |
dtype: float16
|
model-00001-of-00001.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2471645464
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd70beb576bd1a82e796d16a10c58771d08343f3c123df9ad7b10c2ffc1a00cd
|
3 |
size 2471645464
|