Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- README.md +17 -0
- added_tokens.json +3 -0
- config.json +30 -0
- mergekit_config.yml +30 -0
- merges.txt +0 -0
- model-00001-of-00082.safetensors +3 -0
- model-00002-of-00082.safetensors +3 -0
- model-00003-of-00082.safetensors +3 -0
- model-00004-of-00082.safetensors +3 -0
- model-00005-of-00082.safetensors +3 -0
- model-00006-of-00082.safetensors +3 -0
- model-00007-of-00082.safetensors +3 -0
- model-00008-of-00082.safetensors +3 -0
- model-00009-of-00082.safetensors +3 -0
- model-00010-of-00082.safetensors +3 -0
- model-00011-of-00082.safetensors +3 -0
- model-00012-of-00082.safetensors +3 -0
- model-00013-of-00082.safetensors +3 -0
- model-00014-of-00082.safetensors +3 -0
- model-00015-of-00082.safetensors +3 -0
- model-00016-of-00082.safetensors +3 -0
- model-00017-of-00082.safetensors +3 -0
- model-00018-of-00082.safetensors +3 -0
- model-00019-of-00082.safetensors +3 -0
- model-00020-of-00082.safetensors +3 -0
- model-00021-of-00082.safetensors +3 -0
- model-00022-of-00082.safetensors +3 -0
- model-00023-of-00082.safetensors +3 -0
- model-00024-of-00082.safetensors +3 -0
- model-00025-of-00082.safetensors +3 -0
- model-00026-of-00082.safetensors +3 -0
- model-00027-of-00082.safetensors +3 -0
- model-00028-of-00082.safetensors +3 -0
- model-00029-of-00082.safetensors +3 -0
- model-00030-of-00082.safetensors +3 -0
- model-00031-of-00082.safetensors +3 -0
- model-00032-of-00082.safetensors +3 -0
- model-00033-of-00082.safetensors +3 -0
- model-00034-of-00082.safetensors +3 -0
- model-00035-of-00082.safetensors +3 -0
- model-00036-of-00082.safetensors +3 -0
- model-00037-of-00082.safetensors +3 -0
- model-00038-of-00082.safetensors +3 -0
- model-00039-of-00082.safetensors +3 -0
- model-00040-of-00082.safetensors +3 -0
- model-00041-of-00082.safetensors +3 -0
- model-00042-of-00082.safetensors +3 -0
- model-00043-of-00082.safetensors +3 -0
- model-00044-of-00082.safetensors +3 -0
- model-00045-of-00082.safetensors +3 -0
README.md
ADDED
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
license: apache-2.0
|
3 |
+
tags:
|
4 |
+
- merge
|
5 |
+
- mergekit
|
6 |
+
- lazymergekit
|
7 |
+
- migtissera/Tess-72B-v1.5b
|
8 |
+
- davidkim205/Rhea-72b-v0.5
|
9 |
+
---
|
10 |
+
|
11 |
+
# TW3-JRGL-v4
|
12 |
+
|
13 |
+
TW3-JRGL-v4 is a merge of the following models using [mergekit](https://github.com/cg123/mergekit):
|
14 |
+
* [migtissera/Tess-72B-v1.5b](https://huggingface.co/migtissera/Tess-72B-v1.5b)
|
15 |
+
* [davidkim205/Rhea-72b-v0.5](https://huggingface.co/davidkim205/Rhea-72b-v0.5)
|
16 |
+
|
17 |
+
## 🧩 Configuration
|
added_tokens.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"[PAD]": 151851
|
3 |
+
}
|
config.json
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "migtissera/Tess-72B-v1.5b",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128245,
|
9 |
+
"eos_token_id": 128247,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 24576,
|
14 |
+
"max_position_embeddings": 32768,
|
15 |
+
"model_type": "llama",
|
16 |
+
"num_attention_heads": 64,
|
17 |
+
"num_hidden_layers": 80,
|
18 |
+
"num_key_value_heads": 64,
|
19 |
+
"pad_token_id": 151643,
|
20 |
+
"pretraining_tp": 1,
|
21 |
+
"rms_norm_eps": 1e-06,
|
22 |
+
"rope_scaling": null,
|
23 |
+
"rope_theta": 1000000,
|
24 |
+
"seq_length": 32768,
|
25 |
+
"tie_word_embeddings": false,
|
26 |
+
"torch_dtype": "bfloat16",
|
27 |
+
"transformers_version": "4.39.3",
|
28 |
+
"use_cache": false,
|
29 |
+
"vocab_size": 152064
|
30 |
+
}
|
mergekit_config.yml
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
base_model: migtissera/Tess-72B-v1.5b
|
2 |
+
dtype: bfloat16
|
3 |
+
merge_method: slerp
|
4 |
+
parameters:
|
5 |
+
t:
|
6 |
+
- filter: self_attn
|
7 |
+
value:
|
8 |
+
- 0
|
9 |
+
- 0.5
|
10 |
+
- 0.3
|
11 |
+
- 0.7
|
12 |
+
- 1
|
13 |
+
- filter: mlp
|
14 |
+
value:
|
15 |
+
- 1
|
16 |
+
- 0.5
|
17 |
+
- 0.7
|
18 |
+
- 0.3
|
19 |
+
- 0
|
20 |
+
- value: 0.5
|
21 |
+
slices:
|
22 |
+
- sources:
|
23 |
+
- layer_range:
|
24 |
+
- 0
|
25 |
+
- 80
|
26 |
+
model: migtissera/Tess-72B-v1.5b
|
27 |
+
- layer_range:
|
28 |
+
- 0
|
29 |
+
- 80
|
30 |
+
model: davidkim205/Rhea-72b-v0.5
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
model-00001-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b076fba39171b1f315254c357286e41f81c082572bc4aaf947e96cd92b5f58fb
|
3 |
+
size 1879164616
|
model-00002-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf66cecfbbf417ba05714ad6aaa6297be5626f111344f1ea02afe616bf0919d8
|
3 |
+
size 402703024
|
model-00003-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a43130851c7ad8e89a98e9efe296ded2bde233d177d5ae3ccd92e44e3a5a9df
|
3 |
+
size 2491416720
|
model-00004-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3cffdb823c4185c67998755c21e53ac79aa37062e828f14279cac897be85d142
|
3 |
+
size 1879164616
|
model-00005-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f972250550d8270ce1505d3dc57484bdb9b8ecf439c64a628ff0b9eba9b38cc3
|
3 |
+
size 1879164608
|
model-00006-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7652acaaf081e4f05a1035426f9d5c7b886edffd15c4eca346c65ed3bdbd3cfd
|
3 |
+
size 1610646216
|
model-00007-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa26f86c541b957a56815b8c1dc0036831574876af51b3ede7885bdaa6884ac6
|
3 |
+
size 1744930280
|
model-00008-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28c1c7aaf672a137595dc53a3978d34f341ad80ff51930b72c1a7402cd3c39f0
|
3 |
+
size 1744930280
|
model-00009-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4142891839942a500e1eb509aca4d14510c37f22742dbc78e5b1ab831759bac0
|
3 |
+
size 1879131376
|
model-00010-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f66787cf9bfd4405016ded7cf99e7a6c19e8c7572a8277df2b3bad291be988ee
|
3 |
+
size 1879148128
|
model-00011-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a47ec7685d2b05e11071901d6744e5a23b6eeb24966437e7168910336f202c3
|
3 |
+
size 1879164616
|
model-00012-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a81d18b0e16ac4576045099d5e447e835f365b3f9cbd52b3edef9037b0c5911b
|
3 |
+
size 1610712664
|
model-00013-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f8bd9531bb00829755c5adf289694c5c2c75f801dd3c254f78e1371c3eee51d
|
3 |
+
size 1744930288
|
model-00014-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a18bcadedbf0f6da21672c623d5e84228ea43f56074845f1f6048cd3b19fd280
|
3 |
+
size 1879214112
|
model-00015-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e64783f011149fc6889ac4da2258ac7b0da9bd6fa72f8e07a60c033f46f08fa0
|
3 |
+
size 1879148136
|
model-00016-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8cb2937f6beb04956dc805e2c4b4d13a70501418c499644d9022df7b67d8211f
|
3 |
+
size 1879164632
|
model-00017-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebd65edb71bf5ea57b27ff626e96f1856441a16936779f1882a91dda06e3691a
|
3 |
+
size 1610695936
|
model-00018-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28df20056453843e2a20fef4722a71581c1d5c1ce97ce212195248709de6ffb2
|
3 |
+
size 1744930288
|
model-00019-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a12d96df5f8b9f996df4e49b04efe1ba4c79f96aab28971ae78ffe71c9a50c6
|
3 |
+
size 1744930288
|
model-00020-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e68482fadbb7ddafb7cc48d7c87b1ba04ef57a13b1d6d7f10a7620364cac7f4d
|
3 |
+
size 1610646216
|
model-00021-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f55fd252981c4b4496994a35e69c308dd81709f4240428166e83c82ee0a05192
|
3 |
+
size 1744930288
|
model-00022-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea2ee36362167c098f85dca3f951242aaf16ca364aabb3b1a5cea6e22441aca8
|
3 |
+
size 1744930288
|
model-00023-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7ddc843e86e21322a91e45c46c436ddba7e9a1bd291792a02d6184fb96990ae
|
3 |
+
size 1879181112
|
model-00024-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34c925f1746b58160b1b33030054d50c55460f94c13286fcc667cf47d942ac96
|
3 |
+
size 1879148128
|
model-00025-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9974d20698c08ce4e59f40d83048020aec42069754f1127ba4bb045a7f96d95b
|
3 |
+
size 1744930280
|
model-00026-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bdab875af7115c5b444675c77f6639b789c34ee708b65e429fe8a4b41dae4b3
|
3 |
+
size 1744897296
|
model-00027-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7453aa485829f08c09f2215d5dcb2dacfdc82742f42e7d9ccbae462bf5da5407
|
3 |
+
size 1744930288
|
model-00028-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5a5e4e1b4f60a00b83ea65fd4df51f62afe6db0e45849b4750b43244e29b175
|
3 |
+
size 1879247336
|
model-00029-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0462f41dfea71d13337091296f71ef885a284aca61a975dac368701522018131
|
3 |
+
size 1744930280
|
model-00030-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63db7e907803c4a9841bce9b73219dcf8e9e493943b94daaf398b8bc01f222f2
|
3 |
+
size 1744930280
|
model-00031-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d606c8c96ae446716cdbba966778947fc8afd16f764ebe6c9c378e8ec1c45ef1
|
3 |
+
size 1879114896
|
model-00032-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3aa7f0d92104f3d7fa7effa45e9d5eabb129ab8b651b5128d0d4575b93764e5d
|
3 |
+
size 1744930288
|
model-00033-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:883ecfd3bc0118fc3fa2686ed604193d1a0b489596512cf115721a0a74bf3382
|
3 |
+
size 1744930288
|
model-00034-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ec762ed683af045c83f1b183965046c2dda2254280f64b6d2ed2dda23feeac1
|
3 |
+
size 1879147896
|
model-00035-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abfa943d8ace0a21f18214bb37afe4cb3ab69933e678983a0082ed417c331c7d
|
3 |
+
size 1879164632
|
model-00036-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ffccaa5bca70ffcfa339fdc80a779f8369e0d6075ed037732a12d8411cd050be
|
3 |
+
size 1610695944
|
model-00037-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7611617dee33c0d85a5f8d8104ffeb0108297d492cf3de36997fbfa7cc00c6e
|
3 |
+
size 1744897296
|
model-00038-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a11eafc0f96c785a2bc8ac952c7d81ec9b2251cbe32d98fc04a90aee3879dfc7
|
3 |
+
size 1744930288
|
model-00039-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4351ec87134658eda01e4799ea8108a40a5dd2c49cf38d3dc699f16f1e78537
|
3 |
+
size 1879181112
|
model-00040-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9c5cfa84f58955bd5029f0f416656f22f4b1bd264e62ea5eabc0c96859d0a8c
|
3 |
+
size 1879148136
|
model-00041-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43a56ae6bdf87b5d23a58a76650f8a7d93515e77099d739f698747e8dd01f070
|
3 |
+
size 1879164632
|
model-00042-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d221cf041935f6cfbc8210d5f0bcd6ea156106944f521adc08491e31e37c093f
|
3 |
+
size 1879164624
|
model-00043-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a55dda9830fc1b8f66a77905f88a39f33a244b30b53fb8be48c963ad58e15ef2
|
3 |
+
size 1744930288
|
model-00044-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f6dc79cf95ac4569b8c983ee85b1a3b488db6b8e7e8419e1256081cc27e05dc
|
3 |
+
size 1879214112
|
model-00045-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:909734628ea75aae199d55c6bfab6e5cb5b9eb4d7e4c9d289a4c8b469caf1b5c
|
3 |
+
size 1879148128
|