allknowingroger
commited on
Commit
•
92d0e9b
1
Parent(s):
47a58a3
Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- README.md +38 -0
- added_tokens.json +5 -0
- config.json +29 -0
- mergekit_config.yml +8 -0
- merges.txt +0 -0
- model-00001-of-00067.safetensors +3 -0
- model-00002-of-00067.safetensors +3 -0
- model-00003-of-00067.safetensors +3 -0
- model-00004-of-00067.safetensors +3 -0
- model-00005-of-00067.safetensors +3 -0
- model-00006-of-00067.safetensors +3 -0
- model-00007-of-00067.safetensors +3 -0
- model-00008-of-00067.safetensors +3 -0
- model-00009-of-00067.safetensors +3 -0
- model-00010-of-00067.safetensors +3 -0
- model-00011-of-00067.safetensors +3 -0
- model-00012-of-00067.safetensors +3 -0
- model-00013-of-00067.safetensors +3 -0
- model-00014-of-00067.safetensors +3 -0
- model-00015-of-00067.safetensors +3 -0
- model-00016-of-00067.safetensors +3 -0
- model-00017-of-00067.safetensors +3 -0
- model-00018-of-00067.safetensors +3 -0
- model-00019-of-00067.safetensors +3 -0
- model-00020-of-00067.safetensors +3 -0
- model-00021-of-00067.safetensors +3 -0
- model-00022-of-00067.safetensors +3 -0
- model-00023-of-00067.safetensors +3 -0
- model-00024-of-00067.safetensors +3 -0
- model-00025-of-00067.safetensors +3 -0
- model-00026-of-00067.safetensors +3 -0
- model-00027-of-00067.safetensors +3 -0
- model-00028-of-00067.safetensors +3 -0
- model-00029-of-00067.safetensors +3 -0
- model-00030-of-00067.safetensors +3 -0
- model-00031-of-00067.safetensors +3 -0
- model-00032-of-00067.safetensors +3 -0
- model-00033-of-00067.safetensors +3 -0
- model-00034-of-00067.safetensors +3 -0
- model-00035-of-00067.safetensors +3 -0
- model-00036-of-00067.safetensors +3 -0
- model-00037-of-00067.safetensors +3 -0
- model-00038-of-00067.safetensors +3 -0
- model-00039-of-00067.safetensors +3 -0
- model-00040-of-00067.safetensors +3 -0
- model-00041-of-00067.safetensors +3 -0
- model-00042-of-00067.safetensors +3 -0
- model-00043-of-00067.safetensors +3 -0
- model-00044-of-00067.safetensors +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
README.md
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
base_model:
|
3 |
+
- dnhkng/RYS-XLarge
|
4 |
+
library_name: transformers
|
5 |
+
tags:
|
6 |
+
- mergekit
|
7 |
+
- merge
|
8 |
+
|
9 |
+
---
|
10 |
+
# merge
|
11 |
+
|
12 |
+
This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
|
13 |
+
|
14 |
+
## Merge Details
|
15 |
+
### Merge Method
|
16 |
+
|
17 |
+
This model was merged using the SLERP merge method.
|
18 |
+
|
19 |
+
### Models Merged
|
20 |
+
|
21 |
+
The following models were included in the merge:
|
22 |
+
* [dnhkng/RYS-XLarge](https://huggingface.co/dnhkng/RYS-XLarge)
|
23 |
+
|
24 |
+
### Configuration
|
25 |
+
|
26 |
+
The following YAML configuration was used to produce this model:
|
27 |
+
|
28 |
+
```yaml
|
29 |
+
models:
|
30 |
+
- model: dnhkng/RYS-XLarge
|
31 |
+
- model: dnhkng/RYS-XLarge
|
32 |
+
merge_method: slerp
|
33 |
+
base_model: dnhkng/RYS-XLarge
|
34 |
+
dtype: float32
|
35 |
+
parameters:
|
36 |
+
t: [0, 0.5, 1, 0.5, 0] # V shaped curve: Hermes for input & output, WizardMath in the middle layers
|
37 |
+
|
38 |
+
```
|
added_tokens.json
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<|endoftext|>": 151643,
|
3 |
+
"<|im_end|>": 151645,
|
4 |
+
"<|im_start|>": 151644
|
5 |
+
}
|
config.json
ADDED
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "dnhkng/RYS-XLarge",
|
3 |
+
"architectures": [
|
4 |
+
"Qwen2ForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 151643,
|
8 |
+
"eos_token_id": 151645,
|
9 |
+
"hidden_act": "silu",
|
10 |
+
"hidden_size": 8192,
|
11 |
+
"initializer_range": 0.02,
|
12 |
+
"intermediate_size": 29568,
|
13 |
+
"max_position_embeddings": 32768,
|
14 |
+
"max_window_layers": 80,
|
15 |
+
"model_type": "qwen2",
|
16 |
+
"num_attention_heads": 64,
|
17 |
+
"num_hidden_layers": 86,
|
18 |
+
"num_key_value_heads": 8,
|
19 |
+
"rms_norm_eps": 1e-06,
|
20 |
+
"rope_scaling": null,
|
21 |
+
"rope_theta": 1000000.0,
|
22 |
+
"sliding_window": null,
|
23 |
+
"tie_word_embeddings": false,
|
24 |
+
"torch_dtype": "float32",
|
25 |
+
"transformers_version": "4.45.1",
|
26 |
+
"use_cache": true,
|
27 |
+
"use_sliding_window": false,
|
28 |
+
"vocab_size": 151646
|
29 |
+
}
|
mergekit_config.yml
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
models:
|
2 |
+
- model: dnhkng/RYS-XLarge
|
3 |
+
- model: dnhkng/RYS-XLarge
|
4 |
+
merge_method: slerp
|
5 |
+
base_model: dnhkng/RYS-XLarge
|
6 |
+
dtype: float32
|
7 |
+
parameters:
|
8 |
+
t: [0, 0.5, 1, 0.5, 0] # V shaped curve: Hermes for input & output, WizardMath in the middle layers
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
model-00001-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfd8750203b7bcbf73618d3ded41abdc194f65eb92cbad236acab842a187b5cb
|
3 |
+
size 4969136256
|
model-00002-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d291d8cbed14d98a958946ffafba43e204e2f2bf1be460798f8aafc080d1614
|
3 |
+
size 4969169144
|
model-00003-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d2c4c8fa91881bb501b342a999ac3f22e55c3e9c19f07504a4dce50812f851d
|
3 |
+
size 4479624672
|
model-00004-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e47c87936d1c47ba254cc87a70df5125f85a5c2849228da246f7b4c9ba6cf6d6
|
3 |
+
size 4479624680
|
model-00005-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:759f140e1e4f19b9c715b1d8819b95ecca5306d9d378956fb59198f561a804dc
|
3 |
+
size 4781684776
|
model-00006-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fcb47b8ba325c41e1df39b1cd06c1d8ac1449482a1e7bf2d56a347152dbcafe
|
3 |
+
size 4781651888
|
model-00007-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1d25dc2011ab96aa9ec5c9bbd3259818e0acea38b07348a7325d714d2e1a6bf
|
3 |
+
size 4479624688
|
model-00008-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ffb28e091cc377a363badfd1518d905b078565c473ec1030647063d217dacd1e
|
3 |
+
size 4781684776
|
model-00009-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c785c40669a7d23901e231f5894a5d6fdc1b960161ae3b8df0a04ce8929c016d
|
3 |
+
size 4781651888
|
model-00010-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da079f13bd921122de9355c11f3ec48b3b009ca463043bef713968a15240ae15
|
3 |
+
size 4479624688
|
model-00011-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10154b18f5ec52fb30e5a8296c7c4db0b9d6ffc9c78e6ad78f07865a8e0ab389
|
3 |
+
size 4781684776
|
model-00012-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e71e64073b1869214af02b5ad9dd7af395b8647498bd751185e87d36ecf1921e
|
3 |
+
size 4781651880
|
model-00013-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02e7b18ea0226793c42e1ba85f85d836e34cfb9d1bf1051409cbb569fba35150
|
3 |
+
size 4479624688
|
model-00014-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38ef519826c1cf02890ba5f584edadd4a7a48a8531a614735e6ad1a41e62710f
|
3 |
+
size 4781684776
|
model-00015-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5dcc63022522be7f39b48233b05251e44e457c8371ede143151e31f736ac8f4
|
3 |
+
size 4781651888
|
model-00016-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a51661fa303cb05e97ec705c85ee78fe21c47efa0540bbb06c2d9145889ad5e
|
3 |
+
size 4479624688
|
model-00017-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e824f7f003e04d9b84f16b01ba762a37785a6f1bc709d8b8a50d1c3e8f2f1689
|
3 |
+
size 4781684776
|
model-00018-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78a0117deefcc24b86705bd8b60f958c65b2bd37a82d557a68104d2081e5fd44
|
3 |
+
size 4781651888
|
model-00019-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d03bbec59aafb9c8145ab4d73a68228eda6fa8aff5ca6ea560c98780cd6d700
|
3 |
+
size 4479624688
|
model-00020-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3139b557b9fa8209446d7aace61244071c76e320d165cc039047442f808edd64
|
3 |
+
size 4781684768
|
model-00021-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03dd2214092600d72ae62907ee3de74dad4ef31e111417a3ab82f879b276d164
|
3 |
+
size 4781651888
|
model-00022-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:987beb77905343e9b7cc38b97f06711ffd1f9aa02348463e8ea3426a20fbcb3b
|
3 |
+
size 4479624688
|
model-00023-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98b4346dc11aaba8315e320eae0c4ac525af79d29d5b8f902dfabcb2df81482a
|
3 |
+
size 4781684776
|
model-00024-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e0147122eecb64427646d3ba658b8d22b7b691d3f2260090544360aa9347c59
|
3 |
+
size 4781651888
|
model-00025-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4e711b598caeec14a4388ee9d7321226713289d5bcb9a9ac98a492a43d4de4d
|
3 |
+
size 4479624688
|
model-00026-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0233a5e475a0eec8d427e2d6f8015b94a2e1b729de96ac7fba38c2645481de89
|
3 |
+
size 4781684776
|
model-00027-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98ff430ea90afc77f7e9d671e498cc84f3564579acae55f67b7caa0ef75b9703
|
3 |
+
size 4781651888
|
model-00028-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:854ce86bc868348dfc287a9a8c7b29ff9e5348b5d36371b11eaf931dc843d5c0
|
3 |
+
size 4479624688
|
model-00029-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5a48d7f7fdbbb18abc2b3066ca438ef1d3742479ba81f30ec2fe91cdd83da89
|
3 |
+
size 4781684768
|
model-00030-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c89eecd9250febf0d89c9bee7a7e21f2e9e77155ff5eb2d57e8f3a6cafb3b54d
|
3 |
+
size 4781651888
|
model-00031-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5ea81ac35939257ed491b8c989fc34ba3e14135802641a472b447ad7010ccee
|
3 |
+
size 4479624688
|
model-00032-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:568ee9fba502a0d3cb5c9f8a95d617f9992cffea8b33c5ef0bbddaa60d7f72e0
|
3 |
+
size 4781684776
|
model-00033-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bdcfa87c31053b3b20f1df9c02be82ff0f3c71c9b21084756df815b4a58b633
|
3 |
+
size 4781651888
|
model-00034-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebdbf639443fcb2a2f839794f40f506f7a81c9d288a8296acb374b8e8941d8f7
|
3 |
+
size 4479624688
|
model-00035-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94994af66a94c578823f0243de5a6c662436252613efaec6cf8c6d577d6e6381
|
3 |
+
size 4781684776
|
model-00036-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5331aa70339ee825f65652ac1576891d2c97e290e4ccae162db779edfcc732bf
|
3 |
+
size 4781651888
|
model-00037-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76533b032978d1b2fb5f62d6fb1df70af1beeb9b9f121755f62cd4adf2257e74
|
3 |
+
size 4479624680
|
model-00038-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17c79131836d60911735ab77fd5eba36b765d6c4baa74259144c941939ab9881
|
3 |
+
size 4781684776
|
model-00039-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d739c458c123338e0cadbaa31dfa8465a9be2f623d401f86c3decebf3bd7516
|
3 |
+
size 4781651888
|
model-00040-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff92609ecadf6e01720e9ecc436d9a8219ac278d1a88696ad90c70014bf89075
|
3 |
+
size 4479624688
|
model-00041-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcc736f059a0e7c7f2139b8ac6d1a36ee78184db230dacb6d47fad4392a9b8e6
|
3 |
+
size 4781684776
|
model-00042-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:758aa8cdb71bcf76752b639435214e8e8edfa3c94ab856ad26a136729e3247c0
|
3 |
+
size 4781651888
|
model-00043-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b66d322fc06086314fadf4ed0d9a906965e743beafc283fcb9c8859ba59ab7bd
|
3 |
+
size 4479624688
|
model-00044-of-00067.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:031fb5cc270778018fd95a58bd207225b489b71e3ed4eeb1d1766df0bf62512b
|
3 |
+
size 4781684776
|