Upload 5 files
Browse files- .gitattributes +1 -0
- AETEG6110A00KPFHTKMZVNG5C0.jpeg +3 -0
- Playtime_Logo.webp +0 -0
- README.md +174 -0
- non-lore-README-cn.md +50 -0
- non-lore-README.md +50 -0
.gitattributes
CHANGED
@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
37 |
+
AETEG6110A00KPFHTKMZVNG5C0.jpeg filter=lfs diff=lfs merge=lfs -text
|
AETEG6110A00KPFHTKMZVNG5C0.jpeg
ADDED
![]() |
Git LFS Details
|
Playtime_Logo.webp
ADDED
![]() |
README.md
ADDED
@@ -0,0 +1,174 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
license: other
|
3 |
+
license_name: mrl
|
4 |
+
language:
|
5 |
+
- en
|
6 |
+
- zh
|
7 |
+
base_model:
|
8 |
+
- mistralai/Ministral-8B-Instruct-2410
|
9 |
+
library_name: transformers
|
10 |
+
tags:
|
11 |
+
- axolotl
|
12 |
+
- roleplay
|
13 |
+
- conversational
|
14 |
+
- chat
|
15 |
+
---
|
16 |
+
|
17 |
+
<style>
|
18 |
+
main {
|
19 |
+
--creep-bg: #0f0f0f;
|
20 |
+
--blood-rust: #5e2e28;
|
21 |
+
--faded-white: #e8e8e8;
|
22 |
+
background: var(--creep-bg);
|
23 |
+
border-radius: 10px;
|
24 |
+
}
|
25 |
+
main, details {
|
26 |
+
display: flex;
|
27 |
+
flex-direction: column;
|
28 |
+
align-items: center;
|
29 |
+
padding: 15px;
|
30 |
+
overflow-x: scroll;
|
31 |
+
scrollbar-width: none;
|
32 |
+
}
|
33 |
+
.warning-box {
|
34 |
+
background: #2d1a1a;
|
35 |
+
border: 1px solid var(--blood-rust);
|
36 |
+
padding: 15px;
|
37 |
+
margin: 20px 0;
|
38 |
+
position: relative;
|
39 |
+
overflow: hidden;
|
40 |
+
}
|
41 |
+
.warning-box::before {
|
42 |
+
content: '';
|
43 |
+
position: absolute;
|
44 |
+
top: 0;
|
45 |
+
left: -10%;
|
46 |
+
width: 120%;
|
47 |
+
height: 100%;
|
48 |
+
background: linear-gradient(90deg, transparent 0%, #ff000020 50%, transparent 100%);
|
49 |
+
animation: scan 4s infinite linear;
|
50 |
+
}
|
51 |
+
.content-block {
|
52 |
+
background: #1a1a1a;
|
53 |
+
border: 1px solid #333;
|
54 |
+
border-radius: 4px;
|
55 |
+
padding: 20px;
|
56 |
+
margin: 15px 0;
|
57 |
+
box-shadow: 0 2px 8px rgba(0,0,0,0.3);
|
58 |
+
position: relative;
|
59 |
+
}
|
60 |
+
code {
|
61 |
+
background: #000;
|
62 |
+
color: #f8f8f8;
|
63 |
+
padding: 4px 6px;
|
64 |
+
border-radius: 3px;
|
65 |
+
font-family: monospace;
|
66 |
+
border: 1px solid #333;
|
67 |
+
}
|
68 |
+
.spoiler-text {
|
69 |
+
background: linear-gradient(45deg, #ff3b3b, #ff6b6b);
|
70 |
+
-webkit-background-clip: text;
|
71 |
+
color: transparent;
|
72 |
+
text-shadow: 0 0 12px rgba(255,59,59,0.5);
|
73 |
+
animation: glitch 1s infinite steps(2);
|
74 |
+
}
|
75 |
+
img {
|
76 |
+
max-width: min(90vw, 400px);
|
77 |
+
border-radius: 6px;
|
78 |
+
filter: brightness(0.95) contrast(1.1);
|
79 |
+
}
|
80 |
+
@media (max-width: 768px) {
|
81 |
+
main {
|
82 |
+
padding: 10px;
|
83 |
+
}
|
84 |
+
.content-block {
|
85 |
+
padding: 15px;
|
86 |
+
margin: 10px 0;
|
87 |
+
}
|
88 |
+
details[open] {
|
89 |
+
padding-bottom: 20px;
|
90 |
+
}
|
91 |
+
}
|
92 |
+
@keyframes glitch {
|
93 |
+
0% { transform: translateX(0); }
|
94 |
+
25% { transform: translateX(-1px); }
|
95 |
+
50% { transform: translateX(1px); }
|
96 |
+
75% { transform: translateX(-1px); }
|
97 |
+
100% { transform: translateX(0); }
|
98 |
+
}
|
99 |
+
@keyframes scan {
|
100 |
+
0% { transform: translateX(-20%); }
|
101 |
+
100% { transform: translateX(120%); }
|
102 |
+
}
|
103 |
+
</style>
|
104 |
+
|
105 |
+
<main>
|
106 |
+
<img src="Playtime_Logo.webp" alt="Playtime Co. logo" style="transform: rotate(-1deg); box-shadow: 0 4px 20px rgba(0,0,0,0.4);">
|
107 |
+
|
108 |
+
<div style="font-family: system-ui, -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, Oxygen, Ubuntu, Cantarell, sans-serif; line-height: 1.6; max-width: 800px; margin: 0 auto; color: var(--faded-white);">
|
109 |
+
|
110 |
+
<section style="margin-bottom: 30px;">
|
111 |
+
<p style="font-size: 1.1rem; background: #1a1a1a; padding: 20px; border-radius: 6px; border: 1px solid #333; position: relative;">
|
112 |
+
<span style="font-weight: 600; color: #d44d4d;">Us here at Playtime Co.</span> are excited to welcome you to our QA staff! As a signatory of the Employee Confidentiality Agreement, you are required to keep all information regarding the company and our research confidential.
|
113 |
+
</p>
|
114 |
+
|
115 |
+
<p style="font-style: italic; color: #888; text-align: center; margin: 25px 0; text-shadow: 0 1px 3px rgba(0,0,0,0.5);">
|
116 |
+
With that out of the way...
|
117 |
+
</p>
|
118 |
+
</section>
|
119 |
+
|
120 |
+
<details>
|
121 |
+
<summary style="font-size: 1.6rem; cursor: pointer; padding: 15px; background: #2d1a1a; color: white; border-radius: 4px; border: 1px solid #442222; transition: 0.2s;">
|
122 |
+
<span class="spoiler-text">A̶͇͊r̵͎̭͗͛e̶̯̘̋ ̵̤͖̄̕y̶̩̎o̵̡̿u̴̙̅͂ ̵̖̋r̷̮͖̓ě̵̪̹̈́a̸̠̅d̵͖̖̔̋ẙ̷͙̃ ̷̮͖̋̈́t̴͉̅́ȍ̴̹̞ ̵̖̜̈́p̵͕̑̀ľ̵̥̓ȁ̷͔̩̇y̷̞͊̿ ̸͍̺̀͝w̶͙͈̑i̷̡͗̾t̸͎͒̐ḩ̸̳̓ ̴̮̺̇ȗ̴̢͈̉ş̷͖̔̒?̵̝̺́</span>
|
123 |
+
</summary>
|
124 |
+
|
125 |
+
<div style="margin-top: 25px;">
|
126 |
+
<h1 style="color: #d44d4d; border-bottom: 2px solid #442222; padding-bottom: 8px; text-shadow: 0 2px 4px rgba(0,0,0,0.3);">Welcome to the Bigger Bodies Initiative</h1>
|
127 |
+
|
128 |
+
<div style="text-align: center; margin: 25px 0;">
|
129 |
+
<img src="AETEG6110A00KPFHTKMZVNG5C0.jpeg" alt="Catnap" style="max-height: 70vh; border: 2px solid #442222; box-shadow: 0 8px 30px rgba(0,0,0,0.4); transition: 0.3s filter;" onmouseover="this.style.filter='grayscale(80%)'" onmouseout="this.style.filter='none'">
|
130 |
+
</div>
|
131 |
+
|
132 |
+
<h2 style="color: #b33d3d; margin-top: 0; text-transform: uppercase; letter-spacing: 2px;">Experiment 8B</h2>
|
133 |
+
|
134 |
+
<div class="content-block">
|
135 |
+
<h3 style="color: #d44d4d; margin-top: 0;">Usecases</h3>
|
136 |
+
<p>
|
137 |
+
This model was designed for exceptional skill in roleplaying, both with adults and children, for our patent pending Playtime Playground. It seems to have succeeded.
|
138 |
+
</p>
|
139 |
+
|
140 |
+
<h3 style="color: #d44d4d;">Supported Languages</h3>
|
141 |
+
<ul style="list-style-type: '▸ '; padding-left: 25px;">
|
142 |
+
<li style="padding: 5px 0;">Native-quality English</li>
|
143 |
+
<li style="padding: 5px 0;">Mediocre Chinese (further research needed)</li>
|
144 |
+
</ul>
|
145 |
+
</div>
|
146 |
+
|
147 |
+
<div class="content-block">
|
148 |
+
<h3 style="color: #d44d4d; margin-top: 0;">Usage (chat template)</h3>
|
149 |
+
<pre style="background: #000; color: #f8f8f8; padding: 15px; border-radius: 4px; border: 1px solid #333; overflow-x: auto; white-space: pre-wrap; word-break: break-word;">
|
150 |
+
<s>[SYSTEM_PROMPT]What to roleplay as[/SYSTEM_PROMPT][INST]User: xxx[/INST]ASSISTANT: yyy</s></pre>
|
151 |
+
</div>
|
152 |
+
|
153 |
+
<!-- Testing logs would go here if we had any -->
|
154 |
+
|
155 |
+
<div class="warning-box">
|
156 |
+
<h4 style="color: #ff4d4d; margin: 0 0 10px 0;">⚠️ WARNING</h4>
|
157 |
+
<p style="margin: 0;">While Experiment 8B has shown exceptional performance, researchers must maintain safety protocols. Standard containment procedures apply.</p>
|
158 |
+
</div>
|
159 |
+
</div>
|
160 |
+
</details>
|
161 |
+
|
162 |
+
<details style="margin-top: 20px;">
|
163 |
+
<summary style="font-weight: 600; color: #888; cursor: pointer;">Disclaimers</summary>
|
164 |
+
<div style="background: #1a1a1a; padding: 15px; margin-top: 10px; border-radius: 4px; border: 1px solid #333;">
|
165 |
+
Playtime Co., Poppy Playtime, Catnap, and all related properties are trademarks of Mob Entertainment LLC. Not affiliated with or endorsed by Mob Entertainment.
|
166 |
+
</div>
|
167 |
+
</details>
|
168 |
+
|
169 |
+
<div style="display: flex; justify-content: center;">
|
170 |
+
<a href="https://huggingface.co/allura-org/Bigger-Body-12b/blob/main/non-lore-README.md" style="font-weight: 600; color: #888; background: #1a1a1a; padding: 15px; margin-top: 10px; border-radius: 4px; border: 1px solid #333; text-decoration: none; text-align: center;">Go to regular model card</a>
|
171 |
+
</div>
|
172 |
+
|
173 |
+
</div>
|
174 |
+
</main>
|
non-lore-README-cn.md
ADDED
@@ -0,0 +1,50 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[English](./non-lore-README.md) | [简体中文](./non-lore-README-cn.md)
|
2 |
+
|
3 |
+
# Bigger Body 12b
|
4 |
+
data:image/s3,"s3://crabby-images/67d11/67d11c7461cad0a3816967748b30ecc788119344" alt="image/png"
|
5 |
+
基于Ministral Instruct 2410的角色扮演导向伪全微调模型
|
6 |
+
Ink系列的精神续作
|
7 |
+
|
8 |
+
## 数据集
|
9 |
+
Bigger Body(内部仍称为Ink v2.1)的数据混合配方堪称"黑暗料理",比初代Ink混合配方更令人发指。
|
10 |
+
|
11 |
+
<details>
|
12 |
+
<summary>(公开)原始数据集</summary>
|
13 |
+
|
14 |
+
<ul>
|
15 |
+
<li><a href="https://huggingface.co/datasets/Fizzarolli/limarp-processed">Fizzarolli/limarp-processed</a></li>
|
16 |
+
<li><a href="https://huggingface.co/datasets/Norquinal/OpenCAI">Norquinal/OpenCAI</a> - <code>two_users</code> 拆分集</li>
|
17 |
+
<li><a href="https://huggingface.co/datasets/allura-org/Celeste1.x-data-mixture">allura-org/Celeste1.x-data-mixture</a></li>
|
18 |
+
<li><a href="https://huggingface.co/datasets/mapsila/PIPPA-ShareGPT-formatted-named">mapsila/PIPPA-ShareGPT-formatted-named</a></li>
|
19 |
+
<li><a href="https://huggingface.co/datasets/allenai/tulu-3-sft-personas-instruction-following">allenai/tulu-3-sft-personas-instruction-following</a></li>
|
20 |
+
<li><a href="https://huggingface.co/datasets/readmehay/medical-01-reasoning-SFT-json">readmehay/medical-01-reasoning-SFT-json</a></li>
|
21 |
+
<li><a href="https://huggingface.co/datasets/LooksJuicy/ruozhiba">LooksJuicy/ruozhiba</a></li>
|
22 |
+
<li><a href="https://huggingface.co/datasets/shibing624/roleplay-zh-sharegpt-gpt4-data">shibing624/roleplay-zh-sharegpt-gpt4-data</a></li>
|
23 |
+
<li><a href="https://huggingface.co/datasets/CausalLM/Retrieval-SFT-Chat">CausalLM/Retrieval-SFT-Chat</a></li>
|
24 |
+
<li><a href="https://huggingface.co/datasets/ToastyPigeon/fujin-filtered-instruct">ToastyPigeon/fujin-filtered-instruct</a></li>
|
25 |
+
</ul>
|
26 |
+
</details>
|
27 |
+
|
28 |
+
## 量化版本
|
29 |
+
待补充!
|
30 |
+
|
31 |
+
## 推荐配置
|
32 |
+
对话模板:Mistral *v7-tekken*(注意不是v3-tekken!!主要区别是v7版有特定的`[SYSTEM_PROMPT]`和`[/SYSTEM_PROMPT]`标签)
|
33 |
+
推荐采样器(非绝对最优,请自行尝试):
|
34 |
+
- 我完全没头绪。请自行探索。
|
35 |
+
|
36 |
+
## 超参数
|
37 |
+
### 通用配置
|
38 |
+
- 训练轮次 = 2
|
39 |
+
- 学习率 = 2e-6
|
40 |
+
- 学习率调度器 = 余弦退火
|
41 |
+
- 优化器 = [Apollo-mini](https://github.com/zhuhanqing/APOLLO)
|
42 |
+
- 优化目标模块 = `all_linear`
|
43 |
+
- 有效批次大小 = 16
|
44 |
+
- 权重衰减 = 0.01
|
45 |
+
- 预热步数 = 50
|
46 |
+
- 总训练步数 = 920
|
47 |
+
|
48 |
+
## 致谢
|
49 |
+
衷心感谢所有数据集创建者的贡献
|
50 |
+
特别鸣谢Allura成员们的测试支持与精神鼓励 爱你们 /柏拉图式
|
non-lore-README.md
ADDED
@@ -0,0 +1,50 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[English](./non-lore-README.md) | [简体中文](./non-lore-README-cn.md)
|
2 |
+
|
3 |
+
# Bigger Body 12b
|
4 |
+
data:image/s3,"s3://crabby-images/67d11/67d11c7461cad0a3816967748b30ecc788119344" alt="image/png"
|
5 |
+
A roleplay-focused pseudo full-finetune of Ministral Instruct 2410.
|
6 |
+
The successor to the Ink series.
|
7 |
+
|
8 |
+
## Dataset
|
9 |
+
The Bigger Body (referred to as Ink v2.1, because that's still the internal name) mix is absolutely disgusting. It's even more cursed than the original Ink mix.
|
10 |
+
|
11 |
+
<details>
|
12 |
+
<summary>(Public) Original Datasets</summary>
|
13 |
+
|
14 |
+
<ul>
|
15 |
+
<li><a href="https://huggingface.co/datasets/Fizzarolli/limarp-processed">Fizzarolli/limarp-processed</a></li>
|
16 |
+
<li><a href="https://huggingface.co/datasets/Norquinal/OpenCAI">Norquinal/OpenCAI</a> - <code>two_users</code> split</li>
|
17 |
+
<li><a href="https://huggingface.co/datasets/allura-org/Celeste1.x-data-mixture">allura-org/Celeste1.x-data-mixture</a></li>
|
18 |
+
<li><a href="https://huggingface.co/datasets/mapsila/PIPPA-ShareGPT-formatted-named">mapsila/PIPPA-ShareGPT-formatted-named</a></li>
|
19 |
+
<li><a href="https://huggingface.co/datasets/allenai/tulu-3-sft-personas-instruction-following">allenai/tulu-3-sft-personas-instruction-following</a></li>
|
20 |
+
<li><a href="https://huggingface.co/datasets/readmehay/medical-01-reasoning-SFT-json">readmehay/medical-01-reasoning-SFT-json</a></li>
|
21 |
+
<li><a href="https://huggingface.co/datasets/LooksJuicy/ruozhiba">LooksJuicy/ruozhiba</a></li>
|
22 |
+
<li><a href="https://huggingface.co/datasets/shibing624/roleplay-zh-sharegpt-gpt4-data">shibing624/roleplay-zh-sharegpt-gpt4-data</a></li>
|
23 |
+
<li><a href="https://huggingface.co/datasets/CausalLM/Retrieval-SFT-Chat">CausalLM/Retrieval-SFT-Chat</a></li>
|
24 |
+
<li><a href="https://huggingface.co/datasets/ToastyPigeon/fujin-filtered-instruct">ToastyPigeon/fujin-filtered-instruct</a></li>
|
25 |
+
</ul>
|
26 |
+
</details>
|
27 |
+
|
28 |
+
## Quants
|
29 |
+
TODO!
|
30 |
+
|
31 |
+
## Recommended Settings
|
32 |
+
Chat template: Mistral *v7-tekken* (NOT v3-tekken !!!! the main difference is that v7 has specific `[SYSTEM_PROMPT]` and `[/SYSTEM_PROMPT]` tags)
|
33 |
+
Recommended samplers (not the be-all-end-all, try some on your own!):
|
34 |
+
- I have literally no idea. you're on your own.
|
35 |
+
|
36 |
+
## Hyperparams
|
37 |
+
### General
|
38 |
+
- Epochs = 2
|
39 |
+
- LR = 2e-6
|
40 |
+
- LR Scheduler = Cosine
|
41 |
+
- Optimizer = [Apollo-mini](https://github.com/zhuhanqing/APOLLO)
|
42 |
+
- Optimizer target modules = `all_linear`
|
43 |
+
- Effective batch size = 16
|
44 |
+
- Weight Decay = 0.01
|
45 |
+
- Warmup steps = 50
|
46 |
+
- Total steps = 920
|
47 |
+
|
48 |
+
## Credits
|
49 |
+
Humongous thanks to the people who created the data.
|
50 |
+
Big thanks to all Allura members for testing and emotional support ilya /platonic
|