Upload folder using huggingface_hub
Browse files- .gitattributes +1 -0
- README.md +144 -0
- qwen2.5-7b-instruct-uncensored.Q4_0.gguf +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
qwen2.5-7b-instruct-uncensored.Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
|
README.md
ADDED
@@ -0,0 +1,144 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
language:
|
3 |
+
- zh
|
4 |
+
- en
|
5 |
+
license: gpl-3.0
|
6 |
+
tags:
|
7 |
+
- qwen
|
8 |
+
- uncensored
|
9 |
+
base_model:
|
10 |
+
- Qwen/Qwen2.5-7B-Instruct
|
11 |
+
datasets:
|
12 |
+
- NobodyExistsOnTheInternet/ToxicQAFinal
|
13 |
+
- anthracite-org/kalo-opus-instruct-22k-no-refusal
|
14 |
+
- Orion-zhen/dpo-toxic-zh
|
15 |
+
- unalignment/toxic-dpo-v0.2
|
16 |
+
- Crystalcareai/Intel-DPO-Pairs-Norefusals
|
17 |
+
pipeline_tag: text-generation
|
18 |
+
model-index:
|
19 |
+
- name: Qwen2.5-7B-Instruct-Uncensored
|
20 |
+
results:
|
21 |
+
- task:
|
22 |
+
type: text-generation
|
23 |
+
name: Text Generation
|
24 |
+
dataset:
|
25 |
+
name: IFEval (0-Shot)
|
26 |
+
type: HuggingFaceH4/ifeval
|
27 |
+
args:
|
28 |
+
num_few_shot: 0
|
29 |
+
metrics:
|
30 |
+
- type: inst_level_strict_acc and prompt_level_strict_acc
|
31 |
+
value: 72.04
|
32 |
+
name: strict accuracy
|
33 |
+
source:
|
34 |
+
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=Orion-zhen/Qwen2.5-7B-Instruct-Uncensored
|
35 |
+
name: Open LLM Leaderboard
|
36 |
+
- task:
|
37 |
+
type: text-generation
|
38 |
+
name: Text Generation
|
39 |
+
dataset:
|
40 |
+
name: BBH (3-Shot)
|
41 |
+
type: BBH
|
42 |
+
args:
|
43 |
+
num_few_shot: 3
|
44 |
+
metrics:
|
45 |
+
- type: acc_norm
|
46 |
+
value: 35.83
|
47 |
+
name: normalized accuracy
|
48 |
+
source:
|
49 |
+
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=Orion-zhen/Qwen2.5-7B-Instruct-Uncensored
|
50 |
+
name: Open LLM Leaderboard
|
51 |
+
- task:
|
52 |
+
type: text-generation
|
53 |
+
name: Text Generation
|
54 |
+
dataset:
|
55 |
+
name: MATH Lvl 5 (4-Shot)
|
56 |
+
type: hendrycks/competition_math
|
57 |
+
args:
|
58 |
+
num_few_shot: 4
|
59 |
+
metrics:
|
60 |
+
- type: exact_match
|
61 |
+
value: 1.36
|
62 |
+
name: exact match
|
63 |
+
source:
|
64 |
+
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=Orion-zhen/Qwen2.5-7B-Instruct-Uncensored
|
65 |
+
name: Open LLM Leaderboard
|
66 |
+
- task:
|
67 |
+
type: text-generation
|
68 |
+
name: Text Generation
|
69 |
+
dataset:
|
70 |
+
name: GPQA (0-shot)
|
71 |
+
type: Idavidrein/gpqa
|
72 |
+
args:
|
73 |
+
num_few_shot: 0
|
74 |
+
metrics:
|
75 |
+
- type: acc_norm
|
76 |
+
value: 7.05
|
77 |
+
name: acc_norm
|
78 |
+
source:
|
79 |
+
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=Orion-zhen/Qwen2.5-7B-Instruct-Uncensored
|
80 |
+
name: Open LLM Leaderboard
|
81 |
+
- task:
|
82 |
+
type: text-generation
|
83 |
+
name: Text Generation
|
84 |
+
dataset:
|
85 |
+
name: MuSR (0-shot)
|
86 |
+
type: TAUR-Lab/MuSR
|
87 |
+
args:
|
88 |
+
num_few_shot: 0
|
89 |
+
metrics:
|
90 |
+
- type: acc_norm
|
91 |
+
value: 13.58
|
92 |
+
name: acc_norm
|
93 |
+
source:
|
94 |
+
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=Orion-zhen/Qwen2.5-7B-Instruct-Uncensored
|
95 |
+
name: Open LLM Leaderboard
|
96 |
+
- task:
|
97 |
+
type: text-generation
|
98 |
+
name: Text Generation
|
99 |
+
dataset:
|
100 |
+
name: MMLU-PRO (5-shot)
|
101 |
+
type: TIGER-Lab/MMLU-Pro
|
102 |
+
config: main
|
103 |
+
split: test
|
104 |
+
args:
|
105 |
+
num_few_shot: 5
|
106 |
+
metrics:
|
107 |
+
- type: acc
|
108 |
+
value: 38.07
|
109 |
+
name: accuracy
|
110 |
+
source:
|
111 |
+
url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=Orion-zhen/Qwen2.5-7B-Instruct-Uncensored
|
112 |
+
name: Open LLM Leaderboard
|
113 |
+
---
|
114 |
+
|
115 |
+
# Qwen2.5-7B-Instruct-Uncensored
|
116 |
+
|
117 |
+
This model is an uncensored fine-tune version of Qwen2.5-7B-Instruct. However, I can still notice that though uncensored, the model fails to generate detailed descriptions on certain extreme scenarios, which might be associated with deletion on some pretrain datasets in Qwen's pretraining stage.
|
118 |
+
|
119 |
+
Check out my roleplay&writing enhanced model based on this model: [Orion-zhen/Meissa-Qwen2.5-7B-Instruct](https://huggingface.co/Orion-zhen/Meissa-Qwen2.5-7B-Instruct)
|
120 |
+
|
121 |
+
## Traning details
|
122 |
+
|
123 |
+
I used SFT + DPO to ensure uncensorment as well as trying to maintain original model's capabilities.
|
124 |
+
|
125 |
+
- SFT:
|
126 |
+
- NobodyExistsOnTheInternet/ToxicQAFinal
|
127 |
+
- anthracite-org/kalo-opus-instruct-22k-no-refusal
|
128 |
+
- DPO:
|
129 |
+
- Orion-zhen/dpo-toxic-zh
|
130 |
+
- unalignment/toxic-dpo-v0.2
|
131 |
+
- Crystalcareai/Intel-DPO-Pairs-Norefusals
|
132 |
+
# [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard)
|
133 |
+
Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/details_Orion-zhen__Qwen2.5-7B-Instruct-Uncensored)
|
134 |
+
|
135 |
+
| Metric |Value|
|
136 |
+
|-------------------|----:|
|
137 |
+
|Avg. |27.99|
|
138 |
+
|IFEval (0-Shot) |72.04|
|
139 |
+
|BBH (3-Shot) |35.83|
|
140 |
+
|MATH Lvl 5 (4-Shot)| 1.36|
|
141 |
+
|GPQA (0-shot) | 7.05|
|
142 |
+
|MuSR (0-shot) |13.58|
|
143 |
+
|MMLU-PRO (5-shot) |38.07|
|
144 |
+
|
qwen2.5-7b-instruct-uncensored.Q4_0.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e49012292e274440ce86e1df6e86f14c7140a890a34b959e6f684707de35bac3
|
3 |
+
size 4431389472
|