CultriX commited on
Commit
b21e4a0
1 Parent(s): 753a3a8

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +15 -7
README.md CHANGED
@@ -26,7 +26,8 @@ model-index:
26
  value: 52.35
27
  name: strict accuracy
28
  source:
29
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MegaMerge-pt2
 
30
  name: Open LLM Leaderboard
31
  - task:
32
  type: text-generation
@@ -41,7 +42,8 @@ model-index:
41
  value: 50.64
42
  name: normalized accuracy
43
  source:
44
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MegaMerge-pt2
 
45
  name: Open LLM Leaderboard
46
  - task:
47
  type: text-generation
@@ -56,7 +58,8 @@ model-index:
56
  value: 30.06
57
  name: exact match
58
  source:
59
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MegaMerge-pt2
 
60
  name: Open LLM Leaderboard
61
  - task:
62
  type: text-generation
@@ -71,7 +74,8 @@ model-index:
71
  value: 19.13
72
  name: acc_norm
73
  source:
74
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MegaMerge-pt2
 
75
  name: Open LLM Leaderboard
76
  - task:
77
  type: text-generation
@@ -86,7 +90,8 @@ model-index:
86
  value: 18.25
87
  name: acc_norm
88
  source:
89
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MegaMerge-pt2
 
90
  name: Open LLM Leaderboard
91
  - task:
92
  type: text-generation
@@ -103,8 +108,11 @@ model-index:
103
  value: 49.15
104
  name: accuracy
105
  source:
106
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MegaMerge-pt2
 
107
  name: Open LLM Leaderboard
 
 
108
  ---
109
  # merge
110
 
@@ -156,4 +164,4 @@ Detailed results can be found [here](https://huggingface.co/datasets/open-llm-le
156
  | MATH Lvl 5 (4-Shot)| 27.34 |
157
  | GPQA (0-shot) | 17.23 |
158
  | MuSR (0-shot) | 18.74 |
159
- | MMLU-PRO (5-shot) | 49.12 |
 
26
  value: 52.35
27
  name: strict accuracy
28
  source:
29
+ url: >-
30
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MegaMerge-pt2
31
  name: Open LLM Leaderboard
32
  - task:
33
  type: text-generation
 
42
  value: 50.64
43
  name: normalized accuracy
44
  source:
45
+ url: >-
46
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MegaMerge-pt2
47
  name: Open LLM Leaderboard
48
  - task:
49
  type: text-generation
 
58
  value: 30.06
59
  name: exact match
60
  source:
61
+ url: >-
62
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MegaMerge-pt2
63
  name: Open LLM Leaderboard
64
  - task:
65
  type: text-generation
 
74
  value: 19.13
75
  name: acc_norm
76
  source:
77
+ url: >-
78
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MegaMerge-pt2
79
  name: Open LLM Leaderboard
80
  - task:
81
  type: text-generation
 
90
  value: 18.25
91
  name: acc_norm
92
  source:
93
+ url: >-
94
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MegaMerge-pt2
95
  name: Open LLM Leaderboard
96
  - task:
97
  type: text-generation
 
108
  value: 49.15
109
  name: accuracy
110
  source:
111
+ url: >-
112
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MegaMerge-pt2
113
  name: Open LLM Leaderboard
114
+ metrics:
115
+ - accuracy
116
  ---
117
  # merge
118
 
 
164
  | MATH Lvl 5 (4-Shot)| 27.34 |
165
  | GPQA (0-shot) | 17.23 |
166
  | MuSR (0-shot) | 18.74 |
167
+ | MMLU-PRO (5-shot) | 49.12 |