Update README.md
Browse files
README.md
CHANGED
@@ -134,10 +134,11 @@ We rely on [lm-evaluation-harness](https://github.com/EleutherAI/lm-evaluation-h
|
|
134 |
| mmlu | 80.71 | 80.67 |
|
135 |
| bbh | 37.49 | 38.01 |
|
136 |
| **Multilingual** | | |
|
137 |
-
|
|
138 |
| **Math** | | |
|
139 |
| gpqa_main_zeroshot | 41.96 | 42.63 |
|
140 |
-
| **Overall** |
|
|
|
141 |
|
142 |
<details>
|
143 |
<summary> Reproduce Model Quality Results </summary>
|
|
|
134 |
| mmlu | 80.71 | 80.67 |
|
135 |
| bbh | 37.49 | 38.01 |
|
136 |
| **Multilingual** | | |
|
137 |
+
| mgsm_en_cot_es | 58.4 | 52.0 |
|
138 |
| **Math** | | |
|
139 |
| gpqa_main_zeroshot | 41.96 | 42.63 |
|
140 |
+
| **Overall** | 54.64 | 53.33 |
|
141 |
+
|
142 |
|
143 |
<details>
|
144 |
<summary> Reproduce Model Quality Results </summary>
|