Update README.md
Browse files
README.md
CHANGED
@@ -173,7 +173,7 @@ lm_eval --model hf --model_args pretrained=pytorch/Phi-4-mini-instruct-8da4w --t
|
|
173 |
| | Phi-4 mini-Ins | phi4-mini-8da4w|
|
174 |
| **Popular aggregated benchmark** | | |
|
175 |
| mmlu (0 shot) | 66.73 | 63.11 |
|
176 |
-
| mmlu_pro (5-shot) |
|
177 |
| **Reasoning** | | |
|
178 |
| arc_challenge | 56.91 | 55.12 |
|
179 |
| gpqa_main_zeroshot | 30.13 | 29.02 |
|
@@ -188,7 +188,7 @@ lm_eval --model hf --model_args pretrained=pytorch/Phi-4-mini-instruct-8da4w --t
|
|
188 |
| **Math** | | |
|
189 |
| gsm8k (5-shot) | 81.88 | 70.43 |
|
190 |
| Mathqa (0-shot) | 42.31 | 41.57 |
|
191 |
-
| **Overall** | 55.
|
192 |
|
193 |
|
194 |
# Exporting to ExecuTorch
|
|
|
173 |
| | Phi-4 mini-Ins | phi4-mini-8da4w|
|
174 |
| **Popular aggregated benchmark** | | |
|
175 |
| mmlu (0 shot) | 66.73 | 63.11 |
|
176 |
+
| mmlu_pro (5-shot) | 46.43 | 35.31 |
|
177 |
| **Reasoning** | | |
|
178 |
| arc_challenge | 56.91 | 55.12 |
|
179 |
| gpqa_main_zeroshot | 30.13 | 29.02 |
|
|
|
188 |
| **Math** | | |
|
189 |
| gsm8k (5-shot) | 81.88 | 70.43 |
|
190 |
| Mathqa (0-shot) | 42.31 | 41.57 |
|
191 |
+
| **Overall** | 55.35 | 52.38 |
|
192 |
|
193 |
|
194 |
# Exporting to ExecuTorch
|