jerryzh168 commited on
Commit
31b7eb3
·
verified ·
1 Parent(s): 3b07e48

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +2 -2
README.md CHANGED
@@ -173,7 +173,7 @@ lm_eval --model hf --model_args pretrained=pytorch/Phi-4-mini-instruct-8da4w --t
173
  | | Phi-4 mini-Ins | phi4-mini-8da4w|
174
  | **Popular aggregated benchmark** | | |
175
  | mmlu (0 shot) | 66.73 | 63.11 |
176
- | mmlu_pro (5-shot) | 44.71 | 35.31 |
177
  | **Reasoning** | | |
178
  | arc_challenge | 56.91 | 55.12 |
179
  | gpqa_main_zeroshot | 30.13 | 29.02 |
@@ -188,7 +188,7 @@ lm_eval --model hf --model_args pretrained=pytorch/Phi-4-mini-instruct-8da4w --t
188
  | **Math** | | |
189
  | gsm8k (5-shot) | 81.88 | 70.43 |
190
  | Mathqa (0-shot) | 42.31 | 41.57 |
191
- | **Overall** | 55.21 | 52.38 |
192
 
193
 
194
  # Exporting to ExecuTorch
 
173
  | | Phi-4 mini-Ins | phi4-mini-8da4w|
174
  | **Popular aggregated benchmark** | | |
175
  | mmlu (0 shot) | 66.73 | 63.11 |
176
+ | mmlu_pro (5-shot) | 46.43 | 35.31 |
177
  | **Reasoning** | | |
178
  | arc_challenge | 56.91 | 55.12 |
179
  | gpqa_main_zeroshot | 30.13 | 29.02 |
 
188
  | **Math** | | |
189
  | gsm8k (5-shot) | 81.88 | 70.43 |
190
  | Mathqa (0-shot) | 42.31 | 41.57 |
191
+ | **Overall** | 55.35 | 52.38 |
192
 
193
 
194
  # Exporting to ExecuTorch