Update README.md
Browse files
README.md
CHANGED
|
@@ -173,7 +173,7 @@ lm_eval --model hf --model_args pretrained=pytorch/Phi-4-mini-instruct-8da4w --t
|
|
| 173 |
| | Phi-4 mini-Ins | phi4-mini-8da4w|
|
| 174 |
| **Popular aggregated benchmark** | | |
|
| 175 |
| mmlu (0 shot) | 66.73 | 63.11 |
|
| 176 |
-
| mmlu_pro (5-shot) |
|
| 177 |
| **Reasoning** | | |
|
| 178 |
| arc_challenge | 56.91 | 55.12 |
|
| 179 |
| gpqa_main_zeroshot | 30.13 | 29.02 |
|
|
@@ -188,7 +188,7 @@ lm_eval --model hf --model_args pretrained=pytorch/Phi-4-mini-instruct-8da4w --t
|
|
| 188 |
| **Math** | | |
|
| 189 |
| gsm8k (5-shot) | 81.88 | 70.43 |
|
| 190 |
| Mathqa (0-shot) | 42.31 | 41.57 |
|
| 191 |
-
| **Overall** | 55.
|
| 192 |
|
| 193 |
|
| 194 |
# Exporting to ExecuTorch
|
|
|
|
| 173 |
| | Phi-4 mini-Ins | phi4-mini-8da4w|
|
| 174 |
| **Popular aggregated benchmark** | | |
|
| 175 |
| mmlu (0 shot) | 66.73 | 63.11 |
|
| 176 |
+
| mmlu_pro (5-shot) | 46.43 | 35.31 |
|
| 177 |
| **Reasoning** | | |
|
| 178 |
| arc_challenge | 56.91 | 55.12 |
|
| 179 |
| gpqa_main_zeroshot | 30.13 | 29.02 |
|
|
|
|
| 188 |
| **Math** | | |
|
| 189 |
| gsm8k (5-shot) | 81.88 | 70.43 |
|
| 190 |
| Mathqa (0-shot) | 42.31 | 41.57 |
|
| 191 |
+
| **Overall** | 55.35 | 52.38 |
|
| 192 |
|
| 193 |
|
| 194 |
# Exporting to ExecuTorch
|