Update README.md
Browse files
README.md
CHANGED
@@ -215,7 +215,7 @@ lm_eval --model hf --model_args pretrained=$MODEL --tasks hellaswag --device cud
|
|
215 |
| **Math** | | |
|
216 |
| gpqa_main_zeroshot | 35.71 | 32.14 |
|
217 |
| gsm8k | 87.79 | 86.28 |
|
218 |
-
| leaderboard_math_hard
|
219 |
| **Overall** | 60.02 | 56.33 |
|
220 |
|
221 |
|
|
|
215 |
| **Math** | | |
|
216 |
| gpqa_main_zeroshot | 35.71 | 32.14 |
|
217 |
| gsm8k | 87.79 | 86.28 |
|
218 |
+
| leaderboard_math_hard (v3) | 53.7 | 46.83 |
|
219 |
| **Overall** | 60.02 | 56.33 |
|
220 |
|
221 |
|