Update README.md
Browse files
README.md
CHANGED
|
@@ -192,9 +192,9 @@ lm_eval --model hf --model_args pretrained=pytorch/Qwen3-4B-8da4w --tasks mmlu -
|
|
| 192 |
| bbh | 74.86 | 67.47 |
|
| 193 |
| **Reasoning** | | |
|
| 194 |
| gpqa_main_zeroshot | 33.93 | 31.03 |
|
| 195 |
-
| mgsm_en_cot_en | 30.40 | 29.20 |
|
| 196 |
| **Multilingual** | | |
|
| 197 |
| m_mmlu | 50.41 | 47.13 |
|
|
|
|
| 198 |
| **Math** | | |
|
| 199 |
| gsm8k | 84.76 | 82.87 |
|
| 200 |
| leaderboard_math_hard | 62.83 | 53.30 |
|
|
|
|
| 192 |
| bbh | 74.86 | 67.47 |
|
| 193 |
| **Reasoning** | | |
|
| 194 |
| gpqa_main_zeroshot | 33.93 | 31.03 |
|
|
|
|
| 195 |
| **Multilingual** | | |
|
| 196 |
| m_mmlu | 50.41 | 47.13 |
|
| 197 |
+
| mgsm_en_cot_en | 30.40 | 29.20 |
|
| 198 |
| **Math** | | |
|
| 199 |
| gsm8k | 84.76 | 82.87 |
|
| 200 |
| leaderboard_math_hard | 62.83 | 53.30 |
|