Update README.md
Browse files
README.md
CHANGED
@@ -192,9 +192,9 @@ lm_eval --model hf --model_args pretrained=pytorch/Qwen3-4B-8da4w --tasks mmlu -
|
|
192 |
| bbh | 74.86 | 67.47 |
|
193 |
| **Reasoning** | | |
|
194 |
| gpqa_main_zeroshot | 33.93 | 31.03 |
|
195 |
-
| mgsm_en_cot_en | 30.40 | 29.20 |
|
196 |
| **Multilingual** | | |
|
197 |
| m_mmlu | 50.41 | 47.13 |
|
|
|
198 |
| **Math** | | |
|
199 |
| gsm8k | 84.76 | 82.87 |
|
200 |
| leaderboard_math_hard | 62.83 | 53.30 |
|
|
|
192 |
| bbh | 74.86 | 67.47 |
|
193 |
| **Reasoning** | | |
|
194 |
| gpqa_main_zeroshot | 33.93 | 31.03 |
|
|
|
195 |
| **Multilingual** | | |
|
196 |
| m_mmlu | 50.41 | 47.13 |
|
197 |
+
| mgsm_en_cot_en | 30.40 | 29.20 |
|
198 |
| **Math** | | |
|
199 |
| gsm8k | 84.76 | 82.87 |
|
200 |
| leaderboard_math_hard | 62.83 | 53.30 |
|