Update README.md
Browse files
README.md
CHANGED
|
@@ -208,10 +208,10 @@ lm_eval --model hf --model_args pretrained=$MODEL --tasks hellaswag --device cud
|
|
| 208 |
| **General** | | |
|
| 209 |
| mmlu | 73.04 | 70.4 |
|
| 210 |
| mmlu_pro | 53.81 | 52.79 |
|
| 211 |
-
| bbh | 79.33 | 74.92
|
| 212 |
| **Multilingual** | | |
|
| 213 |
| mgsm_en_cot_en | 39.6 | 33.2 |
|
| 214 |
-
| m_mmlu (avg) | 57.17 |
|
| 215 |
| **Math** | | |
|
| 216 |
| gpqa_main_zeroshot | 35.71 | 32.14 |
|
| 217 |
| gsm8k | 87.79 | 86.28 |
|
|
|
|
| 208 |
| **General** | | |
|
| 209 |
| mmlu | 73.04 | 70.4 |
|
| 210 |
| mmlu_pro | 53.81 | 52.79 |
|
| 211 |
+
| bbh | 79.33 | 74.92 |
|
| 212 |
| **Multilingual** | | |
|
| 213 |
| mgsm_en_cot_en | 39.6 | 33.2 |
|
| 214 |
+
| m_mmlu (avg) | 57.17 | 54.06 |
|
| 215 |
| **Math** | | |
|
| 216 |
| gpqa_main_zeroshot | 35.71 | 32.14 |
|
| 217 |
| gsm8k | 87.79 | 86.28 |
|