jerryzh168 commited on
Commit
4c468f5
·
verified ·
1 Parent(s): d76bac0

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +2 -2
README.md CHANGED
@@ -208,10 +208,10 @@ lm_eval --model hf --model_args pretrained=$MODEL --tasks hellaswag --device cud
208
  | **General** | | |
209
  | mmlu | 73.04 | 70.4 |
210
  | mmlu_pro | 53.81 | 52.79 |
211
- | bbh | 79.33 | 74.92 |
212
  | **Multilingual** | | |
213
  | mgsm_en_cot_en | 39.6 | 33.2 |
214
- | m_mmlu (avg) | 57.17 | WIP |
215
  | **Math** | | |
216
  | gpqa_main_zeroshot | 35.71 | 32.14 |
217
  | gsm8k | 87.79 | 86.28 |
 
208
  | **General** | | |
209
  | mmlu | 73.04 | 70.4 |
210
  | mmlu_pro | 53.81 | 52.79 |
211
+ | bbh | 79.33 | 74.92 |
212
  | **Multilingual** | | |
213
  | mgsm_en_cot_en | 39.6 | 33.2 |
214
+ | m_mmlu (avg) | 57.17 | 54.06 |
215
  | **Math** | | |
216
  | gpqa_main_zeroshot | 35.71 | 32.14 |
217
  | gsm8k | 87.79 | 86.28 |