Muennighoff's picture
Add
2aef930
{
"results": {
"anli_r1": {
"acc": 0.349,
"acc_stderr": 0.015080663991563097
},
"anli_r2": {
"acc": 0.359,
"acc_stderr": 0.015177264224798596
},
"anli_r3": {
"acc": 0.365,
"acc_stderr": 0.01390348598141358
},
"cb": {
"acc": 0.5178571428571429,
"acc_stderr": 0.06737697508644648,
"f1": 0.327692720923986
},
"copa": {
"acc": 0.67,
"acc_stderr": 0.04725815626252607
},
"hellaswag": {
"acc": 0.39404501095399325,
"acc_stderr": 0.004876459434619795,
"acc_norm": 0.4907388966341366,
"acc_norm_stderr": 0.0049889254105227685
},
"rte": {
"acc": 0.5234657039711191,
"acc_stderr": 0.03006330041190266
},
"winogrande": {
"acc": 0.5098658247829518,
"acc_stderr": 0.014049749833367592
},
"storycloze_2016": {
"acc": 0.6445750935328701,
"acc_stderr": 0.011068528452399879
},
"boolq": {
"acc": 0.5336391437308868,
"acc_stderr": 0.00872524086113114
},
"arc_easy": {
"acc": 0.4890572390572391,
"acc_stderr": 0.010257326131172879,
"acc_norm": 0.4701178451178451,
"acc_norm_stderr": 0.01024144432288643
},
"arc_challenge": {
"acc": 0.23122866894197952,
"acc_stderr": 0.01232085883477228,
"acc_norm": 0.257679180887372,
"acc_norm_stderr": 0.0127807705627684
},
"sciq": {
"acc": 0.756,
"acc_stderr": 0.013588548437881423,
"acc_norm": 0.734,
"acc_norm_stderr": 0.013979965645145143
},
"piqa": {
"acc": 0.6920565832426551,
"acc_stderr": 0.010770892367463685,
"acc_norm": 0.705658324265506,
"acc_norm_stderr": 0.01063331147034751
}
},
"versions": {
"anli_r1": 0,
"anli_r2": 0,
"anli_r3": 0,
"cb": 1,
"copa": 0,
"hellaswag": 0,
"rte": 0,
"winogrande": 0,
"storycloze_2016": 0,
"boolq": 1,
"arc_easy": 0,
"arc_challenge": 0,
"sciq": 0,
"piqa": 0
}
}