{ "results": { "anli_r1": { "acc": 0.323, "acc_stderr": 0.014794927843348633 }, "anli_r2": { "acc": 0.364, "acc_stderr": 0.015222868840522024 }, "anli_r3": { "acc": 0.3375, "acc_stderr": 0.013655897185463655 }, "cb": { "acc": 0.5178571428571429, "acc_stderr": 0.06737697508644648, "f1": 0.3525733525733525 }, "copa": { "acc": 0.65, "acc_stderr": 0.047937248544110196 }, "hellaswag": { "acc": 0.3941445927106154, "acc_stderr": 0.004876674814874709, "acc_norm": 0.48645688109938257, "acc_norm_stderr": 0.004987950663406552 }, "rte": { "acc": 0.51985559566787, "acc_stderr": 0.030072723167317177 }, "winogrande": { "acc": 0.5138121546961326, "acc_stderr": 0.014047122916440412 }, "storycloze_2016": { "acc": 0.6424371993586317, "acc_stderr": 0.011083341168827792 }, "boolq": { "acc": 0.5, "acc_stderr": 0.008745054976398168 }, "arc_easy": { "acc": 0.5071548821548821, "acc_stderr": 0.01025873302244637, "acc_norm": 0.4650673400673401, "acc_norm_stderr": 0.010234713052723658 }, "arc_challenge": { "acc": 0.23976109215017063, "acc_stderr": 0.012476304127453947, "acc_norm": 0.257679180887372, "acc_norm_stderr": 0.0127807705627684 }, "sciq": { "acc": 0.735, "acc_stderr": 0.013963164754809946, "acc_norm": 0.705, "acc_norm_stderr": 0.014428554438445517 }, "piqa": { "acc": 0.7023939064200218, "acc_stderr": 0.010667353792388213, "acc_norm": 0.7002176278563657, "acc_norm_stderr": 0.01068968696713809 } }, "versions": { "anli_r1": 0, "anli_r2": 0, "anli_r3": 0, "cb": 1, "copa": 0, "hellaswag": 0, "rte": 0, "winogrande": 0, "storycloze_2016": 0, "boolq": 1, "arc_easy": 0, "arc_challenge": 0, "sciq": 0, "piqa": 0 } }