{ "results": { "anli_r1": { "acc": 0.329, "acc_stderr": 0.014865395385928364 }, "anli_r2": { "acc": 0.338, "acc_stderr": 0.014965960710224487 }, "anli_r3": { "acc": 0.3325, "acc_stderr": 0.013605417345710528 }, "cb": { "acc": 0.5535714285714286, "acc_stderr": 0.06703189227942395, "f1": 0.3502252252252252 }, "copa": { "acc": 0.68, "acc_stderr": 0.04688261722621505 }, "hellaswag": { "acc": 0.3595897231627166, "acc_stderr": 0.004788994060654276, "acc_norm": 0.44911372236606256, "acc_norm_stderr": 0.004963872936857938 }, "rte": { "acc": 0.4657039711191336, "acc_stderr": 0.030025579819366426 }, "winogrande": { "acc": 0.5224940805051302, "acc_stderr": 0.014038257824059876 }, "storycloze_2016": { "acc": 0.6365579903794762, "acc_stderr": 0.011122841442059708 }, "boolq": { "acc": 0.5577981651376147, "acc_stderr": 0.00868643052611449 }, "arc_easy": { "acc": 0.5433501683501684, "acc_stderr": 0.010221149650118182, "acc_norm": 0.523989898989899, "acc_norm_stderr": 0.010247967392742688 }, "arc_challenge": { "acc": 0.22525597269624573, "acc_stderr": 0.012207839995407309, "acc_norm": 0.25853242320819114, "acc_norm_stderr": 0.012794553754288673 }, "sciq": { "acc": 0.895, "acc_stderr": 0.009698921026024968, "acc_norm": 0.898, "acc_norm_stderr": 0.00957536880165389 }, "piqa": { "acc": 0.7083786724700761, "acc_stderr": 0.01060444152742879, "acc_norm": 0.7007616974972797, "acc_norm_stderr": 0.010684130673134581 } }, "versions": { "anli_r1": 0, "anli_r2": 0, "anli_r3": 0, "cb": 1, "copa": 0, "hellaswag": 0, "rte": 0, "winogrande": 0, "storycloze_2016": 0, "boolq": 1, "arc_easy": 0, "arc_challenge": 0, "sciq": 0, "piqa": 0 } }