{ "results": { "anli_r1": { "acc": 0.308, "acc_stderr": 0.014606483127342763 }, "anli_r2": { "acc": 0.353, "acc_stderr": 0.015120172605483696 }, "anli_r3": { "acc": 0.3375, "acc_stderr": 0.013655897185463653 }, "cb": { "acc": 0.4642857142857143, "acc_stderr": 0.06724777654937658, "f1": 0.316548463356974 }, "copa": { "acc": 0.61, "acc_stderr": 0.04902071300001975 }, "hellaswag": { "acc": 0.2929695279824736, "acc_stderr": 0.004541944342035901, "acc_norm": 0.31866162119099783, "acc_norm_stderr": 0.00465005215009441 }, "rte": { "acc": 0.47653429602888087, "acc_stderr": 0.030063300411902652 }, "winogrande": { "acc": 0.5011838989739542, "acc_stderr": 0.014052446290529012 }, "storycloze_2016": { "acc": 0.5836451095670764, "acc_stderr": 0.011399490926937005 }, "boolq": { "acc": 0.4776758409785933, "acc_stderr": 0.00873633411558504 }, "arc_easy": { "acc": 0.42634680134680136, "acc_stderr": 0.010147858603835139, "acc_norm": 0.3926767676767677, "acc_norm_stderr": 0.010020646555538686 }, "arc_challenge": { "acc": 0.18344709897610922, "acc_stderr": 0.011310170179554543, "acc_norm": 0.22696245733788395, "acc_norm_stderr": 0.012240491536132879 }, "sciq": { "acc": 0.73, "acc_stderr": 0.014046255632633915, "acc_norm": 0.677, "acc_norm_stderr": 0.014794927843348633 }, "piqa": { "acc": 0.6349292709466812, "acc_stderr": 0.011233021830554829, "acc_norm": 0.6251360174102285, "acc_norm_stderr": 0.011294565805619019 } }, "versions": { "anli_r1": 0, "anli_r2": 0, "anli_r3": 0, "cb": 1, "copa": 0, "hellaswag": 0, "rte": 0, "winogrande": 0, "storycloze_2016": 0, "boolq": 1, "arc_easy": 0, "arc_challenge": 0, "sciq": 0, "piqa": 0 } }