{ "results": { "anli_r1": { "acc": 0.324, "acc_stderr": 0.014806864733738859 }, "anli_r2": { "acc": 0.338, "acc_stderr": 0.014965960710224482 }, "anli_r3": { "acc": 0.3416666666666667, "acc_stderr": 0.013696658778002519 }, "cb": { "acc": 0.42857142857142855, "acc_stderr": 0.06672848092813058, "f1": 0.22212270488132557 }, "copa": { "acc": 0.74, "acc_stderr": 0.044084400227680794 }, "hellaswag": { "acc": 0.48446524596693885, "acc_stderr": 0.004987372476207027, "acc_norm": 0.6316470822545309, "acc_norm_stderr": 0.004813719952829966 }, "rte": { "acc": 0.5126353790613718, "acc_stderr": 0.030086851767188564 }, "winogrande": { "acc": 0.5951065509076559, "acc_stderr": 0.01379592700312494 }, "storycloze_2016": { "acc": 0.711918760021379, "acc_stderr": 0.010472537019822575 }, "boolq": { "acc": 0.5571865443425077, "acc_stderr": 0.008687668766930827 }, "arc_easy": { "acc": 0.6031144781144782, "acc_stderr": 0.010039236800583206, "acc_norm": 0.5353535353535354, "acc_norm_stderr": 0.01023410454341143 }, "arc_challenge": { "acc": 0.2841296928327645, "acc_stderr": 0.013179442447653886, "acc_norm": 0.3003412969283277, "acc_norm_stderr": 0.013395909309957007 }, "sciq": { "acc": 0.858, "acc_stderr": 0.011043457699378237, "acc_norm": 0.766, "acc_norm_stderr": 0.01339490288966001 }, "piqa": { "acc": 0.7627856365614799, "acc_stderr": 0.009924694933586373, "acc_norm": 0.7682263329706203, "acc_norm_stderr": 0.009845143772794052 } }, "versions": { "anli_r1": 0, "anli_r2": 0, "anli_r3": 0, "cb": 1, "copa": 0, "hellaswag": 0, "rte": 0, "winogrande": 0, "storycloze_2016": 0, "boolq": 1, "arc_easy": 0, "arc_challenge": 0, "sciq": 0, "piqa": 0 } }