{ "results": { "anli_r1": { "acc": 0.343, "acc_stderr": 0.015019206922356951 }, "anli_r2": { "acc": 0.35, "acc_stderr": 0.015090650341444231 }, "anli_r3": { "acc": 0.3516666666666667, "acc_stderr": 0.013789711695404794 }, "cb": { "acc": 0.35714285714285715, "acc_stderr": 0.06460957383809221, "f1": 0.3445134575569358 }, "copa": { "acc": 0.79, "acc_stderr": 0.04093601807403326 }, "hellaswag": { "acc": 0.4389563831905995, "acc_stderr": 0.004952454721934793, "acc_norm": 0.5718980282812188, "acc_norm_stderr": 0.0049379243267425755 }, "rte": { "acc": 0.5126353790613718, "acc_stderr": 0.030086851767188564 }, "winogrande": { "acc": 0.5698500394632992, "acc_stderr": 0.013914685094716694 }, "storycloze_2016": { "acc": 0.7156600748262961, "acc_stderr": 0.01043161412866525 }, "boolq": { "acc": 0.5039755351681957, "acc_stderr": 0.008744778542942208 }, "arc_easy": { "acc": 0.5778619528619529, "acc_stderr": 0.010134620524592271, "acc_norm": 0.5509259259259259, "acc_norm_stderr": 0.010206428316323365 }, "arc_challenge": { "acc": 0.25170648464163825, "acc_stderr": 0.012682496334042963, "acc_norm": 0.2841296928327645, "acc_norm_stderr": 0.013179442447653886 }, "sciq": { "acc": 0.865, "acc_stderr": 0.010811655372416053, "acc_norm": 0.845, "acc_norm_stderr": 0.01145015747079946 }, "piqa": { "acc": 0.7421109902067464, "acc_stderr": 0.010206956662056255, "acc_norm": 0.7529923830250272, "acc_norm_stderr": 0.010062268140772625 } }, "versions": { "anli_r1": 0, "anli_r2": 0, "anli_r3": 0, "cb": 1, "copa": 0, "hellaswag": 0, "rte": 0, "winogrande": 0, "storycloze_2016": 0, "boolq": 1, "arc_easy": 0, "arc_challenge": 0, "sciq": 0, "piqa": 0 } }