{ "results": { "anli_r1": { "acc": 0.336, "acc_stderr": 0.014944140233795025 }, "anli_r2": { "acc": 0.352, "acc_stderr": 0.01511040450564867 }, "anli_r3": { "acc": 0.3383333333333333, "acc_stderr": 0.013664144006618266 }, "cb": { "acc": 0.5178571428571429, "acc_stderr": 0.06737697508644645, "f1": 0.3362023995826813 }, "copa": { "acc": 0.6, "acc_stderr": 0.049236596391733084 }, "hellaswag": { "acc": 0.29645488946425014, "acc_stderr": 0.004557606227194286, "acc_norm": 0.3234415455088628, "acc_norm_stderr": 0.004668335725410298 }, "rte": { "acc": 0.49458483754512633, "acc_stderr": 0.030094698123239966 }, "winogrande": { "acc": 0.4877663772691397, "acc_stderr": 0.01404827882040562 }, "storycloze_2016": { "acc": 0.5788348476750401, "acc_stderr": 0.011417808278216117 }, "boolq": { "acc": 0.44434250764525995, "acc_stderr": 0.00869070599067338 }, "arc_easy": { "acc": 0.42845117845117847, "acc_stderr": 0.010154195733990975, "acc_norm": 0.3930976430976431, "acc_norm_stderr": 0.010022540618945312 }, "arc_challenge": { "acc": 0.1962457337883959, "acc_stderr": 0.01160601988141629, "acc_norm": 0.22781569965870307, "acc_norm_stderr": 0.012256708602326905 }, "sciq": { "acc": 0.719, "acc_stderr": 0.014221154708434929, "acc_norm": 0.686, "acc_norm_stderr": 0.014683991951087967 }, "piqa": { "acc": 0.6273122959738846, "acc_stderr": 0.01128131833289774, "acc_norm": 0.6169749727965179, "acc_norm_stderr": 0.01134208170908285 } }, "versions": { "anli_r1": 0, "anli_r2": 0, "anli_r3": 0, "cb": 1, "copa": 0, "hellaswag": 0, "rte": 0, "winogrande": 0, "storycloze_2016": 0, "boolq": 1, "arc_easy": 0, "arc_challenge": 0, "sciq": 0, "piqa": 0 } }