|
{ |
|
"results": { |
|
"anli_r1": { |
|
"acc": 0.354, |
|
"acc_stderr": 0.015129868238451772 |
|
}, |
|
"anli_r2": { |
|
"acc": 0.336, |
|
"acc_stderr": 0.014944140233795016 |
|
}, |
|
"anli_r3": { |
|
"acc": 0.3475, |
|
"acc_stderr": 0.013751753243291854 |
|
}, |
|
"cb": { |
|
"acc": 0.48214285714285715, |
|
"acc_stderr": 0.0673769750864465, |
|
"f1": 0.2828828828828829 |
|
}, |
|
"copa": { |
|
"acc": 0.82, |
|
"acc_stderr": 0.038612291966536955 |
|
}, |
|
"hellaswag": { |
|
"acc": 0.4772953594901414, |
|
"acc_stderr": 0.004984634285101618, |
|
"acc_norm": 0.6366261700856403, |
|
"acc_norm_stderr": 0.00479988224849481 |
|
}, |
|
"rte": { |
|
"acc": 0.5595667870036101, |
|
"acc_stderr": 0.029882123363118726 |
|
}, |
|
"winogrande": { |
|
"acc": 0.6093133385951065, |
|
"acc_stderr": 0.013712536036556667 |
|
}, |
|
"storycloze_2016": { |
|
"acc": 0.7274184927846071, |
|
"acc_stderr": 0.010297209765351286 |
|
}, |
|
"boolq": { |
|
"acc": 0.6345565749235474, |
|
"acc_stderr": 0.008422437370062704 |
|
}, |
|
"arc_easy": { |
|
"acc": 0.648989898989899, |
|
"acc_stderr": 0.009793703885101045, |
|
"acc_norm": 0.6199494949494949, |
|
"acc_norm_stderr": 0.009960175831493126 |
|
}, |
|
"arc_challenge": { |
|
"acc": 0.2909556313993174, |
|
"acc_stderr": 0.01327307786590758, |
|
"acc_norm": 0.3225255972696246, |
|
"acc_norm_stderr": 0.01365998089427737 |
|
}, |
|
"sciq": { |
|
"acc": 0.92, |
|
"acc_stderr": 0.008583336977753653, |
|
"acc_norm": 0.916, |
|
"acc_norm_stderr": 0.00877616208949112 |
|
}, |
|
"piqa": { |
|
"acc": 0.7568008705114254, |
|
"acc_stderr": 0.010009611953858922, |
|
"acc_norm": 0.766050054406964, |
|
"acc_norm_stderr": 0.009877236895137437 |
|
} |
|
}, |
|
"versions": { |
|
"anli_r1": 0, |
|
"anli_r2": 0, |
|
"anli_r3": 0, |
|
"cb": 1, |
|
"copa": 0, |
|
"hellaswag": 0, |
|
"rte": 0, |
|
"winogrande": 0, |
|
"storycloze_2016": 0, |
|
"boolq": 1, |
|
"arc_easy": 0, |
|
"arc_challenge": 0, |
|
"sciq": 0, |
|
"piqa": 0 |
|
} |
|
} |