|
{ |
|
"results": { |
|
"anli_r1": { |
|
"acc": 0.317, |
|
"acc_stderr": 0.014721675438880227 |
|
}, |
|
"anli_r2": { |
|
"acc": 0.33, |
|
"acc_stderr": 0.014876872027456736 |
|
}, |
|
"anli_r3": { |
|
"acc": 0.34, |
|
"acc_stderr": 0.013680495725767796 |
|
}, |
|
"cb": { |
|
"acc": 0.4642857142857143, |
|
"acc_stderr": 0.06724777654937658, |
|
"f1": 0.3299319727891156 |
|
}, |
|
"copa": { |
|
"acc": 0.72, |
|
"acc_stderr": 0.04512608598542127 |
|
}, |
|
"hellaswag": { |
|
"acc": 0.45289782911770565, |
|
"acc_stderr": 0.0049675912675574, |
|
"acc_norm": 0.6038637721569409, |
|
"acc_norm_stderr": 0.004880937933163293 |
|
}, |
|
"rte": { |
|
"acc": 0.49458483754512633, |
|
"acc_stderr": 0.030094698123239966 |
|
}, |
|
"winogrande": { |
|
"acc": 0.5824782951854776, |
|
"acc_stderr": 0.01385997826444025 |
|
}, |
|
"storycloze_2016": { |
|
"acc": 0.7049706039551042, |
|
"acc_stderr": 0.010546232606962287 |
|
}, |
|
"boolq": { |
|
"acc": 0.5834862385321101, |
|
"acc_stderr": 0.008622288020674008 |
|
}, |
|
"arc_easy": { |
|
"acc": 0.6313131313131313, |
|
"acc_stderr": 0.009899640855681038, |
|
"acc_norm": 0.6077441077441077, |
|
"acc_norm_stderr": 0.010018744689650043 |
|
}, |
|
"arc_challenge": { |
|
"acc": 0.30204778156996587, |
|
"acc_stderr": 0.013417519144716422, |
|
"acc_norm": 0.3302047781569966, |
|
"acc_norm_stderr": 0.013743085603760431 |
|
}, |
|
"sciq": { |
|
"acc": 0.908, |
|
"acc_stderr": 0.009144376393151103, |
|
"acc_norm": 0.914, |
|
"acc_norm_stderr": 0.008870325962594766 |
|
}, |
|
"piqa": { |
|
"acc": 0.7442872687704026, |
|
"acc_stderr": 0.010178690109459862, |
|
"acc_norm": 0.7524483133841132, |
|
"acc_norm_stderr": 0.010069703966857114 |
|
} |
|
}, |
|
"versions": { |
|
"anli_r1": 0, |
|
"anli_r2": 0, |
|
"anli_r3": 0, |
|
"cb": 1, |
|
"copa": 0, |
|
"hellaswag": 0, |
|
"rte": 0, |
|
"winogrande": 0, |
|
"storycloze_2016": 0, |
|
"boolq": 1, |
|
"arc_easy": 0, |
|
"arc_challenge": 0, |
|
"sciq": 0, |
|
"piqa": 0 |
|
} |
|
} |