|
{ |
|
"results": { |
|
"anli_r1": { |
|
"acc": 0.327, |
|
"acc_stderr": 0.014842213153411249 |
|
}, |
|
"anli_r2": { |
|
"acc": 0.346, |
|
"acc_stderr": 0.015050266127564441 |
|
}, |
|
"anli_r3": { |
|
"acc": 0.325, |
|
"acc_stderr": 0.013526454480351018 |
|
}, |
|
"cb": { |
|
"acc": 0.375, |
|
"acc_stderr": 0.06527912098338669, |
|
"f1": 0.2151416122004357 |
|
}, |
|
"copa": { |
|
"acc": 0.74, |
|
"acc_stderr": 0.04408440022768077 |
|
}, |
|
"hellaswag": { |
|
"acc": 0.39494124676359293, |
|
"acc_stderr": 0.00487839022659172, |
|
"acc_norm": 0.483469428400717, |
|
"acc_norm_stderr": 0.004987053652540279 |
|
}, |
|
"rte": { |
|
"acc": 0.4657039711191336, |
|
"acc_stderr": 0.030025579819366426 |
|
}, |
|
"winogrande": { |
|
"acc": 0.49329123914759276, |
|
"acc_stderr": 0.014051220692330342 |
|
}, |
|
"storycloze_2016": { |
|
"acc": 0.649919828968466, |
|
"acc_stderr": 0.011030440255782963 |
|
}, |
|
"boolq": { |
|
"acc": 0.4883792048929664, |
|
"acc_stderr": 0.008742692742551265 |
|
}, |
|
"arc_easy": { |
|
"acc": 0.494949494949495, |
|
"acc_stderr": 0.010259260102565858, |
|
"acc_norm": 0.4515993265993266, |
|
"acc_norm_stderr": 0.010211600726405215 |
|
}, |
|
"arc_challenge": { |
|
"acc": 0.23464163822525597, |
|
"acc_stderr": 0.012383873560768675, |
|
"acc_norm": 0.2593856655290102, |
|
"acc_norm_stderr": 0.012808273573927094 |
|
}, |
|
"sciq": { |
|
"acc": 0.69, |
|
"acc_stderr": 0.014632638658632893, |
|
"acc_norm": 0.633, |
|
"acc_norm_stderr": 0.015249378464171756 |
|
}, |
|
"piqa": { |
|
"acc": 0.6931447225244831, |
|
"acc_stderr": 0.010760295070580359, |
|
"acc_norm": 0.6893362350380848, |
|
"acc_norm_stderr": 0.01079707893372768 |
|
} |
|
}, |
|
"versions": { |
|
"anli_r1": 0, |
|
"anli_r2": 0, |
|
"anli_r3": 0, |
|
"cb": 1, |
|
"copa": 0, |
|
"hellaswag": 0, |
|
"rte": 0, |
|
"winogrande": 0, |
|
"storycloze_2016": 0, |
|
"boolq": 1, |
|
"arc_easy": 0, |
|
"arc_challenge": 0, |
|
"sciq": 0, |
|
"piqa": 0 |
|
} |
|
} |