File size: 1,061 Bytes
71f6ad1 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 |
task,metric,value,err,version
anli_r1,acc,0.33,0.01487687202745673,0
anli_r2,acc,0.337,0.014955087918653612,0
anli_r3,acc,0.3416666666666667,0.013696658778002512,0
arc_challenge,acc,0.24232081911262798,0.012521593295800115,0
arc_challenge,acc_norm,0.27559726962457337,0.013057169655761838,0
arc_easy,acc,0.5012626262626263,0.010259750807991068,0
arc_easy,acc_norm,0.502104377104377,0.010259692651537035,0
boolq,acc,0.5443425076452599,0.00871059702108126,1
cb,acc,0.5357142857142857,0.06724777654937658,1
cb,f1,0.3263888888888889,,1
copa,acc,0.7,0.046056618647183814,0
hellaswag,acc,0.39822744473212507,0.004885323175701676,0
hellaswag,acc_norm,0.4894443337980482,0.004988669343786957,0
piqa,acc,0.676822633297062,0.01091197412428213,0
piqa,acc_norm,0.6833514689880305,0.010853160531978484,0
rte,acc,0.44404332129963897,0.029907396333795994,0
sciq,acc,0.749,0.01371813351688892,0
sciq,acc_norm,0.74,0.013877773329774166,0
storycloze_2016,acc,0.6419027258150721,0.011087006809925712,0
winogrande,acc,0.5130228887134964,0.014047718393997667,0
|