|
{ |
|
"STSBenchmark": { |
|
"train": { |
|
"pearson": [ |
|
0.7675016313639117, |
|
0.0 |
|
], |
|
"spearman": [ |
|
0.7404488937353225, |
|
0.0 |
|
], |
|
"nsamples": 5749 |
|
}, |
|
"dev": { |
|
"pearson": [ |
|
0.7658521041744508, |
|
1.4020329449305176e-289 |
|
], |
|
"spearman": [ |
|
0.7730453513050343, |
|
2.066561283121993e-298 |
|
], |
|
"nsamples": 1500 |
|
}, |
|
"test": { |
|
"pearson": [ |
|
0.7623056519318484, |
|
1.8448021245198884e-262 |
|
], |
|
"spearman": [ |
|
0.7572290027800557, |
|
5.3120116722114526e-257 |
|
], |
|
"nsamples": 1379 |
|
}, |
|
"all": { |
|
"pearson": { |
|
"all": 0.7647570029076096, |
|
"mean": 0.7652197958234037, |
|
"wmean": 0.7663843913985655 |
|
}, |
|
"spearman": { |
|
"all": 0.7534738635333297, |
|
"mean": 0.7569077492734708, |
|
"wmean": 0.7487978108339844 |
|
} |
|
} |
|
}, |
|
"SICKRelatedness": { |
|
"train": { |
|
"pearson": [ |
|
0.7707517065205873, |
|
0.0 |
|
], |
|
"spearman": [ |
|
0.6949522587450165, |
|
0.0 |
|
], |
|
"nsamples": 4500 |
|
}, |
|
"dev": { |
|
"pearson": [ |
|
0.778349180191507, |
|
9.711324138536703e-103 |
|
], |
|
"spearman": [ |
|
0.7176593438481393, |
|
2.743332620783351e-80 |
|
], |
|
"nsamples": 500 |
|
}, |
|
"test": { |
|
"pearson": [ |
|
0.7642987657770804, |
|
0.0 |
|
], |
|
"spearman": [ |
|
0.6847455515560564, |
|
0.0 |
|
], |
|
"nsamples": 4927 |
|
}, |
|
"all": { |
|
"pearson": { |
|
"all": 0.7678373187987577, |
|
"mean": 0.7711332174963915, |
|
"wmean": 0.7679316297393041 |
|
}, |
|
"spearman": { |
|
"all": 0.6909477744903625, |
|
"mean": 0.6991190513830707, |
|
"wmean": 0.6910301368785469 |
|
} |
|
} |
|
}, |
|
"MR": { |
|
"devacc": 81.19, |
|
"acc": 80.75, |
|
"ndev": 10662, |
|
"ntest": 10662 |
|
}, |
|
"CR": { |
|
"devacc": 87.12, |
|
"acc": 86.73, |
|
"ndev": 3775, |
|
"ntest": 3775 |
|
}, |
|
"SUBJ": { |
|
"devacc": 95.61, |
|
"acc": 95.29, |
|
"ndev": 10000, |
|
"ntest": 10000 |
|
}, |
|
"MPQA": { |
|
"devacc": 89.04, |
|
"acc": 88.61, |
|
"ndev": 10606, |
|
"ntest": 10606 |
|
}, |
|
"SST2": { |
|
"devacc": 85.21, |
|
"acc": 85.61, |
|
"ndev": 872, |
|
"ntest": 1821 |
|
}, |
|
"TREC": { |
|
"devacc": 80.69, |
|
"acc": 86.8, |
|
"ndev": 5452, |
|
"ntest": 500 |
|
}, |
|
"MRPC": { |
|
"devacc": 71.69, |
|
"acc": 70.32, |
|
"f1": 79.57, |
|
"ndev": 4076, |
|
"ntest": 1725 |
|
}, |
|
"STS12": { |
|
"MSRpar": { |
|
"pearson": [ |
|
0.4514113169306324, |
|
6.251817668045887e-39 |
|
], |
|
"spearman": [ |
|
0.4499549654577979, |
|
1.1613312893486279e-38 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"MSRvid": { |
|
"pearson": [ |
|
0.8599559900295872, |
|
1.0643859926359198e-220 |
|
], |
|
"spearman": [ |
|
0.8649974875962446, |
|
3.229629761923383e-226 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"SMTeuroparl": { |
|
"pearson": [ |
|
0.4931333562119396, |
|
1.6812261260529903e-29 |
|
], |
|
"spearman": [ |
|
0.6128103790153274, |
|
1.1381831791276455e-48 |
|
], |
|
"nsamples": 459 |
|
}, |
|
"surprise.OnWN": { |
|
"pearson": [ |
|
0.7365214189654901, |
|
3.947242882144461e-129 |
|
], |
|
"spearman": [ |
|
0.683719802480883, |
|
1.910512439440496e-104 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"surprise.SMTnews": { |
|
"pearson": [ |
|
0.6084967943558258, |
|
8.882847362372895e-42 |
|
], |
|
"spearman": [ |
|
0.6324009475046439, |
|
5.9238371155257115e-46 |
|
], |
|
"nsamples": 399 |
|
}, |
|
"all": { |
|
"pearson": { |
|
"all": 0.6090786981125251, |
|
"mean": 0.629903775298695, |
|
"wmean": 0.6451270836208292 |
|
}, |
|
"spearman": { |
|
"all": 0.5915463354166586, |
|
"mean": 0.6487767164109794, |
|
"wmean": 0.6539936080030831 |
|
} |
|
} |
|
}, |
|
"STS13": { |
|
"FNWN": { |
|
"pearson": [ |
|
0.5827724320641434, |
|
1.399853624093483e-18 |
|
], |
|
"spearman": [ |
|
0.6243224304995846, |
|
8.1205413287147755e-22 |
|
], |
|
"nsamples": 189 |
|
}, |
|
"headlines": { |
|
"pearson": [ |
|
0.782141211640678, |
|
7.962032809197313e-156 |
|
], |
|
"spearman": [ |
|
0.7864730688106963, |
|
1.0734436155388987e-158 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"OnWN": { |
|
"pearson": [ |
|
0.7763285115488442, |
|
3.939259823816713e-114 |
|
], |
|
"spearman": [ |
|
0.7706743357210359, |
|
1.7455185991511694e-111 |
|
], |
|
"nsamples": 561 |
|
}, |
|
"all": { |
|
"pearson": { |
|
"all": 0.7269930269261002, |
|
"mean": 0.7137473850845552, |
|
"wmean": 0.7548467955796887 |
|
}, |
|
"spearman": { |
|
"all": 0.7392805868780532, |
|
"mean": 0.7271566116771057, |
|
"wmean": 0.7601333622079632 |
|
} |
|
} |
|
}, |
|
"STS14": { |
|
"deft-forum": { |
|
"pearson": [ |
|
0.5228897751421426, |
|
6.073682402382636e-33 |
|
], |
|
"spearman": [ |
|
0.5053330319071232, |
|
1.532862819818703e-30 |
|
], |
|
"nsamples": 450 |
|
}, |
|
"deft-news": { |
|
"pearson": [ |
|
0.7680069983657648, |
|
1.2852042740473546e-59 |
|
], |
|
"spearman": [ |
|
0.7189884605027314, |
|
5.271976030712246e-49 |
|
], |
|
"nsamples": 300 |
|
}, |
|
"headlines": { |
|
"pearson": [ |
|
0.7541282525177266, |
|
9.793324818317855e-139 |
|
], |
|
"spearman": [ |
|
0.7184718603499471, |
|
4.702376618230486e-120 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"images": { |
|
"pearson": [ |
|
0.8478349220740108, |
|
2.8453760358482384e-208 |
|
], |
|
"spearman": [ |
|
0.8081484798616755, |
|
3.9047867377054607e-174 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"OnWN": { |
|
"pearson": [ |
|
0.8215837025605404, |
|
9.871899662708195e-185 |
|
], |
|
"spearman": [ |
|
0.8279072975227956, |
|
4.92735009919912e-190 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"tweet-news": { |
|
"pearson": [ |
|
0.7317126218269044, |
|
1.2202543536716308e-126 |
|
], |
|
"spearman": [ |
|
0.6520317484632859, |
|
5.3026345548268765e-92 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"all": { |
|
"pearson": { |
|
"all": 0.7189696594882792, |
|
"mean": 0.7410260454145149, |
|
"wmean": 0.7552392326821546 |
|
}, |
|
"spearman": { |
|
"all": 0.670800547509326, |
|
"mean": 0.7051468131012597, |
|
"wmean": 0.7194709179086142 |
|
} |
|
} |
|
}, |
|
"STS15": { |
|
"answers-forums": { |
|
"pearson": [ |
|
0.7262407045308339, |
|
1.1025031075653589e-62 |
|
], |
|
"spearman": [ |
|
0.7275038094083748, |
|
5.324790051370908e-63 |
|
], |
|
"nsamples": 375 |
|
}, |
|
"answers-students": { |
|
"pearson": [ |
|
0.6978521677757564, |
|
1.6036590447498983e-110 |
|
], |
|
"spearman": [ |
|
0.7024365108998977, |
|
1.4353461268590496e-112 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"belief": { |
|
"pearson": [ |
|
0.7839138106441258, |
|
3.235687910099277e-79 |
|
], |
|
"spearman": [ |
|
0.79336254174086, |
|
2.047534842473332e-82 |
|
], |
|
"nsamples": 375 |
|
}, |
|
"headlines": { |
|
"pearson": [ |
|
0.8124656869189333, |
|
1.9047661503782033e-177 |
|
], |
|
"spearman": [ |
|
0.8124179763234277, |
|
2.0744785143960583e-177 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"images": { |
|
"pearson": [ |
|
0.8731830765774482, |
|
1.1398312421407709e-235 |
|
], |
|
"spearman": [ |
|
0.8795017881810903, |
|
1.9914488519259588e-243 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"all": { |
|
"pearson": { |
|
"all": 0.7827019127153672, |
|
"mean": 0.7787310892894196, |
|
"wmean": 0.7846445472149044 |
|
}, |
|
"spearman": { |
|
"all": 0.790296617367925, |
|
"mean": 0.7830445253107301, |
|
"wmean": 0.7886973627447582 |
|
} |
|
} |
|
}, |
|
"STS16": { |
|
"answer-answer": { |
|
"pearson": [ |
|
0.7325081931498698, |
|
5.607126931548686e-44 |
|
], |
|
"spearman": [ |
|
0.7313808706110454, |
|
8.788498983014453e-44 |
|
], |
|
"nsamples": 254 |
|
}, |
|
"headlines": { |
|
"pearson": [ |
|
0.7702918518354713, |
|
3.5986232616752304e-50 |
|
], |
|
"spearman": [ |
|
0.7838189633800285, |
|
5.030858666324319e-53 |
|
], |
|
"nsamples": 249 |
|
}, |
|
"plagiarism": { |
|
"pearson": [ |
|
0.8193777086614761, |
|
5.14320199251657e-57 |
|
], |
|
"spearman": [ |
|
0.8274487763356487, |
|
4.601518050831221e-59 |
|
], |
|
"nsamples": 230 |
|
}, |
|
"postediting": { |
|
"pearson": [ |
|
0.8373109699109689, |
|
2.1202879642927884e-65 |
|
], |
|
"spearman": [ |
|
0.8554383865248261, |
|
4.218785247850647e-71 |
|
], |
|
"nsamples": 244 |
|
}, |
|
"question-question": { |
|
"pearson": [ |
|
0.7703959894794563, |
|
2.4658565942110764e-42 |
|
], |
|
"spearman": [ |
|
0.7772827176027448, |
|
1.5625377662687375e-43 |
|
], |
|
"nsamples": 209 |
|
}, |
|
"all": { |
|
"pearson": { |
|
"all": 0.7784793728977035, |
|
"mean": 0.7859769426074485, |
|
"wmean": 0.785525517385094 |
|
}, |
|
"spearman": { |
|
"all": 0.7906179855205325, |
|
"mean": 0.7950739428908588, |
|
"wmean": 0.7946323236636283 |
|
} |
|
} |
|
}, |
|
"eval_senteval-STS12": 0.5915463354166586, |
|
"eval_senteval-STS13": 0.7392805868780532, |
|
"eval_senteval-STS14": 0.670800547509326, |
|
"eval_senteval-STS15": 0.790296617367925, |
|
"eval_senteval-STS16": 0.7906179855205325, |
|
"eval_senteval-STSBenchmark": 0.7534738635333297, |
|
"eval_senteval-SICKRelatedness": 0.6909477744903625, |
|
"eval_senteval-avg_sts_7": 0.7181376729594552, |
|
"eval_senteval-MR": 81.19, |
|
"eval_senteval-CR": 87.12, |
|
"eval_senteval-SUBJ": 95.61, |
|
"eval_senteval-MPQA": 89.04, |
|
"eval_senteval-SST2": 85.21, |
|
"eval_senteval-TREC": 80.69, |
|
"eval_senteval-MRPC": 71.69, |
|
"eval_senteval-avg_transfer": 84.36428571428571 |
|
} |
|
|