memray's picture
Upload 130 files
e840ac8
{
"STSBenchmark": {
"train": {
"pearson": [
0.759143306453737,
0.0
],
"spearman": [
0.732317209733238,
0.0
],
"nsamples": 5749
},
"dev": {
"pearson": [
0.7746081783379711,
2.2556430824992415e-300
],
"spearman": [
0.7800424504336374,
2.5466091811087085e-307
],
"nsamples": 1500
},
"test": {
"pearson": [
0.7580850707783013,
6.51859239939566e-258
],
"spearman": [
0.7560754511600052,
8.850873074119353e-256
],
"nsamples": 1379
},
"all": {
"pearson": {
"all": 0.7620304519086235,
"mean": 0.7639455185233365,
"wmean": 0.7616627780381048
},
"spearman": {
"all": 0.7488342650348635,
"mean": 0.7561450371089601,
"wmean": 0.7444116088962087
}
}
},
"SICKRelatedness": {
"train": {
"pearson": [
0.7660762263543586,
0.0
],
"spearman": [
0.6943387839868075,
0.0
],
"nsamples": 4500
},
"dev": {
"pearson": [
0.7787463535407387,
6.565381473913046e-103
],
"spearman": [
0.724076491124677,
2.2464753888818782e-82
],
"nsamples": 500
},
"test": {
"pearson": [
0.7585953923013815,
0.0
],
"spearman": [
0.6847050750070173,
0.0
],
"nsamples": 4927
},
"all": {
"pearson": {
"all": 0.7629449380408607,
"mean": 0.7678059907321595,
"wmean": 0.7630014801283258
},
"spearman": {
"all": 0.6909722716792152,
"mean": 0.7010401167061673,
"wmean": 0.6910551705512789
}
}
},
"MR": {
"devacc": 81.13,
"acc": 80.72,
"ndev": 10662,
"ntest": 10662
},
"CR": {
"devacc": 87.1,
"acc": 85.35,
"ndev": 3775,
"ntest": 3775
},
"SUBJ": {
"devacc": 95.37,
"acc": 94.83,
"ndev": 10000,
"ntest": 10000
},
"MPQA": {
"devacc": 88.87,
"acc": 88.84,
"ndev": 10606,
"ntest": 10606
},
"SST2": {
"devacc": 83.72,
"acc": 84.84,
"ndev": 872,
"ntest": 1821
},
"TREC": {
"devacc": 79.31,
"acc": 85.4,
"ndev": 5452,
"ntest": 500
},
"MRPC": {
"devacc": 71.32,
"acc": 68.93,
"f1": 78.8,
"ndev": 4076,
"ntest": 1725
},
"STS12": {
"MSRpar": {
"pearson": [
0.4802609709856894,
1.5548549952823705e-44
],
"spearman": [
0.4768543559246008,
7.614791350529852e-44
],
"nsamples": 750
},
"MSRvid": {
"pearson": [
0.8263319209416204,
1.080221265522035e-188
],
"spearman": [
0.8252791857619619,
8.356577398931468e-188
],
"nsamples": 750
},
"SMTeuroparl": {
"pearson": [
0.5184489923467462,
6.1406360676578446e-33
],
"spearman": [
0.6230131131079721,
1.0590062591812851e-50
],
"nsamples": 459
},
"surprise.OnWN": {
"pearson": [
0.7315874470125636,
1.414322871092147e-126
],
"spearman": [
0.6731301571473148,
4.0960228359103546e-100
],
"nsamples": 750
},
"surprise.SMTnews": {
"pearson": [
0.6259156885670977,
8.739441951714742e-45
],
"spearman": [
0.6148988213247114,
7.33074623929432e-43
],
"nsamples": 399
},
"all": {
"pearson": {
"all": 0.623383289827507,
"mean": 0.6365090039707434,
"wmean": 0.6487592346944445
},
"spearman": {
"all": 0.606079829047924,
"mean": 0.6426351266533122,
"wmean": 0.6476047048746869
}
}
},
"STS13": {
"FNWN": {
"pearson": [
0.5661863937046698,
2.0580012282455086e-17
],
"spearman": [
0.5912700246061035,
3.3253838782016723e-19
],
"nsamples": 189
},
"headlines": {
"pearson": [
0.7825601400543155,
4.2299360961974125e-156
],
"spearman": [
0.7841745697183816,
3.6476628073513e-157
],
"nsamples": 750
},
"OnWN": {
"pearson": [
0.794529783804957,
3.311330886766186e-123
],
"spearman": [
0.7834024923042585,
1.4890472209808275e-117
],
"nsamples": 561
},
"all": {
"pearson": {
"all": 0.7471361547131256,
"mean": 0.7144254391879808,
"wmean": 0.7597736947770001
},
"spearman": {
"all": 0.7564536182897523,
"mean": 0.7196156955429145,
"wmean": 0.7595798400813525
}
}
},
"STS14": {
"deft-forum": {
"pearson": [
0.5270887834584671,
1.541470939768766e-33
],
"spearman": [
0.5112851401228272,
2.4363986591055635e-31
],
"nsamples": 450
},
"deft-news": {
"pearson": [
0.7735386895034391,
5.576824423082716e-61
],
"spearman": [
0.721172124183031,
1.986170265393856e-49
],
"nsamples": 300
},
"headlines": {
"pearson": [
0.7545133819317689,
5.912159102599232e-139
],
"spearman": [
0.7126401838119187,
2.8437071308486684e-117
],
"nsamples": 750
},
"images": {
"pearson": [
0.8323456329452497,
6.921690784176308e-194
],
"spearman": [
0.7937433816131229,
1.1474485172111374e-163
],
"nsamples": 750
},
"OnWN": {
"pearson": [
0.8297923551143387,
1.175057263022769e-191
],
"spearman": [
0.826236205234858,
1.3018028294306147e-188
],
"nsamples": 750
},
"tweet-news": {
"pearson": [
0.7558799639584549,
9.788201645414497e-140
],
"spearman": [
0.6845652322701915,
8.460582099195036e-105
],
"nsamples": 750
},
"all": {
"pearson": {
"all": 0.7159862351857734,
"mean": 0.7455264678186196,
"wmean": 0.7596400159652537
},
"spearman": {
"all": 0.6704800621775756,
"mean": 0.7082737112059916,
"wmean": 0.7224849873354
}
}
},
"STS15": {
"answers-forums": {
"pearson": [
0.7317275686935678,
4.532297271121567e-64
],
"spearman": [
0.7407727747177331,
1.972401483293033e-66
],
"nsamples": 375
},
"answers-students": {
"pearson": [
0.7050737483230498,
9.136794973091405e-114
],
"spearman": [
0.7064217578173171,
2.2091874983666628e-114
],
"nsamples": 750
},
"belief": {
"pearson": [
0.783394736380794,
4.7974747142716894e-79
],
"spearman": [
0.7998064345059992,
1.0770053295383067e-84
],
"nsamples": 375
},
"headlines": {
"pearson": [
0.813583787598092,
2.5592603175894345e-178
],
"spearman": [
0.8095733522782433,
3.220682833365799e-175
],
"nsamples": 750
},
"images": {
"pearson": [
0.8641888241232765,
2.5653257492197874e-225
],
"spearman": [
0.869236692916196,
4.9395933314044357e-231
],
"nsamples": 750
},
"all": {
"pearson": {
"all": 0.7901758719755425,
"mean": 0.779593733023756,
"wmean": 0.7851018781453998
},
"spearman": {
"all": 0.7993930145058169,
"mean": 0.7851622024470977,
"wmean": 0.7888803519059057
}
}
},
"STS16": {
"answer-answer": {
"pearson": [
0.732325384111771,
6.031948033432114e-44
],
"spearman": [
0.7331760524557248,
4.2918539327373104e-44
],
"nsamples": 254
},
"headlines": {
"pearson": [
0.7751129917838497,
3.6445698860447696e-51
],
"spearman": [
0.7759120405190852,
2.4798809912199763e-51
],
"nsamples": 249
},
"plagiarism": {
"pearson": [
0.8073018229023751,
3.908432651513822e-54
],
"spearman": [
0.8201128848961844,
3.380055386535779e-57
],
"nsamples": 230
},
"postediting": {
"pearson": [
0.8262293698872258,
2.999128754083028e-62
],
"spearman": [
0.8467835716176686,
2.7503849185111653e-68
],
"nsamples": 244
},
"question-question": {
"pearson": [
0.7751346076550414,
3.733475629577834e-43
],
"spearman": [
0.7850104595896853,
6.270227463768292e-45
],
"nsamples": 209
},
"all": {
"pearson": {
"all": 0.7817024776005017,
"mean": 0.7832208352680526,
"wmean": 0.7827118895771512
},
"spearman": {
"all": 0.7931904794778135,
"mean": 0.7921990018156697,
"wmean": 0.7915153089950118
}
}
},
"eval_senteval-STS12": 0.606079829047924,
"eval_senteval-STS13": 0.7564536182897523,
"eval_senteval-STS14": 0.6704800621775756,
"eval_senteval-STS15": 0.7993930145058169,
"eval_senteval-STS16": 0.7931904794778135,
"eval_senteval-STSBenchmark": 0.7488342650348635,
"eval_senteval-SICKRelatedness": 0.6909722716792152,
"eval_senteval-avg_sts_7": 0.7236290771732802,
"eval_senteval-MR": 81.13,
"eval_senteval-CR": 87.1,
"eval_senteval-SUBJ": 95.37,
"eval_senteval-MPQA": 88.87,
"eval_senteval-SST2": 83.72,
"eval_senteval-TREC": 79.31,
"eval_senteval-MRPC": 71.32,
"eval_senteval-avg_transfer": 83.83142857142856
}