|
{ |
|
"STSBenchmark": { |
|
"train": { |
|
"pearson": [ |
|
0.7671625496286432, |
|
0.0 |
|
], |
|
"spearman": [ |
|
0.7407051823403011, |
|
0.0 |
|
], |
|
"nsamples": 5749 |
|
}, |
|
"dev": { |
|
"pearson": [ |
|
0.7813083270941137, |
|
5.741719519093736e-309 |
|
], |
|
"spearman": [ |
|
0.7888860081302335, |
|
4.6194e-319 |
|
], |
|
"nsamples": 1500 |
|
}, |
|
"test": { |
|
"pearson": [ |
|
0.7624448096598531, |
|
1.3012886054724166e-262 |
|
], |
|
"spearman": [ |
|
0.7602771570534436, |
|
2.908594263406545e-260 |
|
], |
|
"nsamples": 1379 |
|
}, |
|
"all": { |
|
"pearson": { |
|
"all": 0.7695053681260078, |
|
"mean": 0.7703052287942033, |
|
"wmean": 0.7688678002986993 |
|
}, |
|
"spearman": { |
|
"all": 0.7564014032837215, |
|
"mean": 0.7632894491746595, |
|
"wmean": 0.7522097015584654 |
|
} |
|
} |
|
}, |
|
"SICKRelatedness": { |
|
"train": { |
|
"pearson": [ |
|
0.7772208691267224, |
|
0.0 |
|
], |
|
"spearman": [ |
|
0.6978066630711928, |
|
0.0 |
|
], |
|
"nsamples": 4500 |
|
}, |
|
"dev": { |
|
"pearson": [ |
|
0.7909750341980787, |
|
2.5296588439552555e-108 |
|
], |
|
"spearman": [ |
|
0.7277741174377886, |
|
1.3244056458147093e-83 |
|
], |
|
"nsamples": 500 |
|
}, |
|
"test": { |
|
"pearson": [ |
|
0.771314072761317, |
|
0.0 |
|
], |
|
"spearman": [ |
|
0.6895861583188468, |
|
0.0 |
|
], |
|
"nsamples": 4927 |
|
}, |
|
"all": { |
|
"pearson": { |
|
"all": 0.7749070438706636, |
|
"mean": 0.7798366586953728, |
|
"wmean": 0.7749819547360027 |
|
}, |
|
"spearman": { |
|
"all": 0.6952695805138401, |
|
"mean": 0.7050556462759427, |
|
"wmean": 0.6952360274580659 |
|
} |
|
} |
|
}, |
|
"MR": { |
|
"devacc": 80.83, |
|
"acc": 80.73, |
|
"ndev": 10662, |
|
"ntest": 10662 |
|
}, |
|
"CR": { |
|
"devacc": 88.1, |
|
"acc": 86.04, |
|
"ndev": 3775, |
|
"ntest": 3775 |
|
}, |
|
"SUBJ": { |
|
"devacc": 95.32, |
|
"acc": 94.97, |
|
"ndev": 10000, |
|
"ntest": 10000 |
|
}, |
|
"MPQA": { |
|
"devacc": 89.04, |
|
"acc": 88.84, |
|
"ndev": 10606, |
|
"ntest": 10606 |
|
}, |
|
"SST2": { |
|
"devacc": 84.06, |
|
"acc": 85.45, |
|
"ndev": 872, |
|
"ntest": 1821 |
|
}, |
|
"TREC": { |
|
"devacc": 81.07, |
|
"acc": 88.0, |
|
"ndev": 5452, |
|
"ntest": 500 |
|
}, |
|
"MRPC": { |
|
"devacc": 70.68, |
|
"acc": 69.28, |
|
"f1": 80.87, |
|
"ndev": 4076, |
|
"ntest": 1725 |
|
}, |
|
"STS12": { |
|
"MSRpar": { |
|
"pearson": [ |
|
0.44444679689851435, |
|
1.1761912553301756e-37 |
|
], |
|
"spearman": [ |
|
0.44300447101923845, |
|
2.1416387542051887e-37 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"MSRvid": { |
|
"pearson": [ |
|
0.8646599853522132, |
|
7.68208333670891e-226 |
|
], |
|
"spearman": [ |
|
0.8699014177629724, |
|
8.381559996022476e-232 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"SMTeuroparl": { |
|
"pearson": [ |
|
0.47046175638197285, |
|
1.1740073098461771e-26 |
|
], |
|
"spearman": [ |
|
0.6114586792865501, |
|
2.0882913296724147e-48 |
|
], |
|
"nsamples": 459 |
|
}, |
|
"surprise.OnWN": { |
|
"pearson": [ |
|
0.7178639582155328, |
|
9.237684853571945e-120 |
|
], |
|
"spearman": [ |
|
0.6658532948970585, |
|
3.0576891351321453e-97 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"surprise.SMTnews": { |
|
"pearson": [ |
|
0.611621280135737, |
|
2.647843518922555e-42 |
|
], |
|
"spearman": [ |
|
0.6250107076256665, |
|
1.2659259057241255e-44 |
|
], |
|
"nsamples": 399 |
|
}, |
|
"all": { |
|
"pearson": { |
|
"all": 0.6378431863774492, |
|
"mean": 0.6218107553967942, |
|
"wmean": 0.6371322047307528 |
|
}, |
|
"spearman": { |
|
"all": 0.6163833612367604, |
|
"mean": 0.6430457141182971, |
|
"wmean": 0.6480399594255531 |
|
} |
|
} |
|
}, |
|
"STS13": { |
|
"FNWN": { |
|
"pearson": [ |
|
0.5562805069869132, |
|
9.550380482948488e-17 |
|
], |
|
"spearman": [ |
|
0.5837123125601075, |
|
1.19655468411138e-18 |
|
], |
|
"nsamples": 189 |
|
}, |
|
"headlines": { |
|
"pearson": [ |
|
0.7823638193897661, |
|
5.690320525335935e-156 |
|
], |
|
"spearman": [ |
|
0.7917891963332858, |
|
2.60264998377283e-162 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"OnWN": { |
|
"pearson": [ |
|
0.7816458183409305, |
|
1.083315842299476e-116 |
|
], |
|
"spearman": [ |
|
0.7796359177798075, |
|
1.0258079303272485e-115 |
|
], |
|
"nsamples": 561 |
|
}, |
|
"all": { |
|
"pearson": { |
|
"all": 0.7255022107614845, |
|
"mean": 0.7067633815725367, |
|
"wmean": 0.7536087896347422 |
|
}, |
|
"spearman": { |
|
"all": 0.7419430794508367, |
|
"mean": 0.7183791422244002, |
|
"wmean": 0.7610261827988645 |
|
} |
|
} |
|
}, |
|
"STS14": { |
|
"deft-forum": { |
|
"pearson": [ |
|
0.5089575374073992, |
|
5.023172357070916e-31 |
|
], |
|
"spearman": [ |
|
0.4963233135417476, |
|
2.317944450085771e-29 |
|
], |
|
"nsamples": 450 |
|
}, |
|
"deft-news": { |
|
"pearson": [ |
|
0.7651252415822635, |
|
6.366264844550544e-59 |
|
], |
|
"spearman": [ |
|
0.7127419493226671, |
|
8.180911780133503e-48 |
|
], |
|
"nsamples": 300 |
|
}, |
|
"headlines": { |
|
"pearson": [ |
|
0.749244660243113, |
|
5.438116092767328e-136 |
|
], |
|
"spearman": [ |
|
0.7099163551457461, |
|
5.362434306324602e-116 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"images": { |
|
"pearson": [ |
|
0.8463923099739724, |
|
7.255366412502392e-207 |
|
], |
|
"spearman": [ |
|
0.8037324760119565, |
|
7.818229780597217e-171 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"OnWN": { |
|
"pearson": [ |
|
0.8194865773850172, |
|
5.086803489175948e-183 |
|
], |
|
"spearman": [ |
|
0.8214740885641392, |
|
1.2146288498994132e-184 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"tweet-news": { |
|
"pearson": [ |
|
0.7298695292458673, |
|
1.0631684722321918e-125 |
|
], |
|
"spearman": [ |
|
0.6599928354527725, |
|
5.5057855924436005e-95 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"all": { |
|
"pearson": { |
|
"all": 0.7165932905627189, |
|
"mean": 0.7365126426396054, |
|
"wmean": 0.7512835391850631 |
|
}, |
|
"spearman": { |
|
"all": 0.6677462039090557, |
|
"mean": 0.7006968363398381, |
|
"wmean": 0.7156013046057461 |
|
} |
|
} |
|
}, |
|
"STS15": { |
|
"answers-forums": { |
|
"pearson": [ |
|
0.7110270112832033, |
|
5.18878369534419e-59 |
|
], |
|
"spearman": [ |
|
0.7180037029082824, |
|
1.1507346620419953e-60 |
|
], |
|
"nsamples": 375 |
|
}, |
|
"answers-students": { |
|
"pearson": [ |
|
0.685403182699777, |
|
3.763475670820268e-105 |
|
], |
|
"spearman": [ |
|
0.6892806170636011, |
|
8.551548507203923e-107 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"belief": { |
|
"pearson": [ |
|
0.7406221526966811, |
|
2.1633293082135999e-66 |
|
], |
|
"spearman": [ |
|
0.7616812212998276, |
|
2.7456783665122726e-72 |
|
], |
|
"nsamples": 375 |
|
}, |
|
"headlines": { |
|
"pearson": [ |
|
0.8065884284038872, |
|
5.856919545907542e-173 |
|
], |
|
"spearman": [ |
|
0.8065628750527286, |
|
6.121300087095471e-173 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"images": { |
|
"pearson": [ |
|
0.8734727058865335, |
|
5.133694173289855e-236 |
|
], |
|
"spearman": [ |
|
0.8800760762065849, |
|
3.7371804165528405e-244 |
|
], |
|
"nsamples": 750 |
|
}, |
|
"all": { |
|
"pearson": { |
|
"all": 0.7786729190560969, |
|
"mean": 0.7634226961940165, |
|
"wmean": 0.7728222247450349 |
|
}, |
|
"spearman": { |
|
"all": 0.7899640319998164, |
|
"mean": 0.7711208985062049, |
|
"wmean": 0.7789405076067425 |
|
} |
|
} |
|
}, |
|
"STS16": { |
|
"answer-answer": { |
|
"pearson": [ |
|
0.6932635451048339, |
|
1.0228592987318116e-37 |
|
], |
|
"spearman": [ |
|
0.7021547155024479, |
|
4.8011478191297344e-39 |
|
], |
|
"nsamples": 254 |
|
}, |
|
"headlines": { |
|
"pearson": [ |
|
0.7691218196080909, |
|
6.220546451256778e-50 |
|
], |
|
"spearman": [ |
|
0.779843578127762, |
|
3.643403874299668e-52 |
|
], |
|
"nsamples": 249 |
|
}, |
|
"plagiarism": { |
|
"pearson": [ |
|
0.8038816275257141, |
|
2.350047547816728e-53 |
|
], |
|
"spearman": [ |
|
0.8153039508029369, |
|
5.088887617848758e-56 |
|
], |
|
"nsamples": 230 |
|
}, |
|
"postediting": { |
|
"pearson": [ |
|
0.8113538363870572, |
|
2.3510310736845822e-58 |
|
], |
|
"spearman": [ |
|
0.8303201531350315, |
|
2.1906668671246972e-63 |
|
], |
|
"nsamples": 244 |
|
}, |
|
"question-question": { |
|
"pearson": [ |
|
0.7802351353605056, |
|
4.64479928094145e-44 |
|
], |
|
"spearman": [ |
|
0.7884164498209355, |
|
1.4564689988934998e-45 |
|
], |
|
"nsamples": 209 |
|
}, |
|
"all": { |
|
"pearson": { |
|
"all": 0.7704350276676698, |
|
"mean": 0.7715711927972403, |
|
"wmean": 0.7702635136920273 |
|
}, |
|
"spearman": { |
|
"all": 0.7846388532549995, |
|
"mean": 0.7832077694778227, |
|
"wmean": 0.7819775824229623 |
|
} |
|
} |
|
}, |
|
"eval_senteval-STS12": 0.6163833612367604, |
|
"eval_senteval-STS13": 0.7419430794508367, |
|
"eval_senteval-STS14": 0.6677462039090557, |
|
"eval_senteval-STS15": 0.7899640319998164, |
|
"eval_senteval-STS16": 0.7846388532549995, |
|
"eval_senteval-STSBenchmark": 0.7564014032837215, |
|
"eval_senteval-SICKRelatedness": 0.6952695805138401, |
|
"eval_senteval-avg_sts_7": 0.7217637876641472, |
|
"eval_senteval-MR": 80.83, |
|
"eval_senteval-CR": 88.1, |
|
"eval_senteval-SUBJ": 95.32, |
|
"eval_senteval-MPQA": 89.04, |
|
"eval_senteval-SST2": 84.06, |
|
"eval_senteval-TREC": 81.07, |
|
"eval_senteval-MRPC": 70.68, |
|
"eval_senteval-avg_transfer": 84.15714285714287 |
|
} |
|
|