memray's picture
Upload 130 files
444729b
{
"STSBenchmark": {
"train": {
"pearson": [
0.7868313677903059,
0.0
],
"spearman": [
0.7533061602723176,
0.0
],
"nsamples": 5749
},
"dev": {
"pearson": [
0.8010234738701788,
0.0
],
"spearman": [
0.8010173901569266,
0.0
],
"nsamples": 1500
},
"test": {
"pearson": [
0.7766524771374954,
1.1662374252806932e-278
],
"spearman": [
0.7638460069862814,
3.8220116833205965e-264
],
"nsamples": 1379
},
"all": {
"pearson": {
"all": 0.7882517084559206,
"mean": 0.7881691062659933,
"wmean": 0.7876718254757005
},
"spearman": {
"all": 0.7668425138024548,
"mean": 0.7727231858051752,
"wmean": 0.7632854478761041
}
}
},
"SICKRelatedness": {
"train": {
"pearson": [
0.7853064744370001,
0.0
],
"spearman": [
0.7045889188784015,
0.0
],
"nsamples": 4500
},
"dev": {
"pearson": [
0.7952406911697713,
2.6811654216760936e-110
],
"spearman": [
0.7309801454276812,
1.0951577254305346e-84
],
"nsamples": 500
},
"test": {
"pearson": [
0.7794843403240526,
0.0
],
"spearman": [
0.6977349592492605,
0.0
],
"nsamples": 4927
},
"all": {
"pearson": {
"all": 0.7828650051750712,
"mean": 0.7866771686436079,
"wmean": 0.7829171779317007
},
"spearman": {
"all": 0.7025121676824595,
"mean": 0.7111013411851145,
"wmean": 0.702516404944873
}
}
},
"MR": {
"devacc": 81.09,
"acc": 80.59,
"ndev": 10662,
"ntest": 10662
},
"CR": {
"devacc": 87.01,
"acc": 86.6,
"ndev": 3775,
"ntest": 3775
},
"SUBJ": {
"devacc": 95.34,
"acc": 95.02,
"ndev": 10000,
"ntest": 10000
},
"MPQA": {
"devacc": 88.89,
"acc": 88.99,
"ndev": 10606,
"ntest": 10606
},
"SST2": {
"devacc": 84.06,
"acc": 84.95,
"ndev": 872,
"ntest": 1821
},
"TREC": {
"devacc": 82.7,
"acc": 87.2,
"ndev": 5452,
"ntest": 500
},
"MRPC": {
"devacc": 70.8,
"acc": 68.81,
"f1": 76.97,
"ndev": 4076,
"ntest": 1725
},
"STS12": {
"MSRpar": {
"pearson": [
0.4506656429961876,
8.587667122234213e-39
],
"spearman": [
0.4537783738578545,
2.270328303306969e-39
],
"nsamples": 750
},
"MSRvid": {
"pearson": [
0.8735316429807825,
4.363488536726283e-236
],
"spearman": [
0.8745116790315722,
2.8887254873277706e-237
],
"nsamples": 750
},
"SMTeuroparl": {
"pearson": [
0.5276646768590786,
2.9080130640693665e-34
],
"spearman": [
0.6225349369600102,
1.3236704498055218e-50
],
"nsamples": 459
},
"surprise.OnWN": {
"pearson": [
0.7340552729415586,
7.588168789192366e-128
],
"spearman": [
0.6862387036955726,
1.6734444180335097e-105
],
"nsamples": 750
},
"surprise.SMTnews": {
"pearson": [
0.6554833920285361,
2.382715639542081e-50
],
"spearman": [
0.6338572026855626,
3.2084519789805647e-46
],
"nsamples": 399
},
"all": {
"pearson": {
"all": 0.667994262204242,
"mean": 0.6482801255612287,
"wmean": 0.6587597745452379
},
"spearman": {
"all": 0.6198695741812278,
"mean": 0.6541841792461144,
"wmean": 0.659443091175976
}
}
},
"STS13": {
"FNWN": {
"pearson": [
0.570828218970704,
9.847987645161228e-18
],
"spearman": [
0.6046232001507675,
3.1840503190651897e-20
],
"nsamples": 189
},
"headlines": {
"pearson": [
0.7995020825200164,
9.500980524179015e-168
],
"spearman": [
0.8125460785135767,
1.649528631120915e-177
],
"nsamples": 750
},
"OnWN": {
"pearson": [
0.7844322816916485,
4.612357080156043e-118
],
"spearman": [
0.7801367000550998,
5.871872377147612e-116
],
"nsamples": 561
},
"all": {
"pearson": {
"all": 0.7407620228952401,
"mean": 0.718254194394123,
"wmean": 0.7650530702029934
},
"spearman": {
"all": 0.7458274512781141,
"mean": 0.7324353262398148,
"wmean": 0.7742266882963925
}
}
},
"STS14": {
"deft-forum": {
"pearson": [
0.5631321216962222,
5.210192672663357e-39
],
"spearman": [
0.5511772152789268,
4.031968923211026e-37
],
"nsamples": 450
},
"deft-news": {
"pearson": [
0.7692532638001923,
6.387272025432673e-60
],
"spearman": [
0.7225821241233733,
1.0522226454927607e-49
],
"nsamples": 300
},
"headlines": {
"pearson": [
0.7685532605008147,
3.1092413652073723e-147
],
"spearman": [
0.72597520728351,
9.721513948491652e-124
],
"nsamples": 750
},
"images": {
"pearson": [
0.8353848860067018,
1.3687751285353585e-196
],
"spearman": [
0.8008852796417836,
9.492757773828998e-169
],
"nsamples": 750
},
"OnWN": {
"pearson": [
0.8314850837955547,
3.9440310563877586e-193
],
"spearman": [
0.8316458764161619,
2.851406716141642e-193
],
"nsamples": 750
},
"tweet-news": {
"pearson": [
0.7778758524787571,
4.607989885863323e-153
],
"spearman": [
0.6958906739489547,
1.1738361486418922e-109
],
"nsamples": 750
},
"all": {
"pearson": {
"all": 0.73992310716163,
"mean": 0.7576140780463737,
"wmean": 0.7717759322639277
},
"spearman": {
"all": 0.6864467990669687,
"mean": 0.7213593961154516,
"wmean": 0.734827243221423
}
}
},
"STS15": {
"answers-forums": {
"pearson": [
0.7391296029963142,
5.385805927099778e-66
],
"spearman": [
0.7409312029744309,
1.789609179402688e-66
],
"nsamples": 375
},
"answers-students": {
"pearson": [
0.7026326622651042,
1.1706959560110963e-112
],
"spearman": [
0.7107886172788801,
2.1014876744572312e-116
],
"nsamples": 750
},
"belief": {
"pearson": [
0.8006281964159404,
5.439878843301103e-85
],
"spearman": [
0.8172868949869829,
2.543177483321865e-91
],
"nsamples": 375
},
"headlines": {
"pearson": [
0.8172091326355518,
3.472486751097505e-181
],
"spearman": [
0.8158723780481846,
4.030205865269612e-180
],
"nsamples": 750
},
"images": {
"pearson": [
0.8784869743544939,
3.750940760878824e-242
],
"spearman": [
0.8806887757856461,
6.211464354884257e-245
],
"nsamples": 750
},
"all": {
"pearson": {
"all": 0.7913051772787048,
"mean": 0.787617313733481,
"wmean": 0.7920519172403193
},
"spearman": {
"all": 0.7986117512115241,
"mean": 0.7931135738148248,
"wmean": 0.7966147050233544
}
}
},
"STS16": {
"answer-answer": {
"pearson": [
0.7177168935513755,
1.7118144003107402e-41
],
"spearman": [
0.7132893030185777,
8.841119832138394e-41
],
"nsamples": 254
},
"headlines": {
"pearson": [
0.7910112149047425,
1.2553390356155912e-54
],
"spearman": [
0.8059772680734066,
3.561704789876049e-58
],
"nsamples": 249
},
"plagiarism": {
"pearson": [
0.8146246368802861,
7.416724178775043e-56
],
"spearman": [
0.8287733749128491,
2.0728091350119785e-59
],
"nsamples": 230
},
"postediting": {
"pearson": [
0.8358664674126319,
5.627683437146896e-65
],
"spearman": [
0.8514410852739017,
8.855209165489321e-70
],
"nsamples": 244
},
"question-question": {
"pearson": [
0.7757563825820808,
2.9043591729136265e-43
],
"spearman": [
0.7882765418102572,
1.5472955880308416e-45
],
"nsamples": 209
},
"all": {
"pearson": {
"all": 0.7727412422624585,
"mean": 0.7869951190662233,
"wmean": 0.7864334333593027
},
"spearman": {
"all": 0.7823935956761426,
"mean": 0.7975515146177985,
"wmean": 0.7967817209039866
}
}
},
"eval_senteval-STS12": 0.6198695741812278,
"eval_senteval-STS13": 0.7458274512781141,
"eval_senteval-STS14": 0.6864467990669687,
"eval_senteval-STS15": 0.7986117512115241,
"eval_senteval-STS16": 0.7823935956761426,
"eval_senteval-STSBenchmark": 0.7668425138024548,
"eval_senteval-SICKRelatedness": 0.7025121676824595,
"eval_senteval-avg_sts_7": 0.7289291218426988,
"eval_senteval-MR": 81.09,
"eval_senteval-CR": 87.01,
"eval_senteval-SUBJ": 95.34,
"eval_senteval-MPQA": 88.89,
"eval_senteval-SST2": 84.06,
"eval_senteval-TREC": 82.7,
"eval_senteval-MRPC": 70.8,
"eval_senteval-avg_transfer": 84.27
}