Muennighoff commited on
Commit
aa91968
1 Parent(s): 41063e3

Add MTEB eval

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. {eval → evaluation/beir}/beir.json +0 -0
  2. evaluation/mteb/AmazonCounterfactualClassification.json +16 -0
  3. evaluation/mteb/AmazonPolarityClassification.json +14 -0
  4. evaluation/mteb/AmazonReviewsClassification.json +14 -0
  5. evaluation/mteb/ArguAna.json +37 -0
  6. evaluation/mteb/ArxivClusteringP2P.json +9 -0
  7. evaluation/mteb/ArxivClusteringS2S.json +9 -0
  8. evaluation/mteb/AskUbuntuDupQuestions.json +9 -0
  9. evaluation/mteb/BIOSSES.json +19 -0
  10. evaluation/mteb/Banking77Classification.json +12 -0
  11. evaluation/mteb/BiorxivClusteringP2P.json +9 -0
  12. evaluation/mteb/BiorxivClusteringS2S.json +9 -0
  13. evaluation/mteb/CQADupstackAndroidRetrieval.json +37 -0
  14. evaluation/mteb/CQADupstackEnglishRetrieval.json +37 -0
  15. evaluation/mteb/CQADupstackGamingRetrieval.json +37 -0
  16. evaluation/mteb/CQADupstackGisRetrieval.json +37 -0
  17. evaluation/mteb/CQADupstackMathematicaRetrieval.json +37 -0
  18. evaluation/mteb/CQADupstackPhysicsRetrieval.json +37 -0
  19. evaluation/mteb/CQADupstackProgrammersRetrieval.json +37 -0
  20. evaluation/mteb/CQADupstackRetrieval.json +1 -0
  21. evaluation/mteb/CQADupstackStatsRetrieval.json +37 -0
  22. evaluation/mteb/CQADupstackTexRetrieval.json +37 -0
  23. evaluation/mteb/CQADupstackUnixRetrieval.json +37 -0
  24. evaluation/mteb/CQADupstackWebmastersRetrieval.json +37 -0
  25. evaluation/mteb/CQADupstackWordpressRetrieval.json +37 -0
  26. evaluation/mteb/ClimateFEVER.json +37 -0
  27. evaluation/mteb/DBPedia.json +37 -0
  28. evaluation/mteb/EmotionClassification.json +12 -0
  29. evaluation/mteb/FEVER.json +37 -0
  30. evaluation/mteb/FiQA2018.json +37 -0
  31. evaluation/mteb/HotpotQA.json +37 -0
  32. evaluation/mteb/ImdbClassification.json +14 -0
  33. evaluation/mteb/MSMARCO.json +37 -0
  34. evaluation/mteb/MTOPDomainClassification.json +14 -0
  35. evaluation/mteb/MTOPIntentClassification.json +14 -0
  36. evaluation/mteb/MassiveIntentClassification.json +14 -0
  37. evaluation/mteb/MassiveScenarioClassification.json +14 -0
  38. evaluation/mteb/MedrxivClusteringP2P.json +9 -0
  39. evaluation/mteb/MedrxivClusteringS2S.json +9 -0
  40. evaluation/mteb/NFCorpus.json +37 -0
  41. evaluation/mteb/NQ.json +37 -0
  42. evaluation/mteb/QuoraRetrieval.json +37 -0
  43. evaluation/mteb/RedditClustering.json +9 -0
  44. evaluation/mteb/RedditClusteringP2P.json +9 -0
  45. evaluation/mteb/SCIDOCS.json +37 -0
  46. evaluation/mteb/SGPT-2.7B-weightedmean-msmarco-specb-bitfit_results.csv +354 -0
  47. evaluation/mteb/SICK-R.json +19 -0
  48. evaluation/mteb/STS12.json +19 -0
  49. evaluation/mteb/STS13.json +19 -0
  50. evaluation/mteb/STS14.json +19 -0
{eval → evaluation/beir}/beir.json RENAMED
File without changes
evaluation/mteb/AmazonCounterfactualClassification.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "en": {
6
+ "accuracy": 0.6756716417910448,
7
+ "accuracy_stderr": 0.035149491395717075,
8
+ "ap": 0.3075574629595259,
9
+ "ap_stderr": 0.022378514563472136,
10
+ "f1": 0.6180512130185866,
11
+ "f1_stderr": 0.027752667739340424,
12
+ "main_score": 0.6756716417910448
13
+ },
14
+ "evaluation_time": 33.75
15
+ }
16
+ }
evaluation/mteb/AmazonPolarityClassification.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "accuracy": 0.71439575,
6
+ "accuracy_stderr": 0.04118535930779893,
7
+ "ap": 0.6591341330532453,
8
+ "ap_stderr": 0.039567766080541335,
9
+ "evaluation_time": 15193.17,
10
+ "f1": 0.7090561852619555,
11
+ "f1_stderr": 0.04610604328985526,
12
+ "main_score": 0.71439575
13
+ }
14
+ }
evaluation/mteb/AmazonReviewsClassification.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "en": {
6
+ "accuracy": 0.35748,
7
+ "accuracy_stderr": 0.017313624692709504,
8
+ "f1": 0.35485762871863474,
9
+ "f1_stderr": 0.016676501915976406,
10
+ "main_score": 0.35748
11
+ },
12
+ "evaluation_time": 125.24
13
+ }
14
+ }
evaluation/mteb/ArguAna.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 254.16,
6
+ "map_at_1": 0.2596,
7
+ "map_at_10": 0.41619,
8
+ "map_at_100": 0.42673,
9
+ "map_at_1000": 0.42684,
10
+ "map_at_3": 0.36569,
11
+ "map_at_5": 0.39397,
12
+ "mrr_at_1": 0.26316,
13
+ "mrr_at_10": 0.41772,
14
+ "mrr_at_100": 0.4282,
15
+ "mrr_at_1000": 0.4283,
16
+ "mrr_at_3": 0.36724,
17
+ "mrr_at_5": 0.39529,
18
+ "ndcg_at_1": 0.2596,
19
+ "ndcg_at_10": 0.50491,
20
+ "ndcg_at_100": 0.54865,
21
+ "ndcg_at_1000": 0.55107,
22
+ "ndcg_at_3": 0.40053,
23
+ "ndcg_at_5": 0.45134,
24
+ "precision_at_1": 0.2596,
25
+ "precision_at_10": 0.07895,
26
+ "precision_at_100": 0.00978,
27
+ "precision_at_1000": 0.001,
28
+ "precision_at_3": 0.16714,
29
+ "precision_at_5": 0.12489,
30
+ "recall_at_1": 0.2596,
31
+ "recall_at_10": 0.78947,
32
+ "recall_at_100": 0.97795,
33
+ "recall_at_1000": 0.99644,
34
+ "recall_at_3": 0.50142,
35
+ "recall_at_5": 0.62447
36
+ }
37
+ }
evaluation/mteb/ArxivClusteringP2P.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 57365.88,
6
+ "v_measure": 0.44721257146422017,
7
+ "v_measure_std": 0.135218958073186
8
+ }
9
+ }
evaluation/mteb/ArxivClusteringS2S.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 6983.79,
6
+ "v_measure": 0.35081451519142065,
7
+ "v_measure_std": 0.14064701566219873
8
+ }
9
+ }
evaluation/mteb/AskUbuntuDupQuestions.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 56.03,
6
+ "map": 0.5963466199039206,
7
+ "mrr": 0.736813525040672
8
+ }
9
+ }
evaluation/mteb/BIOSSES.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "cos_sim": {
6
+ "pearson": 0.8742754550496836,
7
+ "spearman": 0.8484289705838665
8
+ },
9
+ "euclidean": {
10
+ "pearson": 0.8559331970450859,
11
+ "spearman": 0.858525586184271
12
+ },
13
+ "evaluation_time": 6.0,
14
+ "manhattan": {
15
+ "pearson": 0.8541233134466698,
16
+ "spearman": 0.8552303303767403
17
+ }
18
+ }
19
+ }
evaluation/mteb/Banking77Classification.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "accuracy": 0.8321753246753246,
6
+ "accuracy_stderr": 0.008047037149251285,
7
+ "evaluation_time": 109.45,
8
+ "f1": 0.8315394543120915,
9
+ "f1_stderr": 0.008443343664861741,
10
+ "main_score": 0.8321753246753246
11
+ }
12
+ }
evaluation/mteb/BiorxivClusteringP2P.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 6657.01,
6
+ "v_measure": 0.3441414219680629,
7
+ "v_measure_std": 0.010243021348181702
8
+ }
9
+ }
evaluation/mteb/BiorxivClusteringS2S.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 843.62,
6
+ "v_measure": 0.30533275862270026,
7
+ "v_measure_std": 0.011135486000086606
8
+ }
9
+ }
evaluation/mteb/CQADupstackAndroidRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 1118.91,
6
+ "map_at_1": 0.30809,
7
+ "map_at_10": 0.40617,
8
+ "map_at_100": 0.41895,
9
+ "map_at_1000": 0.42025,
10
+ "map_at_3": 0.37,
11
+ "map_at_5": 0.38993,
12
+ "mrr_at_1": 0.37482,
13
+ "mrr_at_10": 0.46497,
14
+ "mrr_at_100": 0.47144,
15
+ "mrr_at_1000": 0.47189,
16
+ "mrr_at_3": 0.43705,
17
+ "mrr_at_5": 0.45193,
18
+ "ndcg_at_1": 0.37482,
19
+ "ndcg_at_10": 0.46688,
20
+ "ndcg_at_100": 0.51726,
21
+ "ndcg_at_1000": 0.53825,
22
+ "ndcg_at_3": 0.41242,
23
+ "ndcg_at_5": 0.43657,
24
+ "precision_at_1": 0.37482,
25
+ "precision_at_10": 0.08827,
26
+ "precision_at_100": 0.01393,
27
+ "precision_at_1000": 0.00186,
28
+ "precision_at_3": 0.19361,
29
+ "precision_at_5": 0.14106,
30
+ "recall_at_1": 0.30809,
31
+ "recall_at_10": 0.5847,
32
+ "recall_at_100": 0.80519,
33
+ "recall_at_1000": 0.93809,
34
+ "recall_at_3": 0.42462,
35
+ "recall_at_5": 0.49385
36
+ }
37
+ }
evaluation/mteb/CQADupstackEnglishRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 1732.23,
6
+ "map_at_1": 0.26962,
7
+ "map_at_10": 0.3693,
8
+ "map_at_100": 0.38102,
9
+ "map_at_1000": 0.3822,
10
+ "map_at_3": 0.34065,
11
+ "map_at_5": 0.3572,
12
+ "mrr_at_1": 0.33567,
13
+ "mrr_at_10": 0.42269,
14
+ "mrr_at_100": 0.4299,
15
+ "mrr_at_1000": 0.43033,
16
+ "mrr_at_3": 0.40064,
17
+ "mrr_at_5": 0.41258,
18
+ "ndcg_at_1": 0.33567,
19
+ "ndcg_at_10": 0.42405,
20
+ "ndcg_at_100": 0.46847,
21
+ "ndcg_at_1000": 0.48951,
22
+ "ndcg_at_3": 0.38312,
23
+ "ndcg_at_5": 0.40242,
24
+ "precision_at_1": 0.33567,
25
+ "precision_at_10": 0.08032,
26
+ "precision_at_100": 0.01295,
27
+ "precision_at_1000": 0.00176,
28
+ "precision_at_3": 0.18662,
29
+ "precision_at_5": 0.13299,
30
+ "recall_at_1": 0.26962,
31
+ "recall_at_10": 0.52489,
32
+ "recall_at_100": 0.71635,
33
+ "recall_at_1000": 0.85141,
34
+ "recall_at_3": 0.4028,
35
+ "recall_at_5": 0.45757
36
+ }
37
+ }
evaluation/mteb/CQADupstackGamingRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 1830.25,
6
+ "map_at_1": 0.36318,
7
+ "map_at_10": 0.4797,
8
+ "map_at_100": 0.49003,
9
+ "map_at_1000": 0.49066,
10
+ "map_at_3": 0.45031,
11
+ "map_at_5": 0.46633,
12
+ "mrr_at_1": 0.41505,
13
+ "mrr_at_10": 0.51431,
14
+ "mrr_at_100": 0.52129,
15
+ "mrr_at_1000": 0.52161,
16
+ "mrr_at_3": 0.48934,
17
+ "mrr_at_5": 0.5042,
18
+ "ndcg_at_1": 0.41505,
19
+ "ndcg_at_10": 0.53676,
20
+ "ndcg_at_100": 0.57867,
21
+ "ndcg_at_1000": 0.59166,
22
+ "ndcg_at_3": 0.48516,
23
+ "ndcg_at_5": 0.50984,
24
+ "precision_at_1": 0.41505,
25
+ "precision_at_10": 0.08608,
26
+ "precision_at_100": 0.01156,
27
+ "precision_at_1000": 0.00133,
28
+ "precision_at_3": 0.21463,
29
+ "precision_at_5": 0.14721,
30
+ "recall_at_1": 0.36318,
31
+ "recall_at_10": 0.67066,
32
+ "recall_at_100": 0.8534,
33
+ "recall_at_1000": 0.94491,
34
+ "recall_at_3": 0.53216,
35
+ "recall_at_5": 0.59214
36
+ }
37
+ }
evaluation/mteb/CQADupstackGisRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 2522.93,
6
+ "map_at_1": 0.22167,
7
+ "map_at_10": 0.29544,
8
+ "map_at_100": 0.30579,
9
+ "map_at_1000": 0.3067,
10
+ "map_at_3": 0.26982,
11
+ "map_at_5": 0.28474,
12
+ "mrr_at_1": 0.24068,
13
+ "mrr_at_10": 0.31237,
14
+ "mrr_at_100": 0.32222,
15
+ "mrr_at_1000": 0.32292,
16
+ "mrr_at_3": 0.28776,
17
+ "mrr_at_5": 0.30234,
18
+ "ndcg_at_1": 0.24068,
19
+ "ndcg_at_10": 0.33973,
20
+ "ndcg_at_100": 0.39135,
21
+ "ndcg_at_1000": 0.41444,
22
+ "ndcg_at_3": 0.29018,
23
+ "ndcg_at_5": 0.31559,
24
+ "precision_at_1": 0.24068,
25
+ "precision_at_10": 0.05299,
26
+ "precision_at_100": 0.00823,
27
+ "precision_at_1000": 0.00106,
28
+ "precision_at_3": 0.12166,
29
+ "precision_at_5": 0.08768,
30
+ "recall_at_1": 0.22167,
31
+ "recall_at_10": 0.46115,
32
+ "recall_at_100": 0.69867,
33
+ "recall_at_1000": 0.87234,
34
+ "recall_at_3": 0.32798,
35
+ "recall_at_5": 0.38951
36
+ }
37
+ }
evaluation/mteb/CQADupstackMathematicaRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 1350.85,
6
+ "map_at_1": 0.12033,
7
+ "map_at_10": 0.19314,
8
+ "map_at_100": 0.20562,
9
+ "map_at_1000": 0.20695,
10
+ "map_at_3": 0.16946,
11
+ "map_at_5": 0.18077,
12
+ "mrr_at_1": 0.14801,
13
+ "mrr_at_10": 0.2274,
14
+ "mrr_at_100": 0.23876,
15
+ "mrr_at_1000": 0.23949,
16
+ "mrr_at_3": 0.20211,
17
+ "mrr_at_5": 0.21573,
18
+ "ndcg_at_1": 0.14801,
19
+ "ndcg_at_10": 0.24038,
20
+ "ndcg_at_100": 0.30186,
21
+ "ndcg_at_1000": 0.33321,
22
+ "ndcg_at_3": 0.19431,
23
+ "ndcg_at_5": 0.2134,
24
+ "precision_at_1": 0.14801,
25
+ "precision_at_10": 0.04776,
26
+ "precision_at_100": 0.00897,
27
+ "precision_at_1000": 0.00133,
28
+ "precision_at_3": 0.0966,
29
+ "precision_at_5": 0.07239,
30
+ "recall_at_1": 0.12033,
31
+ "recall_at_10": 0.35098,
32
+ "recall_at_100": 0.62175,
33
+ "recall_at_1000": 0.84171,
34
+ "recall_at_3": 0.2261,
35
+ "recall_at_5": 0.27279
36
+ }
37
+ }
evaluation/mteb/CQADupstackPhysicsRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 2467.52,
6
+ "map_at_1": 0.26651,
7
+ "map_at_10": 0.36901,
8
+ "map_at_100": 0.38249,
9
+ "map_at_1000": 0.38361,
10
+ "map_at_3": 0.33891,
11
+ "map_at_5": 0.35439,
12
+ "mrr_at_1": 0.32724,
13
+ "mrr_at_10": 0.42504,
14
+ "mrr_at_100": 0.43392,
15
+ "mrr_at_1000": 0.43436,
16
+ "mrr_at_3": 0.3999,
17
+ "mrr_at_5": 0.41347,
18
+ "ndcg_at_1": 0.32724,
19
+ "ndcg_at_10": 0.43007,
20
+ "ndcg_at_100": 0.48601,
21
+ "ndcg_at_1000": 0.50697,
22
+ "ndcg_at_3": 0.3799,
23
+ "ndcg_at_5": 0.40084,
24
+ "precision_at_1": 0.32724,
25
+ "precision_at_10": 0.07873,
26
+ "precision_at_100": 0.01247,
27
+ "precision_at_1000": 0.00162,
28
+ "precision_at_3": 0.18062,
29
+ "precision_at_5": 0.12666,
30
+ "recall_at_1": 0.26651,
31
+ "recall_at_10": 0.55674,
32
+ "recall_at_100": 0.78904,
33
+ "recall_at_1000": 0.92558,
34
+ "recall_at_3": 0.4136,
35
+ "recall_at_5": 0.46984
36
+ }
37
+ }
evaluation/mteb/CQADupstackProgrammersRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 2301.71,
6
+ "map_at_1": 0.22589,
7
+ "map_at_10": 0.32244,
8
+ "map_at_100": 0.3346,
9
+ "map_at_1000": 0.33593,
10
+ "map_at_3": 0.2921,
11
+ "map_at_5": 0.3102,
12
+ "mrr_at_1": 0.28425,
13
+ "mrr_at_10": 0.37282,
14
+ "mrr_at_100": 0.38187,
15
+ "mrr_at_1000": 0.38248,
16
+ "mrr_at_3": 0.34684,
17
+ "mrr_at_5": 0.36123,
18
+ "ndcg_at_1": 0.28425,
19
+ "ndcg_at_10": 0.37942,
20
+ "ndcg_at_100": 0.43443,
21
+ "ndcg_at_1000": 0.45996,
22
+ "ndcg_at_3": 0.32874,
23
+ "ndcg_at_5": 0.35325,
24
+ "precision_at_1": 0.28425,
25
+ "precision_at_10": 0.071,
26
+ "precision_at_100": 0.01166,
27
+ "precision_at_1000": 0.00158,
28
+ "precision_at_3": 0.1602,
29
+ "precision_at_5": 0.11644,
30
+ "recall_at_1": 0.22589,
31
+ "recall_at_10": 0.5004,
32
+ "recall_at_100": 0.73973,
33
+ "recall_at_1000": 0.91128,
34
+ "recall_at_3": 0.35883,
35
+ "recall_at_5": 0.42188
36
+ }
37
+ }
evaluation/mteb/CQADupstackRetrieval.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"dataset_version": null, "mteb_version": "0.0.2", "test": {"evaluation_time": 3522.66, "map_at_1": 0.23190833333333336, "map_at_10": 0.31504916666666666, "map_at_100": 0.32649083333333334, "map_at_1000": 0.3277075, "map_at_3": 0.2882575, "map_at_5": 0.302755, "mrr_at_1": 0.27427499999999994, "mrr_at_10": 0.35364833333333334, "mrr_at_100": 0.36234416666666663, "mrr_at_1000": 0.36297583333333333, "mrr_at_3": 0.3297966666666667, "mrr_at_5": 0.34294583333333334, "ndcg_at_1": 0.27427499999999994, "ndcg_at_10": 0.3653358333333333, "ndcg_at_100": 0.4164508333333333, "ndcg_at_1000": 0.4414499999999999, "ndcg_at_3": 0.3188908333333333, "ndcg_at_5": 0.33984333333333333, "precision_at_1": 0.27427499999999994, "precision_at_10": 0.06481083333333333, "precision_at_100": 0.010610833333333333, "precision_at_1000": 0.0014691666666666666, "precision_at_3": 0.1465675, "precision_at_5": 0.10493583333333333, "recall_at_1": 0.23190833333333336, "recall_at_10": 0.4765175, "recall_at_100": 0.7041016666666666, "recall_at_1000": 0.8782708333333332, "recall_at_3": 0.34637583333333327, "recall_at_5": 0.4005008333333333}}
evaluation/mteb/CQADupstackStatsRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 3154.61,
6
+ "map_at_1": 0.20409,
7
+ "map_at_10": 0.26794,
8
+ "map_at_100": 0.27682,
9
+ "map_at_1000": 0.27783,
10
+ "map_at_3": 0.24461,
11
+ "map_at_5": 0.25668,
12
+ "mrr_at_1": 0.22853,
13
+ "mrr_at_10": 0.29296,
14
+ "mrr_at_100": 0.30103,
15
+ "mrr_at_1000": 0.30179,
16
+ "mrr_at_3": 0.27173,
17
+ "mrr_at_5": 0.28223,
18
+ "ndcg_at_1": 0.22853,
19
+ "ndcg_at_10": 0.31007,
20
+ "ndcg_at_100": 0.35581,
21
+ "ndcg_at_1000": 0.38147,
22
+ "ndcg_at_3": 0.26591,
23
+ "ndcg_at_5": 0.2843,
24
+ "precision_at_1": 0.22853,
25
+ "precision_at_10": 0.05031,
26
+ "precision_at_100": 0.00794,
27
+ "precision_at_1000": 0.0011,
28
+ "precision_at_3": 0.11401,
29
+ "precision_at_5": 0.0816,
30
+ "recall_at_1": 0.20409,
31
+ "recall_at_10": 0.41766,
32
+ "recall_at_100": 0.62964,
33
+ "recall_at_1000": 0.81682,
34
+ "recall_at_3": 0.29281,
35
+ "recall_at_5": 0.3383
36
+ }
37
+ }
evaluation/mteb/CQADupstackTexRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 5341.04,
6
+ "map_at_1": 0.14549,
7
+ "map_at_10": 0.20315,
8
+ "map_at_100": 0.21301,
9
+ "map_at_1000": 0.21425,
10
+ "map_at_3": 0.18132,
11
+ "map_at_5": 0.19429,
12
+ "mrr_at_1": 0.1786,
13
+ "mrr_at_10": 0.23861,
14
+ "mrr_at_100": 0.24737,
15
+ "mrr_at_1000": 0.2482,
16
+ "mrr_at_3": 0.21685,
17
+ "mrr_at_5": 0.23008,
18
+ "ndcg_at_1": 0.1786,
19
+ "ndcg_at_10": 0.24396,
20
+ "ndcg_at_100": 0.29328,
21
+ "ndcg_at_1000": 0.32486,
22
+ "ndcg_at_3": 0.20375,
23
+ "ndcg_at_5": 0.22411,
24
+ "precision_at_1": 0.1786,
25
+ "precision_at_10": 0.0447,
26
+ "precision_at_100": 0.0081,
27
+ "precision_at_1000": 0.00125,
28
+ "precision_at_3": 0.09475,
29
+ "precision_at_5": 0.07171,
30
+ "recall_at_1": 0.14549,
31
+ "recall_at_10": 0.33365,
32
+ "recall_at_100": 0.55797,
33
+ "recall_at_1000": 0.78632,
34
+ "recall_at_3": 0.22229,
35
+ "recall_at_5": 0.27339
36
+ }
37
+ }
evaluation/mteb/CQADupstackUnixRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 3320.59,
6
+ "map_at_1": 0.23286,
7
+ "map_at_10": 0.30728,
8
+ "map_at_100": 0.3184,
9
+ "map_at_1000": 0.31953,
10
+ "map_at_3": 0.28302,
11
+ "map_at_5": 0.29615,
12
+ "mrr_at_1": 0.27239,
13
+ "mrr_at_10": 0.34408,
14
+ "mrr_at_100": 0.35335,
15
+ "mrr_at_1000": 0.35405,
16
+ "mrr_at_3": 0.32152,
17
+ "mrr_at_5": 0.33355,
18
+ "ndcg_at_1": 0.27239,
19
+ "ndcg_at_10": 0.35324,
20
+ "ndcg_at_100": 0.40866,
21
+ "ndcg_at_1000": 0.43584,
22
+ "ndcg_at_3": 0.30899,
23
+ "ndcg_at_5": 0.32813,
24
+ "precision_at_1": 0.27239,
25
+ "precision_at_10": 0.05896,
26
+ "precision_at_100": 0.00979,
27
+ "precision_at_1000": 0.00133,
28
+ "precision_at_3": 0.13713,
29
+ "precision_at_5": 0.09683,
30
+ "recall_at_1": 0.23286,
31
+ "recall_at_10": 0.45711,
32
+ "recall_at_100": 0.70611,
33
+ "recall_at_1000": 0.90029,
34
+ "recall_at_3": 0.33615,
35
+ "recall_at_5": 0.3841
36
+ }
37
+ }
evaluation/mteb/CQADupstackWebmastersRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 1047.0,
6
+ "map_at_1": 0.23962,
7
+ "map_at_10": 0.31943,
8
+ "map_at_100": 0.33384,
9
+ "map_at_1000": 0.33611,
10
+ "map_at_3": 0.29243,
11
+ "map_at_5": 0.30446,
12
+ "mrr_at_1": 0.28458,
13
+ "mrr_at_10": 0.36157,
14
+ "mrr_at_100": 0.37093,
15
+ "mrr_at_1000": 0.37163,
16
+ "mrr_at_3": 0.3386,
17
+ "mrr_at_5": 0.35086,
18
+ "ndcg_at_1": 0.28458,
19
+ "ndcg_at_10": 0.37201,
20
+ "ndcg_at_100": 0.42591,
21
+ "ndcg_at_1000": 0.45539,
22
+ "ndcg_at_3": 0.32889,
23
+ "ndcg_at_5": 0.34483,
24
+ "precision_at_1": 0.28458,
25
+ "precision_at_10": 0.07332,
26
+ "precision_at_100": 0.01437,
27
+ "precision_at_1000": 0.00233,
28
+ "precision_at_3": 0.15547,
29
+ "precision_at_5": 0.11146,
30
+ "recall_at_1": 0.23962,
31
+ "recall_at_10": 0.46751,
32
+ "recall_at_100": 0.71626,
33
+ "recall_at_1000": 0.90939,
34
+ "recall_at_3": 0.34138,
35
+ "recall_at_5": 0.38673
36
+ }
37
+ }
evaluation/mteb/CQADupstackWordpressRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 3522.66,
6
+ "map_at_1": 0.18555,
7
+ "map_at_10": 0.24759,
8
+ "map_at_100": 0.25732,
9
+ "map_at_1000": 0.25847,
10
+ "map_at_3": 0.22646,
11
+ "map_at_5": 0.23792,
12
+ "mrr_at_1": 0.20148,
13
+ "mrr_at_10": 0.26696,
14
+ "mrr_at_100": 0.27605,
15
+ "mrr_at_1000": 0.27696,
16
+ "mrr_at_3": 0.24522,
17
+ "mrr_at_5": 0.25715,
18
+ "ndcg_at_1": 0.20148,
19
+ "ndcg_at_10": 0.28746,
20
+ "ndcg_at_100": 0.3357,
21
+ "ndcg_at_1000": 0.36584,
22
+ "ndcg_at_3": 0.24532,
23
+ "ndcg_at_5": 0.26484,
24
+ "precision_at_1": 0.20148,
25
+ "precision_at_10": 0.04529,
26
+ "precision_at_100": 0.00736,
27
+ "precision_at_1000": 0.00108,
28
+ "precision_at_3": 0.10351,
29
+ "precision_at_5": 0.0732,
30
+ "recall_at_1": 0.18555,
31
+ "recall_at_10": 0.39276,
32
+ "recall_at_100": 0.61511,
33
+ "recall_at_1000": 0.84111,
34
+ "recall_at_3": 0.27779,
35
+ "recall_at_5": 0.32591
36
+ }
37
+ }
evaluation/mteb/ClimateFEVER.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 30738.76,
6
+ "map_at_1": 0.10367,
7
+ "map_at_10": 0.18954,
8
+ "map_at_100": 0.20675,
9
+ "map_at_1000": 0.20868,
10
+ "map_at_3": 0.15486,
11
+ "map_at_5": 0.17347,
12
+ "mrr_at_1": 0.23257,
13
+ "mrr_at_10": 0.35419,
14
+ "mrr_at_100": 0.36361,
15
+ "mrr_at_1000": 0.36403,
16
+ "mrr_at_3": 0.31748,
17
+ "mrr_at_5": 0.34077,
18
+ "ndcg_at_1": 0.23257,
19
+ "ndcg_at_10": 0.2711,
20
+ "ndcg_at_100": 0.33981,
21
+ "ndcg_at_1000": 0.37444,
22
+ "ndcg_at_3": 0.21472,
23
+ "ndcg_at_5": 0.23769,
24
+ "precision_at_1": 0.23257,
25
+ "precision_at_10": 0.08704,
26
+ "precision_at_100": 0.01606,
27
+ "precision_at_1000": 0.00225,
28
+ "precision_at_3": 0.16287,
29
+ "precision_at_5": 0.13068,
30
+ "recall_at_1": 0.10367,
31
+ "recall_at_10": 0.33706,
32
+ "recall_at_100": 0.57375,
33
+ "recall_at_1000": 0.7679,
34
+ "recall_at_3": 0.2018,
35
+ "recall_at_5": 0.26215
36
+ }
37
+ }
evaluation/mteb/DBPedia.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 21716.72,
6
+ "map_at_1": 0.08246,
7
+ "map_at_10": 0.15979,
8
+ "map_at_100": 0.21025,
9
+ "map_at_1000": 0.2219,
10
+ "map_at_3": 0.11997,
11
+ "map_at_5": 0.13697,
12
+ "mrr_at_1": 0.6075,
13
+ "mrr_at_10": 0.68701,
14
+ "mrr_at_100": 0.691,
15
+ "mrr_at_1000": 0.69111,
16
+ "mrr_at_3": 0.66583,
17
+ "mrr_at_5": 0.67871,
18
+ "ndcg_at_1": 0.4975,
19
+ "ndcg_at_10": 0.34702,
20
+ "ndcg_at_100": 0.37607,
21
+ "ndcg_at_1000": 0.44322,
22
+ "ndcg_at_3": 0.39555,
23
+ "ndcg_at_5": 0.36684,
24
+ "precision_at_1": 0.6075,
25
+ "precision_at_10": 0.26625,
26
+ "precision_at_100": 0.0797,
27
+ "precision_at_1000": 0.01678,
28
+ "precision_at_3": 0.41833,
29
+ "precision_at_5": 0.345,
30
+ "recall_at_1": 0.08246,
31
+ "recall_at_10": 0.20968,
32
+ "recall_at_100": 0.42065,
33
+ "recall_at_1000": 0.63671,
34
+ "recall_at_3": 0.13039,
35
+ "recall_at_5": 0.16042
36
+ }
37
+ }
evaluation/mteb/EmotionClassification.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "accuracy": 0.49215,
6
+ "accuracy_stderr": 0.0188680285138644,
7
+ "evaluation_time": 46.17,
8
+ "f1": 0.44859524511637555,
9
+ "f1_stderr": 0.012754862698341127,
10
+ "main_score": 0.49215
11
+ }
12
+ }
evaluation/mteb/FEVER.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 32873.8,
6
+ "map_at_1": 0.56769,
7
+ "map_at_10": 0.67302,
8
+ "map_at_100": 0.67692,
9
+ "map_at_1000": 0.67712,
10
+ "map_at_3": 0.65346,
11
+ "map_at_5": 0.66574,
12
+ "mrr_at_1": 0.61371,
13
+ "mrr_at_10": 0.71875,
14
+ "mrr_at_100": 0.72195,
15
+ "mrr_at_1000": 0.72206,
16
+ "mrr_at_3": 0.7004,
17
+ "mrr_at_5": 0.71224,
18
+ "ndcg_at_1": 0.61371,
19
+ "ndcg_at_10": 0.72731,
20
+ "ndcg_at_100": 0.74468,
21
+ "ndcg_at_1000": 0.74916,
22
+ "ndcg_at_3": 0.69077,
23
+ "ndcg_at_5": 0.71111,
24
+ "precision_at_1": 0.61371,
25
+ "precision_at_10": 0.09326,
26
+ "precision_at_100": 0.0103,
27
+ "precision_at_1000": 0.00108,
28
+ "precision_at_3": 0.27303,
29
+ "precision_at_5": 0.17525,
30
+ "recall_at_1": 0.56769,
31
+ "recall_at_10": 0.8506,
32
+ "recall_at_100": 0.92767,
33
+ "recall_at_1000": 0.95933,
34
+ "recall_at_3": 0.75131,
35
+ "recall_at_5": 0.8017
36
+ }
37
+ }
evaluation/mteb/FiQA2018.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 506.29,
6
+ "map_at_1": 0.15753,
7
+ "map_at_10": 0.25876,
8
+ "map_at_100": 0.27415,
9
+ "map_at_1000": 0.27591,
10
+ "map_at_3": 0.2217,
11
+ "map_at_5": 0.24236,
12
+ "mrr_at_1": 0.31019,
13
+ "mrr_at_10": 0.39977,
14
+ "mrr_at_100": 0.40789,
15
+ "mrr_at_1000": 0.40832,
16
+ "mrr_at_3": 0.37088,
17
+ "mrr_at_5": 0.38655,
18
+ "ndcg_at_1": 0.31019,
19
+ "ndcg_at_10": 0.33286,
20
+ "ndcg_at_100": 0.39529,
21
+ "ndcg_at_1000": 0.42934,
22
+ "ndcg_at_3": 0.2929,
23
+ "ndcg_at_5": 0.30615,
24
+ "precision_at_1": 0.31019,
25
+ "precision_at_10": 0.09383,
26
+ "precision_at_100": 0.01602,
27
+ "precision_at_1000": 0.00222,
28
+ "precision_at_3": 0.19753,
29
+ "precision_at_5": 0.14815,
30
+ "recall_at_1": 0.15753,
31
+ "recall_at_10": 0.40896,
32
+ "recall_at_100": 0.64443,
33
+ "recall_at_1000": 0.85218,
34
+ "recall_at_3": 0.26526,
35
+ "recall_at_5": 0.32453
36
+ }
37
+ }
evaluation/mteb/HotpotQA.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 24496.84,
6
+ "map_at_1": 0.32154,
7
+ "map_at_10": 0.43651,
8
+ "map_at_100": 0.4441,
9
+ "map_at_1000": 0.44487,
10
+ "map_at_3": 0.41239,
11
+ "map_at_5": 0.42659,
12
+ "mrr_at_1": 0.64308,
13
+ "mrr_at_10": 0.71225,
14
+ "mrr_at_100": 0.7157,
15
+ "mrr_at_1000": 0.71591,
16
+ "mrr_at_3": 0.6995,
17
+ "mrr_at_5": 0.70738,
18
+ "ndcg_at_1": 0.64308,
19
+ "ndcg_at_10": 0.52835,
20
+ "ndcg_at_100": 0.55841,
21
+ "ndcg_at_1000": 0.57484,
22
+ "ndcg_at_3": 0.49014,
23
+ "ndcg_at_5": 0.51016,
24
+ "precision_at_1": 0.64308,
25
+ "precision_at_10": 0.1077,
26
+ "precision_at_100": 0.01315,
27
+ "precision_at_1000": 0.00153,
28
+ "precision_at_3": 0.30223,
29
+ "precision_at_5": 0.19716,
30
+ "recall_at_1": 0.32154,
31
+ "recall_at_10": 0.53849,
32
+ "recall_at_100": 0.6576,
33
+ "recall_at_1000": 0.76705,
34
+ "recall_at_3": 0.45334,
35
+ "recall_at_5": 0.49291
36
+ }
37
+ }
evaluation/mteb/ImdbClassification.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "accuracy": 0.635316,
6
+ "accuracy_stderr": 0.04211004041793359,
7
+ "ap": 0.5890084300359825,
8
+ "ap_stderr": 0.03111656030669087,
9
+ "evaluation_time": 1823.15,
10
+ "f1": 0.6335727889030892,
11
+ "f1_stderr": 0.04298181731027657,
12
+ "main_score": 0.635316
13
+ }
14
+ }
evaluation/mteb/MSMARCO.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "validation": {
5
+ "evaluation_time": 43129.71,
6
+ "map_at_1": 0.20566,
7
+ "map_at_10": 0.32229,
8
+ "map_at_100": 0.33445,
9
+ "map_at_1000": 0.33501,
10
+ "map_at_3": 0.28504,
11
+ "map_at_5": 0.30681,
12
+ "mrr_at_1": 0.21218,
13
+ "mrr_at_10": 0.32816,
14
+ "mrr_at_100": 0.33986,
15
+ "mrr_at_1000": 0.34035,
16
+ "mrr_at_3": 0.2915,
17
+ "mrr_at_5": 0.3129,
18
+ "ndcg_at_1": 0.21218,
19
+ "ndcg_at_10": 0.38832,
20
+ "ndcg_at_100": 0.44743,
21
+ "ndcg_at_1000": 0.46138,
22
+ "ndcg_at_3": 0.31232,
23
+ "ndcg_at_5": 0.351,
24
+ "precision_at_1": 0.21218,
25
+ "precision_at_10": 0.06186,
26
+ "precision_at_100": 0.00914,
27
+ "precision_at_1000": 0.00103,
28
+ "precision_at_3": 0.13314,
29
+ "precision_at_5": 0.09943,
30
+ "recall_at_1": 0.20566,
31
+ "recall_at_10": 0.59192,
32
+ "recall_at_100": 0.86626,
33
+ "recall_at_1000": 0.97283,
34
+ "recall_at_3": 0.38492,
35
+ "recall_at_5": 0.4776
36
+ }
37
+ }
evaluation/mteb/MTOPDomainClassification.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "en": {
6
+ "accuracy": 0.9256269949840401,
7
+ "accuracy_stderr": 0.0038850782151341893,
8
+ "f1": 0.921020975473988,
9
+ "f1_stderr": 0.0044060167819252195,
10
+ "main_score": 0.9256269949840401
11
+ },
12
+ "evaluation_time": 45.61
13
+ }
14
+ }
evaluation/mteb/MTOPIntentClassification.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "en": {
6
+ "accuracy": 0.7184678522571819,
7
+ "accuracy_stderr": 0.01111163093063421,
8
+ "f1": 0.5365271934859202,
9
+ "f1_stderr": 0.010588821247395342,
10
+ "main_score": 0.7184678522571819
11
+ },
12
+ "evaluation_time": 122.63
13
+ }
14
+ }
evaluation/mteb/MassiveIntentClassification.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "en": {
6
+ "accuracy": 0.6900806993947546,
7
+ "accuracy_stderr": 0.012602822825246073,
8
+ "f1": 0.6741429618885515,
9
+ "f1_stderr": 0.011707310656187842,
10
+ "main_score": 0.6900806993947546
11
+ },
12
+ "evaluation_time": 72.53
13
+ }
14
+ }
evaluation/mteb/MassiveScenarioClassification.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "en": {
6
+ "accuracy": 0.7590114324142568,
7
+ "accuracy_stderr": 0.010656499030857346,
8
+ "f1": 0.7625183590651454,
9
+ "f1_stderr": 0.010649247943952904,
10
+ "main_score": 0.7590114324142568
11
+ },
12
+ "evaluation_time": 41.51
13
+ }
14
+ }
evaluation/mteb/MedrxivClusteringP2P.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 3336.04,
6
+ "v_measure": 0.31350109978273394,
7
+ "v_measure_std": 0.015425381126297112
8
+ }
9
+ }
evaluation/mteb/MedrxivClusteringS2S.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 492.85,
6
+ "v_measure": 0.2876892369576733,
7
+ "v_measure_std": 0.01586647571955603
8
+ }
9
+ }
evaluation/mteb/NFCorpus.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 168.77,
6
+ "map_at_1": 0.05604,
7
+ "map_at_10": 0.1238,
8
+ "map_at_100": 0.15791,
9
+ "map_at_1000": 0.17327,
10
+ "map_at_3": 0.0915,
11
+ "map_at_5": 0.10599,
12
+ "mrr_at_1": 0.45201,
13
+ "mrr_at_10": 0.53374,
14
+ "mrr_at_100": 0.54089,
15
+ "mrr_at_1000": 0.54123,
16
+ "mrr_at_3": 0.51445,
17
+ "mrr_at_5": 0.5259,
18
+ "ndcg_at_1": 0.42879,
19
+ "ndcg_at_10": 0.33891,
20
+ "ndcg_at_100": 0.31392,
21
+ "ndcg_at_1000": 0.4036,
22
+ "ndcg_at_3": 0.39076,
23
+ "ndcg_at_5": 0.37047,
24
+ "precision_at_1": 0.44582,
25
+ "precision_at_10": 0.25294,
26
+ "precision_at_100": 0.08285,
27
+ "precision_at_1000": 0.02148,
28
+ "precision_at_3": 0.3612,
29
+ "precision_at_5": 0.3195,
30
+ "recall_at_1": 0.05604,
31
+ "recall_at_10": 0.16239,
32
+ "recall_at_100": 0.3216,
33
+ "recall_at_1000": 0.64513,
34
+ "recall_at_3": 0.10406,
35
+ "recall_at_5": 0.12685
36
+ }
37
+ }
evaluation/mteb/NQ.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 15471.98,
6
+ "map_at_1": 0.25881,
7
+ "map_at_10": 0.39501,
8
+ "map_at_100": 0.40615,
9
+ "map_at_1000": 0.40661,
10
+ "map_at_3": 0.35559,
11
+ "map_at_5": 0.37773,
12
+ "mrr_at_1": 0.29229,
13
+ "mrr_at_10": 0.41956,
14
+ "mrr_at_100": 0.4286,
15
+ "mrr_at_1000": 0.42893,
16
+ "mrr_at_3": 0.38562,
17
+ "mrr_at_5": 0.40542,
18
+ "ndcg_at_1": 0.292,
19
+ "ndcg_at_10": 0.46703,
20
+ "ndcg_at_100": 0.51644,
21
+ "ndcg_at_1000": 0.52771,
22
+ "ndcg_at_3": 0.39142,
23
+ "ndcg_at_5": 0.42892,
24
+ "precision_at_1": 0.292,
25
+ "precision_at_10": 0.0792,
26
+ "precision_at_100": 0.01066,
27
+ "precision_at_1000": 0.00117,
28
+ "precision_at_3": 0.18105,
29
+ "precision_at_5": 0.13036,
30
+ "recall_at_1": 0.25881,
31
+ "recall_at_10": 0.66266,
32
+ "recall_at_100": 0.88116,
33
+ "recall_at_1000": 0.96582,
34
+ "recall_at_3": 0.46526,
35
+ "recall_at_5": 0.55154
36
+ }
37
+ }
evaluation/mteb/QuoraRetrieval.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 1285.77,
6
+ "map_at_1": 0.67553,
7
+ "map_at_10": 0.8134,
8
+ "map_at_100": 0.82002,
9
+ "map_at_1000": 0.82027,
10
+ "map_at_3": 0.78281,
11
+ "map_at_5": 0.80149,
12
+ "mrr_at_1": 0.7772,
13
+ "mrr_at_10": 0.84733,
14
+ "mrr_at_100": 0.84878,
15
+ "mrr_at_1000": 0.84879,
16
+ "mrr_at_3": 0.83587,
17
+ "mrr_at_5": 0.84326,
18
+ "ndcg_at_1": 0.7775,
19
+ "ndcg_at_10": 0.85603,
20
+ "ndcg_at_100": 0.87069,
21
+ "ndcg_at_1000": 0.8725,
22
+ "ndcg_at_3": 0.82303,
23
+ "ndcg_at_5": 0.84037,
24
+ "precision_at_1": 0.7775,
25
+ "precision_at_10": 0.1304,
26
+ "precision_at_100": 0.01507,
27
+ "precision_at_1000": 0.00156,
28
+ "precision_at_3": 0.35903,
29
+ "precision_at_5": 0.23738,
30
+ "recall_at_1": 0.67553,
31
+ "recall_at_10": 0.93903,
32
+ "recall_at_100": 0.99062,
33
+ "recall_at_1000": 0.99935,
34
+ "recall_at_3": 0.84581,
35
+ "recall_at_5": 0.89316
36
+ }
37
+ }
evaluation/mteb/RedditClustering.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 6540.34,
6
+ "v_measure": 0.46468877112302354,
7
+ "v_measure_std": 0.059743532887098036
8
+ }
9
+ }
evaluation/mteb/RedditClusteringP2P.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 26567.79,
6
+ "v_measure": 0.5416687629824692,
7
+ "v_measure_std": 0.11955619105267504
8
+ }
9
+ }
evaluation/mteb/SCIDOCS.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "evaluation_time": 338.56,
6
+ "map_at_1": 0.04053,
7
+ "map_at_10": 0.09694,
8
+ "map_at_100": 0.11387,
9
+ "map_at_1000": 0.11654,
10
+ "map_at_3": 0.07053,
11
+ "map_at_5": 0.08439,
12
+ "mrr_at_1": 0.199,
13
+ "mrr_at_10": 0.29359,
14
+ "mrr_at_100": 0.30484,
15
+ "mrr_at_1000": 0.30553,
16
+ "mrr_at_3": 0.262,
17
+ "mrr_at_5": 0.28115,
18
+ "ndcg_at_1": 0.199,
19
+ "ndcg_at_10": 0.16575,
20
+ "ndcg_at_100": 0.23655,
21
+ "ndcg_at_1000": 0.28853,
22
+ "ndcg_at_3": 0.15848,
23
+ "ndcg_at_5": 0.14026,
24
+ "precision_at_1": 0.199,
25
+ "precision_at_10": 0.0845,
26
+ "precision_at_100": 0.01872,
27
+ "precision_at_1000": 0.00313,
28
+ "precision_at_3": 0.14667,
29
+ "precision_at_5": 0.1232,
30
+ "recall_at_1": 0.04053,
31
+ "recall_at_10": 0.1717,
32
+ "recall_at_100": 0.38025,
33
+ "recall_at_1000": 0.63572,
34
+ "recall_at_3": 0.08903,
35
+ "recall_at_5": 0.12477
36
+ }
37
+ }
evaluation/mteb/SGPT-2.7B-weightedmean-msmarco-specb-bitfit_results.csv ADDED
@@ -0,0 +1,354 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,task,dataset,language,metric,value
2
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,BitextMining,BUCC,,f1,
3
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,BitextMining,Tatoeba,,f1,
4
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,en,accuracy,0.6756716417910448
5
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,de,accuracy,
6
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,de,accuracy,
7
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,en-ext,accuracy,
8
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,en-ext,accuracy,
9
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,ja,accuracy,
10
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonCounterfactualClassification,ja,accuracy,
11
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonPolarityClassification,en,accuracy,0.71439575
12
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,en,accuracy,0.35748
13
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,de,accuracy,
14
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,de,accuracy,
15
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,es,accuracy,
16
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,es,accuracy,
17
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,fr,accuracy,
18
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,fr,accuracy,
19
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,ja,accuracy,
20
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,ja,accuracy,
21
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,zh,accuracy,
22
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,AmazonReviewsClassification,zh,accuracy,
23
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,Banking77Classification,en,accuracy,0.8321753246753246
24
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,EmotionClassification,en,accuracy,0.49215
25
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,ImdbClassification,en,accuracy,0.635316
26
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,af,accuracy,
27
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,af,accuracy,
28
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,am,accuracy,
29
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,am,accuracy,
30
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ar,accuracy,
31
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ar,accuracy,
32
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,az,accuracy,
33
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,az,accuracy,
34
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,bn,accuracy,
35
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,bn,accuracy,
36
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,cy,accuracy,
37
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,cy,accuracy,
38
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,da,accuracy,
39
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,da,accuracy,
40
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,de,accuracy,
41
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,de,accuracy,
42
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,el,accuracy,
43
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,el,accuracy,
44
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,en,accuracy,0.6900806993947546
45
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,es,accuracy,
46
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,es,accuracy,
47
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fa,accuracy,
48
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fa,accuracy,
49
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fi,accuracy,
50
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fi,accuracy,
51
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fr,accuracy,
52
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,fr,accuracy,
53
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,he,accuracy,
54
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,he,accuracy,
55
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hi,accuracy,
56
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hi,accuracy,
57
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hu,accuracy,
58
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hu,accuracy,
59
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hy,accuracy,
60
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,hy,accuracy,
61
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,id,accuracy,
62
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,id,accuracy,
63
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,is,accuracy,
64
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,is,accuracy,
65
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,it,accuracy,
66
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,it,accuracy,
67
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ja,accuracy,
68
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ja,accuracy,
69
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,jv,accuracy,
70
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,jv,accuracy,
71
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ka,accuracy,
72
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ka,accuracy,
73
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,km,accuracy,
74
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,km,accuracy,
75
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,kn,accuracy,
76
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,kn,accuracy,
77
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ko,accuracy,
78
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ko,accuracy,
79
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,lv,accuracy,
80
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,lv,accuracy,
81
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ml,accuracy,
82
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ml,accuracy,
83
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,mn,accuracy,
84
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,mn,accuracy,
85
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ms,accuracy,
86
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ms,accuracy,
87
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,my,accuracy,
88
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,my,accuracy,
89
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nb,accuracy,
90
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nb,accuracy,
91
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nl,accuracy,
92
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,nl,accuracy,
93
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pl,accuracy,
94
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pl,accuracy,
95
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pt,accuracy,
96
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,pt,accuracy,
97
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ro,accuracy,
98
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ro,accuracy,
99
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ru,accuracy,
100
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ru,accuracy,
101
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sl,accuracy,
102
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sl,accuracy,
103
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sq,accuracy,
104
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sq,accuracy,
105
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sv,accuracy,
106
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sv,accuracy,
107
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sw,accuracy,
108
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,sw,accuracy,
109
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ta,accuracy,
110
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ta,accuracy,
111
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,te,accuracy,
112
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,te,accuracy,
113
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,th,accuracy,
114
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,th,accuracy,
115
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tl,accuracy,
116
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tl,accuracy,
117
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tr,accuracy,
118
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,tr,accuracy,
119
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ur,accuracy,
120
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,ur,accuracy,
121
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,vi,accuracy,
122
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,vi,accuracy,
123
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-CN,accuracy,
124
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-CN,accuracy,
125
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-TW,accuracy,
126
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveIntentClassification,zh-TW,accuracy,
127
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,af,accuracy,
128
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,af,accuracy,
129
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,am,accuracy,
130
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,am,accuracy,
131
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ar,accuracy,
132
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ar,accuracy,
133
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,az,accuracy,
134
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,az,accuracy,
135
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,bn,accuracy,
136
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,bn,accuracy,
137
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,cy,accuracy,
138
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,cy,accuracy,
139
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,da,accuracy,
140
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,da,accuracy,
141
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,de,accuracy,
142
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,de,accuracy,
143
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,el,accuracy,
144
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,el,accuracy,
145
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,en,accuracy,0.7590114324142568
146
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,es,accuracy,
147
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,es,accuracy,
148
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fa,accuracy,
149
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fa,accuracy,
150
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fi,accuracy,
151
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fi,accuracy,
152
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fr,accuracy,
153
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,fr,accuracy,
154
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,he,accuracy,
155
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,he,accuracy,
156
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hi,accuracy,
157
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hi,accuracy,
158
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hu,accuracy,
159
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hu,accuracy,
160
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hy,accuracy,
161
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,hy,accuracy,
162
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,id,accuracy,
163
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,id,accuracy,
164
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,is,accuracy,
165
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,is,accuracy,
166
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,it,accuracy,
167
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,it,accuracy,
168
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ja,accuracy,
169
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ja,accuracy,
170
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,jv,accuracy,
171
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,jv,accuracy,
172
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ka,accuracy,
173
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ka,accuracy,
174
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,km,accuracy,
175
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,km,accuracy,
176
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,kn,accuracy,
177
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,kn,accuracy,
178
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ko,accuracy,
179
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ko,accuracy,
180
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,lv,accuracy,
181
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,lv,accuracy,
182
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ml,accuracy,
183
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ml,accuracy,
184
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,mn,accuracy,
185
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,mn,accuracy,
186
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ms,accuracy,
187
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ms,accuracy,
188
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,my,accuracy,
189
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,my,accuracy,
190
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nb,accuracy,
191
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nb,accuracy,
192
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nl,accuracy,
193
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,nl,accuracy,
194
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pl,accuracy,
195
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pl,accuracy,
196
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pt,accuracy,
197
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,pt,accuracy,
198
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ro,accuracy,
199
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ro,accuracy,
200
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ru,accuracy,
201
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ru,accuracy,
202
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sl,accuracy,
203
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sl,accuracy,
204
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sq,accuracy,
205
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sq,accuracy,
206
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sv,accuracy,
207
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sv,accuracy,
208
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sw,accuracy,
209
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,sw,accuracy,
210
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ta,accuracy,
211
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ta,accuracy,
212
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,te,accuracy,
213
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,te,accuracy,
214
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,th,accuracy,
215
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,th,accuracy,
216
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tl,accuracy,
217
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tl,accuracy,
218
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tr,accuracy,
219
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,tr,accuracy,
220
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ur,accuracy,
221
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,ur,accuracy,
222
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,vi,accuracy,
223
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,vi,accuracy,
224
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-CN,accuracy,
225
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-CN,accuracy,
226
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-TW,accuracy,
227
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MassiveScenarioClassification,zh-TW,accuracy,
228
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,en,accuracy,0.9256269949840401
229
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,de,accuracy,
230
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,de,accuracy,
231
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,es,accuracy,
232
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,es,accuracy,
233
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,fr,accuracy,
234
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,fr,accuracy,
235
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,hi,accuracy,
236
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,hi,accuracy,
237
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,th,accuracy,
238
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPDomainClassification,th,accuracy,
239
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,en,accuracy,0.7184678522571819
240
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,de,accuracy,
241
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,de,accuracy,
242
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,es,accuracy,
243
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,es,accuracy,
244
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,fr,accuracy,
245
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,fr,accuracy,
246
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,hi,accuracy,
247
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,hi,accuracy,
248
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,th,accuracy,
249
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,MTOPIntentClassification,th,accuracy,
250
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,ToxicConversationsClassification,en,accuracy,0.6884080000000001
251
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,TweetSentimentExtractionClassification,en,accuracy,0.5668647425014148
252
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,ArxivClusteringP2P,en,v_measure,0.44721257146422017
253
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,ArxivClusteringS2S,en,v_measure,0.35081451519142065
254
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,BiorxivClusteringP2P,en,v_measure,0.3441414219680629
255
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,BiorxivClusteringS2S,en,v_measure,0.30533275862270026
256
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,MedrxivClusteringP2P,en,v_measure,0.31350109978273394
257
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,MedrxivClusteringS2S,en,v_measure,0.2876892369576733
258
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,RedditClustering,en,v_measure,0.46468877112302354
259
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,RedditClusteringP2P,en,v_measure,0.5416687629824692
260
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,StackExchangeClustering,en,v_measure,0.5919409867397648
261
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,StackExchangeClusteringP2P,en,v_measure,0.32574403257811496
262
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,TwentyNewsgroupsClustering,en,v_measure,0.408911707239219
263
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,PairClassification,SprintDuplicateQuestions,en,ap,0.9347124923047998
264
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,PairClassification,TwitterSemEval2015,en,ap,0.6368133990830133
265
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,PairClassification,TwitterURLCorpus,en,ap,0.8480240716354543
266
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Reranking,AskUbuntuDupQuestions,en,map,0.5963466199039206
267
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Reranking,MindSmallReranking,,map,
268
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Reranking,SciDocsRR,en,map,0.7771580844366375
269
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Reranking,StackOverflowDupQuestions,en,map,0.4961186384154483
270
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,ArguAna,en,ndcg_at_10,0.50491
271
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,ClimateFEVER,en,ndcg_at_10,0.2711
272
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,CQADupstackRetrieval,en,ndcg_at_10,0.3653358333333333
273
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,DBPedia,en,ndcg_at_10,0.34702
274
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,FEVER,en,ndcg_at_10,0.72731
275
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,FiQA2018,en,ndcg_at_10,0.33286
276
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,HotpotQA,en,ndcg_at_10,0.52835
277
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,MSMARCO,en,ndcg_at_10,0.38832
278
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,NFCorpus,en,ndcg_at_10,0.33891
279
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,NQ,en,ndcg_at_10,0.46703
280
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,QuoraRetrieval,en,ndcg_at_10,0.85603
281
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,SCIDOCS,en,ndcg_at_10,0.16575
282
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,SciFact,en,ndcg_at_10,0.70165
283
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,Touche2020,en,ndcg_at_10,0.2344
284
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,TRECCOVID,en,ndcg_at_10,0.7517
285
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,BIOSSES,en,cosine_spearman,0.8484289705838665
286
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,SICK-R,en,cosine_spearman,0.6819926431966059
287
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS12,en,cosine_spearman,0.6699390786191646
288
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS13,en,cosine_spearman,0.7757623085766706
289
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS14,en,cosine_spearman,0.7278258293483495
290
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS15,en,cosine_spearman,0.8261707296911949
291
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS16,en,cosine_spearman,0.8009839524406284
292
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,ko-ko,cosine_spearman,
293
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,ko-ko,cosine_spearman,
294
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,ar-ar,cosine_spearman,
295
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,ar-ar,cosine_spearman,
296
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-ar,cosine_spearman,
297
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-ar,cosine_spearman,
298
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-de,cosine_spearman,
299
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-de,cosine_spearman,
300
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-en,cosine_spearman,0.8725017540413703
301
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-tr,cosine_spearman,
302
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,en-tr,cosine_spearman,
303
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-en,cosine_spearman,
304
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-en,cosine_spearman,
305
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-es,cosine_spearman,
306
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,es-es,cosine_spearman,
307
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,fr-en,cosine_spearman,
308
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,fr-en,cosine_spearman,
309
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,it-en,cosine_spearman,
310
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,it-en,cosine_spearman,
311
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,nl-en,cosine_spearman,
312
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS17,nl-en,cosine_spearman,
313
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,en,cosine_spearman,0.687486910762485
314
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,de,cosine_spearman,
315
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,de,cosine_spearman,
316
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,es,cosine_spearman,
317
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,es,cosine_spearman,
318
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl,cosine_spearman,
319
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl,cosine_spearman,
320
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,tr,cosine_spearman,
321
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,tr,cosine_spearman,
322
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,ar,cosine_spearman,
323
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,ar,cosine_spearman,
324
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,ru,cosine_spearman,
325
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,ru,cosine_spearman,
326
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh,cosine_spearman,
327
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh,cosine_spearman,
328
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr,cosine_spearman,
329
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr,cosine_spearman,
330
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-en,cosine_spearman,
331
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-en,cosine_spearman,
332
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-en,cosine_spearman,
333
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-en,cosine_spearman,
334
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,it,cosine_spearman,
335
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,it,cosine_spearman,
336
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl-en,cosine_spearman,
337
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,pl-en,cosine_spearman,
338
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh-en,cosine_spearman,
339
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,zh-en,cosine_spearman,
340
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-it,cosine_spearman,
341
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,es-it,cosine_spearman,
342
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-fr,cosine_spearman,
343
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-fr,cosine_spearman,
344
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-pl,cosine_spearman,
345
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,de-pl,cosine_spearman,
346
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr-pl,cosine_spearman,
347
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STS22,fr-pl,cosine_spearman,
348
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,STSBenchmark,en,cosine_spearman,0.7920585637461047
349
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Summarization,SummEval,en,cosine_spearman,0.27870478281195465
350
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Classification,average,en,accuracy,0.6713040365015015
351
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Clustering,average,en,v_measure,0.39833144224085476
352
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,PairClassification,average,en,ap,0.8065166543410891
353
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,Retrieval,average,en,ndcg_at_10,0.4653783888888888
354
+ SGPT-2.7B-weightedmean-msmarco-specb-bitfit,STS,average,en,cosine_spearman,0.768315074100644
evaluation/mteb/SICK-R.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "cos_sim": {
6
+ "pearson": 0.7775487485196769,
7
+ "spearman": 0.6819926431966059
8
+ },
9
+ "euclidean": {
10
+ "pearson": 0.7169016204991725,
11
+ "spearman": 0.6698099673026834
12
+ },
13
+ "evaluation_time": 106.65,
14
+ "manhattan": {
15
+ "pearson": 0.7162994072488664,
16
+ "spearman": 0.6703435950744577
17
+ }
18
+ }
19
+ }
evaluation/mteb/STS12.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "cos_sim": {
6
+ "pearson": 0.7591051402657887,
7
+ "spearman": 0.6699390786191646
8
+ },
9
+ "euclidean": {
10
+ "pearson": 0.7154128036454578,
11
+ "spearman": 0.6925605675649068
12
+ },
13
+ "evaluation_time": 49.4,
14
+ "manhattan": {
15
+ "pearson": 0.7160981030780171,
16
+ "spearman": 0.6927513670128046
17
+ }
18
+ }
19
+ }
evaluation/mteb/STS13.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "cos_sim": {
6
+ "pearson": 0.7723835466417793,
7
+ "spearman": 0.7757623085766706
8
+ },
9
+ "euclidean": {
10
+ "pearson": 0.775090992200725,
11
+ "spearman": 0.7788601688144924
12
+ },
13
+ "evaluation_time": 21.2,
14
+ "manhattan": {
15
+ "pearson": 0.7739045060647423,
16
+ "spearman": 0.7777552718279098
17
+ }
18
+ }
19
+ }
evaluation/mteb/STS14.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_version": null,
3
+ "mteb_version": "0.0.2",
4
+ "test": {
5
+ "cos_sim": {
6
+ "pearson": 0.7791692485139602,
7
+ "spearman": 0.7278258293483495
8
+ },
9
+ "euclidean": {
10
+ "pearson": 0.7464773017077789,
11
+ "spearman": 0.7181662299104619
12
+ },
13
+ "evaluation_time": 52.55,
14
+ "manhattan": {
15
+ "pearson": 0.7471043337995533,
16
+ "spearman": 0.7183960860845646
17
+ }
18
+ }
19
+ }