all-mpnet-base-v2 / README.md

Muennighoff

Add MTEB

f965a9b almost 2 years ago

preview code

raw

history blame

No virus

66.7 kB

	---
	pipeline_tag: sentence-similarity
	tags:
	- sentence-transformers
	- feature-extraction
	- sentence-similarity
	- mteb
	language: en
	license: apache-2.0
	datasets:
	- s2orc
	- flax-sentence-embeddings/stackexchange_xml
	- MS Marco
	- gooaq
	- yahoo_answers_topics
	- code_search_net
	- search_qa
	- eli5
	- snli
	- multi_nli
	- wikihow
	- natural_questions
	- trivia_qa
	- embedding-data/sentence-compression
	- embedding-data/flickr30k-captions
	- embedding-data/altlex
	- embedding-data/simple-wiki
	- embedding-data/QQP
	- embedding-data/SPECTER
	- embedding-data/PAQ_pairs
	- embedding-data/WikiAnswers
	model-index:
	- name: all-mpnet-base-v2
	results:
	- task:
	type: Classification
	dataset:
	type: mteb/amazon_counterfactual
	name: MTEB AmazonCounterfactualClassification (en)
	config: en
	split: test
	revision: 2d8a100785abf0ae21420d2a55b0c56e3e1ea996
	metrics:
	- type: accuracy
	value: 65.26865671641791
	- type: ap
	value: 28.47453420428918
	- type: f1
	value: 59.3470101009448
	- task:
	type: Classification
	dataset:
	type: mteb/amazon_polarity
	name: MTEB AmazonPolarityClassification
	config: default
	split: test
	revision: 80714f8dcf8cefc218ef4f8c5a966dd83f75a0e1
	metrics:
	- type: accuracy
	value: 67.13145
	- type: ap
	value: 61.842060778903786
	- type: f1
	value: 66.79987305640383
	- task:
	type: Classification
	dataset:
	type: mteb/amazon_reviews_multi
	name: MTEB AmazonReviewsClassification (en)
	config: en
	split: test
	revision: c379a6705fec24a2493fa68e011692605f44e119
	metrics:
	- type: accuracy
	value: 31.920000000000005
	- type: f1
	value: 31.2465193896153
	- task:
	type: Retrieval
	dataset:
	type: arguana
	name: MTEB ArguAna
	config: default
	split: test
	revision: 5b3e3697907184a9b77a3c99ee9ea1a9cbb1e4e3
	metrics:
	- type: map_at_1
	value: 23.186
	- type: map_at_10
	value: 37.692
	- type: map_at_100
	value: 38.986
	- type: map_at_1000
	value: 38.991
	- type: map_at_3
	value: 32.622
	- type: map_at_5
	value: 35.004999999999995
	- type: ndcg_at_1
	value: 23.186
	- type: ndcg_at_10
	value: 46.521
	- type: ndcg_at_100
	value: 51.954
	- type: ndcg_at_1000
	value: 52.087
	- type: ndcg_at_3
	value: 35.849
	- type: ndcg_at_5
	value: 40.12
	- type: precision_at_1
	value: 23.186
	- type: precision_at_10
	value: 7.510999999999999
	- type: precision_at_100
	value: 0.9860000000000001
	- type: precision_at_1000
	value: 0.1
	- type: precision_at_3
	value: 15.078
	- type: precision_at_5
	value: 11.110000000000001
	- type: recall_at_1
	value: 23.186
	- type: recall_at_10
	value: 75.107
	- type: recall_at_100
	value: 98.649
	- type: recall_at_1000
	value: 99.644
	- type: recall_at_3
	value: 45.235
	- type: recall_at_5
	value: 55.547999999999995
	- task:
	type: Clustering
	dataset:
	type: mteb/arxiv-clustering-p2p
	name: MTEB ArxivClusteringP2P
	config: default
	split: test
	revision: 0bbdb47bcbe3a90093699aefeed338a0f28a7ee8
	metrics:
	- type: v_measure
	value: 48.37886340922374
	- task:
	type: Clustering
	dataset:
	type: mteb/arxiv-clustering-s2s
	name: MTEB ArxivClusteringS2S
	config: default
	split: test
	revision: b73bd54100e5abfa6e3a23dcafb46fe4d2438dc3
	metrics:
	- type: v_measure
	value: 39.72488615315985
	- task:
	type: Reranking
	dataset:
	type: mteb/askubuntudupquestions-reranking
	name: MTEB AskUbuntuDupQuestions
	config: default
	split: test
	revision: 4d853f94cd57d85ec13805aeeac3ae3e5eb4c49c
	metrics:
	- type: map
	value: 65.85199009344481
	- type: mrr
	value: 78.47700391329201
	- task:
	type: STS
	dataset:
	type: mteb/biosses-sts
	name: MTEB BIOSSES
	config: default
	split: test
	revision: 9ee918f184421b6bd48b78f6c714d86546106103
	metrics:
	- type: cos_sim_pearson
	value: 84.47737119217858
	- type: cos_sim_spearman
	value: 80.43195317854409
	- type: euclidean_pearson
	value: 82.20496332547978
	- type: euclidean_spearman
	value: 80.43195317854409
	- type: manhattan_pearson
	value: 81.4836610720397
	- type: manhattan_spearman
	value: 79.65904400101908
	- task:
	type: Classification
	dataset:
	type: mteb/banking77
	name: MTEB Banking77Classification
	config: default
	split: test
	revision: 44fa15921b4c889113cc5df03dd4901b49161ab7
	metrics:
	- type: accuracy
	value: 81.8603896103896
	- type: f1
	value: 81.28027245637479
	- task:
	type: Clustering
	dataset:
	type: mteb/biorxiv-clustering-p2p
	name: MTEB BiorxivClusteringP2P
	config: default
	split: test
	revision: 11d0121201d1f1f280e8cc8f3d98fb9c4d9f9c55
	metrics:
	- type: v_measure
	value: 39.616605133625185
	- task:
	type: Clustering
	dataset:
	type: mteb/biorxiv-clustering-s2s
	name: MTEB BiorxivClusteringS2S
	config: default
	split: test
	revision: c0fab014e1bcb8d3a5e31b2088972a1e01547dc1
	metrics:
	- type: v_measure
	value: 35.02442407186902
	- task:
	type: Retrieval
	dataset:
	type: BeIR/cqadupstack
	name: MTEB CQADupstackAndroidRetrieval
	config: default
	split: test
	revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
	metrics:
	- type: map_at_1
	value: 36.036
	- type: map_at_10
	value: 49.302
	- type: map_at_100
	value: 50.956
	- type: map_at_1000
	value: 51.080000000000005
	- type: map_at_3
	value: 45.237
	- type: map_at_5
	value: 47.353
	- type: ndcg_at_1
	value: 45.207
	- type: ndcg_at_10
	value: 56.485
	- type: ndcg_at_100
	value: 61.413
	- type: ndcg_at_1000
	value: 62.870000000000005
	- type: ndcg_at_3
	value: 51.346000000000004
	- type: ndcg_at_5
	value: 53.486
	- type: precision_at_1
	value: 45.207
	- type: precision_at_10
	value: 11.144
	- type: precision_at_100
	value: 1.735
	- type: precision_at_1000
	value: 0.22100000000000003
	- type: precision_at_3
	value: 24.94
	- type: precision_at_5
	value: 17.997
	- type: recall_at_1
	value: 36.036
	- type: recall_at_10
	value: 69.191
	- type: recall_at_100
	value: 89.423
	- type: recall_at_1000
	value: 98.425
	- type: recall_at_3
	value: 53.849999999999994
	- type: recall_at_5
	value: 60.107
	- task:
	type: Retrieval
	dataset:
	type: BeIR/cqadupstack
	name: MTEB CQADupstackEnglishRetrieval
	config: default
	split: test
	revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
	metrics:
	- type: map_at_1
	value: 32.92
	- type: map_at_10
	value: 45.739999999999995
	- type: map_at_100
	value: 47.309
	- type: map_at_1000
	value: 47.443000000000005
	- type: map_at_3
	value: 42.154
	- type: map_at_5
	value: 44.207
	- type: ndcg_at_1
	value: 42.229
	- type: ndcg_at_10
	value: 52.288999999999994
	- type: ndcg_at_100
	value: 57.04900000000001
	- type: ndcg_at_1000
	value: 58.788
	- type: ndcg_at_3
	value: 47.531
	- type: ndcg_at_5
	value: 49.861
	- type: precision_at_1
	value: 42.229
	- type: precision_at_10
	value: 10.299
	- type: precision_at_100
	value: 1.68
	- type: precision_at_1000
	value: 0.213
	- type: precision_at_3
	value: 23.673
	- type: precision_at_5
	value: 17.006
	- type: recall_at_1
	value: 32.92
	- type: recall_at_10
	value: 63.865
	- type: recall_at_100
	value: 84.06700000000001
	- type: recall_at_1000
	value: 94.536
	- type: recall_at_3
	value: 49.643
	- type: recall_at_5
	value: 56.119
	- task:
	type: Retrieval
	dataset:
	type: BeIR/cqadupstack
	name: MTEB CQADupstackGamingRetrieval
	config: default
	split: test
	revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
	metrics:
	- type: map_at_1
	value: 40.695
	- type: map_at_10
	value: 53.787
	- type: map_at_100
	value: 54.778000000000006
	- type: map_at_1000
	value: 54.827000000000005
	- type: map_at_3
	value: 50.151999999999994
	- type: map_at_5
	value: 52.207
	- type: ndcg_at_1
	value: 46.52
	- type: ndcg_at_10
	value: 60.026
	- type: ndcg_at_100
	value: 63.81099999999999
	- type: ndcg_at_1000
	value: 64.741
	- type: ndcg_at_3
	value: 53.83
	- type: ndcg_at_5
	value: 56.928999999999995
	- type: precision_at_1
	value: 46.52
	- type: precision_at_10
	value: 9.754999999999999
	- type: precision_at_100
	value: 1.2670000000000001
	- type: precision_at_1000
	value: 0.13799999999999998
	- type: precision_at_3
	value: 24.096
	- type: precision_at_5
	value: 16.689999999999998
	- type: recall_at_1
	value: 40.695
	- type: recall_at_10
	value: 75.181
	- type: recall_at_100
	value: 91.479
	- type: recall_at_1000
	value: 98.06899999999999
	- type: recall_at_3
	value: 58.707
	- type: recall_at_5
	value: 66.295
	- task:
	type: Retrieval
	dataset:
	type: BeIR/cqadupstack
	name: MTEB CQADupstackGisRetrieval
	config: default
	split: test
	revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
	metrics:
	- type: map_at_1
	value: 29.024
	- type: map_at_10
	value: 38.438
	- type: map_at_100
	value: 39.576
	- type: map_at_1000
	value: 39.645
	- type: map_at_3
	value: 34.827999999999996
	- type: map_at_5
	value: 36.947
	- type: ndcg_at_1
	value: 31.299
	- type: ndcg_at_10
	value: 44.268
	- type: ndcg_at_100
	value: 49.507
	- type: ndcg_at_1000
	value: 51.205999999999996
	- type: ndcg_at_3
	value: 37.248999999999995
	- type: ndcg_at_5
	value: 40.861999999999995
	- type: precision_at_1
	value: 31.299
	- type: precision_at_10
	value: 6.949
	- type: precision_at_100
	value: 1.012
	- type: precision_at_1000
	value: 0.11900000000000001
	- type: precision_at_3
	value: 15.518
	- type: precision_at_5
	value: 11.366999999999999
	- type: recall_at_1
	value: 29.024
	- type: recall_at_10
	value: 60.404
	- type: recall_at_100
	value: 83.729
	- type: recall_at_1000
	value: 96.439
	- type: recall_at_3
	value: 41.65
	- type: recall_at_5
	value: 50.263999999999996
	- task:
	type: Retrieval
	dataset:
	type: BeIR/cqadupstack
	name: MTEB CQADupstackMathematicaRetrieval
	config: default
	split: test
	revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
	metrics:
	- type: map_at_1
	value: 17.774
	- type: map_at_10
	value: 28.099
	- type: map_at_100
	value: 29.603
	- type: map_at_1000
	value: 29.709999999999997
	- type: map_at_3
	value: 25.036
	- type: map_at_5
	value: 26.657999999999998
	- type: ndcg_at_1
	value: 22.139
	- type: ndcg_at_10
	value: 34.205999999999996
	- type: ndcg_at_100
	value: 40.844
	- type: ndcg_at_1000
	value: 43.144
	- type: ndcg_at_3
	value: 28.732999999999997
	- type: ndcg_at_5
	value: 31.252000000000002
	- type: precision_at_1
	value: 22.139
	- type: precision_at_10
	value: 6.567
	- type: precision_at_100
	value: 1.147
	- type: precision_at_1000
	value: 0.146
	- type: precision_at_3
	value: 14.386
	- type: precision_at_5
	value: 10.423
	- type: recall_at_1
	value: 17.774
	- type: recall_at_10
	value: 48.32
	- type: recall_at_100
	value: 76.373
	- type: recall_at_1000
	value: 92.559
	- type: recall_at_3
	value: 33.478
	- type: recall_at_5
	value: 39.872
	- task:
	type: Retrieval
	dataset:
	type: BeIR/cqadupstack
	name: MTEB CQADupstackPhysicsRetrieval
	config: default
	split: test
	revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
	metrics:
	- type: map_at_1
	value: 31.885
	- type: map_at_10
	value: 44.289
	- type: map_at_100
	value: 45.757999999999996
	- type: map_at_1000
	value: 45.86
	- type: map_at_3
	value: 40.459
	- type: map_at_5
	value: 42.662
	- type: ndcg_at_1
	value: 39.75
	- type: ndcg_at_10
	value: 50.975
	- type: ndcg_at_100
	value: 56.528999999999996
	- type: ndcg_at_1000
	value: 58.06099999999999
	- type: ndcg_at_3
	value: 45.327
	- type: ndcg_at_5
	value: 48.041
	- type: precision_at_1
	value: 39.75
	- type: precision_at_10
	value: 9.557
	- type: precision_at_100
	value: 1.469
	- type: precision_at_1000
	value: 0.17700000000000002
	- type: precision_at_3
	value: 22.073
	- type: precision_at_5
	value: 15.765
	- type: recall_at_1
	value: 31.885
	- type: recall_at_10
	value: 64.649
	- type: recall_at_100
	value: 87.702
	- type: recall_at_1000
	value: 97.327
	- type: recall_at_3
	value: 48.61
	- type: recall_at_5
	value: 55.882
	- task:
	type: Retrieval
	dataset:
	type: BeIR/cqadupstack
	name: MTEB CQADupstackProgrammersRetrieval
	config: default
	split: test
	revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
	metrics:
	- type: map_at_1
	value: 26.454
	- type: map_at_10
	value: 37.756
	- type: map_at_100
	value: 39.225
	- type: map_at_1000
	value: 39.332
	- type: map_at_3
	value: 34.115
	- type: map_at_5
	value: 35.942
	- type: ndcg_at_1
	value: 32.42
	- type: ndcg_at_10
	value: 44.165
	- type: ndcg_at_100
	value: 50.202000000000005
	- type: ndcg_at_1000
	value: 52.188
	- type: ndcg_at_3
	value: 38.381
	- type: ndcg_at_5
	value: 40.849000000000004
	- type: precision_at_1
	value: 32.42
	- type: precision_at_10
	value: 8.482000000000001
	- type: precision_at_100
	value: 1.332
	- type: precision_at_1000
	value: 0.169
	- type: precision_at_3
	value: 18.683
	- type: precision_at_5
	value: 13.539000000000001
	- type: recall_at_1
	value: 26.454
	- type: recall_at_10
	value: 57.937000000000005
	- type: recall_at_100
	value: 83.76
	- type: recall_at_1000
	value: 96.82600000000001
	- type: recall_at_3
	value: 41.842
	- type: recall_at_5
	value: 48.285
	- task:
	type: Retrieval
	dataset:
	type: BeIR/cqadupstack
	name: MTEB CQADupstackRetrieval
	config: default
	split: test
	revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
	metrics:
	- type: map_at_1
	value: 27.743666666666666
	- type: map_at_10
	value: 38.75416666666667
	- type: map_at_100
	value: 40.133250000000004
	- type: map_at_1000
	value: 40.24616666666667
	- type: map_at_3
	value: 35.267250000000004
	- type: map_at_5
	value: 37.132749999999994
	- type: ndcg_at_1
	value: 33.14358333333333
	- type: ndcg_at_10
	value: 44.95916666666667
	- type: ndcg_at_100
	value: 50.46375
	- type: ndcg_at_1000
	value: 52.35508333333334
	- type: ndcg_at_3
	value: 39.17883333333334
	- type: ndcg_at_5
	value: 41.79724999999999
	- type: precision_at_1
	value: 33.14358333333333
	- type: precision_at_10
	value: 8.201083333333333
	- type: precision_at_100
	value: 1.3085
	- type: precision_at_1000
	value: 0.1665833333333333
	- type: precision_at_3
	value: 18.405583333333333
	- type: precision_at_5
	value: 13.233166666666666
	- type: recall_at_1
	value: 27.743666666666666
	- type: recall_at_10
	value: 58.91866666666667
	- type: recall_at_100
	value: 82.76216666666666
	- type: recall_at_1000
	value: 95.56883333333333
	- type: recall_at_3
	value: 42.86925
	- type: recall_at_5
	value: 49.553333333333335
	- task:
	type: Retrieval
	dataset:
	type: BeIR/cqadupstack
	name: MTEB CQADupstackStatsRetrieval
	config: default
	split: test
	revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
	metrics:
	- type: map_at_1
	value: 25.244
	- type: map_at_10
	value: 33.464
	- type: map_at_100
	value: 34.633
	- type: map_at_1000
	value: 34.721999999999994
	- type: map_at_3
	value: 30.784
	- type: map_at_5
	value: 32.183
	- type: ndcg_at_1
	value: 28.681
	- type: ndcg_at_10
	value: 38.149
	- type: ndcg_at_100
	value: 43.856
	- type: ndcg_at_1000
	value: 46.026
	- type: ndcg_at_3
	value: 33.318
	- type: ndcg_at_5
	value: 35.454
	- type: precision_at_1
	value: 28.681
	- type: precision_at_10
	value: 6.304
	- type: precision_at_100
	value: 0.992
	- type: precision_at_1000
	value: 0.125
	- type: precision_at_3
	value: 14.673
	- type: precision_at_5
	value: 10.245
	- type: recall_at_1
	value: 25.244
	- type: recall_at_10
	value: 49.711
	- type: recall_at_100
	value: 75.928
	- type: recall_at_1000
	value: 91.79899999999999
	- type: recall_at_3
	value: 36.325
	- type: recall_at_5
	value: 41.752
	- task:
	type: Retrieval
	dataset:
	type: BeIR/cqadupstack
	name: MTEB CQADupstackTexRetrieval
	config: default
	split: test
	revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
	metrics:
	- type: map_at_1
	value: 18.857
	- type: map_at_10
	value: 27.794
	- type: map_at_100
	value: 29.186
	- type: map_at_1000
	value: 29.323
	- type: map_at_3
	value: 24.779
	- type: map_at_5
	value: 26.459
	- type: ndcg_at_1
	value: 23.227999999999998
	- type: ndcg_at_10
	value: 33.353
	- type: ndcg_at_100
	value: 39.598
	- type: ndcg_at_1000
	value: 42.268
	- type: ndcg_at_3
	value: 28.054000000000002
	- type: ndcg_at_5
	value: 30.566
	- type: precision_at_1
	value: 23.227999999999998
	- type: precision_at_10
	value: 6.397
	- type: precision_at_100
	value: 1.129
	- type: precision_at_1000
	value: 0.155
	- type: precision_at_3
	value: 13.616
	- type: precision_at_5
	value: 10.116999999999999
	- type: recall_at_1
	value: 18.857
	- type: recall_at_10
	value: 45.797
	- type: recall_at_100
	value: 73.615
	- type: recall_at_1000
	value: 91.959
	- type: recall_at_3
	value: 31.129
	- type: recall_at_5
	value: 37.565
	- task:
	type: Retrieval
	dataset:
	type: BeIR/cqadupstack
	name: MTEB CQADupstackUnixRetrieval
	config: default
	split: test
	revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
	metrics:
	- type: map_at_1
	value: 27.486
	- type: map_at_10
	value: 39.164
	- type: map_at_100
	value: 40.543
	- type: map_at_1000
	value: 40.636
	- type: map_at_3
	value: 35.52
	- type: map_at_5
	value: 37.355
	- type: ndcg_at_1
	value: 32.275999999999996
	- type: ndcg_at_10
	value: 45.414
	- type: ndcg_at_100
	value: 51.254
	- type: ndcg_at_1000
	value: 53.044000000000004
	- type: ndcg_at_3
	value: 39.324999999999996
	- type: ndcg_at_5
	value: 41.835
	- type: precision_at_1
	value: 32.275999999999996
	- type: precision_at_10
	value: 8.144
	- type: precision_at_100
	value: 1.237
	- type: precision_at_1000
	value: 0.15
	- type: precision_at_3
	value: 18.501
	- type: precision_at_5
	value: 13.134
	- type: recall_at_1
	value: 27.486
	- type: recall_at_10
	value: 60.449
	- type: recall_at_100
	value: 85.176
	- type: recall_at_1000
	value: 97.087
	- type: recall_at_3
	value: 43.59
	- type: recall_at_5
	value: 50.08899999999999
	- task:
	type: Retrieval
	dataset:
	type: BeIR/cqadupstack
	name: MTEB CQADupstackWebmastersRetrieval
	config: default
	split: test
	revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
	metrics:
	- type: map_at_1
	value: 26.207
	- type: map_at_10
	value: 37.255
	- type: map_at_100
	value: 39.043
	- type: map_at_1000
	value: 39.273
	- type: map_at_3
	value: 33.487
	- type: map_at_5
	value: 35.441
	- type: ndcg_at_1
	value: 31.423000000000002
	- type: ndcg_at_10
	value: 44.235
	- type: ndcg_at_100
	value: 50.49
	- type: ndcg_at_1000
	value: 52.283
	- type: ndcg_at_3
	value: 37.602000000000004
	- type: ndcg_at_5
	value: 40.518
	- type: precision_at_1
	value: 31.423000000000002
	- type: precision_at_10
	value: 8.715
	- type: precision_at_100
	value: 1.7590000000000001
	- type: precision_at_1000
	value: 0.257
	- type: precision_at_3
	value: 17.523
	- type: precision_at_5
	value: 13.161999999999999
	- type: recall_at_1
	value: 26.207
	- type: recall_at_10
	value: 59.17099999999999
	- type: recall_at_100
	value: 86.166
	- type: recall_at_1000
	value: 96.54700000000001
	- type: recall_at_3
	value: 41.18
	- type: recall_at_5
	value: 48.083999999999996
	- task:
	type: Retrieval
	dataset:
	type: BeIR/cqadupstack
	name: MTEB CQADupstackWordpressRetrieval
	config: default
	split: test
	revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
	metrics:
	- type: map_at_1
	value: 20.342
	- type: map_at_10
	value: 29.962
	- type: map_at_100
	value: 30.989
	- type: map_at_1000
	value: 31.102999999999998
	- type: map_at_3
	value: 26.656000000000002
	- type: map_at_5
	value: 28.179
	- type: ndcg_at_1
	value: 22.551
	- type: ndcg_at_10
	value: 35.945
	- type: ndcg_at_100
	value: 41.012
	- type: ndcg_at_1000
	value: 43.641999999999996
	- type: ndcg_at_3
	value: 29.45
	- type: ndcg_at_5
	value: 31.913999999999998
	- type: precision_at_1
	value: 22.551
	- type: precision_at_10
	value: 6.1
	- type: precision_at_100
	value: 0.943
	- type: precision_at_1000
	value: 0.129
	- type: precision_at_3
	value: 13.184999999999999
	- type: precision_at_5
	value: 9.353
	- type: recall_at_1
	value: 20.342
	- type: recall_at_10
	value: 52.349000000000004
	- type: recall_at_100
	value: 75.728
	- type: recall_at_1000
	value: 95.253
	- type: recall_at_3
	value: 34.427
	- type: recall_at_5
	value: 40.326
	- task:
	type: Retrieval
	dataset:
	type: climate-fever
	name: MTEB ClimateFEVER
	config: default
	split: test
	revision: 392b78eb68c07badcd7c2cd8f39af108375dfcce
	metrics:
	- type: map_at_1
	value: 7.71
	- type: map_at_10
	value: 14.81
	- type: map_at_100
	value: 16.536
	- type: map_at_1000
	value: 16.744999999999997
	- type: map_at_3
	value: 12.109
	- type: map_at_5
	value: 13.613
	- type: ndcg_at_1
	value: 18.046
	- type: ndcg_at_10
	value: 21.971
	- type: ndcg_at_100
	value: 29.468
	- type: ndcg_at_1000
	value: 33.428999999999995
	- type: ndcg_at_3
	value: 17.227999999999998
	- type: ndcg_at_5
	value: 19.189999999999998
	- type: precision_at_1
	value: 18.046
	- type: precision_at_10
	value: 7.192
	- type: precision_at_100
	value: 1.51
	- type: precision_at_1000
	value: 0.22499999999999998
	- type: precision_at_3
	value: 13.312
	- type: precision_at_5
	value: 10.775
	- type: recall_at_1
	value: 7.71
	- type: recall_at_10
	value: 27.908
	- type: recall_at_100
	value: 54.452
	- type: recall_at_1000
	value: 76.764
	- type: recall_at_3
	value: 16.64
	- type: recall_at_5
	value: 21.631
	- task:
	type: Retrieval
	dataset:
	type: dbpedia-entity
	name: MTEB DBPedia
	config: default
	split: test
	revision: f097057d03ed98220bc7309ddb10b71a54d667d6
	metrics:
	- type: map_at_1
	value: 6.8180000000000005
	- type: map_at_10
	value: 14.591000000000001
	- type: map_at_100
	value: 19.855999999999998
	- type: map_at_1000
	value: 21.178
	- type: map_at_3
	value: 10.345
	- type: map_at_5
	value: 12.367
	- type: ndcg_at_1
	value: 39.25
	- type: ndcg_at_10
	value: 32.088
	- type: ndcg_at_100
	value: 36.019
	- type: ndcg_at_1000
	value: 43.649
	- type: ndcg_at_3
	value: 35.132999999999996
	- type: ndcg_at_5
	value: 33.777
	- type: precision_at_1
	value: 49.5
	- type: precision_at_10
	value: 25.624999999999996
	- type: precision_at_100
	value: 8.043
	- type: precision_at_1000
	value: 1.7409999999999999
	- type: precision_at_3
	value: 38.417
	- type: precision_at_5
	value: 33.2
	- type: recall_at_1
	value: 6.8180000000000005
	- type: recall_at_10
	value: 20.399
	- type: recall_at_100
	value: 42.8
	- type: recall_at_1000
	value: 68.081
	- type: recall_at_3
	value: 11.928999999999998
	- type: recall_at_5
	value: 15.348999999999998
	- task:
	type: Classification
	dataset:
	type: mteb/emotion
	name: MTEB EmotionClassification
	config: default
	split: test
	revision: 829147f8f75a25f005913200eb5ed41fae320aa1
	metrics:
	- type: accuracy
	value: 39.725
	- type: f1
	value: 35.19385687310605
	- task:
	type: Retrieval
	dataset:
	type: fever
	name: MTEB FEVER
	config: default
	split: test
	revision: 1429cf27e393599b8b359b9b72c666f96b2525f9
	metrics:
	- type: map_at_1
	value: 31.901000000000003
	- type: map_at_10
	value: 44.156
	- type: map_at_100
	value: 44.901
	- type: map_at_1000
	value: 44.939
	- type: map_at_3
	value: 41.008
	- type: map_at_5
	value: 42.969
	- type: ndcg_at_1
	value: 34.263
	- type: ndcg_at_10
	value: 50.863
	- type: ndcg_at_100
	value: 54.336
	- type: ndcg_at_1000
	value: 55.297
	- type: ndcg_at_3
	value: 44.644
	- type: ndcg_at_5
	value: 48.075
	- type: precision_at_1
	value: 34.263
	- type: precision_at_10
	value: 7.542999999999999
	- type: precision_at_100
	value: 0.9400000000000001
	- type: precision_at_1000
	value: 0.104
	- type: precision_at_3
	value: 18.912000000000003
	- type: precision_at_5
	value: 13.177
	- type: recall_at_1
	value: 31.901000000000003
	- type: recall_at_10
	value: 68.872
	- type: recall_at_100
	value: 84.468
	- type: recall_at_1000
	value: 91.694
	- type: recall_at_3
	value: 52.272
	- type: recall_at_5
	value: 60.504999999999995
	- task:
	type: Retrieval
	dataset:
	type: fiqa
	name: MTEB FiQA2018
	config: default
	split: test
	revision: 41b686a7f28c59bcaaa5791efd47c67c8ebe28be
	metrics:
	- type: map_at_1
	value: 24.4
	- type: map_at_10
	value: 41.117
	- type: map_at_100
	value: 43.167
	- type: map_at_1000
	value: 43.323
	- type: map_at_3
	value: 35.744
	- type: map_at_5
	value: 38.708
	- type: ndcg_at_1
	value: 49.074
	- type: ndcg_at_10
	value: 49.963
	- type: ndcg_at_100
	value: 56.564
	- type: ndcg_at_1000
	value: 58.931999999999995
	- type: ndcg_at_3
	value: 45.489000000000004
	- type: ndcg_at_5
	value: 47.133
	- type: precision_at_1
	value: 49.074
	- type: precision_at_10
	value: 13.889000000000001
	- type: precision_at_100
	value: 2.091
	- type: precision_at_1000
	value: 0.251
	- type: precision_at_3
	value: 30.658
	- type: precision_at_5
	value: 22.593
	- type: recall_at_1
	value: 24.4
	- type: recall_at_10
	value: 58.111999999999995
	- type: recall_at_100
	value: 81.96900000000001
	- type: recall_at_1000
	value: 96.187
	- type: recall_at_3
	value: 41.661
	- type: recall_at_5
	value: 49.24
	- task:
	type: Retrieval
	dataset:
	type: hotpotqa
	name: MTEB HotpotQA
	config: default
	split: test
	revision: 766870b35a1b9ca65e67a0d1913899973551fc6c
	metrics:
	- type: map_at_1
	value: 22.262
	- type: map_at_10
	value: 31.266
	- type: map_at_100
	value: 32.202
	- type: map_at_1000
	value: 32.300000000000004
	- type: map_at_3
	value: 28.874
	- type: map_at_5
	value: 30.246000000000002
	- type: ndcg_at_1
	value: 44.524
	- type: ndcg_at_10
	value: 39.294000000000004
	- type: ndcg_at_100
	value: 43.296
	- type: ndcg_at_1000
	value: 45.561
	- type: ndcg_at_3
	value: 35.013
	- type: ndcg_at_5
	value: 37.177
	- type: precision_at_1
	value: 44.524
	- type: precision_at_10
	value: 8.52
	- type: precision_at_100
	value: 1.169
	- type: precision_at_1000
	value: 0.147
	- type: precision_at_3
	value: 22.003
	- type: precision_at_5
	value: 14.914
	- type: recall_at_1
	value: 22.262
	- type: recall_at_10
	value: 42.6
	- type: recall_at_100
	value: 58.46
	- type: recall_at_1000
	value: 73.565
	- type: recall_at_3
	value: 33.005
	- type: recall_at_5
	value: 37.286
	- task:
	type: Classification
	dataset:
	type: mteb/imdb
	name: MTEB ImdbClassification
	config: default
	split: test
	revision: 8d743909f834c38949e8323a8a6ce8721ea6c7f4
	metrics:
	- type: accuracy
	value: 70.7156
	- type: ap
	value: 64.89470531959896
	- type: f1
	value: 70.53051887683772
	- task:
	type: Retrieval
	dataset:
	type: msmarco
	name: MTEB MSMARCO
	config: default
	split: dev
	revision: e6838a846e2408f22cf5cc337ebc83e0bcf77849
	metrics:
	- type: map_at_1
	value: 21.174
	- type: map_at_10
	value: 33.0
	- type: map_at_100
	value: 34.178
	- type: map_at_1000
	value: 34.227000000000004
	- type: map_at_3
	value: 29.275000000000002
	- type: map_at_5
	value: 31.341
	- type: ndcg_at_1
	value: 21.776999999999997
	- type: ndcg_at_10
	value: 39.745999999999995
	- type: ndcg_at_100
	value: 45.488
	- type: ndcg_at_1000
	value: 46.733999999999995
	- type: ndcg_at_3
	value: 32.086
	- type: ndcg_at_5
	value: 35.792
	- type: precision_at_1
	value: 21.776999999999997
	- type: precision_at_10
	value: 6.324000000000001
	- type: precision_at_100
	value: 0.922
	- type: precision_at_1000
	value: 0.10300000000000001
	- type: precision_at_3
	value: 13.696
	- type: precision_at_5
	value: 10.100000000000001
	- type: recall_at_1
	value: 21.174
	- type: recall_at_10
	value: 60.488
	- type: recall_at_100
	value: 87.234
	- type: recall_at_1000
	value: 96.806
	- type: recall_at_3
	value: 39.582
	- type: recall_at_5
	value: 48.474000000000004
	- task:
	type: Classification
	dataset:
	type: mteb/mtop_domain
	name: MTEB MTOPDomainClassification (en)
	config: en
	split: test
	revision: a7e2a951126a26fc8c6a69f835f33a346ba259e3
	metrics:
	- type: accuracy
	value: 92.07934336525308
	- type: f1
	value: 91.93440027035814
	- task:
	type: Classification
	dataset:
	type: mteb/mtop_intent
	name: MTEB MTOPIntentClassification (en)
	config: en
	split: test
	revision: 6299947a7777084cc2d4b64235bf7190381ce755
	metrics:
	- type: accuracy
	value: 70.20975832193344
	- type: f1
	value: 48.571776628850074
	- task:
	type: Classification
	dataset:
	type: mteb/amazon_massive_intent
	name: MTEB MassiveIntentClassification (en)
	config: en
	split: test
	revision: 072a486a144adf7f4479a4a0dddb2152e161e1ea
	metrics:
	- type: accuracy
	value: 69.56624075319435
	- type: f1
	value: 67.64419185784621
	- task:
	type: Classification
	dataset:
	type: mteb/amazon_massive_scenario
	name: MTEB MassiveScenarioClassification (en)
	config: en
	split: test
	revision: 7d571f92784cd94a019292a1f45445077d0ef634
	metrics:
	- type: accuracy
	value: 76.01210490921318
	- type: f1
	value: 75.1934366365826
	- task:
	type: Clustering
	dataset:
	type: mteb/medrxiv-clustering-p2p
	name: MTEB MedrxivClusteringP2P
	config: default
	split: test
	revision: dcefc037ef84348e49b0d29109e891c01067226b
	metrics:
	- type: v_measure
	value: 35.58002813186373
	- task:
	type: Clustering
	dataset:
	type: mteb/medrxiv-clustering-s2s
	name: MTEB MedrxivClusteringS2S
	config: default
	split: test
	revision: 3cd0e71dfbe09d4de0f9e5ecba43e7ce280959dc
	metrics:
	- type: v_measure
	value: 32.872725562410444
	- task:
	type: Reranking
	dataset:
	type: mteb/mind_small
	name: MTEB MindSmallReranking
	config: default
	split: test
	revision: 3bdac13927fdc888b903db93b2ffdbd90b295a69
	metrics:
	- type: map
	value: 30.965343604861328
	- type: mrr
	value: 31.933710165863594
	- task:
	type: Retrieval
	dataset:
	type: nfcorpus
	name: MTEB NFCorpus
	config: default
	split: test
	revision: 7eb63cc0c1eb59324d709ebed25fcab851fa7610
	metrics:
	- type: map_at_1
	value: 4.938
	- type: map_at_10
	value: 12.034
	- type: map_at_100
	value: 15.675
	- type: map_at_1000
	value: 17.18
	- type: map_at_3
	value: 8.471
	- type: map_at_5
	value: 10.128
	- type: ndcg_at_1
	value: 40.402
	- type: ndcg_at_10
	value: 33.289
	- type: ndcg_at_100
	value: 31.496000000000002
	- type: ndcg_at_1000
	value: 40.453
	- type: ndcg_at_3
	value: 37.841
	- type: ndcg_at_5
	value: 36.215
	- type: precision_at_1
	value: 41.796
	- type: precision_at_10
	value: 25.294
	- type: precision_at_100
	value: 8.381
	- type: precision_at_1000
	value: 2.1260000000000003
	- type: precision_at_3
	value: 36.429
	- type: precision_at_5
	value: 32.446000000000005
	- type: recall_at_1
	value: 4.938
	- type: recall_at_10
	value: 16.637
	- type: recall_at_100
	value: 33.853
	- type: recall_at_1000
	value: 66.07
	- type: recall_at_3
	value: 9.818
	- type: recall_at_5
	value: 12.544
	- task:
	type: Retrieval
	dataset:
	type: nq
	name: MTEB NQ
	config: default
	split: test
	revision: 6062aefc120bfe8ece5897809fb2e53bfe0d128c
	metrics:
	- type: map_at_1
	value: 27.124
	- type: map_at_10
	value: 42.418
	- type: map_at_100
	value: 43.633
	- type: map_at_1000
	value: 43.66
	- type: map_at_3
	value: 37.766
	- type: map_at_5
	value: 40.482
	- type: ndcg_at_1
	value: 30.794
	- type: ndcg_at_10
	value: 50.449999999999996
	- type: ndcg_at_100
	value: 55.437999999999995
	- type: ndcg_at_1000
	value: 56.084
	- type: ndcg_at_3
	value: 41.678
	- type: ndcg_at_5
	value: 46.257
	- type: precision_at_1
	value: 30.794
	- type: precision_at_10
	value: 8.656
	- type: precision_at_100
	value: 1.141
	- type: precision_at_1000
	value: 0.12
	- type: precision_at_3
	value: 19.37
	- type: precision_at_5
	value: 14.218
	- type: recall_at_1
	value: 27.124
	- type: recall_at_10
	value: 72.545
	- type: recall_at_100
	value: 93.938
	- type: recall_at_1000
	value: 98.788
	- type: recall_at_3
	value: 49.802
	- type: recall_at_5
	value: 60.426
	- task:
	type: Retrieval
	dataset:
	type: quora
	name: MTEB QuoraRetrieval
	config: default
	split: test
	revision: 6205996560df11e3a3da9ab4f926788fc30a7db4
	metrics:
	- type: map_at_1
	value: 69.33500000000001
	- type: map_at_10
	value: 83.554
	- type: map_at_100
	value: 84.237
	- type: map_at_1000
	value: 84.251
	- type: map_at_3
	value: 80.456
	- type: map_at_5
	value: 82.395
	- type: ndcg_at_1
	value: 80.06
	- type: ndcg_at_10
	value: 87.46199999999999
	- type: ndcg_at_100
	value: 88.774
	- type: ndcg_at_1000
	value: 88.864
	- type: ndcg_at_3
	value: 84.437
	- type: ndcg_at_5
	value: 86.129
	- type: precision_at_1
	value: 80.06
	- type: precision_at_10
	value: 13.418
	- type: precision_at_100
	value: 1.536
	- type: precision_at_1000
	value: 0.157
	- type: precision_at_3
	value: 37.103
	- type: precision_at_5
	value: 24.522
	- type: recall_at_1
	value: 69.33500000000001
	- type: recall_at_10
	value: 95.03200000000001
	- type: recall_at_100
	value: 99.559
	- type: recall_at_1000
	value: 99.98700000000001
	- type: recall_at_3
	value: 86.404
	- type: recall_at_5
	value: 91.12400000000001
	- task:
	type: Clustering
	dataset:
	type: mteb/reddit-clustering
	name: MTEB RedditClustering
	config: default
	split: test
	revision: b2805658ae38990172679479369a78b86de8c390
	metrics:
	- type: v_measure
	value: 54.824256698437324
	- task:
	type: Clustering
	dataset:
	type: mteb/reddit-clustering-p2p
	name: MTEB RedditClusteringP2P
	config: default
	split: test
	revision: 385e3cb46b4cfa89021f56c4380204149d0efe33
	metrics:
	- type: v_measure
	value: 56.768972678049366
	- task:
	type: Retrieval
	dataset:
	type: scidocs
	name: MTEB SCIDOCS
	config: default
	split: test
	revision: 5c59ef3e437a0a9651c8fe6fde943e7dce59fba5
	metrics:
	- type: map_at_1
	value: 5.192
	- type: map_at_10
	value: 14.426
	- type: map_at_100
	value: 17.18
	- type: map_at_1000
	value: 17.580000000000002
	- type: map_at_3
	value: 9.94
	- type: map_at_5
	value: 12.077
	- type: ndcg_at_1
	value: 25.5
	- type: ndcg_at_10
	value: 23.765
	- type: ndcg_at_100
	value: 33.664
	- type: ndcg_at_1000
	value: 39.481
	- type: ndcg_at_3
	value: 21.813
	- type: ndcg_at_5
	value: 19.285
	- type: precision_at_1
	value: 25.5
	- type: precision_at_10
	value: 12.690000000000001
	- type: precision_at_100
	value: 2.71
	- type: precision_at_1000
	value: 0.409
	- type: precision_at_3
	value: 20.732999999999997
	- type: precision_at_5
	value: 17.24
	- type: recall_at_1
	value: 5.192
	- type: recall_at_10
	value: 25.712000000000003
	- type: recall_at_100
	value: 54.99699999999999
	- type: recall_at_1000
	value: 82.97200000000001
	- type: recall_at_3
	value: 12.631999999999998
	- type: recall_at_5
	value: 17.497
	- task:
	type: STS
	dataset:
	type: mteb/sickr-sts
	name: MTEB SICK-R
	config: default
	split: test
	revision: 20a6d6f312dd54037fe07a32d58e5e168867909d
	metrics:
	- type: cos_sim_pearson
	value: 84.00280838354293
	- type: cos_sim_spearman
	value: 80.5854192844009
	- type: euclidean_pearson
	value: 80.55974827073891
	- type: euclidean_spearman
	value: 80.58541460172292
	- type: manhattan_pearson
	value: 80.27294578437488
	- type: manhattan_spearman
	value: 80.33176193921884
	- task:
	type: STS
	dataset:
	type: mteb/sts12-sts
	name: MTEB STS12
	config: default
	split: test
	revision: fdf84275bb8ce4b49c971d02e84dd1abc677a50f
	metrics:
	- type: cos_sim_pearson
	value: 83.2801353818369
	- type: cos_sim_spearman
	value: 72.63427853822449
	- type: euclidean_pearson
	value: 79.01343235899544
	- type: euclidean_spearman
	value: 72.63178302036903
	- type: manhattan_pearson
	value: 78.65899981586094
	- type: manhattan_spearman
	value: 72.26646573268035
	- task:
	type: STS
	dataset:
	type: mteb/sts13-sts
	name: MTEB STS13
	config: default
	split: test
	revision: 1591bfcbe8c69d4bf7fe2a16e2451017832cafb9
	metrics:
	- type: cos_sim_pearson
	value: 83.20700572036095
	- type: cos_sim_spearman
	value: 83.48499016384896
	- type: euclidean_pearson
	value: 82.82555353364394
	- type: euclidean_spearman
	value: 83.48499008964005
	- type: manhattan_pearson
	value: 82.46034885462956
	- type: manhattan_spearman
	value: 83.09829447251937
	- task:
	type: STS
	dataset:
	type: mteb/sts14-sts
	name: MTEB STS14
	config: default
	split: test
	revision: e2125984e7df8b7871f6ae9949cf6b6795e7c54b
	metrics:
	- type: cos_sim_pearson
	value: 82.27113025749529
	- type: cos_sim_spearman
	value: 78.0001371342168
	- type: euclidean_pearson
	value: 80.62651938409732
	- type: euclidean_spearman
	value: 78.0001341029446
	- type: manhattan_pearson
	value: 80.25786381999085
	- type: manhattan_spearman
	value: 77.68750207429126
	- task:
	type: STS
	dataset:
	type: mteb/sts15-sts
	name: MTEB STS15
	config: default
	split: test
	revision: 1cd7298cac12a96a373b6a2f18738bb3e739a9b6
	metrics:
	- type: cos_sim_pearson
	value: 84.98824030948605
	- type: cos_sim_spearman
	value: 85.66275391649481
	- type: euclidean_pearson
	value: 84.88733530073506
	- type: euclidean_spearman
	value: 85.66275062257034
	- type: manhattan_pearson
	value: 84.70100813924223
	- type: manhattan_spearman
	value: 85.50318526944764
	- task:
	type: STS
	dataset:
	type: mteb/sts16-sts
	name: MTEB STS16
	config: default
	split: test
	revision: 360a0b2dff98700d09e634a01e1cc1624d3e42cd
	metrics:
	- type: cos_sim_pearson
	value: 78.82478639193744
	- type: cos_sim_spearman
	value: 80.03011315645662
	- type: euclidean_pearson
	value: 79.84794502236802
	- type: euclidean_spearman
	value: 80.03011258077692
	- type: manhattan_pearson
	value: 79.47012152325492
	- type: manhattan_spearman
	value: 79.60652985087651
	- task:
	type: STS
	dataset:
	type: mteb/sts17-crosslingual-sts
	name: MTEB STS17 (en-en)
	config: en-en
	split: test
	revision: 9fc37e8c632af1c87a3d23e685d49552a02582a0
	metrics:
	- type: cos_sim_pearson
	value: 90.90804154377126
	- type: cos_sim_spearman
	value: 90.59523263123734
	- type: euclidean_pearson
	value: 89.8466957775513
	- type: euclidean_spearman
	value: 90.59523263123734
	- type: manhattan_pearson
	value: 89.82268413033941
	- type: manhattan_spearman
	value: 90.68706496728889
	- task:
	type: STS
	dataset:
	type: mteb/sts22-crosslingual-sts
	name: MTEB STS22 (en)
	config: en
	split: test
	revision: 2de6ce8c1921b71a755b262c6b57fef195dd7906
	metrics:
	- type: cos_sim_pearson
	value: 66.78771571400975
	- type: cos_sim_spearman
	value: 67.94534221542501
	- type: euclidean_pearson
	value: 68.62534447097993
	- type: euclidean_spearman
	value: 67.94534221542501
	- type: manhattan_pearson
	value: 68.35916011329631
	- type: manhattan_spearman
	value: 67.58212723406085
	- task:
	type: STS
	dataset:
	type: mteb/stsbenchmark-sts
	name: MTEB STSBenchmark
	config: default
	split: test
	revision: 8913289635987208e6e7c72789e4be2fe94b6abd
	metrics:
	- type: cos_sim_pearson
	value: 84.03996099800993
	- type: cos_sim_spearman
	value: 83.421898505618
	- type: euclidean_pearson
	value: 83.78671249317563
	- type: euclidean_spearman
	value: 83.4219042133061
	- type: manhattan_pearson
	value: 83.44085827249334
	- type: manhattan_spearman
	value: 83.02901331535297
	- task:
	type: Reranking
	dataset:
	type: mteb/scidocs-reranking
	name: MTEB SciDocsRR
	config: default
	split: test
	revision: 56a6d0140cf6356659e2a7c1413286a774468d44
	metrics:
	- type: map
	value: 88.65396986895777
	- type: mrr
	value: 96.60209525405604
	- task:
	type: Retrieval
	dataset:
	type: scifact
	name: MTEB SciFact
	config: default
	split: test
	revision: a75ae049398addde9b70f6b268875f5cbce99089
	metrics:
	- type: map_at_1
	value: 51.456
	- type: map_at_10
	value: 60.827
	- type: map_at_100
	value: 61.595
	- type: map_at_1000
	value: 61.629999999999995
	- type: map_at_3
	value: 57.518
	- type: map_at_5
	value: 59.435
	- type: ndcg_at_1
	value: 53.333
	- type: ndcg_at_10
	value: 65.57
	- type: ndcg_at_100
	value: 68.911
	- type: ndcg_at_1000
	value: 69.65299999999999
	- type: ndcg_at_3
	value: 60.009
	- type: ndcg_at_5
	value: 62.803
	- type: precision_at_1
	value: 53.333
	- type: precision_at_10
	value: 8.933
	- type: precision_at_100
	value: 1.0699999999999998
	- type: precision_at_1000
	value: 0.11299999999999999
	- type: precision_at_3
	value: 23.333000000000002
	- type: precision_at_5
	value: 15.8
	- type: recall_at_1
	value: 51.456
	- type: recall_at_10
	value: 79.011
	- type: recall_at_100
	value: 94.167
	- type: recall_at_1000
	value: 99.667
	- type: recall_at_3
	value: 64.506
	- type: recall_at_5
	value: 71.211
	- task:
	type: PairClassification
	dataset:
	type: mteb/sprintduplicatequestions-pairclassification
	name: MTEB SprintDuplicateQuestions
	config: default
	split: test
	revision: 5a8256d0dff9c4bd3be3ba3e67e4e70173f802ea
	metrics:
	- type: cos_sim_accuracy
	value: 99.65940594059406
	- type: cos_sim_ap
	value: 90.1455141683116
	- type: cos_sim_f1
	value: 82.26044226044226
	- type: cos_sim_precision
	value: 80.8695652173913
	- type: cos_sim_recall
	value: 83.7
	- type: dot_accuracy
	value: 99.65940594059406
	- type: dot_ap
	value: 90.1455141683116
	- type: dot_f1
	value: 82.26044226044226
	- type: dot_precision
	value: 80.8695652173913
	- type: dot_recall
	value: 83.7
	- type: euclidean_accuracy
	value: 99.65940594059406
	- type: euclidean_ap
	value: 90.14551416831162
	- type: euclidean_f1
	value: 82.26044226044226
	- type: euclidean_precision
	value: 80.8695652173913
	- type: euclidean_recall
	value: 83.7
	- type: manhattan_accuracy
	value: 99.64950495049504
	- type: manhattan_ap
	value: 89.5492617367771
	- type: manhattan_f1
	value: 81.58280410356619
	- type: manhattan_precision
	value: 79.75167144221585
	- type: manhattan_recall
	value: 83.5
	- type: max_accuracy
	value: 99.65940594059406
	- type: max_ap
	value: 90.14551416831162
	- type: max_f1
	value: 82.26044226044226
	- task:
	type: Clustering
	dataset:
	type: mteb/stackexchange-clustering
	name: MTEB StackExchangeClustering
	config: default
	split: test
	revision: 70a89468f6dccacc6aa2b12a6eac54e74328f235
	metrics:
	- type: v_measure
	value: 53.80048409076929
	- task:
	type: Clustering
	dataset:
	type: mteb/stackexchange-clustering-p2p
	name: MTEB StackExchangeClusteringP2P
	config: default
	split: test
	revision: d88009ab563dd0b16cfaf4436abaf97fa3550cf0
	metrics:
	- type: v_measure
	value: 34.280269334397545
	- task:
	type: Reranking
	dataset:
	type: mteb/stackoverflowdupquestions-reranking
	name: MTEB StackOverflowDupQuestions
	config: default
	split: test
	revision: ef807ea29a75ec4f91b50fd4191cb4ee4589a9f9
	metrics:
	- type: map
	value: 51.97907654945493
	- type: mrr
	value: 52.82873376623376
	- task:
	type: Summarization
	dataset:
	type: mteb/summeval
	name: MTEB SummEval
	config: default
	split: test
	revision: 8753c2788d36c01fc6f05d03fe3f7268d63f9122
	metrics:
	- type: cos_sim_pearson
	value: 28.364293841556304
	- type: cos_sim_spearman
	value: 27.485869639926136
	- type: dot_pearson
	value: 28.364295910221145
	- type: dot_spearman
	value: 27.485869639926136
	- task:
	type: Retrieval
	dataset:
	type: trec-covid
	name: MTEB TRECCOVID
	config: default
	split: test
	revision: 2c8041b2c07a79b6f7ba8fe6acc72e5d9f92d217
	metrics:
	- type: map_at_1
	value: 0.19499999999999998
	- type: map_at_10
	value: 1.218
	- type: map_at_100
	value: 7.061000000000001
	- type: map_at_1000
	value: 19.735
	- type: map_at_3
	value: 0.46499999999999997
	- type: map_at_5
	value: 0.672
	- type: ndcg_at_1
	value: 60.0
	- type: ndcg_at_10
	value: 51.32600000000001
	- type: ndcg_at_100
	value: 41.74
	- type: ndcg_at_1000
	value: 43.221
	- type: ndcg_at_3
	value: 54.989
	- type: ndcg_at_5
	value: 52.905
	- type: precision_at_1
	value: 66.0
	- type: precision_at_10
	value: 55.60000000000001
	- type: precision_at_100
	value: 43.34
	- type: precision_at_1000
	value: 19.994
	- type: precision_at_3
	value: 59.333000000000006
	- type: precision_at_5
	value: 57.199999999999996
	- type: recall_at_1
	value: 0.19499999999999998
	- type: recall_at_10
	value: 1.473
	- type: recall_at_100
	value: 10.596
	- type: recall_at_1000
	value: 42.466
	- type: recall_at_3
	value: 0.49899999999999994
	- type: recall_at_5
	value: 0.76
	- task:
	type: Retrieval
	dataset:
	type: webis-touche2020
	name: MTEB Touche2020
	config: default
	split: test
	revision: 527b7d77e16e343303e68cb6af11d6e18b9f7b3b
	metrics:
	- type: map_at_1
	value: 1.997
	- type: map_at_10
	value: 7.5569999999999995
	- type: map_at_100
	value: 12.238
	- type: map_at_1000
	value: 13.773
	- type: map_at_3
	value: 4.334
	- type: map_at_5
	value: 5.5
	- type: ndcg_at_1
	value: 22.448999999999998
	- type: ndcg_at_10
	value: 19.933999999999997
	- type: ndcg_at_100
	value: 30.525999999999996
	- type: ndcg_at_1000
	value: 43.147999999999996
	- type: ndcg_at_3
	value: 22.283
	- type: ndcg_at_5
	value: 21.224
	- type: precision_at_1
	value: 24.490000000000002
	- type: precision_at_10
	value: 17.551
	- type: precision_at_100
	value: 6.4079999999999995
	- type: precision_at_1000
	value: 1.463
	- type: precision_at_3
	value: 23.128999999999998
	- type: precision_at_5
	value: 20.816000000000003
	- type: recall_at_1
	value: 1.997
	- type: recall_at_10
	value: 13.001999999999999
	- type: recall_at_100
	value: 40.98
	- type: recall_at_1000
	value: 79.40899999999999
	- type: recall_at_3
	value: 5.380999999999999
	- type: recall_at_5
	value: 7.721
	- task:
	type: Classification
	dataset:
	type: mteb/toxic_conversations_50k
	name: MTEB ToxicConversationsClassification
	config: default
	split: test
	revision: edfaf9da55d3dd50d43143d90c1ac476895ae6de
	metrics:
	- type: accuracy
	value: 60.861200000000004
	- type: ap
	value: 11.39641747026629
	- type: f1
	value: 47.80230380517065
	- task:
	type: Classification
	dataset:
	type: mteb/tweet_sentiment_extraction
	name: MTEB TweetSentimentExtractionClassification
	config: default
	split: test
	revision: 62146448f05be9e52a36b8ee9936447ea787eede
	metrics:
	- type: accuracy
	value: 55.464063384267114
	- type: f1
	value: 55.759039643764666
	- task:
	type: Clustering
	dataset:
	type: mteb/twentynewsgroups-clustering
	name: MTEB TwentyNewsgroupsClustering
	config: default
	split: test
	revision: 091a54f9a36281ce7d6590ec8c75dd485e7e01d4
	metrics:
	- type: v_measure
	value: 49.74455348083809
	- task:
	type: PairClassification
	dataset:
	type: mteb/twittersemeval2015-pairclassification
	name: MTEB TwitterSemEval2015
	config: default
	split: test
	revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
	metrics:
	- type: cos_sim_accuracy
	value: 86.07617571675507
	- type: cos_sim_ap
	value: 73.85398650568216
	- type: cos_sim_f1
	value: 68.50702798531087
	- type: cos_sim_precision
	value: 65.86316045775506
	- type: cos_sim_recall
	value: 71.37203166226914
	- type: dot_accuracy
	value: 86.07617571675507
	- type: dot_ap
	value: 73.85398346238429
	- type: dot_f1
	value: 68.50702798531087
	- type: dot_precision
	value: 65.86316045775506
	- type: dot_recall
	value: 71.37203166226914
	- type: euclidean_accuracy
	value: 86.07617571675507
	- type: euclidean_ap
	value: 73.85398625060357
	- type: euclidean_f1
	value: 68.50702798531087
	- type: euclidean_precision
	value: 65.86316045775506
	- type: euclidean_recall
	value: 71.37203166226914
	- type: manhattan_accuracy
	value: 85.98676759849795
	- type: manhattan_ap
	value: 73.86874126878737
	- type: manhattan_f1
	value: 68.55096559662361
	- type: manhattan_precision
	value: 66.51774633904195
	- type: manhattan_recall
	value: 70.71240105540898
	- type: max_accuracy
	value: 86.07617571675507
	- type: max_ap
	value: 73.86874126878737
	- type: max_f1
	value: 68.55096559662361
	- task:
	type: PairClassification
	dataset:
	type: mteb/twitterurlcorpus-pairclassification
	name: MTEB TwitterURLCorpus
	config: default
	split: test
	revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
	metrics:
	- type: cos_sim_accuracy
	value: 88.51631932316529
	- type: cos_sim_ap
	value: 85.10831084479727
	- type: cos_sim_f1
	value: 77.14563397129186
	- type: cos_sim_precision
	value: 74.9709386806161
	- type: cos_sim_recall
	value: 79.45026178010471
	- type: dot_accuracy
	value: 88.51631932316529
	- type: dot_ap
	value: 85.10831188797107
	- type: dot_f1
	value: 77.14563397129186
	- type: dot_precision
	value: 74.9709386806161
	- type: dot_recall
	value: 79.45026178010471
	- type: euclidean_accuracy
	value: 88.51631932316529
	- type: euclidean_ap
	value: 85.10829618408616
	- type: euclidean_f1
	value: 77.14563397129186
	- type: euclidean_precision
	value: 74.9709386806161
	- type: euclidean_recall
	value: 79.45026178010471
	- type: manhattan_accuracy
	value: 88.50467652423643
	- type: manhattan_ap
	value: 85.08329502055064
	- type: manhattan_f1
	value: 77.11157455683002
	- type: manhattan_precision
	value: 74.67541834968263
	- type: manhattan_recall
	value: 79.71204188481676
	- type: max_accuracy
	value: 88.51631932316529
	- type: max_ap
	value: 85.10831188797107
	- type: max_f1
	value: 77.14563397129186
	---


	# all-mpnet-base-v2
	This is a [sentence-transformers](https://www.SBERT.net) model: It maps sentences & paragraphs to a 768 dimensional dense vector space and can be used for tasks like clustering or semantic search.

	## Usage (Sentence-Transformers)
	Using this model becomes easy when you have [sentence-transformers](https://www.SBERT.net) installed:

	```
	pip install -U sentence-transformers
	```

	Then you can use the model like this:
	```python
	from sentence_transformers import SentenceTransformer
	sentences = ["This is an example sentence", "Each sentence is converted"]

	model = SentenceTransformer('sentence-transformers/all-mpnet-base-v2')
	embeddings = model.encode(sentences)
	print(embeddings)
	```

	## Usage (HuggingFace Transformers)
	Without [sentence-transformers](https://www.SBERT.net), you can use the model like this: First, you pass your input through the transformer model, then you have to apply the right pooling-operation on-top of the contextualized word embeddings.

	```python
	from transformers import AutoTokenizer, AutoModel
	import torch
	import torch.nn.functional as F

	#Mean Pooling - Take attention mask into account for correct averaging
	def mean_pooling(model_output, attention_mask):
	token_embeddings = model_output[0] #First element of model_output contains all token embeddings
	input_mask_expanded = attention_mask.unsqueeze(-1).expand(token_embeddings.size()).float()
	return torch.sum(token_embeddings * input_mask_expanded, 1) / torch.clamp(input_mask_expanded.sum(1), min=1e-9)


	# Sentences we want sentence embeddings for
	sentences = ['This is an example sentence', 'Each sentence is converted']

	# Load model from HuggingFace Hub
	tokenizer = AutoTokenizer.from_pretrained('sentence-transformers/all-mpnet-base-v2')
	model = AutoModel.from_pretrained('sentence-transformers/all-mpnet-base-v2')

	# Tokenize sentences
	encoded_input = tokenizer(sentences, padding=True, truncation=True, return_tensors='pt')

	# Compute token embeddings
	with torch.no_grad():
	model_output = model(**encoded_input)

	# Perform pooling
	sentence_embeddings = mean_pooling(model_output, encoded_input['attention_mask'])

	# Normalize embeddings
	sentence_embeddings = F.normalize(sentence_embeddings, p=2, dim=1)

	print("Sentence embeddings:")
	print(sentence_embeddings)
	```

	## Evaluation Results

	For an automated evaluation of this model, see MTEB: https://huggingface.co/spaces/mteb/leaderboard or the Sentence Embeddings Benchmark: [https://seb.sbert.net](https://seb.sbert.net?model_name=sentence-transformers/all-MiniLM-L12-v2)

	------

	## Background

	The project aims to train sentence embedding models on very large sentence level datasets using a self-supervised
	contrastive learning objective. We used the pretrained [`microsoft/mpnet-base`](https://huggingface.co/microsoft/mpnet-base) model and fine-tuned in on a
	1B sentence pairs dataset. We use a contrastive learning objective: given a sentence from the pair, the model should predict which out of a set of randomly sampled other sentences, was actually paired with it in our dataset.

	We developped this model during the
	[Community week using JAX/Flax for NLP & CV](https://discuss.huggingface.co/t/open-to-the-community-community-week-using-jax-flax-for-nlp-cv/7104),
	organized by Hugging Face. We developped this model as part of the project:
	[Train the Best Sentence Embedding Model Ever with 1B Training Pairs](https://discuss.huggingface.co/t/train-the-best-sentence-embedding-model-ever-with-1b-training-pairs/7354). We benefited from efficient hardware infrastructure to run the project: 7 TPUs v3-8, as well as intervention from Googles Flax, JAX, and Cloud team member about efficient deep learning frameworks.

	## Intended uses

	Our model is intented to be used as a sentence and short paragraph encoder. Given an input text, it ouptuts a vector which captures
	the semantic information. The sentence vector may be used for information retrieval, clustering or sentence similarity tasks.

	By default, input text longer than 384 word pieces is truncated.


	## Training procedure

	### Pre-training

	We use the pretrained [`microsoft/mpnet-base`](https://huggingface.co/microsoft/mpnet-base) model. Please refer to the model card for more detailed information about the pre-training procedure.

	### Fine-tuning

	We fine-tune the model using a contrastive objective. Formally, we compute the cosine similarity from each possible sentence pairs from the batch.
	We then apply the cross entropy loss by comparing with true pairs.

	#### Hyper parameters

	We trained ou model on a TPU v3-8. We train the model during 100k steps using a batch size of 1024 (128 per TPU core).
	We use a learning rate warm up of 500. The sequence length was limited to 128 tokens. We used the AdamW optimizer with
	a 2e-5 learning rate. The full training script is accessible in this current repository: `train_script.py`.

	#### Training data

	We use the concatenation from multiple datasets to fine-tune our model. The total number of sentence pairs is above 1 billion sentences.
	We sampled each dataset given a weighted probability which configuration is detailed in the `data_config.json` file.


	\| Dataset \| Paper \| Number of training tuples \|
	\|--------------------------------------------------------\|:----------------------------------------:\|:--------------------------:\|
	\| [Reddit comments (2015-2018)](https://github.com/PolyAI-LDN/conversational-datasets/tree/master/reddit) \| [paper](https://arxiv.org/abs/1904.06472) \| 726,484,430 \|
	\| [S2ORC](https://github.com/allenai/s2orc) Citation pairs (Abstracts) \| [paper](https://aclanthology.org/2020.acl-main.447/) \| 116,288,806 \|
	\| [WikiAnswers](https://github.com/afader/oqa#wikianswers-corpus) Duplicate question pairs \| [paper](https://doi.org/10.1145/2623330.2623677) \| 77,427,422 \|
	\| [PAQ](https://github.com/facebookresearch/PAQ) (Question, Answer) pairs \| [paper](https://arxiv.org/abs/2102.07033) \| 64,371,441 \|
	\| [S2ORC](https://github.com/allenai/s2orc) Citation pairs (Titles) \| [paper](https://aclanthology.org/2020.acl-main.447/) \| 52,603,982 \|
	\| [S2ORC](https://github.com/allenai/s2orc) (Title, Abstract) \| [paper](https://aclanthology.org/2020.acl-main.447/) \| 41,769,185 \|
	\| [Stack Exchange](https://huggingface.co/datasets/flax-sentence-embeddings/stackexchange_xml) (Title, Body) pairs \| - \| 25,316,456 \|
	\| [Stack Exchange](https://huggingface.co/datasets/flax-sentence-embeddings/stackexchange_xml) (Title+Body, Answer) pairs \| - \| 21,396,559 \|
	\| [Stack Exchange](https://huggingface.co/datasets/flax-sentence-embeddings/stackexchange_xml) (Title, Answer) pairs \| - \| 21,396,559 \|
	\| [MS MARCO](https://microsoft.github.io/msmarco/) triplets \| [paper](https://doi.org/10.1145/3404835.3462804) \| 9,144,553 \|
	\| [GOOAQ: Open Question Answering with Diverse Answer Types](https://github.com/allenai/gooaq) \| [paper](https://arxiv.org/pdf/2104.08727.pdf) \| 3,012,496 \|
	\| [Yahoo Answers](https://www.kaggle.com/soumikrakshit/yahoo-answers-dataset) (Title, Answer) \| [paper](https://proceedings.neurips.cc/paper/2015/hash/250cf8b51c773f3f8dc8b4be867a9a02-Abstract.html) \| 1,198,260 \|
	\| [Code Search](https://huggingface.co/datasets/code_search_net) \| - \| 1,151,414 \|
	\| [COCO](https://cocodataset.org/#home) Image captions \| [paper](https://link.springer.com/chapter/10.1007%2F978-3-319-10602-1_48) \| 828,395\|
	\| [SPECTER](https://github.com/allenai/specter) citation triplets \| [paper](https://doi.org/10.18653/v1/2020.acl-main.207) \| 684,100 \|
	\| [Yahoo Answers](https://www.kaggle.com/soumikrakshit/yahoo-answers-dataset) (Question, Answer) \| [paper](https://proceedings.neurips.cc/paper/2015/hash/250cf8b51c773f3f8dc8b4be867a9a02-Abstract.html) \| 681,164 \|
	\| [Yahoo Answers](https://www.kaggle.com/soumikrakshit/yahoo-answers-dataset) (Title, Question) \| [paper](https://proceedings.neurips.cc/paper/2015/hash/250cf8b51c773f3f8dc8b4be867a9a02-Abstract.html) \| 659,896 \|
	\| [SearchQA](https://huggingface.co/datasets/search_qa) \| [paper](https://arxiv.org/abs/1704.05179) \| 582,261 \|
	\| [Eli5](https://huggingface.co/datasets/eli5) \| [paper](https://doi.org/10.18653/v1/p19-1346) \| 325,475 \|
	\| [Flickr 30k](https://shannon.cs.illinois.edu/DenotationGraph/) \| [paper](https://transacl.org/ojs/index.php/tacl/article/view/229/33) \| 317,695 \|
	\| [Stack Exchange](https://huggingface.co/datasets/flax-sentence-embeddings/stackexchange_xml) Duplicate questions (titles) \| \| 304,525 \|
	\| AllNLI ([SNLI](https://nlp.stanford.edu/projects/snli/) and [MultiNLI](https://cims.nyu.edu/~sbowman/multinli/) \| [paper SNLI](https://doi.org/10.18653/v1/d15-1075), [paper MultiNLI](https://doi.org/10.18653/v1/n18-1101) \| 277,230 \|
	\| [Stack Exchange](https://huggingface.co/datasets/flax-sentence-embeddings/stackexchange_xml) Duplicate questions (bodies) \| \| 250,519 \|
	\| [Stack Exchange](https://huggingface.co/datasets/flax-sentence-embeddings/stackexchange_xml) Duplicate questions (titles+bodies) \| \| 250,460 \|
	\| [Sentence Compression](https://github.com/google-research-datasets/sentence-compression) \| [paper](https://www.aclweb.org/anthology/D13-1155/) \| 180,000 \|
	\| [Wikihow](https://github.com/pvl/wikihow_pairs_dataset) \| [paper](https://arxiv.org/abs/1810.09305) \| 128,542 \|
	\| [Altlex](https://github.com/chridey/altlex/) \| [paper](https://aclanthology.org/P16-1135.pdf) \| 112,696 \|
	\| [Quora Question Triplets](https://quoradata.quora.com/First-Quora-Dataset-Release-Question-Pairs) \| - \| 103,663 \|
	\| [Simple Wikipedia](https://cs.pomona.edu/~dkauchak/simplification/) \| [paper](https://www.aclweb.org/anthology/P11-2117/) \| 102,225 \|
	\| [Natural Questions (NQ)](https://ai.google.com/research/NaturalQuestions) \| [paper](https://transacl.org/ojs/index.php/tacl/article/view/1455) \| 100,231 \|
	\| [SQuAD2.0](https://rajpurkar.github.io/SQuAD-explorer/) \| [paper](https://aclanthology.org/P18-2124.pdf) \| 87,599 \|
	\| [TriviaQA](https://huggingface.co/datasets/trivia_qa) \| - \| 73,346 \|
	\| Total \| \| 1,170,060,424 \|