metadata

pipeline_tag: sentence-similarity
tags:
  - sentence-transformers
  - feature-extraction
  - sentence-similarity
  - mteb
language: en
license: apache-2.0
datasets:
  - s2orc
  - flax-sentence-embeddings/stackexchange_xml
  - MS Marco
  - gooaq
  - yahoo_answers_topics
  - code_search_net
  - search_qa
  - eli5
  - snli
  - multi_nli
  - wikihow
  - natural_questions
  - trivia_qa
  - embedding-data/sentence-compression
  - embedding-data/flickr30k-captions
  - embedding-data/altlex
  - embedding-data/simple-wiki
  - embedding-data/QQP
  - embedding-data/SPECTER
  - embedding-data/PAQ_pairs
  - embedding-data/WikiAnswers
model-index:
  - name: all-mpnet-base-v2
    results:
      - task:
          type: Classification
        dataset:
          type: mteb/amazon_counterfactual
          name: MTEB AmazonCounterfactualClassification (en)
          config: en
          split: test
          revision: 2d8a100785abf0ae21420d2a55b0c56e3e1ea996
        metrics:
          - type: accuracy
            value: 65.26865671641791
          - type: ap
            value: 28.47453420428918
          - type: f1
            value: 59.3470101009448
      - task:
          type: Classification
        dataset:
          type: mteb/amazon_polarity
          name: MTEB AmazonPolarityClassification
          config: default
          split: test
          revision: 80714f8dcf8cefc218ef4f8c5a966dd83f75a0e1
        metrics:
          - type: accuracy
            value: 67.13145
          - type: ap
            value: 61.842060778903786
          - type: f1
            value: 66.79987305640383
      - task:
          type: Classification
        dataset:
          type: mteb/amazon_reviews_multi
          name: MTEB AmazonReviewsClassification (en)
          config: en
          split: test
          revision: c379a6705fec24a2493fa68e011692605f44e119
        metrics:
          - type: accuracy
            value: 31.920000000000005
          - type: f1
            value: 31.2465193896153
      - task:
          type: Retrieval
        dataset:
          type: arguana
          name: MTEB ArguAna
          config: default
          split: test
          revision: 5b3e3697907184a9b77a3c99ee9ea1a9cbb1e4e3
        metrics:
          - type: map_at_1
            value: 23.186
          - type: map_at_10
            value: 37.692
          - type: map_at_100
            value: 38.986
          - type: map_at_1000
            value: 38.991
          - type: map_at_3
            value: 32.622
          - type: map_at_5
            value: 35.004999999999995
          - type: ndcg_at_1
            value: 23.186
          - type: ndcg_at_10
            value: 46.521
          - type: ndcg_at_100
            value: 51.954
          - type: ndcg_at_1000
            value: 52.087
          - type: ndcg_at_3
            value: 35.849
          - type: ndcg_at_5
            value: 40.12
          - type: precision_at_1
            value: 23.186
          - type: precision_at_10
            value: 7.510999999999999
          - type: precision_at_100
            value: 0.9860000000000001
          - type: precision_at_1000
            value: 0.1
          - type: precision_at_3
            value: 15.078
          - type: precision_at_5
            value: 11.110000000000001
          - type: recall_at_1
            value: 23.186
          - type: recall_at_10
            value: 75.107
          - type: recall_at_100
            value: 98.649
          - type: recall_at_1000
            value: 99.644
          - type: recall_at_3
            value: 45.235
          - type: recall_at_5
            value: 55.547999999999995
      - task:
          type: Clustering
        dataset:
          type: mteb/arxiv-clustering-p2p
          name: MTEB ArxivClusteringP2P
          config: default
          split: test
          revision: 0bbdb47bcbe3a90093699aefeed338a0f28a7ee8
        metrics:
          - type: v_measure
            value: 48.37886340922374
      - task:
          type: Clustering
        dataset:
          type: mteb/arxiv-clustering-s2s
          name: MTEB ArxivClusteringS2S
          config: default
          split: test
          revision: b73bd54100e5abfa6e3a23dcafb46fe4d2438dc3
        metrics:
          - type: v_measure
            value: 39.72488615315985
      - task:
          type: Reranking
        dataset:
          type: mteb/askubuntudupquestions-reranking
          name: MTEB AskUbuntuDupQuestions
          config: default
          split: test
          revision: 4d853f94cd57d85ec13805aeeac3ae3e5eb4c49c
        metrics:
          - type: map
            value: 65.85199009344481
          - type: mrr
            value: 78.47700391329201
      - task:
          type: STS
        dataset:
          type: mteb/biosses-sts
          name: MTEB BIOSSES
          config: default
          split: test
          revision: 9ee918f184421b6bd48b78f6c714d86546106103
        metrics:
          - type: cos_sim_pearson
            value: 84.47737119217858
          - type: cos_sim_spearman
            value: 80.43195317854409
          - type: euclidean_pearson
            value: 82.20496332547978
          - type: euclidean_spearman
            value: 80.43195317854409
          - type: manhattan_pearson
            value: 81.4836610720397
          - type: manhattan_spearman
            value: 79.65904400101908
      - task:
          type: Classification
        dataset:
          type: mteb/banking77
          name: MTEB Banking77Classification
          config: default
          split: test
          revision: 44fa15921b4c889113cc5df03dd4901b49161ab7
        metrics:
          - type: accuracy
            value: 81.8603896103896
          - type: f1
            value: 81.28027245637479
      - task:
          type: Clustering
        dataset:
          type: mteb/biorxiv-clustering-p2p
          name: MTEB BiorxivClusteringP2P
          config: default
          split: test
          revision: 11d0121201d1f1f280e8cc8f3d98fb9c4d9f9c55
        metrics:
          - type: v_measure
            value: 39.616605133625185
      - task:
          type: Clustering
        dataset:
          type: mteb/biorxiv-clustering-s2s
          name: MTEB BiorxivClusteringS2S
          config: default
          split: test
          revision: c0fab014e1bcb8d3a5e31b2088972a1e01547dc1
        metrics:
          - type: v_measure
            value: 35.02442407186902
      - task:
          type: Retrieval
        dataset:
          type: BeIR/cqadupstack
          name: MTEB CQADupstackAndroidRetrieval
          config: default
          split: test
          revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
        metrics:
          - type: map_at_1
            value: 36.036
          - type: map_at_10
            value: 49.302
          - type: map_at_100
            value: 50.956
          - type: map_at_1000
            value: 51.080000000000005
          - type: map_at_3
            value: 45.237
          - type: map_at_5
            value: 47.353
          - type: ndcg_at_1
            value: 45.207
          - type: ndcg_at_10
            value: 56.485
          - type: ndcg_at_100
            value: 61.413
          - type: ndcg_at_1000
            value: 62.870000000000005
          - type: ndcg_at_3
            value: 51.346000000000004
          - type: ndcg_at_5
            value: 53.486
          - type: precision_at_1
            value: 45.207
          - type: precision_at_10
            value: 11.144
          - type: precision_at_100
            value: 1.735
          - type: precision_at_1000
            value: 0.22100000000000003
          - type: precision_at_3
            value: 24.94
          - type: precision_at_5
            value: 17.997
          - type: recall_at_1
            value: 36.036
          - type: recall_at_10
            value: 69.191
          - type: recall_at_100
            value: 89.423
          - type: recall_at_1000
            value: 98.425
          - type: recall_at_3
            value: 53.849999999999994
          - type: recall_at_5
            value: 60.107
      - task:
          type: Retrieval
        dataset:
          type: BeIR/cqadupstack
          name: MTEB CQADupstackEnglishRetrieval
          config: default
          split: test
          revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
        metrics:
          - type: map_at_1
            value: 32.92
          - type: map_at_10
            value: 45.739999999999995
          - type: map_at_100
            value: 47.309
          - type: map_at_1000
            value: 47.443000000000005
          - type: map_at_3
            value: 42.154
          - type: map_at_5
            value: 44.207
          - type: ndcg_at_1
            value: 42.229
          - type: ndcg_at_10
            value: 52.288999999999994
          - type: ndcg_at_100
            value: 57.04900000000001
          - type: ndcg_at_1000
            value: 58.788
          - type: ndcg_at_3
            value: 47.531
          - type: ndcg_at_5
            value: 49.861
          - type: precision_at_1
            value: 42.229
          - type: precision_at_10
            value: 10.299
          - type: precision_at_100
            value: 1.68
          - type: precision_at_1000
            value: 0.213
          - type: precision_at_3
            value: 23.673
          - type: precision_at_5
            value: 17.006
          - type: recall_at_1
            value: 32.92
          - type: recall_at_10
            value: 63.865
          - type: recall_at_100
            value: 84.06700000000001
          - type: recall_at_1000
            value: 94.536
          - type: recall_at_3
            value: 49.643
          - type: recall_at_5
            value: 56.119
      - task:
          type: Retrieval
        dataset:
          type: BeIR/cqadupstack
          name: MTEB CQADupstackGamingRetrieval
          config: default
          split: test
          revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
        metrics:
          - type: map_at_1
            value: 40.695
          - type: map_at_10
            value: 53.787
          - type: map_at_100
            value: 54.778000000000006
          - type: map_at_1000
            value: 54.827000000000005
          - type: map_at_3
            value: 50.151999999999994
          - type: map_at_5
            value: 52.207
          - type: ndcg_at_1
            value: 46.52
          - type: ndcg_at_10
            value: 60.026
          - type: ndcg_at_100
            value: 63.81099999999999
          - type: ndcg_at_1000
            value: 64.741
          - type: ndcg_at_3
            value: 53.83
          - type: ndcg_at_5
            value: 56.928999999999995
          - type: precision_at_1
            value: 46.52
          - type: precision_at_10
            value: 9.754999999999999
          - type: precision_at_100
            value: 1.2670000000000001
          - type: precision_at_1000
            value: 0.13799999999999998
          - type: precision_at_3
            value: 24.096
          - type: precision_at_5
            value: 16.689999999999998
          - type: recall_at_1
            value: 40.695
          - type: recall_at_10
            value: 75.181
          - type: recall_at_100
            value: 91.479
          - type: recall_at_1000
            value: 98.06899999999999
          - type: recall_at_3
            value: 58.707
          - type: recall_at_5
            value: 66.295
      - task:
          type: Retrieval
        dataset:
          type: BeIR/cqadupstack
          name: MTEB CQADupstackGisRetrieval
          config: default
          split: test
          revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
        metrics:
          - type: map_at_1
            value: 29.024
          - type: map_at_10
            value: 38.438
          - type: map_at_100
            value: 39.576
          - type: map_at_1000
            value: 39.645
          - type: map_at_3
            value: 34.827999999999996
          - type: map_at_5
            value: 36.947
          - type: ndcg_at_1
            value: 31.299
          - type: ndcg_at_10
            value: 44.268
          - type: ndcg_at_100
            value: 49.507
          - type: ndcg_at_1000
            value: 51.205999999999996
          - type: ndcg_at_3
            value: 37.248999999999995
          - type: ndcg_at_5
            value: 40.861999999999995
          - type: precision_at_1
            value: 31.299
          - type: precision_at_10
            value: 6.949
          - type: precision_at_100
            value: 1.012
          - type: precision_at_1000
            value: 0.11900000000000001
          - type: precision_at_3
            value: 15.518
          - type: precision_at_5
            value: 11.366999999999999
          - type: recall_at_1
            value: 29.024
          - type: recall_at_10
            value: 60.404
          - type: recall_at_100
            value: 83.729
          - type: recall_at_1000
            value: 96.439
          - type: recall_at_3
            value: 41.65
          - type: recall_at_5
            value: 50.263999999999996
      - task:
          type: Retrieval
        dataset:
          type: BeIR/cqadupstack
          name: MTEB CQADupstackMathematicaRetrieval
          config: default
          split: test
          revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
        metrics:
          - type: map_at_1
            value: 17.774
          - type: map_at_10
            value: 28.099
          - type: map_at_100
            value: 29.603
          - type: map_at_1000
            value: 29.709999999999997
          - type: map_at_3
            value: 25.036
          - type: map_at_5
            value: 26.657999999999998
          - type: ndcg_at_1
            value: 22.139
          - type: ndcg_at_10
            value: 34.205999999999996
          - type: ndcg_at_100
            value: 40.844
          - type: ndcg_at_1000
            value: 43.144
          - type: ndcg_at_3
            value: 28.732999999999997
          - type: ndcg_at_5
            value: 31.252000000000002
          - type: precision_at_1
            value: 22.139
          - type: precision_at_10
            value: 6.567
          - type: precision_at_100
            value: 1.147
          - type: precision_at_1000
            value: 0.146
          - type: precision_at_3
            value: 14.386
          - type: precision_at_5
            value: 10.423
          - type: recall_at_1
            value: 17.774
          - type: recall_at_10
            value: 48.32
          - type: recall_at_100
            value: 76.373
          - type: recall_at_1000
            value: 92.559
          - type: recall_at_3
            value: 33.478
          - type: recall_at_5
            value: 39.872
      - task:
          type: Retrieval
        dataset:
          type: BeIR/cqadupstack
          name: MTEB CQADupstackPhysicsRetrieval
          config: default
          split: test
          revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
        metrics:
          - type: map_at_1
            value: 31.885
          - type: map_at_10
            value: 44.289
          - type: map_at_100
            value: 45.757999999999996
          - type: map_at_1000
            value: 45.86
          - type: map_at_3
            value: 40.459
          - type: map_at_5
            value: 42.662
          - type: ndcg_at_1
            value: 39.75
          - type: ndcg_at_10
            value: 50.975
          - type: ndcg_at_100
            value: 56.528999999999996
          - type: ndcg_at_1000
            value: 58.06099999999999
          - type: ndcg_at_3
            value: 45.327
          - type: ndcg_at_5
            value: 48.041
          - type: precision_at_1
            value: 39.75
          - type: precision_at_10
            value: 9.557
          - type: precision_at_100
            value: 1.469
          - type: precision_at_1000
            value: 0.17700000000000002
          - type: precision_at_3
            value: 22.073
          - type: precision_at_5
            value: 15.765
          - type: recall_at_1
            value: 31.885
          - type: recall_at_10
            value: 64.649
          - type: recall_at_100
            value: 87.702
          - type: recall_at_1000
            value: 97.327
          - type: recall_at_3
            value: 48.61
          - type: recall_at_5
            value: 55.882
      - task:
          type: Retrieval
        dataset:
          type: BeIR/cqadupstack
          name: MTEB CQADupstackProgrammersRetrieval
          config: default
          split: test
          revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
        metrics:
          - type: map_at_1
            value: 26.454
          - type: map_at_10
            value: 37.756
          - type: map_at_100
            value: 39.225
          - type: map_at_1000
            value: 39.332
          - type: map_at_3
            value: 34.115
          - type: map_at_5
            value: 35.942
          - type: ndcg_at_1
            value: 32.42
          - type: ndcg_at_10
            value: 44.165
          - type: ndcg_at_100
            value: 50.202000000000005
          - type: ndcg_at_1000
            value: 52.188
          - type: ndcg_at_3
            value: 38.381
          - type: ndcg_at_5
            value: 40.849000000000004
          - type: precision_at_1
            value: 32.42
          - type: precision_at_10
            value: 8.482000000000001
          - type: precision_at_100
            value: 1.332
          - type: precision_at_1000
            value: 0.169
          - type: precision_at_3
            value: 18.683
          - type: precision_at_5
            value: 13.539000000000001
          - type: recall_at_1
            value: 26.454
          - type: recall_at_10
            value: 57.937000000000005
          - type: recall_at_100
            value: 83.76
          - type: recall_at_1000
            value: 96.82600000000001
          - type: recall_at_3
            value: 41.842
          - type: recall_at_5
            value: 48.285
      - task:
          type: Retrieval
        dataset:
          type: BeIR/cqadupstack
          name: MTEB CQADupstackRetrieval
          config: default
          split: test
          revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
        metrics:
          - type: map_at_1
            value: 27.743666666666666
          - type: map_at_10
            value: 38.75416666666667
          - type: map_at_100
            value: 40.133250000000004
          - type: map_at_1000
            value: 40.24616666666667
          - type: map_at_3
            value: 35.267250000000004
          - type: map_at_5
            value: 37.132749999999994
          - type: ndcg_at_1
            value: 33.14358333333333
          - type: ndcg_at_10
            value: 44.95916666666667
          - type: ndcg_at_100
            value: 50.46375
          - type: ndcg_at_1000
            value: 52.35508333333334
          - type: ndcg_at_3
            value: 39.17883333333334
          - type: ndcg_at_5
            value: 41.79724999999999
          - type: precision_at_1
            value: 33.14358333333333
          - type: precision_at_10
            value: 8.201083333333333
          - type: precision_at_100
            value: 1.3085
          - type: precision_at_1000
            value: 0.1665833333333333
          - type: precision_at_3
            value: 18.405583333333333
          - type: precision_at_5
            value: 13.233166666666666
          - type: recall_at_1
            value: 27.743666666666666
          - type: recall_at_10
            value: 58.91866666666667
          - type: recall_at_100
            value: 82.76216666666666
          - type: recall_at_1000
            value: 95.56883333333333
          - type: recall_at_3
            value: 42.86925
          - type: recall_at_5
            value: 49.553333333333335
      - task:
          type: Retrieval
        dataset:
          type: BeIR/cqadupstack
          name: MTEB CQADupstackStatsRetrieval
          config: default
          split: test
          revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
        metrics:
          - type: map_at_1
            value: 25.244
          - type: map_at_10
            value: 33.464
          - type: map_at_100
            value: 34.633
          - type: map_at_1000
            value: 34.721999999999994
          - type: map_at_3
            value: 30.784
          - type: map_at_5
            value: 32.183
          - type: ndcg_at_1
            value: 28.681
          - type: ndcg_at_10
            value: 38.149
          - type: ndcg_at_100
            value: 43.856
          - type: ndcg_at_1000
            value: 46.026
          - type: ndcg_at_3
            value: 33.318
          - type: ndcg_at_5
            value: 35.454
          - type: precision_at_1
            value: 28.681
          - type: precision_at_10
            value: 6.304
          - type: precision_at_100
            value: 0.992
          - type: precision_at_1000
            value: 0.125
          - type: precision_at_3
            value: 14.673
          - type: precision_at_5
            value: 10.245
          - type: recall_at_1
            value: 25.244
          - type: recall_at_10
            value: 49.711
          - type: recall_at_100
            value: 75.928
          - type: recall_at_1000
            value: 91.79899999999999
          - type: recall_at_3
            value: 36.325
          - type: recall_at_5
            value: 41.752
      - task:
          type: Retrieval
        dataset:
          type: BeIR/cqadupstack
          name: MTEB CQADupstackTexRetrieval
          config: default
          split: test
          revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
        metrics:
          - type: map_at_1
            value: 18.857
          - type: map_at_10
            value: 27.794
          - type: map_at_100
            value: 29.186
          - type: map_at_1000
            value: 29.323
          - type: map_at_3
            value: 24.779
          - type: map_at_5
            value: 26.459
          - type: ndcg_at_1
            value: 23.227999999999998
          - type: ndcg_at_10
            value: 33.353
          - type: ndcg_at_100
            value: 39.598
          - type: ndcg_at_1000
            value: 42.268
          - type: ndcg_at_3
            value: 28.054000000000002
          - type: ndcg_at_5
            value: 30.566
          - type: precision_at_1
            value: 23.227999999999998
          - type: precision_at_10
            value: 6.397
          - type: precision_at_100
            value: 1.129
          - type: precision_at_1000
            value: 0.155
          - type: precision_at_3
            value: 13.616
          - type: precision_at_5
            value: 10.116999999999999
          - type: recall_at_1
            value: 18.857
          - type: recall_at_10
            value: 45.797
          - type: recall_at_100
            value: 73.615
          - type: recall_at_1000
            value: 91.959
          - type: recall_at_3
            value: 31.129
          - type: recall_at_5
            value: 37.565
      - task:
          type: Retrieval
        dataset:
          type: BeIR/cqadupstack
          name: MTEB CQADupstackUnixRetrieval
          config: default
          split: test
          revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
        metrics:
          - type: map_at_1
            value: 27.486
          - type: map_at_10
            value: 39.164
          - type: map_at_100
            value: 40.543
          - type: map_at_1000
            value: 40.636
          - type: map_at_3
            value: 35.52
          - type: map_at_5
            value: 37.355
          - type: ndcg_at_1
            value: 32.275999999999996
          - type: ndcg_at_10
            value: 45.414
          - type: ndcg_at_100
            value: 51.254
          - type: ndcg_at_1000
            value: 53.044000000000004
          - type: ndcg_at_3
            value: 39.324999999999996
          - type: ndcg_at_5
            value: 41.835
          - type: precision_at_1
            value: 32.275999999999996
          - type: precision_at_10
            value: 8.144
          - type: precision_at_100
            value: 1.237
          - type: precision_at_1000
            value: 0.15
          - type: precision_at_3
            value: 18.501
          - type: precision_at_5
            value: 13.134
          - type: recall_at_1
            value: 27.486
          - type: recall_at_10
            value: 60.449
          - type: recall_at_100
            value: 85.176
          - type: recall_at_1000
            value: 97.087
          - type: recall_at_3
            value: 43.59
          - type: recall_at_5
            value: 50.08899999999999
      - task:
          type: Retrieval
        dataset:
          type: BeIR/cqadupstack
          name: MTEB CQADupstackWebmastersRetrieval
          config: default
          split: test
          revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
        metrics:
          - type: map_at_1
            value: 26.207
          - type: map_at_10
            value: 37.255
          - type: map_at_100
            value: 39.043
          - type: map_at_1000
            value: 39.273
          - type: map_at_3
            value: 33.487
          - type: map_at_5
            value: 35.441
          - type: ndcg_at_1
            value: 31.423000000000002
          - type: ndcg_at_10
            value: 44.235
          - type: ndcg_at_100
            value: 50.49
          - type: ndcg_at_1000
            value: 52.283
          - type: ndcg_at_3
            value: 37.602000000000004
          - type: ndcg_at_5
            value: 40.518
          - type: precision_at_1
            value: 31.423000000000002
          - type: precision_at_10
            value: 8.715
          - type: precision_at_100
            value: 1.7590000000000001
          - type: precision_at_1000
            value: 0.257
          - type: precision_at_3
            value: 17.523
          - type: precision_at_5
            value: 13.161999999999999
          - type: recall_at_1
            value: 26.207
          - type: recall_at_10
            value: 59.17099999999999
          - type: recall_at_100
            value: 86.166
          - type: recall_at_1000
            value: 96.54700000000001
          - type: recall_at_3
            value: 41.18
          - type: recall_at_5
            value: 48.083999999999996
      - task:
          type: Retrieval
        dataset:
          type: BeIR/cqadupstack
          name: MTEB CQADupstackWordpressRetrieval
          config: default
          split: test
          revision: 2b9f5791698b5be7bc5e10535c8690f20043c3db
        metrics:
          - type: map_at_1
            value: 20.342
          - type: map_at_10
            value: 29.962
          - type: map_at_100
            value: 30.989
          - type: map_at_1000
            value: 31.102999999999998
          - type: map_at_3
            value: 26.656000000000002
          - type: map_at_5
            value: 28.179
          - type: ndcg_at_1
            value: 22.551
          - type: ndcg_at_10
            value: 35.945
          - type: ndcg_at_100
            value: 41.012
          - type: ndcg_at_1000
            value: 43.641999999999996
          - type: ndcg_at_3
            value: 29.45
          - type: ndcg_at_5
            value: 31.913999999999998
          - type: precision_at_1
            value: 22.551
          - type: precision_at_10
            value: 6.1
          - type: precision_at_100
            value: 0.943
          - type: precision_at_1000
            value: 0.129
          - type: precision_at_3
            value: 13.184999999999999
          - type: precision_at_5
            value: 9.353
          - type: recall_at_1
            value: 20.342
          - type: recall_at_10
            value: 52.349000000000004
          - type: recall_at_100
            value: 75.728
          - type: recall_at_1000
            value: 95.253
          - type: recall_at_3
            value: 34.427
          - type: recall_at_5
            value: 40.326
      - task:
          type: Retrieval
        dataset:
          type: climate-fever
          name: MTEB ClimateFEVER
          config: default
          split: test
          revision: 392b78eb68c07badcd7c2cd8f39af108375dfcce
        metrics:
          - type: map_at_1
            value: 7.71
          - type: map_at_10
            value: 14.81
          - type: map_at_100
            value: 16.536
          - type: map_at_1000
            value: 16.744999999999997
          - type: map_at_3
            value: 12.109
          - type: map_at_5
            value: 13.613
          - type: ndcg_at_1
            value: 18.046
          - type: ndcg_at_10
            value: 21.971
          - type: ndcg_at_100
            value: 29.468
          - type: ndcg_at_1000
            value: 33.428999999999995
          - type: ndcg_at_3
            value: 17.227999999999998
          - type: ndcg_at_5
            value: 19.189999999999998
          - type: precision_at_1
            value: 18.046
          - type: precision_at_10
            value: 7.192
          - type: precision_at_100
            value: 1.51
          - type: precision_at_1000
            value: 0.22499999999999998
          - type: precision_at_3
            value: 13.312
          - type: precision_at_5
            value: 10.775
          - type: recall_at_1
            value: 7.71
          - type: recall_at_10
            value: 27.908
          - type: recall_at_100
            value: 54.452
          - type: recall_at_1000
            value: 76.764
          - type: recall_at_3
            value: 16.64
          - type: recall_at_5
            value: 21.631
      - task:
          type: Retrieval
        dataset:
          type: dbpedia-entity
          name: MTEB DBPedia
          config: default
          split: test
          revision: f097057d03ed98220bc7309ddb10b71a54d667d6
        metrics:
          - type: map_at_1
            value: 6.8180000000000005
          - type: map_at_10
            value: 14.591000000000001
          - type: map_at_100
            value: 19.855999999999998
          - type: map_at_1000
            value: 21.178
          - type: map_at_3
            value: 10.345
          - type: map_at_5
            value: 12.367
          - type: ndcg_at_1
            value: 39.25
          - type: ndcg_at_10
            value: 32.088
          - type: ndcg_at_100
            value: 36.019
          - type: ndcg_at_1000
            value: 43.649
          - type: ndcg_at_3
            value: 35.132999999999996
          - type: ndcg_at_5
            value: 33.777
          - type: precision_at_1
            value: 49.5
          - type: precision_at_10
            value: 25.624999999999996
          - type: precision_at_100
            value: 8.043
          - type: precision_at_1000
            value: 1.7409999999999999
          - type: precision_at_3
            value: 38.417
          - type: precision_at_5
            value: 33.2
          - type: recall_at_1
            value: 6.8180000000000005
          - type: recall_at_10
            value: 20.399
          - type: recall_at_100
            value: 42.8
          - type: recall_at_1000
            value: 68.081
          - type: recall_at_3
            value: 11.928999999999998
          - type: recall_at_5
            value: 15.348999999999998
      - task:
          type: Classification
        dataset:
          type: mteb/emotion
          name: MTEB EmotionClassification
          config: default
          split: test
          revision: 829147f8f75a25f005913200eb5ed41fae320aa1
        metrics:
          - type: accuracy
            value: 39.725
          - type: f1
            value: 35.19385687310605
      - task:
          type: Retrieval
        dataset:
          type: fever
          name: MTEB FEVER
          config: default
          split: test
          revision: 1429cf27e393599b8b359b9b72c666f96b2525f9
        metrics:
          - type: map_at_1
            value: 31.901000000000003
          - type: map_at_10
            value: 44.156
          - type: map_at_100
            value: 44.901
          - type: map_at_1000
            value: 44.939
          - type: map_at_3
            value: 41.008
          - type: map_at_5
            value: 42.969
          - type: ndcg_at_1
            value: 34.263
          - type: ndcg_at_10
            value: 50.863
          - type: ndcg_at_100
            value: 54.336
          - type: ndcg_at_1000
            value: 55.297
          - type: ndcg_at_3
            value: 44.644
          - type: ndcg_at_5
            value: 48.075
          - type: precision_at_1
            value: 34.263
          - type: precision_at_10
            value: 7.542999999999999
          - type: precision_at_100
            value: 0.9400000000000001
          - type: precision_at_1000
            value: 0.104
          - type: precision_at_3
            value: 18.912000000000003
          - type: precision_at_5
            value: 13.177
          - type: recall_at_1
            value: 31.901000000000003
          - type: recall_at_10
            value: 68.872
          - type: recall_at_100
            value: 84.468
          - type: recall_at_1000
            value: 91.694
          - type: recall_at_3
            value: 52.272
          - type: recall_at_5
            value: 60.504999999999995
      - task:
          type: Retrieval
        dataset:
          type: fiqa
          name: MTEB FiQA2018
          config: default
          split: test
          revision: 41b686a7f28c59bcaaa5791efd47c67c8ebe28be
        metrics:
          - type: map_at_1
            value: 24.4
          - type: map_at_10
            value: 41.117
          - type: map_at_100
            value: 43.167
          - type: map_at_1000
            value: 43.323
          - type: map_at_3
            value: 35.744
          - type: map_at_5
            value: 38.708
          - type: ndcg_at_1
            value: 49.074
          - type: ndcg_at_10
            value: 49.963
          - type: ndcg_at_100
            value: 56.564
          - type: ndcg_at_1000
            value: 58.931999999999995
          - type: ndcg_at_3
            value: 45.489000000000004
          - type: ndcg_at_5
            value: 47.133
          - type: precision_at_1
            value: 49.074
          - type: precision_at_10
            value: 13.889000000000001
          - type: precision_at_100
            value: 2.091
          - type: precision_at_1000
            value: 0.251
          - type: precision_at_3
            value: 30.658
          - type: precision_at_5
            value: 22.593
          - type: recall_at_1
            value: 24.4
          - type: recall_at_10
            value: 58.111999999999995
          - type: recall_at_100
            value: 81.96900000000001
          - type: recall_at_1000
            value: 96.187
          - type: recall_at_3
            value: 41.661
          - type: recall_at_5
            value: 49.24
      - task:
          type: Retrieval
        dataset:
          type: hotpotqa
          name: MTEB HotpotQA
          config: default
          split: test
          revision: 766870b35a1b9ca65e67a0d1913899973551fc6c
        metrics:
          - type: map_at_1
            value: 22.262
          - type: map_at_10
            value: 31.266
          - type: map_at_100
            value: 32.202
          - type: map_at_1000
            value: 32.300000000000004
          - type: map_at_3
            value: 28.874
          - type: map_at_5
            value: 30.246000000000002
          - type: ndcg_at_1
            value: 44.524
          - type: ndcg_at_10
            value: 39.294000000000004
          - type: ndcg_at_100
            value: 43.296
          - type: ndcg_at_1000
            value: 45.561
          - type: ndcg_at_3
            value: 35.013
          - type: ndcg_at_5
            value: 37.177
          - type: precision_at_1
            value: 44.524
          - type: precision_at_10
            value: 8.52
          - type: precision_at_100
            value: 1.169
          - type: precision_at_1000
            value: 0.147
          - type: precision_at_3
            value: 22.003
          - type: precision_at_5
            value: 14.914
          - type: recall_at_1
            value: 22.262
          - type: recall_at_10
            value: 42.6
          - type: recall_at_100
            value: 58.46
          - type: recall_at_1000
            value: 73.565
          - type: recall_at_3
            value: 33.005
          - type: recall_at_5
            value: 37.286
      - task:
          type: Classification
        dataset:
          type: mteb/imdb
          name: MTEB ImdbClassification
          config: default
          split: test
          revision: 8d743909f834c38949e8323a8a6ce8721ea6c7f4
        metrics:
          - type: accuracy
            value: 70.7156
          - type: ap
            value: 64.89470531959896
          - type: f1
            value: 70.53051887683772
      - task:
          type: Retrieval
        dataset:
          type: msmarco
          name: MTEB MSMARCO
          config: default
          split: dev
          revision: e6838a846e2408f22cf5cc337ebc83e0bcf77849
        metrics:
          - type: map_at_1
            value: 21.174
          - type: map_at_10
            value: 33
          - type: map_at_100
            value: 34.178
          - type: map_at_1000
            value: 34.227000000000004
          - type: map_at_3
            value: 29.275000000000002
          - type: map_at_5
            value: 31.341
          - type: ndcg_at_1
            value: 21.776999999999997
          - type: ndcg_at_10
            value: 39.745999999999995
          - type: ndcg_at_100
            value: 45.488
          - type: ndcg_at_1000
            value: 46.733999999999995
          - type: ndcg_at_3
            value: 32.086
          - type: ndcg_at_5
            value: 35.792
          - type: precision_at_1
            value: 21.776999999999997
          - type: precision_at_10
            value: 6.324000000000001
          - type: precision_at_100
            value: 0.922
          - type: precision_at_1000
            value: 0.10300000000000001
          - type: precision_at_3
            value: 13.696
          - type: precision_at_5
            value: 10.100000000000001
          - type: recall_at_1
            value: 21.174
          - type: recall_at_10
            value: 60.488
          - type: recall_at_100
            value: 87.234
          - type: recall_at_1000
            value: 96.806
          - type: recall_at_3
            value: 39.582
          - type: recall_at_5
            value: 48.474000000000004
      - task:
          type: Classification
        dataset:
          type: mteb/mtop_domain
          name: MTEB MTOPDomainClassification (en)
          config: en
          split: test
          revision: a7e2a951126a26fc8c6a69f835f33a346ba259e3
        metrics:
          - type: accuracy
            value: 92.07934336525308
          - type: f1
            value: 91.93440027035814
      - task:
          type: Classification
        dataset:
          type: mteb/mtop_intent
          name: MTEB MTOPIntentClassification (en)
          config: en
          split: test
          revision: 6299947a7777084cc2d4b64235bf7190381ce755
        metrics:
          - type: accuracy
            value: 70.20975832193344
          - type: f1
            value: 48.571776628850074
      - task:
          type: Classification
        dataset:
          type: mteb/amazon_massive_intent
          name: MTEB MassiveIntentClassification (en)
          config: en
          split: test
          revision: 072a486a144adf7f4479a4a0dddb2152e161e1ea
        metrics:
          - type: accuracy
            value: 69.56624075319435
          - type: f1
            value: 67.64419185784621
      - task:
          type: Classification
        dataset:
          type: mteb/amazon_massive_scenario
          name: MTEB MassiveScenarioClassification (en)
          config: en
          split: test
          revision: 7d571f92784cd94a019292a1f45445077d0ef634
        metrics:
          - type: accuracy
            value: 76.01210490921318
          - type: f1
            value: 75.1934366365826
      - task:
          type: Clustering
        dataset:
          type: mteb/medrxiv-clustering-p2p
          name: MTEB MedrxivClusteringP2P
          config: default
          split: test
          revision: dcefc037ef84348e49b0d29109e891c01067226b
        metrics:
          - type: v_measure
            value: 35.58002813186373
      - task:
          type: Clustering
        dataset:
          type: mteb/medrxiv-clustering-s2s
          name: MTEB MedrxivClusteringS2S
          config: default
          split: test
          revision: 3cd0e71dfbe09d4de0f9e5ecba43e7ce280959dc
        metrics:
          - type: v_measure
            value: 32.872725562410444
      - task:
          type: Reranking
        dataset:
          type: mteb/mind_small
          name: MTEB MindSmallReranking
          config: default
          split: test
          revision: 3bdac13927fdc888b903db93b2ffdbd90b295a69
        metrics:
          - type: map
            value: 30.965343604861328
          - type: mrr
            value: 31.933710165863594
      - task:
          type: Retrieval
        dataset:
          type: nfcorpus
          name: MTEB NFCorpus
          config: default
          split: test
          revision: 7eb63cc0c1eb59324d709ebed25fcab851fa7610
        metrics:
          - type: map_at_1
            value: 4.938
          - type: map_at_10
            value: 12.034
          - type: map_at_100
            value: 15.675
          - type: map_at_1000
            value: 17.18
          - type: map_at_3
            value: 8.471
          - type: map_at_5
            value: 10.128
          - type: ndcg_at_1
            value: 40.402
          - type: ndcg_at_10
            value: 33.289
          - type: ndcg_at_100
            value: 31.496000000000002
          - type: ndcg_at_1000
            value: 40.453
          - type: ndcg_at_3
            value: 37.841
          - type: ndcg_at_5
            value: 36.215
          - type: precision_at_1
            value: 41.796
          - type: precision_at_10
            value: 25.294
          - type: precision_at_100
            value: 8.381
          - type: precision_at_1000
            value: 2.1260000000000003
          - type: precision_at_3
            value: 36.429
          - type: precision_at_5
            value: 32.446000000000005
          - type: recall_at_1
            value: 4.938
          - type: recall_at_10
            value: 16.637
          - type: recall_at_100
            value: 33.853
          - type: recall_at_1000
            value: 66.07
          - type: recall_at_3
            value: 9.818
          - type: recall_at_5
            value: 12.544
      - task:
          type: Retrieval
        dataset:
          type: nq
          name: MTEB NQ
          config: default
          split: test
          revision: 6062aefc120bfe8ece5897809fb2e53bfe0d128c
        metrics:
          - type: map_at_1
            value: 27.124
          - type: map_at_10
            value: 42.418
          - type: map_at_100
            value: 43.633
          - type: map_at_1000
            value: 43.66
          - type: map_at_3
            value: 37.766
          - type: map_at_5
            value: 40.482
          - type: ndcg_at_1
            value: 30.794
          - type: ndcg_at_10
            value: 50.449999999999996
          - type: ndcg_at_100
            value: 55.437999999999995
          - type: ndcg_at_1000
            value: 56.084
          - type: ndcg_at_3
            value: 41.678
          - type: ndcg_at_5
            value: 46.257
          - type: precision_at_1
            value: 30.794
          - type: precision_at_10
            value: 8.656
          - type: precision_at_100
            value: 1.141
          - type: precision_at_1000
            value: 0.12
          - type: precision_at_3
            value: 19.37
          - type: precision_at_5
            value: 14.218
          - type: recall_at_1
            value: 27.124
          - type: recall_at_10
            value: 72.545
          - type: recall_at_100
            value: 93.938
          - type: recall_at_1000
            value: 98.788
          - type: recall_at_3
            value: 49.802
          - type: recall_at_5
            value: 60.426
      - task:
          type: Retrieval
        dataset:
          type: quora
          name: MTEB QuoraRetrieval
          config: default
          split: test
          revision: 6205996560df11e3a3da9ab4f926788fc30a7db4
        metrics:
          - type: map_at_1
            value: 69.33500000000001
          - type: map_at_10
            value: 83.554
          - type: map_at_100
            value: 84.237
          - type: map_at_1000
            value: 84.251
          - type: map_at_3
            value: 80.456
          - type: map_at_5
            value: 82.395
          - type: ndcg_at_1
            value: 80.06
          - type: ndcg_at_10
            value: 87.46199999999999
          - type: ndcg_at_100
            value: 88.774
          - type: ndcg_at_1000
            value: 88.864
          - type: ndcg_at_3
            value: 84.437
          - type: ndcg_at_5
            value: 86.129
          - type: precision_at_1
            value: 80.06
          - type: precision_at_10
            value: 13.418
          - type: precision_at_100
            value: 1.536
          - type: precision_at_1000
            value: 0.157
          - type: precision_at_3
            value: 37.103
          - type: precision_at_5
            value: 24.522
          - type: recall_at_1
            value: 69.33500000000001
          - type: recall_at_10
            value: 95.03200000000001
          - type: recall_at_100
            value: 99.559
          - type: recall_at_1000
            value: 99.98700000000001
          - type: recall_at_3
            value: 86.404
          - type: recall_at_5
            value: 91.12400000000001
      - task:
          type: Clustering
        dataset:
          type: mteb/reddit-clustering
          name: MTEB RedditClustering
          config: default
          split: test
          revision: b2805658ae38990172679479369a78b86de8c390
        metrics:
          - type: v_measure
            value: 54.824256698437324
      - task:
          type: Clustering
        dataset:
          type: mteb/reddit-clustering-p2p
          name: MTEB RedditClusteringP2P
          config: default
          split: test
          revision: 385e3cb46b4cfa89021f56c4380204149d0efe33
        metrics:
          - type: v_measure
            value: 56.768972678049366
      - task:
          type: Retrieval
        dataset:
          type: scidocs
          name: MTEB SCIDOCS
          config: default
          split: test
          revision: 5c59ef3e437a0a9651c8fe6fde943e7dce59fba5
        metrics:
          - type: map_at_1
            value: 5.192
          - type: map_at_10
            value: 14.426
          - type: map_at_100
            value: 17.18
          - type: map_at_1000
            value: 17.580000000000002
          - type: map_at_3
            value: 9.94
          - type: map_at_5
            value: 12.077
          - type: ndcg_at_1
            value: 25.5
          - type: ndcg_at_10
            value: 23.765
          - type: ndcg_at_100
            value: 33.664
          - type: ndcg_at_1000
            value: 39.481
          - type: ndcg_at_3
            value: 21.813
          - type: ndcg_at_5
            value: 19.285
          - type: precision_at_1
            value: 25.5
          - type: precision_at_10
            value: 12.690000000000001
          - type: precision_at_100
            value: 2.71
          - type: precision_at_1000
            value: 0.409
          - type: precision_at_3
            value: 20.732999999999997
          - type: precision_at_5
            value: 17.24
          - type: recall_at_1
            value: 5.192
          - type: recall_at_10
            value: 25.712000000000003
          - type: recall_at_100
            value: 54.99699999999999
          - type: recall_at_1000
            value: 82.97200000000001
          - type: recall_at_3
            value: 12.631999999999998
          - type: recall_at_5
            value: 17.497
      - task:
          type: STS
        dataset:
          type: mteb/sickr-sts
          name: MTEB SICK-R
          config: default
          split: test
          revision: 20a6d6f312dd54037fe07a32d58e5e168867909d
        metrics:
          - type: cos_sim_pearson
            value: 84.00280838354293
          - type: cos_sim_spearman
            value: 80.5854192844009
          - type: euclidean_pearson
            value: 80.55974827073891
          - type: euclidean_spearman
            value: 80.58541460172292
          - type: manhattan_pearson
            value: 80.27294578437488
          - type: manhattan_spearman
            value: 80.33176193921884
      - task:
          type: STS
        dataset:
          type: mteb/sts12-sts
          name: MTEB STS12
          config: default
          split: test
          revision: fdf84275bb8ce4b49c971d02e84dd1abc677a50f
        metrics:
          - type: cos_sim_pearson
            value: 83.2801353818369
          - type: cos_sim_spearman
            value: 72.63427853822449
          - type: euclidean_pearson
            value: 79.01343235899544
          - type: euclidean_spearman
            value: 72.63178302036903
          - type: manhattan_pearson
            value: 78.65899981586094
          - type: manhattan_spearman
            value: 72.26646573268035
      - task:
          type: STS
        dataset:
          type: mteb/sts13-sts
          name: MTEB STS13
          config: default
          split: test
          revision: 1591bfcbe8c69d4bf7fe2a16e2451017832cafb9
        metrics:
          - type: cos_sim_pearson
            value: 83.20700572036095
          - type: cos_sim_spearman
            value: 83.48499016384896
          - type: euclidean_pearson
            value: 82.82555353364394
          - type: euclidean_spearman
            value: 83.48499008964005
          - type: manhattan_pearson
            value: 82.46034885462956
          - type: manhattan_spearman
            value: 83.09829447251937
      - task:
          type: STS
        dataset:
          type: mteb/sts14-sts
          name: MTEB STS14
          config: default
          split: test
          revision: e2125984e7df8b7871f6ae9949cf6b6795e7c54b
        metrics:
          - type: cos_sim_pearson
            value: 82.27113025749529
          - type: cos_sim_spearman
            value: 78.0001371342168
          - type: euclidean_pearson
            value: 80.62651938409732
          - type: euclidean_spearman
            value: 78.0001341029446
          - type: manhattan_pearson
            value: 80.25786381999085
          - type: manhattan_spearman
            value: 77.68750207429126
      - task:
          type: STS
        dataset:
          type: mteb/sts15-sts
          name: MTEB STS15
          config: default
          split: test
          revision: 1cd7298cac12a96a373b6a2f18738bb3e739a9b6
        metrics:
          - type: cos_sim_pearson
            value: 84.98824030948605
          - type: cos_sim_spearman
            value: 85.66275391649481
          - type: euclidean_pearson
            value: 84.88733530073506
          - type: euclidean_spearman
            value: 85.66275062257034
          - type: manhattan_pearson
            value: 84.70100813924223
          - type: manhattan_spearman
            value: 85.50318526944764
      - task:
          type: STS
        dataset:
          type: mteb/sts16-sts
          name: MTEB STS16
          config: default
          split: test
          revision: 360a0b2dff98700d09e634a01e1cc1624d3e42cd
        metrics:
          - type: cos_sim_pearson
            value: 78.82478639193744
          - type: cos_sim_spearman
            value: 80.03011315645662
          - type: euclidean_pearson
            value: 79.84794502236802
          - type: euclidean_spearman
            value: 80.03011258077692
          - type: manhattan_pearson
            value: 79.47012152325492
          - type: manhattan_spearman
            value: 79.60652985087651
      - task:
          type: STS
        dataset:
          type: mteb/sts17-crosslingual-sts
          name: MTEB STS17 (en-en)
          config: en-en
          split: test
          revision: 9fc37e8c632af1c87a3d23e685d49552a02582a0
        metrics:
          - type: cos_sim_pearson
            value: 90.90804154377126
          - type: cos_sim_spearman
            value: 90.59523263123734
          - type: euclidean_pearson
            value: 89.8466957775513
          - type: euclidean_spearman
            value: 90.59523263123734
          - type: manhattan_pearson
            value: 89.82268413033941
          - type: manhattan_spearman
            value: 90.68706496728889
      - task:
          type: STS
        dataset:
          type: mteb/sts22-crosslingual-sts
          name: MTEB STS22 (en)
          config: en
          split: test
          revision: 2de6ce8c1921b71a755b262c6b57fef195dd7906
        metrics:
          - type: cos_sim_pearson
            value: 66.78771571400975
          - type: cos_sim_spearman
            value: 67.94534221542501
          - type: euclidean_pearson
            value: 68.62534447097993
          - type: euclidean_spearman
            value: 67.94534221542501
          - type: manhattan_pearson
            value: 68.35916011329631
          - type: manhattan_spearman
            value: 67.58212723406085
      - task:
          type: STS
        dataset:
          type: mteb/stsbenchmark-sts
          name: MTEB STSBenchmark
          config: default
          split: test
          revision: 8913289635987208e6e7c72789e4be2fe94b6abd
        metrics:
          - type: cos_sim_pearson
            value: 84.03996099800993
          - type: cos_sim_spearman
            value: 83.421898505618
          - type: euclidean_pearson
            value: 83.78671249317563
          - type: euclidean_spearman
            value: 83.4219042133061
          - type: manhattan_pearson
            value: 83.44085827249334
          - type: manhattan_spearman
            value: 83.02901331535297
      - task:
          type: Reranking
        dataset:
          type: mteb/scidocs-reranking
          name: MTEB SciDocsRR
          config: default
          split: test
          revision: 56a6d0140cf6356659e2a7c1413286a774468d44
        metrics:
          - type: map
            value: 88.65396986895777
          - type: mrr
            value: 96.60209525405604
      - task:
          type: Retrieval
        dataset:
          type: scifact
          name: MTEB SciFact
          config: default
          split: test
          revision: a75ae049398addde9b70f6b268875f5cbce99089
        metrics:
          - type: map_at_1
            value: 51.456
          - type: map_at_10
            value: 60.827
          - type: map_at_100
            value: 61.595
          - type: map_at_1000
            value: 61.629999999999995
          - type: map_at_3
            value: 57.518
          - type: map_at_5
            value: 59.435
          - type: ndcg_at_1
            value: 53.333
          - type: ndcg_at_10
            value: 65.57
          - type: ndcg_at_100
            value: 68.911
          - type: ndcg_at_1000
            value: 69.65299999999999
          - type: ndcg_at_3
            value: 60.009
          - type: ndcg_at_5
            value: 62.803
          - type: precision_at_1
            value: 53.333
          - type: precision_at_10
            value: 8.933
          - type: precision_at_100
            value: 1.0699999999999998
          - type: precision_at_1000
            value: 0.11299999999999999
          - type: precision_at_3
            value: 23.333000000000002
          - type: precision_at_5
            value: 15.8
          - type: recall_at_1
            value: 51.456
          - type: recall_at_10
            value: 79.011
          - type: recall_at_100
            value: 94.167
          - type: recall_at_1000
            value: 99.667
          - type: recall_at_3
            value: 64.506
          - type: recall_at_5
            value: 71.211
      - task:
          type: PairClassification
        dataset:
          type: mteb/sprintduplicatequestions-pairclassification
          name: MTEB SprintDuplicateQuestions
          config: default
          split: test
          revision: 5a8256d0dff9c4bd3be3ba3e67e4e70173f802ea
        metrics:
          - type: cos_sim_accuracy
            value: 99.65940594059406
          - type: cos_sim_ap
            value: 90.1455141683116
          - type: cos_sim_f1
            value: 82.26044226044226
          - type: cos_sim_precision
            value: 80.8695652173913
          - type: cos_sim_recall
            value: 83.7
          - type: dot_accuracy
            value: 99.65940594059406
          - type: dot_ap
            value: 90.1455141683116
          - type: dot_f1
            value: 82.26044226044226
          - type: dot_precision
            value: 80.8695652173913
          - type: dot_recall
            value: 83.7
          - type: euclidean_accuracy
            value: 99.65940594059406
          - type: euclidean_ap
            value: 90.14551416831162
          - type: euclidean_f1
            value: 82.26044226044226
          - type: euclidean_precision
            value: 80.8695652173913
          - type: euclidean_recall
            value: 83.7
          - type: manhattan_accuracy
            value: 99.64950495049504
          - type: manhattan_ap
            value: 89.5492617367771
          - type: manhattan_f1
            value: 81.58280410356619
          - type: manhattan_precision
            value: 79.75167144221585
          - type: manhattan_recall
            value: 83.5
          - type: max_accuracy
            value: 99.65940594059406
          - type: max_ap
            value: 90.14551416831162
          - type: max_f1
            value: 82.26044226044226
      - task:
          type: Clustering
        dataset:
          type: mteb/stackexchange-clustering
          name: MTEB StackExchangeClustering
          config: default
          split: test
          revision: 70a89468f6dccacc6aa2b12a6eac54e74328f235
        metrics:
          - type: v_measure
            value: 53.80048409076929
      - task:
          type: Clustering
        dataset:
          type: mteb/stackexchange-clustering-p2p
          name: MTEB StackExchangeClusteringP2P
          config: default
          split: test
          revision: d88009ab563dd0b16cfaf4436abaf97fa3550cf0
        metrics:
          - type: v_measure
            value: 34.280269334397545
      - task:
          type: Reranking
        dataset:
          type: mteb/stackoverflowdupquestions-reranking
          name: MTEB StackOverflowDupQuestions
          config: default
          split: test
          revision: ef807ea29a75ec4f91b50fd4191cb4ee4589a9f9
        metrics:
          - type: map
            value: 51.97907654945493
          - type: mrr
            value: 52.82873376623376
      - task:
          type: Summarization
        dataset:
          type: mteb/summeval
          name: MTEB SummEval
          config: default
          split: test
          revision: 8753c2788d36c01fc6f05d03fe3f7268d63f9122
        metrics:
          - type: cos_sim_pearson
            value: 28.364293841556304
          - type: cos_sim_spearman
            value: 27.485869639926136
          - type: dot_pearson
            value: 28.364295910221145
          - type: dot_spearman
            value: 27.485869639926136
      - task:
          type: Retrieval
        dataset:
          type: trec-covid
          name: MTEB TRECCOVID
          config: default
          split: test
          revision: 2c8041b2c07a79b6f7ba8fe6acc72e5d9f92d217
        metrics:
          - type: map_at_1
            value: 0.19499999999999998
          - type: map_at_10
            value: 1.218
          - type: map_at_100
            value: 7.061000000000001
          - type: map_at_1000
            value: 19.735
          - type: map_at_3
            value: 0.46499999999999997
          - type: map_at_5
            value: 0.672
          - type: ndcg_at_1
            value: 60
          - type: ndcg_at_10
            value: 51.32600000000001
          - type: ndcg_at_100
            value: 41.74
          - type: ndcg_at_1000
            value: 43.221
          - type: ndcg_at_3
            value: 54.989
          - type: ndcg_at_5
            value: 52.905
          - type: precision_at_1
            value: 66
          - type: precision_at_10
            value: 55.60000000000001
          - type: precision_at_100
            value: 43.34
          - type: precision_at_1000
            value: 19.994
          - type: precision_at_3
            value: 59.333000000000006
          - type: precision_at_5
            value: 57.199999999999996
          - type: recall_at_1
            value: 0.19499999999999998
          - type: recall_at_10
            value: 1.473
          - type: recall_at_100
            value: 10.596
          - type: recall_at_1000
            value: 42.466
          - type: recall_at_3
            value: 0.49899999999999994
          - type: recall_at_5
            value: 0.76
      - task:
          type: Retrieval
        dataset:
          type: webis-touche2020
          name: MTEB Touche2020
          config: default
          split: test
          revision: 527b7d77e16e343303e68cb6af11d6e18b9f7b3b
        metrics:
          - type: map_at_1
            value: 1.997
          - type: map_at_10
            value: 7.5569999999999995
          - type: map_at_100
            value: 12.238
          - type: map_at_1000
            value: 13.773
          - type: map_at_3
            value: 4.334
          - type: map_at_5
            value: 5.5
          - type: ndcg_at_1
            value: 22.448999999999998
          - type: ndcg_at_10
            value: 19.933999999999997
          - type: ndcg_at_100
            value: 30.525999999999996
          - type: ndcg_at_1000
            value: 43.147999999999996
          - type: ndcg_at_3
            value: 22.283
          - type: ndcg_at_5
            value: 21.224
          - type: precision_at_1
            value: 24.490000000000002
          - type: precision_at_10
            value: 17.551
          - type: precision_at_100
            value: 6.4079999999999995
          - type: precision_at_1000
            value: 1.463
          - type: precision_at_3
            value: 23.128999999999998
          - type: precision_at_5
            value: 20.816000000000003
          - type: recall_at_1
            value: 1.997
          - type: recall_at_10
            value: 13.001999999999999
          - type: recall_at_100
            value: 40.98
          - type: recall_at_1000
            value: 79.40899999999999
          - type: recall_at_3
            value: 5.380999999999999
          - type: recall_at_5
            value: 7.721
      - task:
          type: Classification
        dataset:
          type: mteb/toxic_conversations_50k
          name: MTEB ToxicConversationsClassification
          config: default
          split: test
          revision: edfaf9da55d3dd50d43143d90c1ac476895ae6de
        metrics:
          - type: accuracy
            value: 60.861200000000004
          - type: ap
            value: 11.39641747026629
          - type: f1
            value: 47.80230380517065
      - task:
          type: Classification
        dataset:
          type: mteb/tweet_sentiment_extraction
          name: MTEB TweetSentimentExtractionClassification
          config: default
          split: test
          revision: 62146448f05be9e52a36b8ee9936447ea787eede
        metrics:
          - type: accuracy
            value: 55.464063384267114
          - type: f1
            value: 55.759039643764666
      - task:
          type: Clustering
        dataset:
          type: mteb/twentynewsgroups-clustering
          name: MTEB TwentyNewsgroupsClustering
          config: default
          split: test
          revision: 091a54f9a36281ce7d6590ec8c75dd485e7e01d4
        metrics:
          - type: v_measure
            value: 49.74455348083809
      - task:
          type: PairClassification
        dataset:
          type: mteb/twittersemeval2015-pairclassification
          name: MTEB TwitterSemEval2015
          config: default
          split: test
          revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
        metrics:
          - type: cos_sim_accuracy
            value: 86.07617571675507
          - type: cos_sim_ap
            value: 73.85398650568216
          - type: cos_sim_f1
            value: 68.50702798531087
          - type: cos_sim_precision
            value: 65.86316045775506
          - type: cos_sim_recall
            value: 71.37203166226914
          - type: dot_accuracy
            value: 86.07617571675507
          - type: dot_ap
            value: 73.85398346238429
          - type: dot_f1
            value: 68.50702798531087
          - type: dot_precision
            value: 65.86316045775506
          - type: dot_recall
            value: 71.37203166226914
          - type: euclidean_accuracy
            value: 86.07617571675507
          - type: euclidean_ap
            value: 73.85398625060357
          - type: euclidean_f1
            value: 68.50702798531087
          - type: euclidean_precision
            value: 65.86316045775506
          - type: euclidean_recall
            value: 71.37203166226914
          - type: manhattan_accuracy
            value: 85.98676759849795
          - type: manhattan_ap
            value: 73.86874126878737
          - type: manhattan_f1
            value: 68.55096559662361
          - type: manhattan_precision
            value: 66.51774633904195
          - type: manhattan_recall
            value: 70.71240105540898
          - type: max_accuracy
            value: 86.07617571675507
          - type: max_ap
            value: 73.86874126878737
          - type: max_f1
            value: 68.55096559662361
      - task:
          type: PairClassification
        dataset:
          type: mteb/twitterurlcorpus-pairclassification
          name: MTEB TwitterURLCorpus
          config: default
          split: test
          revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
        metrics:
          - type: cos_sim_accuracy
            value: 88.51631932316529
          - type: cos_sim_ap
            value: 85.10831084479727
          - type: cos_sim_f1
            value: 77.14563397129186
          - type: cos_sim_precision
            value: 74.9709386806161
          - type: cos_sim_recall
            value: 79.45026178010471
          - type: dot_accuracy
            value: 88.51631932316529
          - type: dot_ap
            value: 85.10831188797107
          - type: dot_f1
            value: 77.14563397129186
          - type: dot_precision
            value: 74.9709386806161
          - type: dot_recall
            value: 79.45026178010471
          - type: euclidean_accuracy
            value: 88.51631932316529
          - type: euclidean_ap
            value: 85.10829618408616
          - type: euclidean_f1
            value: 77.14563397129186
          - type: euclidean_precision
            value: 74.9709386806161
          - type: euclidean_recall
            value: 79.45026178010471
          - type: manhattan_accuracy
            value: 88.50467652423643
          - type: manhattan_ap
            value: 85.08329502055064
          - type: manhattan_f1
            value: 77.11157455683002
          - type: manhattan_precision
            value: 74.67541834968263
          - type: manhattan_recall
            value: 79.71204188481676
          - type: max_accuracy
            value: 88.51631932316529
          - type: max_ap
            value: 85.10831188797107
          - type: max_f1
            value: 77.14563397129186

all-mpnet-base-v2

This is a sentence-transformers model: It maps sentences & paragraphs to a 768 dimensional dense vector space and can be used for tasks like clustering or semantic search.

Usage (Sentence-Transformers)

Using this model becomes easy when you have sentence-transformers installed:

pip install -U sentence-transformers

Then you can use the model like this:

from sentence_transformers import SentenceTransformer
sentences = ["This is an example sentence", "Each sentence is converted"]

model = SentenceTransformer('sentence-transformers/all-mpnet-base-v2')
embeddings = model.encode(sentences)
print(embeddings)

Usage (HuggingFace Transformers)

Without sentence-transformers, you can use the model like this: First, you pass your input through the transformer model, then you have to apply the right pooling-operation on-top of the contextualized word embeddings.

from transformers import AutoTokenizer, AutoModel
import torch
import torch.nn.functional as F

#Mean Pooling - Take attention mask into account for correct averaging
def mean_pooling(model_output, attention_mask):
    token_embeddings = model_output[0] #First element of model_output contains all token embeddings
    input_mask_expanded = attention_mask.unsqueeze(-1).expand(token_embeddings.size()).float()
    return torch.sum(token_embeddings * input_mask_expanded, 1) / torch.clamp(input_mask_expanded.sum(1), min=1e-9)


# Sentences we want sentence embeddings for
sentences = ['This is an example sentence', 'Each sentence is converted']

# Load model from HuggingFace Hub
tokenizer = AutoTokenizer.from_pretrained('sentence-transformers/all-mpnet-base-v2')
model = AutoModel.from_pretrained('sentence-transformers/all-mpnet-base-v2')

# Tokenize sentences
encoded_input = tokenizer(sentences, padding=True, truncation=True, return_tensors='pt')

# Compute token embeddings
with torch.no_grad():
    model_output = model(**encoded_input)

# Perform pooling
sentence_embeddings = mean_pooling(model_output, encoded_input['attention_mask'])

# Normalize embeddings
sentence_embeddings = F.normalize(sentence_embeddings, p=2, dim=1)

print("Sentence embeddings:")
print(sentence_embeddings)

Evaluation Results

For an automated evaluation of this model, see MTEB: https://huggingface.co/spaces/mteb/leaderboard or the Sentence Embeddings Benchmark: https://seb.sbert.net

Background

The project aims to train sentence embedding models on very large sentence level datasets using a self-supervised contrastive learning objective. We used the pretrained microsoft/mpnet-base model and fine-tuned in on a 1B sentence pairs dataset. We use a contrastive learning objective: given a sentence from the pair, the model should predict which out of a set of randomly sampled other sentences, was actually paired with it in our dataset.

We developped this model during the Community week using JAX/Flax for NLP & CV, organized by Hugging Face. We developped this model as part of the project: Train the Best Sentence Embedding Model Ever with 1B Training Pairs. We benefited from efficient hardware infrastructure to run the project: 7 TPUs v3-8, as well as intervention from Googles Flax, JAX, and Cloud team member about efficient deep learning frameworks.

Intended uses

Our model is intented to be used as a sentence and short paragraph encoder. Given an input text, it ouptuts a vector which captures the semantic information. The sentence vector may be used for information retrieval, clustering or sentence similarity tasks.

By default, input text longer than 384 word pieces is truncated.

Training procedure

Pre-training

We use the pretrained microsoft/mpnet-base model. Please refer to the model card for more detailed information about the pre-training procedure.

Fine-tuning

We fine-tune the model using a contrastive objective. Formally, we compute the cosine similarity from each possible sentence pairs from the batch. We then apply the cross entropy loss by comparing with true pairs.

Hyper parameters

We trained ou model on a TPU v3-8. We train the model during 100k steps using a batch size of 1024 (128 per TPU core). We use a learning rate warm up of 500. The sequence length was limited to 128 tokens. We used the AdamW optimizer with a 2e-5 learning rate. The full training script is accessible in this current repository: train_script.py.

Training data

We use the concatenation from multiple datasets to fine-tune our model. The total number of sentence pairs is above 1 billion sentences. We sampled each dataset given a weighted probability which configuration is detailed in the data_config.json file.

Dataset	Paper	Number of training tuples
Reddit comments (2015-2018)	paper	726,484,430
S2ORC Citation pairs (Abstracts)	paper	116,288,806
WikiAnswers Duplicate question pairs	paper	77,427,422
PAQ (Question, Answer) pairs	paper	64,371,441
S2ORC Citation pairs (Titles)	paper	52,603,982
S2ORC (Title, Abstract)	paper	41,769,185
Stack Exchange (Title, Body) pairs	-	25,316,456
Stack Exchange (Title+Body, Answer) pairs	-	21,396,559
Stack Exchange (Title, Answer) pairs	-	21,396,559
MS MARCO triplets	paper	9,144,553
GOOAQ: Open Question Answering with Diverse Answer Types	paper	3,012,496
Yahoo Answers (Title, Answer)	paper	1,198,260
Code Search	-	1,151,414
COCO Image captions	paper	828,395
SPECTER citation triplets	paper	684,100
Yahoo Answers (Question, Answer)	paper	681,164
Yahoo Answers (Title, Question)	paper	659,896
SearchQA	paper	582,261
Eli5	paper	325,475
Flickr 30k	paper	317,695
Stack Exchange Duplicate questions (titles)		304,525
AllNLI (SNLI and MultiNLI	paper SNLI, paper MultiNLI	277,230
Stack Exchange Duplicate questions (bodies)		250,519
Stack Exchange Duplicate questions (titles+bodies)		250,460
Sentence Compression	paper	180,000
Wikihow	paper	128,542
Altlex	paper	112,696
Quora Question Triplets	-	103,663
Simple Wikipedia	paper	102,225
Natural Questions (NQ)	paper	100,231
SQuAD2.0	paper	87,599
TriviaQA	-	73,346
Total		1,170,060,424