Spaces:
Running
Running
Merge pull request #7 from embeddings-benchmark/fix_pawsx
Browse files
boards_data/en/data_overall/default.jsonl
CHANGED
@@ -1,12 +1,12 @@
|
|
1 |
{"index":91,"Rank":1,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Salesforce\/SFR-Embedding-2_R\">SFR-Embedding-2_R<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":26.49,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (56 datasets)":70.31,"Classification Average (12 datasets)":89.05,"Clustering Average (11 datasets)":56.17,"PairClassification Average (3 datasets)":88.07,"Reranking Average (4 datasets)":60.14,"Retrieval Average (15 datasets)":60.18,"STS Average (10 datasets)":81.26,"Summarization Average (1 datasets)":30.71}
|
2 |
-
{"index":16,"Rank":2,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen2-7B-instruct\">gte-Qwen2-7B-instruct<\/a>","Model Size (Million Parameters)":7613,"Memory Usage (GB, fp32)":28.36,"Embedding Dimensions":3584,"Max Tokens":
|
3 |
{"index":48,"Rank":3,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Intel\/neural-embedding-v1\">neural-embedding-v1<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":"","Max Tokens":"","Average (56 datasets)":69.94,"Classification Average (12 datasets)":87.91,"Clustering Average (11 datasets)":54.32,"PairClassification Average (3 datasets)":87.68,"Reranking Average (4 datasets)":61.49,"Retrieval Average (15 datasets)":58.12,"STS Average (10 datasets)":85.24,"Summarization Average (1 datasets)":30.87}
|
4 |
{"index":197,"Rank":4,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/nvidia\/NV-Embed-v1\">NV-Embed-v1<\/a>","Model Size (Million Parameters)":7851,"Memory Usage (GB, fp32)":29.25,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (56 datasets)":69.32,"Classification Average (12 datasets)":87.35,"Clustering Average (11 datasets)":52.8,"PairClassification Average (3 datasets)":86.91,"Reranking Average (4 datasets)":60.54,"Retrieval Average (15 datasets)":59.36,"STS Average (10 datasets)":82.84,"Summarization Average (1 datasets)":31.2}
|
5 |
{"index":6,"Rank":5,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/docs.voyageai.com\/embeddings\/\">voyage-large-2-instruct<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":1024,"Max Tokens":16000,"Average (56 datasets)":68.28,"Classification Average (12 datasets)":81.49,"Clustering Average (11 datasets)":53.35,"PairClassification Average (3 datasets)":89.24,"Reranking Average (4 datasets)":60.09,"Retrieval Average (15 datasets)":58.28,"STS Average (10 datasets)":84.58,"Summarization Average (1 datasets)":30.84}
|
6 |
{"index":54,"Rank":6,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Linq-AI-Research\/Linq-Embed-Mistral\">Linq-Embed-Mistral<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":26.49,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (56 datasets)":68.17,"Classification Average (12 datasets)":80.2,"Clustering Average (11 datasets)":51.42,"PairClassification Average (3 datasets)":88.35,"Reranking Average (4 datasets)":60.29,"Retrieval Average (15 datasets)":60.19,"STS Average (10 datasets)":84.97,"Summarization Average (1 datasets)":30.98}
|
7 |
{"index":92,"Rank":7,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Salesforce\/SFR-Embedding-Mistral\">SFR-Embedding-Mistral<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":26.49,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (56 datasets)":67.56,"Classification Average (12 datasets)":78.33,"Clustering Average (11 datasets)":51.67,"PairClassification Average (3 datasets)":88.54,"Reranking Average (4 datasets)":60.64,"Retrieval Average (15 datasets)":59.0,"STS Average (10 datasets)":85.05,"Summarization Average (1 datasets)":31.16}
|
8 |
{"index":14,"Rank":8,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen1.5-7B-instruct\">gte-Qwen1.5-7B-instruct<\/a>","Model Size (Million Parameters)":7099,"Memory Usage (GB, fp32)":26.45,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (56 datasets)":67.34,"Classification Average (12 datasets)":79.6,"Clustering Average (11 datasets)":55.83,"PairClassification Average (3 datasets)":87.38,"Reranking Average (4 datasets)":60.13,"Retrieval Average (15 datasets)":56.24,"STS Average (10 datasets)":82.42,"Summarization Average (1 datasets)":31.46}
|
9 |
-
{"index":15,"Rank":9,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen2-1.5B-instruct\">gte-Qwen2-1.5B-instruct<\/a>","Model Size (Million Parameters)":1776,"Memory Usage (GB, fp32)":6.62,"Embedding Dimensions":4096,"Max Tokens":
|
10 |
{"index":9,"Rank":10,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/docs.voyageai.com\/embeddings\/\">voyage-lite-02-instruct<\/a>","Model Size (Million Parameters)":1220,"Memory Usage (GB, fp32)":4.54,"Embedding Dimensions":1024,"Max Tokens":4000,"Average (56 datasets)":67.13,"Classification Average (12 datasets)":79.25,"Clustering Average (11 datasets)":52.42,"PairClassification Average (3 datasets)":86.87,"Reranking Average (4 datasets)":58.24,"Retrieval Average (15 datasets)":56.6,"STS Average (10 datasets)":85.79,"Summarization Average (1 datasets)":31.01}
|
11 |
{"index":39,"Rank":11,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/GritLM\/GritLM-7B\">GritLM-7B<\/a>","Model Size (Million Parameters)":7242,"Memory Usage (GB, fp32)":26.98,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (56 datasets)":66.76,"Classification Average (12 datasets)":79.46,"Clustering Average (11 datasets)":50.61,"PairClassification Average (3 datasets)":87.16,"Reranking Average (4 datasets)":60.49,"Retrieval Average (15 datasets)":57.41,"STS Average (10 datasets)":83.35,"Summarization Average (1 datasets)":30.37}
|
12 |
{"index":142,"Rank":12,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/e5-mistral-7b-instruct\">e5-mistral-7b-instruct<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":26.49,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (56 datasets)":66.63,"Classification Average (12 datasets)":78.47,"Clustering Average (11 datasets)":50.26,"PairClassification Average (3 datasets)":88.34,"Reranking Average (4 datasets)":60.21,"Retrieval Average (15 datasets)":56.89,"STS Average (10 datasets)":84.63,"Summarization Average (1 datasets)":31.4}
|
|
|
1 |
{"index":91,"Rank":1,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Salesforce\/SFR-Embedding-2_R\">SFR-Embedding-2_R<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":26.49,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (56 datasets)":70.31,"Classification Average (12 datasets)":89.05,"Clustering Average (11 datasets)":56.17,"PairClassification Average (3 datasets)":88.07,"Reranking Average (4 datasets)":60.14,"Retrieval Average (15 datasets)":60.18,"STS Average (10 datasets)":81.26,"Summarization Average (1 datasets)":30.71}
|
2 |
+
{"index":16,"Rank":2,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen2-7B-instruct\">gte-Qwen2-7B-instruct<\/a>","Model Size (Million Parameters)":7613,"Memory Usage (GB, fp32)":28.36,"Embedding Dimensions":3584,"Max Tokens":32768,"Average (56 datasets)":70.24,"Classification Average (12 datasets)":86.58,"Clustering Average (11 datasets)":56.92,"PairClassification Average (3 datasets)":85.79,"Reranking Average (4 datasets)":61.42,"Retrieval Average (15 datasets)":60.25,"STS Average (10 datasets)":83.04,"Summarization Average (1 datasets)":31.35}
|
3 |
{"index":48,"Rank":3,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Intel\/neural-embedding-v1\">neural-embedding-v1<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":"","Max Tokens":"","Average (56 datasets)":69.94,"Classification Average (12 datasets)":87.91,"Clustering Average (11 datasets)":54.32,"PairClassification Average (3 datasets)":87.68,"Reranking Average (4 datasets)":61.49,"Retrieval Average (15 datasets)":58.12,"STS Average (10 datasets)":85.24,"Summarization Average (1 datasets)":30.87}
|
4 |
{"index":197,"Rank":4,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/nvidia\/NV-Embed-v1\">NV-Embed-v1<\/a>","Model Size (Million Parameters)":7851,"Memory Usage (GB, fp32)":29.25,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (56 datasets)":69.32,"Classification Average (12 datasets)":87.35,"Clustering Average (11 datasets)":52.8,"PairClassification Average (3 datasets)":86.91,"Reranking Average (4 datasets)":60.54,"Retrieval Average (15 datasets)":59.36,"STS Average (10 datasets)":82.84,"Summarization Average (1 datasets)":31.2}
|
5 |
{"index":6,"Rank":5,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/docs.voyageai.com\/embeddings\/\">voyage-large-2-instruct<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":1024,"Max Tokens":16000,"Average (56 datasets)":68.28,"Classification Average (12 datasets)":81.49,"Clustering Average (11 datasets)":53.35,"PairClassification Average (3 datasets)":89.24,"Reranking Average (4 datasets)":60.09,"Retrieval Average (15 datasets)":58.28,"STS Average (10 datasets)":84.58,"Summarization Average (1 datasets)":30.84}
|
6 |
{"index":54,"Rank":6,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Linq-AI-Research\/Linq-Embed-Mistral\">Linq-Embed-Mistral<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":26.49,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (56 datasets)":68.17,"Classification Average (12 datasets)":80.2,"Clustering Average (11 datasets)":51.42,"PairClassification Average (3 datasets)":88.35,"Reranking Average (4 datasets)":60.29,"Retrieval Average (15 datasets)":60.19,"STS Average (10 datasets)":84.97,"Summarization Average (1 datasets)":30.98}
|
7 |
{"index":92,"Rank":7,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Salesforce\/SFR-Embedding-Mistral\">SFR-Embedding-Mistral<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":26.49,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (56 datasets)":67.56,"Classification Average (12 datasets)":78.33,"Clustering Average (11 datasets)":51.67,"PairClassification Average (3 datasets)":88.54,"Reranking Average (4 datasets)":60.64,"Retrieval Average (15 datasets)":59.0,"STS Average (10 datasets)":85.05,"Summarization Average (1 datasets)":31.16}
|
8 |
{"index":14,"Rank":8,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen1.5-7B-instruct\">gte-Qwen1.5-7B-instruct<\/a>","Model Size (Million Parameters)":7099,"Memory Usage (GB, fp32)":26.45,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (56 datasets)":67.34,"Classification Average (12 datasets)":79.6,"Clustering Average (11 datasets)":55.83,"PairClassification Average (3 datasets)":87.38,"Reranking Average (4 datasets)":60.13,"Retrieval Average (15 datasets)":56.24,"STS Average (10 datasets)":82.42,"Summarization Average (1 datasets)":31.46}
|
9 |
+
{"index":15,"Rank":9,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen2-1.5B-instruct\">gte-Qwen2-1.5B-instruct<\/a>","Model Size (Million Parameters)":1776,"Memory Usage (GB, fp32)":6.62,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (56 datasets)":67.16,"Classification Average (12 datasets)":82.47,"Clustering Average (11 datasets)":48.75,"PairClassification Average (3 datasets)":87.51,"Reranking Average (4 datasets)":59.98,"Retrieval Average (15 datasets)":58.29,"STS Average (10 datasets)":82.73,"Summarization Average (1 datasets)":31.17}
|
10 |
{"index":9,"Rank":10,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/docs.voyageai.com\/embeddings\/\">voyage-lite-02-instruct<\/a>","Model Size (Million Parameters)":1220,"Memory Usage (GB, fp32)":4.54,"Embedding Dimensions":1024,"Max Tokens":4000,"Average (56 datasets)":67.13,"Classification Average (12 datasets)":79.25,"Clustering Average (11 datasets)":52.42,"PairClassification Average (3 datasets)":86.87,"Reranking Average (4 datasets)":58.24,"Retrieval Average (15 datasets)":56.6,"STS Average (10 datasets)":85.79,"Summarization Average (1 datasets)":31.01}
|
11 |
{"index":39,"Rank":11,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/GritLM\/GritLM-7B\">GritLM-7B<\/a>","Model Size (Million Parameters)":7242,"Memory Usage (GB, fp32)":26.98,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (56 datasets)":66.76,"Classification Average (12 datasets)":79.46,"Clustering Average (11 datasets)":50.61,"PairClassification Average (3 datasets)":87.16,"Reranking Average (4 datasets)":60.49,"Retrieval Average (15 datasets)":57.41,"STS Average (10 datasets)":83.35,"Summarization Average (1 datasets)":30.37}
|
12 |
{"index":142,"Rank":12,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/intfloat\/e5-mistral-7b-instruct\">e5-mistral-7b-instruct<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":26.49,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (56 datasets)":66.63,"Classification Average (12 datasets)":78.47,"Clustering Average (11 datasets)":50.26,"PairClassification Average (3 datasets)":88.34,"Reranking Average (4 datasets)":60.21,"Retrieval Average (15 datasets)":56.89,"STS Average (10 datasets)":84.63,"Summarization Average (1 datasets)":31.4}
|
boards_data/fr/data_overall/default.jsonl
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
-
{"index":9,"Rank":1,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen2-7B-instruct\">gte-Qwen2-7B-instruct<\/a>","Model Size (Million Parameters)":7613,"Memory Usage (GB, fp32)":28.36,"Embedding Dimensions":3584,"Max Tokens":
|
2 |
-
{"index":8,"Rank":2,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen2-1.5B-instruct\">gte-Qwen2-1.5B-instruct<\/a>","Model Size (Million Parameters)":1776,"Memory Usage (GB, fp32)":6.62,"Embedding Dimensions":4096,"Max Tokens":
|
3 |
{"index":4,"Rank":3,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/docs.voyageai.com\/embeddings\/\">voyage-multilingual-2<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":1024,"Max Tokens":32000,"Average (26 datasets)":61.65,"Classification Average (6 datasets)":68.56,"Clustering Average (7 datasets)":46.57,"PairClassification Average (2 datasets)":78.66,"Reranking Average (2 datasets)":82.59,"Retrieval Average (5 datasets)":54.56,"STS Average (3 datasets)":80.13,"Summarization Average (1 datasets)":29.96}
|
4 |
{"index":3,"Rank":4,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/docs.voyageai.com\/embeddings\/\">voyage-law-2<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":1024,"Max Tokens":16000,"Average (26 datasets)":60.58,"Classification Average (6 datasets)":68.45,"Clustering Average (7 datasets)":44.23,"PairClassification Average (2 datasets)":77.3,"Reranking Average (2 datasets)":82.06,"Retrieval Average (5 datasets)":52.98,"STS Average (3 datasets)":80.29,"Summarization Average (1 datasets)":30.34}
|
5 |
{"index":0,"Rank":5,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/docs.mistral.ai\/guides\/embeddings\">mistral-embed<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":1024,"Max Tokens":"","Average (26 datasets)":59.41,"Classification Average (6 datasets)":68.61,"Clustering Average (7 datasets)":44.74,"PairClassification Average (2 datasets)":77.32,"Reranking Average (2 datasets)":80.46,"Retrieval Average (5 datasets)":46.81,"STS Average (3 datasets)":79.56,"Summarization Average (1 datasets)":31.47}
|
|
|
1 |
+
{"index":9,"Rank":1,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen2-7B-instruct\">gte-Qwen2-7B-instruct<\/a>","Model Size (Million Parameters)":7613,"Memory Usage (GB, fp32)":28.36,"Embedding Dimensions":3584,"Max Tokens":32768,"Average (26 datasets)":68.25,"Classification Average (6 datasets)":81.76,"Clustering Average (7 datasets)":55.56,"PairClassification Average (2 datasets)":90.43,"Reranking Average (2 datasets)":78.7,"Retrieval Average (5 datasets)":55.65,"STS Average (3 datasets)":82.31,"Summarization Average (1 datasets)":31.45}
|
2 |
+
{"index":8,"Rank":2,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen2-1.5B-instruct\">gte-Qwen2-1.5B-instruct<\/a>","Model Size (Million Parameters)":1776,"Memory Usage (GB, fp32)":6.62,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (26 datasets)":66.6,"Classification Average (6 datasets)":78.02,"Clustering Average (7 datasets)":55.01,"PairClassification Average (2 datasets)":86.88,"Reranking Average (2 datasets)":83.76,"Retrieval Average (5 datasets)":52.56,"STS Average (3 datasets)":81.26,"Summarization Average (1 datasets)":30.5}
|
3 |
{"index":4,"Rank":3,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/docs.voyageai.com\/embeddings\/\">voyage-multilingual-2<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":1024,"Max Tokens":32000,"Average (26 datasets)":61.65,"Classification Average (6 datasets)":68.56,"Clustering Average (7 datasets)":46.57,"PairClassification Average (2 datasets)":78.66,"Reranking Average (2 datasets)":82.59,"Retrieval Average (5 datasets)":54.56,"STS Average (3 datasets)":80.13,"Summarization Average (1 datasets)":29.96}
|
4 |
{"index":3,"Rank":4,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/docs.voyageai.com\/embeddings\/\">voyage-law-2<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":1024,"Max Tokens":16000,"Average (26 datasets)":60.58,"Classification Average (6 datasets)":68.45,"Clustering Average (7 datasets)":44.23,"PairClassification Average (2 datasets)":77.3,"Reranking Average (2 datasets)":82.06,"Retrieval Average (5 datasets)":52.98,"STS Average (3 datasets)":80.29,"Summarization Average (1 datasets)":30.34}
|
5 |
{"index":0,"Rank":5,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/docs.mistral.ai\/guides\/embeddings\">mistral-embed<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":1024,"Max Tokens":"","Average (26 datasets)":59.41,"Classification Average (6 datasets)":68.61,"Clustering Average (7 datasets)":44.74,"PairClassification Average (2 datasets)":77.32,"Reranking Average (2 datasets)":80.46,"Retrieval Average (5 datasets)":46.81,"STS Average (3 datasets)":79.56,"Summarization Average (1 datasets)":31.47}
|
boards_data/pl/data_overall/default.jsonl
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
-
{"index":2,"Rank":1,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen2-7B-instruct\">gte-Qwen2-7B-instruct<\/a>","Model Size (Million Parameters)":7613,"Memory Usage (GB, fp32)":28.36,"Embedding Dimensions":3584,"Max Tokens":
|
2 |
-
{"index":1,"Rank":2,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen2-1.5B-instruct\">gte-Qwen2-1.5B-instruct<\/a>","Model Size (Million Parameters)":1776,"Memory Usage (GB, fp32)":6.62,"Embedding Dimensions":4096,"Max Tokens":
|
3 |
{"index":34,"Rank":3,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sdadas\/mmlw-roberta-large\">mmlw-roberta-large<\/a>","Model Size (Million Parameters)":435,"Memory Usage (GB, fp32)":1.62,"Embedding Dimensions":1024,"Max Tokens":514,"Average (26 datasets)":63.23,"Classification Average (7 datasets)":66.39,"Clustering Average (1 datasets)":31.16,"PairClassification Average (4 datasets)":89.13,"Retrieval Average (11 datasets)":52.71,"STS Average (3 datasets)":70.59}
|
4 |
{"index":31,"Rank":4,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sdadas\/mmlw-e5-large\">mmlw-e5-large<\/a>","Model Size (Million Parameters)":560,"Memory Usage (GB, fp32)":2.09,"Embedding Dimensions":1024,"Max Tokens":514,"Average (26 datasets)":61.17,"Classification Average (7 datasets)":61.07,"Clustering Average (1 datasets)":30.62,"PairClassification Average (4 datasets)":85.9,"Retrieval Average (11 datasets)":52.63,"STS Average (3 datasets)":69.98}
|
5 |
{"index":33,"Rank":5,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sdadas\/mmlw-roberta-base\">mmlw-roberta-base<\/a>","Model Size (Million Parameters)":124,"Memory Usage (GB, fp32)":0.46,"Embedding Dimensions":768,"Max Tokens":514,"Average (26 datasets)":61.05,"Classification Average (7 datasets)":62.92,"Clustering Average (1 datasets)":33.08,"PairClassification Average (4 datasets)":88.14,"Retrieval Average (11 datasets)":49.92,"STS Average (3 datasets)":70.7}
|
|
|
1 |
+
{"index":2,"Rank":1,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen2-7B-instruct\">gte-Qwen2-7B-instruct<\/a>","Model Size (Million Parameters)":7613,"Memory Usage (GB, fp32)":28.36,"Embedding Dimensions":3584,"Max Tokens":32768,"Average (26 datasets)":67.86,"Classification Average (7 datasets)":77.84,"Clustering Average (1 datasets)":51.36,"PairClassification Average (4 datasets)":88.48,"Retrieval Average (11 datasets)":54.69,"STS Average (3 datasets)":70.86}
|
2 |
+
{"index":1,"Rank":2,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen2-1.5B-instruct\">gte-Qwen2-1.5B-instruct<\/a>","Model Size (Million Parameters)":1776,"Memory Usage (GB, fp32)":6.62,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (26 datasets)":64.04,"Classification Average (7 datasets)":72.29,"Clustering Average (1 datasets)":44.59,"PairClassification Average (4 datasets)":84.87,"Retrieval Average (11 datasets)":51.88,"STS Average (3 datasets)":68.12}
|
3 |
{"index":34,"Rank":3,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sdadas\/mmlw-roberta-large\">mmlw-roberta-large<\/a>","Model Size (Million Parameters)":435,"Memory Usage (GB, fp32)":1.62,"Embedding Dimensions":1024,"Max Tokens":514,"Average (26 datasets)":63.23,"Classification Average (7 datasets)":66.39,"Clustering Average (1 datasets)":31.16,"PairClassification Average (4 datasets)":89.13,"Retrieval Average (11 datasets)":52.71,"STS Average (3 datasets)":70.59}
|
4 |
{"index":31,"Rank":4,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sdadas\/mmlw-e5-large\">mmlw-e5-large<\/a>","Model Size (Million Parameters)":560,"Memory Usage (GB, fp32)":2.09,"Embedding Dimensions":1024,"Max Tokens":514,"Average (26 datasets)":61.17,"Classification Average (7 datasets)":61.07,"Clustering Average (1 datasets)":30.62,"PairClassification Average (4 datasets)":85.9,"Retrieval Average (11 datasets)":52.63,"STS Average (3 datasets)":69.98}
|
5 |
{"index":33,"Rank":5,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sdadas\/mmlw-roberta-base\">mmlw-roberta-base<\/a>","Model Size (Million Parameters)":124,"Memory Usage (GB, fp32)":0.46,"Embedding Dimensions":768,"Max Tokens":514,"Average (26 datasets)":61.05,"Classification Average (7 datasets)":62.92,"Clustering Average (1 datasets)":33.08,"PairClassification Average (4 datasets)":88.14,"Retrieval Average (11 datasets)":49.92,"STS Average (3 datasets)":70.7}
|
boards_data/zh/data_overall/default.jsonl
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{"index":194,"Rank":1,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/lier007\/xiaobu-embedding-v2\">xiaobu-embedding-v2<\/a>","Model Size (Million Parameters)":326,"Memory Usage (GB, fp32)":1.21,"Embedding Dimensions":1792,"Max Tokens":512,"Average (35 datasets)":72.43,"Classification Average (9 datasets)":74.67,"Clustering Average (4 datasets)":65.17,"PairClassification Average (2 datasets)":91.87,"Reranking Average (4 datasets)":72.58,"Retrieval Average (8 datasets)":76.5,"STS Average (8 datasets)":64.53}
|
2 |
-
{"index":17,"Rank":2,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen2-7B-instruct\">gte-Qwen2-7B-instruct<\/a>","Model Size (Million Parameters)":7613,"Memory Usage (GB, fp32)":28.36,"Embedding Dimensions":3584,"Max Tokens":
|
3 |
{"index":154,"Rank":3,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/iampanda\/zpoint_large_embedding_zh\">zpoint_large_embedding_zh<\/a>","Model Size (Million Parameters)":326,"Memory Usage (GB, fp32)":1.21,"Embedding Dimensions":1792,"Max Tokens":512,"Average (35 datasets)":71.88,"Classification Average (9 datasets)":74.43,"Clustering Average (4 datasets)":62.23,"PairClassification Average (2 datasets)":91.55,"Reranking Average (4 datasets)":72.34,"Retrieval Average (8 datasets)":76.36,"STS Average (8 datasets)":64.22}
|
4 |
{"index":48,"Rank":4,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Erin\/IYun-large-zh\">IYun-large-zh<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":"","Max Tokens":"","Average (35 datasets)":71.04,"Classification Average (9 datasets)":74.18,"Clustering Average (4 datasets)":66.35,"PairClassification Average (2 datasets)":90.87,"Reranking Average (4 datasets)":69.3,"Retrieval Average (8 datasets)":73.56,"STS Average (8 datasets)":63.23}
|
5 |
{"index":237,"Rank":5,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sensenova\/piccolo-large-zh-v2\">piccolo-large-zh-v2<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":"","Max Tokens":"","Average (35 datasets)":70.95,"Classification Average (9 datasets)":74.59,"Clustering Average (4 datasets)":62.17,"PairClassification Average (2 datasets)":90.24,"Reranking Average (4 datasets)":70.0,"Retrieval Average (8 datasets)":74.36,"STS Average (8 datasets)":63.5}
|
@@ -12,7 +12,7 @@
|
|
12 |
{"index":161,"Rank":12,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/infgrad\/stella-large-zh-v3-1792d\">stella-large-zh-v3-1792d<\/a>","Model Size (Million Parameters)":325,"Memory Usage (GB, fp32)":1.21,"Embedding Dimensions":1792,"Max Tokens":512,"Average (35 datasets)":68.48,"Classification Average (9 datasets)":71.5,"Clustering Average (4 datasets)":53.9,"PairClassification Average (2 datasets)":88.1,"Reranking Average (4 datasets)":68.26,"Retrieval Average (8 datasets)":73.6,"STS Average (8 datasets)":62.46}
|
13 |
{"index":298,"Rank":13,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/platform.baichuan-ai.com\/docs\/text-Embedding\">Baichuan-text-embedding<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":1024,"Max Tokens":512,"Average (35 datasets)":68.34,"Classification Average (9 datasets)":72.84,"Clustering Average (4 datasets)":56.88,"PairClassification Average (2 datasets)":82.32,"Reranking Average (4 datasets)":69.67,"Retrieval Average (8 datasets)":73.12,"STS Average (8 datasets)":60.07}
|
14 |
{"index":158,"Rank":14,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/infgrad\/stella-base-zh-v3-1792d\">stella-base-zh-v3-1792d<\/a>","Model Size (Million Parameters)":102,"Memory Usage (GB, fp32)":0.38,"Embedding Dimensions":1792,"Max Tokens":1024,"Average (35 datasets)":67.96,"Classification Average (9 datasets)":71.12,"Clustering Average (4 datasets)":53.3,"PairClassification Average (2 datasets)":87.93,"Reranking Average (4 datasets)":67.84,"Retrieval Average (8 datasets)":72.28,"STS Average (8 datasets)":62.49}
|
15 |
-
{"index":16,"Rank":15,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen2-1.5B-instruct\">gte-Qwen2-1.5B-instruct<\/a>","Model Size (Million Parameters)":1776,"Memory Usage (GB, fp32)":6.62,"Embedding Dimensions":4096,"Max Tokens":
|
16 |
{"index":44,"Rank":16,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/DMetaSoul\/Dmeta-embedding-zh\">Dmeta-embedding-zh<\/a>","Model Size (Million Parameters)":103,"Memory Usage (GB, fp32)":0.38,"Embedding Dimensions":768,"Max Tokens":1024,"Average (35 datasets)":67.51,"Classification Average (9 datasets)":70.0,"Clustering Average (4 datasets)":50.96,"PairClassification Average (2 datasets)":88.92,"Reranking Average (4 datasets)":67.17,"Retrieval Average (8 datasets)":70.41,"STS Average (8 datasets)":64.89}
|
17 |
{"index":193,"Rank":17,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/lier007\/xiaobu-embedding\">xiaobu-embedding<\/a>","Model Size (Million Parameters)":326,"Memory Usage (GB, fp32)":1.21,"Embedding Dimensions":1024,"Max Tokens":512,"Average (35 datasets)":67.28,"Classification Average (9 datasets)":71.2,"Clustering Average (4 datasets)":54.62,"PairClassification Average (2 datasets)":85.3,"Reranking Average (4 datasets)":67.34,"Retrieval Average (8 datasets)":73.41,"STS Average (8 datasets)":58.52}
|
18 |
{"index":102,"Rank":18,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Pristinenlp\/alime-embedding-large-zh\">alime-embedding-large-zh<\/a>","Model Size (Million Parameters)":326,"Memory Usage (GB, fp32)":1.21,"Embedding Dimensions":1024,"Max Tokens":512,"Average (35 datasets)":67.17,"Classification Average (9 datasets)":71.35,"Clustering Average (4 datasets)":54.0,"PairClassification Average (2 datasets)":84.34,"Reranking Average (4 datasets)":67.61,"Retrieval Average (8 datasets)":73.3,"STS Average (8 datasets)":58.41}
|
@@ -94,7 +94,7 @@
|
|
94 |
{"index":66,"Rank":104,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Lajavaness\/bilingual-embedding-base\">bilingual-embedding-base<\/a>","Model Size (Million Parameters)":278,"Memory Usage (GB, fp32)":1.04,"Embedding Dimensions":768,"Max Tokens":514,"Average (35 datasets)":"","Classification Average (9 datasets)":"","Clustering Average (4 datasets)":"","PairClassification Average (2 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (8 datasets)":"","STS Average (8 datasets)":""}
|
95 |
{"index":67,"Rank":105,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Lajavaness\/bilingual-embedding-large\">bilingual-embedding-large<\/a>","Model Size (Million Parameters)":560,"Memory Usage (GB, fp32)":2.09,"Embedding Dimensions":1024,"Max Tokens":514,"Average (35 datasets)":"","Classification Average (9 datasets)":"","Clustering Average (4 datasets)":"","PairClassification Average (2 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (8 datasets)":"","STS Average (8 datasets)":""}
|
96 |
{"index":68,"Rank":106,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Lajavaness\/bilingual-embedding-large-8k\">bilingual-embedding-large-8k<\/a>","Model Size (Million Parameters)":568,"Memory Usage (GB, fp32)":2.12,"Embedding Dimensions":1024,"Max Tokens":8194,"Average (35 datasets)":"","Classification Average (9 datasets)":"","Clustering Average (4 datasets)":"","PairClassification Average (2 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (8 datasets)":"","STS Average (8 datasets)":""}
|
97 |
-
{"index":69,"Rank":107,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Lenovo-Zhihui\/Zhihui_LLM_Embedding\">Zhihui_LLM_Embedding<\/a>","Model Size (Million Parameters)":7069,"Memory Usage (GB, fp32)":26.33,"Embedding Dimensions":3584,"Max Tokens":
|
98 |
{"index":70,"Rank":108,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Linq-AI-Research\/Linq-Embed-Mistral\">Linq-Embed-Mistral<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":26.49,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (35 datasets)":"","Classification Average (9 datasets)":"","Clustering Average (4 datasets)":"","PairClassification Average (2 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (8 datasets)":"","STS Average (8 datasets)":""}
|
99 |
{"index":72,"Rank":110,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/McGill-NLP\/LLM2Vec-Llama-2-7b-chat-hf-mntp-supervised\">LLM2Vec-Llama-2-supervised<\/a>","Model Size (Million Parameters)":6607,"Memory Usage (GB, fp32)":24.61,"Embedding Dimensions":4096,"Max Tokens":4096,"Average (35 datasets)":"","Classification Average (9 datasets)":"","Clustering Average (4 datasets)":"","PairClassification Average (2 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (8 datasets)":"","STS Average (8 datasets)":""}
|
100 |
{"index":73,"Rank":111,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/McGill-NLP\/LLM2Vec-Llama-2-7b-chat-hf-mntp-unsup-simcse\">LLM2Vec-Llama-2-unsupervised<\/a>","Model Size (Million Parameters)":6607,"Memory Usage (GB, fp32)":24.61,"Embedding Dimensions":4096,"Max Tokens":4096,"Average (35 datasets)":"","Classification Average (9 datasets)":"","Clustering Average (4 datasets)":"","PairClassification Average (2 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (8 datasets)":"","STS Average (8 datasets)":""}
|
|
|
1 |
{"index":194,"Rank":1,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/lier007\/xiaobu-embedding-v2\">xiaobu-embedding-v2<\/a>","Model Size (Million Parameters)":326,"Memory Usage (GB, fp32)":1.21,"Embedding Dimensions":1792,"Max Tokens":512,"Average (35 datasets)":72.43,"Classification Average (9 datasets)":74.67,"Clustering Average (4 datasets)":65.17,"PairClassification Average (2 datasets)":91.87,"Reranking Average (4 datasets)":72.58,"Retrieval Average (8 datasets)":76.5,"STS Average (8 datasets)":64.53}
|
2 |
+
{"index":17,"Rank":2,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen2-7B-instruct\">gte-Qwen2-7B-instruct<\/a>","Model Size (Million Parameters)":7613,"Memory Usage (GB, fp32)":28.36,"Embedding Dimensions":3584,"Max Tokens":32768,"Average (35 datasets)":72.05,"Classification Average (9 datasets)":75.09,"Clustering Average (4 datasets)":66.06,"PairClassification Average (2 datasets)":87.48,"Reranking Average (4 datasets)":68.92,"Retrieval Average (8 datasets)":76.03,"STS Average (8 datasets)":65.33}
|
3 |
{"index":154,"Rank":3,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/iampanda\/zpoint_large_embedding_zh\">zpoint_large_embedding_zh<\/a>","Model Size (Million Parameters)":326,"Memory Usage (GB, fp32)":1.21,"Embedding Dimensions":1792,"Max Tokens":512,"Average (35 datasets)":71.88,"Classification Average (9 datasets)":74.43,"Clustering Average (4 datasets)":62.23,"PairClassification Average (2 datasets)":91.55,"Reranking Average (4 datasets)":72.34,"Retrieval Average (8 datasets)":76.36,"STS Average (8 datasets)":64.22}
|
4 |
{"index":48,"Rank":4,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Erin\/IYun-large-zh\">IYun-large-zh<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":"","Max Tokens":"","Average (35 datasets)":71.04,"Classification Average (9 datasets)":74.18,"Clustering Average (4 datasets)":66.35,"PairClassification Average (2 datasets)":90.87,"Reranking Average (4 datasets)":69.3,"Retrieval Average (8 datasets)":73.56,"STS Average (8 datasets)":63.23}
|
5 |
{"index":237,"Rank":5,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/sensenova\/piccolo-large-zh-v2\">piccolo-large-zh-v2<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":"","Max Tokens":"","Average (35 datasets)":70.95,"Classification Average (9 datasets)":74.59,"Clustering Average (4 datasets)":62.17,"PairClassification Average (2 datasets)":90.24,"Reranking Average (4 datasets)":70.0,"Retrieval Average (8 datasets)":74.36,"STS Average (8 datasets)":63.5}
|
|
|
12 |
{"index":161,"Rank":12,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/infgrad\/stella-large-zh-v3-1792d\">stella-large-zh-v3-1792d<\/a>","Model Size (Million Parameters)":325,"Memory Usage (GB, fp32)":1.21,"Embedding Dimensions":1792,"Max Tokens":512,"Average (35 datasets)":68.48,"Classification Average (9 datasets)":71.5,"Clustering Average (4 datasets)":53.9,"PairClassification Average (2 datasets)":88.1,"Reranking Average (4 datasets)":68.26,"Retrieval Average (8 datasets)":73.6,"STS Average (8 datasets)":62.46}
|
13 |
{"index":298,"Rank":13,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/platform.baichuan-ai.com\/docs\/text-Embedding\">Baichuan-text-embedding<\/a>","Model Size (Million Parameters)":"","Memory Usage (GB, fp32)":"","Embedding Dimensions":1024,"Max Tokens":512,"Average (35 datasets)":68.34,"Classification Average (9 datasets)":72.84,"Clustering Average (4 datasets)":56.88,"PairClassification Average (2 datasets)":82.32,"Reranking Average (4 datasets)":69.67,"Retrieval Average (8 datasets)":73.12,"STS Average (8 datasets)":60.07}
|
14 |
{"index":158,"Rank":14,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/infgrad\/stella-base-zh-v3-1792d\">stella-base-zh-v3-1792d<\/a>","Model Size (Million Parameters)":102,"Memory Usage (GB, fp32)":0.38,"Embedding Dimensions":1792,"Max Tokens":1024,"Average (35 datasets)":67.96,"Classification Average (9 datasets)":71.12,"Clustering Average (4 datasets)":53.3,"PairClassification Average (2 datasets)":87.93,"Reranking Average (4 datasets)":67.84,"Retrieval Average (8 datasets)":72.28,"STS Average (8 datasets)":62.49}
|
15 |
+
{"index":16,"Rank":15,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Alibaba-NLP\/gte-Qwen2-1.5B-instruct\">gte-Qwen2-1.5B-instruct<\/a>","Model Size (Million Parameters)":1776,"Memory Usage (GB, fp32)":6.62,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (35 datasets)":67.65,"Classification Average (9 datasets)":71.12,"Clustering Average (4 datasets)":54.61,"PairClassification Average (2 datasets)":86.91,"Reranking Average (4 datasets)":68.21,"Retrieval Average (8 datasets)":71.86,"STS Average (8 datasets)":60.96}
|
16 |
{"index":44,"Rank":16,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/DMetaSoul\/Dmeta-embedding-zh\">Dmeta-embedding-zh<\/a>","Model Size (Million Parameters)":103,"Memory Usage (GB, fp32)":0.38,"Embedding Dimensions":768,"Max Tokens":1024,"Average (35 datasets)":67.51,"Classification Average (9 datasets)":70.0,"Clustering Average (4 datasets)":50.96,"PairClassification Average (2 datasets)":88.92,"Reranking Average (4 datasets)":67.17,"Retrieval Average (8 datasets)":70.41,"STS Average (8 datasets)":64.89}
|
17 |
{"index":193,"Rank":17,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/lier007\/xiaobu-embedding\">xiaobu-embedding<\/a>","Model Size (Million Parameters)":326,"Memory Usage (GB, fp32)":1.21,"Embedding Dimensions":1024,"Max Tokens":512,"Average (35 datasets)":67.28,"Classification Average (9 datasets)":71.2,"Clustering Average (4 datasets)":54.62,"PairClassification Average (2 datasets)":85.3,"Reranking Average (4 datasets)":67.34,"Retrieval Average (8 datasets)":73.41,"STS Average (8 datasets)":58.52}
|
18 |
{"index":102,"Rank":18,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Pristinenlp\/alime-embedding-large-zh\">alime-embedding-large-zh<\/a>","Model Size (Million Parameters)":326,"Memory Usage (GB, fp32)":1.21,"Embedding Dimensions":1024,"Max Tokens":512,"Average (35 datasets)":67.17,"Classification Average (9 datasets)":71.35,"Clustering Average (4 datasets)":54.0,"PairClassification Average (2 datasets)":84.34,"Reranking Average (4 datasets)":67.61,"Retrieval Average (8 datasets)":73.3,"STS Average (8 datasets)":58.41}
|
|
|
94 |
{"index":66,"Rank":104,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Lajavaness\/bilingual-embedding-base\">bilingual-embedding-base<\/a>","Model Size (Million Parameters)":278,"Memory Usage (GB, fp32)":1.04,"Embedding Dimensions":768,"Max Tokens":514,"Average (35 datasets)":"","Classification Average (9 datasets)":"","Clustering Average (4 datasets)":"","PairClassification Average (2 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (8 datasets)":"","STS Average (8 datasets)":""}
|
95 |
{"index":67,"Rank":105,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Lajavaness\/bilingual-embedding-large\">bilingual-embedding-large<\/a>","Model Size (Million Parameters)":560,"Memory Usage (GB, fp32)":2.09,"Embedding Dimensions":1024,"Max Tokens":514,"Average (35 datasets)":"","Classification Average (9 datasets)":"","Clustering Average (4 datasets)":"","PairClassification Average (2 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (8 datasets)":"","STS Average (8 datasets)":""}
|
96 |
{"index":68,"Rank":106,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Lajavaness\/bilingual-embedding-large-8k\">bilingual-embedding-large-8k<\/a>","Model Size (Million Parameters)":568,"Memory Usage (GB, fp32)":2.12,"Embedding Dimensions":1024,"Max Tokens":8194,"Average (35 datasets)":"","Classification Average (9 datasets)":"","Clustering Average (4 datasets)":"","PairClassification Average (2 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (8 datasets)":"","STS Average (8 datasets)":""}
|
97 |
+
{"index":69,"Rank":107,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Lenovo-Zhihui\/Zhihui_LLM_Embedding\">Zhihui_LLM_Embedding<\/a>","Model Size (Million Parameters)":7069,"Memory Usage (GB, fp32)":26.33,"Embedding Dimensions":3584,"Max Tokens":32768,"Average (35 datasets)":"","Classification Average (9 datasets)":"","Clustering Average (4 datasets)":"","PairClassification Average (2 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (8 datasets)":76.74,"STS Average (8 datasets)":""}
|
98 |
{"index":70,"Rank":108,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/Linq-AI-Research\/Linq-Embed-Mistral\">Linq-Embed-Mistral<\/a>","Model Size (Million Parameters)":7111,"Memory Usage (GB, fp32)":26.49,"Embedding Dimensions":4096,"Max Tokens":32768,"Average (35 datasets)":"","Classification Average (9 datasets)":"","Clustering Average (4 datasets)":"","PairClassification Average (2 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (8 datasets)":"","STS Average (8 datasets)":""}
|
99 |
{"index":72,"Rank":110,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/McGill-NLP\/LLM2Vec-Llama-2-7b-chat-hf-mntp-supervised\">LLM2Vec-Llama-2-supervised<\/a>","Model Size (Million Parameters)":6607,"Memory Usage (GB, fp32)":24.61,"Embedding Dimensions":4096,"Max Tokens":4096,"Average (35 datasets)":"","Classification Average (9 datasets)":"","Clustering Average (4 datasets)":"","PairClassification Average (2 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (8 datasets)":"","STS Average (8 datasets)":""}
|
100 |
{"index":73,"Rank":111,"Model":"<a target=\"_blank\" style=\"text-decoration: underline\" href=\"https:\/\/huggingface.co\/McGill-NLP\/LLM2Vec-Llama-2-7b-chat-hf-mntp-unsup-simcse\">LLM2Vec-Llama-2-unsupervised<\/a>","Model Size (Million Parameters)":6607,"Memory Usage (GB, fp32)":24.61,"Embedding Dimensions":4096,"Max Tokens":4096,"Average (35 datasets)":"","Classification Average (9 datasets)":"","Clustering Average (4 datasets)":"","PairClassification Average (2 datasets)":"","Reranking Average (4 datasets)":"","Retrieval Average (8 datasets)":"","STS Average (8 datasets)":""}
|
refresh.py
CHANGED
@@ -323,8 +323,17 @@ def get_mteb_data(tasks=["Clustering"], langs=[], datasets=[], fillna=True, add_
|
|
323 |
df['MLSUMClusteringS2S (fr)'] = df['MLSUMClusteringS2S (fr)'].fillna(df['MLSUMClusteringS2S'])
|
324 |
datasets.remove('MLSUMClusteringS2S')
|
325 |
if ('PawsXPairClassification (fr)' in datasets) and ('PawsX (fr)' in cols):
|
326 |
-
|
|
|
|
|
|
|
|
|
|
|
327 |
datasets.remove('PawsX (fr)')
|
|
|
|
|
|
|
|
|
328 |
# Filter invalid columns
|
329 |
cols = [col for col in cols if col in base_columns + datasets]
|
330 |
i = 0
|
@@ -353,7 +362,6 @@ def get_mteb_average(task_dict: dict):
|
|
353 |
)
|
354 |
# Debugging:
|
355 |
# DATA_OVERALL.to_csv("overall.csv")
|
356 |
-
|
357 |
DATA_OVERALL.insert(1, f"Average ({len(all_tasks)} datasets)", DATA_OVERALL[all_tasks].mean(axis=1, skipna=False))
|
358 |
for i, (task_category, task_category_list) in enumerate(task_dict.items()):
|
359 |
DATA_OVERALL.insert(i+2, f"{task_category} Average ({len(task_category_list)} datasets)", DATA_OVERALL[task_category_list].mean(axis=1, skipna=False))
|
@@ -420,7 +428,7 @@ def refresh_leaderboard():
|
|
420 |
|
421 |
|
422 |
|
423 |
-
def write_out_results(item
|
424 |
"""
|
425 |
Due to their complex structure, let's recursively create subfolders until we reach the end
|
426 |
of the item and then save the DFs as jsonl files
|
|
|
323 |
df['MLSUMClusteringS2S (fr)'] = df['MLSUMClusteringS2S (fr)'].fillna(df['MLSUMClusteringS2S'])
|
324 |
datasets.remove('MLSUMClusteringS2S')
|
325 |
if ('PawsXPairClassification (fr)' in datasets) and ('PawsX (fr)' in cols):
|
326 |
+
# for the first bit no model has it, hence no column for it. We can remove this in a month or so
|
327 |
+
if "PawsXPairClassification (fr)" not in cols:
|
328 |
+
df['PawsXPairClassification (fr)'] = df['PawsX (fr)']
|
329 |
+
else:
|
330 |
+
df['PawsXPairClassification (fr)'] = df['PawsXPairClassification (fr)'].fillna(df['PawsX (fr)'])
|
331 |
+
# make all the columns the same
|
332 |
datasets.remove('PawsX (fr)')
|
333 |
+
cols.remove('PawsX (fr)')
|
334 |
+
df.drop(columns=['PawsX (fr)'], inplace=True)
|
335 |
+
cols.append('PawsXPairClassification (fr)')
|
336 |
+
|
337 |
# Filter invalid columns
|
338 |
cols = [col for col in cols if col in base_columns + datasets]
|
339 |
i = 0
|
|
|
362 |
)
|
363 |
# Debugging:
|
364 |
# DATA_OVERALL.to_csv("overall.csv")
|
|
|
365 |
DATA_OVERALL.insert(1, f"Average ({len(all_tasks)} datasets)", DATA_OVERALL[all_tasks].mean(axis=1, skipna=False))
|
366 |
for i, (task_category, task_category_list) in enumerate(task_dict.items()):
|
367 |
DATA_OVERALL.insert(i+2, f"{task_category} Average ({len(task_category_list)} datasets)", DATA_OVERALL[task_category_list].mean(axis=1, skipna=False))
|
|
|
428 |
|
429 |
|
430 |
|
431 |
+
def write_out_results(item, item_name: str):
|
432 |
"""
|
433 |
Due to their complex structure, let's recursively create subfolders until we reach the end
|
434 |
of the item and then save the DFs as jsonl files
|