huseinzol05 commited on
Commit
8cb674a
β€’
1 Parent(s): 18566fa

added more models

Browse files
Files changed (1) hide show
  1. app.py +40 -18
app.py CHANGED
@@ -2,10 +2,10 @@ import gradio as gr
2
  import pandas as pd
3
  from css_html_js import custom_css
4
 
5
- TITLE = """<h1 align="center" id="space-title">πŸ‡²πŸ‡Ύ Malaysian Embedding Leaderboard</h1>"""
6
 
7
  INTRODUCTION_TEXT = """
8
- πŸ“ The πŸ‡²πŸ‡Ύ Malaysian Embedding Leaderboard aims to track, rank and evaluate Top-k retrieval using embedding models. All notebooks at https://github.com/mesolitica/embedding-benchmarks, feel free to submit your own score at https://huggingface.co/spaces/mesolitica/Malaysian-Embedding-Leaderboard/discussions with link to the notebook.
9
 
10
  ## Dataset
11
 
@@ -52,27 +52,49 @@ open_source = [
52
  'lom.agc.gov.my top-5': 0.1717699775952203,
53
  'lom.agc.gov.my top-10': 0.23089370176748816,
54
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
55
  {
56
  'model': '[llama2-embedding-600m-8k-contrastive](https://huggingface.co/mesolitica/llama2-embedding-600m-8k)',
57
- 'Crossref Melayu top-1': 0.11015162164875991,
58
- 'Crossref Melayu top-3': 0.23707199518023897,
59
- 'Crossref Melayu top-5': 0.30916758710713926,
60
- 'Crossref Melayu top-10': 0.4196204438196606,
61
- 'lom.agc.gov.my top-1': 0.05414488424197162,
62
- 'lom.agc.gov.my top-3': 0.11600697037590242,
63
- 'lom.agc.gov.my top-5': 0.16143888473985563,
64
- 'lom.agc.gov.my top-10': 0.23823749066467514,
65
  },
66
  {
67
  'model': '[llama2-embedding-1b-8k-contrastive](https://huggingface.co/mesolitica/llama2-embedding-1b-8k)',
68
- 'Crossref Melayu top-1': 0.16306858118284967,
69
- 'Crossref Melayu top-3': 0.32824580781202933,
70
- 'Crossref Melayu top-5': 0.41409780098403454,
71
- 'Crossref Melayu top-10': 0.5312782407872276,
72
- 'lom.agc.gov.my top-1': 0.08824993776450087,
73
- 'lom.agc.gov.my top-3': 0.17836694050286284,
74
- 'lom.agc.gov.my top-5': 0.2399800846402788,
75
- 'lom.agc.gov.my top-10': 0.3343291013193926,
76
  },
77
  ]
78
 
 
2
  import pandas as pd
3
  from css_html_js import custom_css
4
 
5
+ TITLE = """<h1 align="center" id="space-title">πŸ‡²πŸ‡Ύ Malaysian RAG Embedding Leaderboard</h1>"""
6
 
7
  INTRODUCTION_TEXT = """
8
+ πŸ“ The πŸ‡²πŸ‡Ύ Malaysian RAG Embedding Leaderboard aims to track, rank and evaluate Top-k retrieval using embedding models. All notebooks at https://github.com/mesolitica/embedding-benchmarks, feel free to submit your own score at https://huggingface.co/spaces/mesolitica/Malaysian-Embedding-Leaderboard/discussions with link to the notebook.
9
 
10
  ## Dataset
11
 
 
52
  'lom.agc.gov.my top-5': 0.1717699775952203,
53
  'lom.agc.gov.my top-10': 0.23089370176748816,
54
  },
55
+ {
56
+ 'model': '[mistral-embedding-191m-8k-contrastive](https://huggingface.co/mesolitica/mistral-embedding-191m-8k-contrastive)',
57
+ 'Crossref Melayu top-1': 0.08001654088700506,
58
+ 'Crossref Melayu top-3': 0.17378269409697095,
59
+ 'Crossref Melayu top-5': 0.232192701333609,
60
+ 'Crossref Melayu top-10': 0.32482166856197664,
61
+ 'lom.agc.gov.my top-1': 0.041075429424943986,
62
+ 'lom.agc.gov.my top-3': 0.09148618371919343,
63
+ 'lom.agc.gov.my top-5': 0.12758277321384118,
64
+ 'lom.agc.gov.my top-10': 0.18707991038088126,
65
+ },
66
+ {
67
+ 'model': '[mistral-embedding-349m-8k-contrastive](https://huggingface.co/mesolitica/mistral-embedding-349m-8k-contrastive)',
68
+ 'Crossref Melayu top-1': 0.09045797580895276,
69
+ 'Crossref Melayu top-3': 0.18742892587615012,
70
+ 'Crossref Melayu top-5': 0.2444949860436266,
71
+ 'Crossref Melayu top-10': 0.3398118474103174,
72
+ 'lom.agc.gov.my top-1': 0.039581777445855115,
73
+ 'lom.agc.gov.my top-3': 0.08849887976101568,
74
+ 'lom.agc.gov.my top-5': 0.12335075927308937,
75
+ 'lom.agc.gov.my top-10': 0.18558625840179238,
76
+ },
77
  {
78
  'model': '[llama2-embedding-600m-8k-contrastive](https://huggingface.co/mesolitica/llama2-embedding-600m-8k)',
79
+ 'Crossref Melayu top-1': 0.11516592577276956,
80
+ 'Crossref Melayu top-3': 0.2412901891863951,
81
+ 'Crossref Melayu top-5': 0.3201695440918019,
82
+ 'Crossref Melayu top-10': 0.4337847617078466,
83
+ 'lom.agc.gov.my top-1': 0.05738113019666418,
84
+ 'lom.agc.gov.my top-3': 0.12571570823998007,
85
+ 'lom.agc.gov.my top-5': 0.16455065969629076,
86
+ 'lom.agc.gov.my top-10': 0.24446104057754542,
87
  },
88
  {
89
  'model': '[llama2-embedding-1b-8k-contrastive](https://huggingface.co/mesolitica/llama2-embedding-1b-8k)',
90
+ 'Crossref Melayu top-1': 0.16489196733174816,
91
+ 'Crossref Melayu top-3': 0.3281298459629898,
92
+ 'Crossref Melayu top-5': 0.42623798201178537,
93
+ 'Crossref Melayu top-10': 0.5487439263930528,
94
+ 'lom.agc.gov.my top-1': 0.09123724172267862,
95
+ 'lom.agc.gov.my top-3': 0.18309683843664426,
96
+ 'lom.agc.gov.my top-5': 0.24271844660194175,
97
+ 'lom.agc.gov.my top-10': 0.3354493403037092,
98
  },
99
  ]
100