OpenLLMFrenchLeaderboard

Running on CPU Upgrade

App Files Files Community

malhajar commited on Oct 18

Commit

53e53d2

•

1 Parent(s): fd6bbaa

Update src/display/about.py

Browse files

Files changed (1) hide show

src/display/about.py +16 -15

src/display/about.py CHANGED Viewed

@@ -11,28 +11,29 @@ class Task:
 # Init: to update with your specific keys
 class Tasks(Enum):
     # task_key in the json file, metric_key in the json file, name to display in the leaderboard
-    task0 = Task("MMLU", "metric_name", "MMLU")
-    task1 = Task("Truthful_qa", "metric_name", "Truthful_qa")
-    task2 = Task("ARC", "metric_name", "ARC")
-    task3 = Task("HellaSwag", "metric_name", "HellaSwag")
     task4 = Task("GSM8K", "metric_name", "GSM8K")
-    task5 = Task("Winogrande", "metric_name", "Winogrande")
 # Your leaderboard name
-TITLE = """<h1 align="center" id="space-title"> OpenLLM Turkish leaderboard v0.2</h1>"""
 # What does your leaderboard evaluate?
 INTRODUCTION_TEXT = """
-Welcome to the Turkish LLM Leaderboard, a pioneering platform dedicated to evaluating Turkish Large Language Models (LLMs). As multilingual LLMs advance, my mission is to specifically highlight models excelling in Turkish, providing benchmarks that drive progress in Turkish LLM and Generative AI for the Turkish language.
-The Leadboard uses [this](https://huggingface.co/collections/malhajar/openllmturkishleadboard-v02-datasets-662a8593043e73938e2f6b1e) currfelly curated benchmarks for evaluation.
-The benchmarks are generated and checked using both GPT-4 and Human annotation rendering the leadboard the most valuable and accurate test in the LLM arena for Turkish evaluation.
-🚀 Submit Your Model 🚀
-Got a Turkish LLM? Submit it for evaluation (Currently Manually, due to the lack of resources! Hoping to automate this with the community's support!), leveraging the Eleuther AI Language Model Evaluation Harness for in-depth performance analysis. Learn more and contribute to Turkish AI advancements on the "About" page.
-Join the forefront of Turkish language technology. Submit your model, and let's advance Turkish LLM's together!
 """
@@ -100,11 +101,11 @@ If everything is done, check you can launch the EleutherAIHarness on your model
 CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
 CITATION_BUTTON_TEXT = r"""
-@misc{openllm-Turkish-leaderboard,
   author = {Mohamad Alhajar},
-  title = {Open LLM Turkish Leaderboard v0.2},
   year = {2024},
   publisher = {Mohamad Alhajar},
-  howpublished = "\url{https://huggingface.co/spaces/malhajar/OpenLLMTurkishLeaderboard}"
 }
 """

 # Init: to update with your specific keys
 class Tasks(Enum):
     # task_key in the json file, metric_key in the json file, name to display in the leaderboard
+    task0 = Task("BBH", "metric_name", "BBH")
+    task1 = Task("GPQA", "metric_name", "GPQA")
+    task2 = Task("IFEval", "metric_name", "IFEval")
+    task3 = Task("MUSR", "metric_name", "MUSR")
     task4 = Task("GSM8K", "metric_name", "GSM8K")
+    task5 = Task("MMMLU-fr", "metric_name", "MMMLU-fr")
 # Your leaderboard name
+TITLE = """<h1 align="center" id="space-title"> OpenLLM French leaderboard 🇫🇷</h1>"""
 # What does your leaderboard evaluate?
 INTRODUCTION_TEXT = """
+Bienvenue sur le Leaderboard des LLM en français, une plateforme pionnière dédiée à l'évaluation des grands modèles de langage (LLM) en français. Alors que les LLM multilingues progressent, ma mission est de mettre en lumière spécifiquement les modèles qui excellent en langue française,
+en fournissant des benchmarks qui stimulent les avancées dans les LLM en français et l'IA générative pour la langue française. Le Leaderboard utilise ce lien (https://huggingface.co/collections/le-leadboard/openllmfrenchleadboard-jeu-de-donnees-67126437539a23c65554fd88) pour ses benchmarks soigneusement sélectionnés. Les évaluations sont générées et vérifiées à la fois par GPT-4 et par annotation humaine,
+rendant ainsi ce Leaderboard l'outil le plus précieux et le plus précis pour l'évaluation des LLM en français.
+🚀 Soumettez votre Modèle 🚀
+Vous avez un LLM en français ? Soumettez-le pour évaluation (Actuellement manuelle, faute de ressources ! En espérant automatiser ce processus avec le soutien de la communauté !), en utilisant le Eleuther AI Language Model Evaluation Harness pour une analyse approfondie des performances. Apprenez-en plus et contribuez aux avancées de l'IA en français sur la page "À propos".
+Rejoignez l'avant-garde de la technologie linguistique en français. Soumettez votre modèle et faisons progresser ensemble les LLM en français !
 """
 CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
 CITATION_BUTTON_TEXT = r"""
+@misc{openllm-French-leaderboard,
   author = {Mohamad Alhajar},
+  title = {Open LLM French Leaderboard v0.2},
   year = {2024},
   publisher = {Mohamad Alhajar},
+  howpublished = "\url{https://huggingface.co/spaces/le-leadboard/OpenLLMFrenchLeaderboard}"
 }
 """