tabedini commited on
Commit
b7e5f47
·
verified ·
1 Parent(s): 19236c8

Update leaderboard_data.jsonl

Browse files
Files changed (1) hide show
  1. leaderboard_data.jsonl +8 -0
leaderboard_data.jsonl CHANGED
@@ -14,3 +14,11 @@
14
  {"Model":"google/gemma-2-27b-it", "Precision": "bfloat16", "#Params (B)": 27.2, "Part Multiple Choice": 46.03, "ARC Easy": 95.98, "ARC Challenge": 85.91, "MMLU Pro": 36.28, "AUT Multiple Choice Persian": 63.12, "Hub License": "gemma", "Model sha": "main", "model_name_for_query": "google/gemma-2-27b-it"}
15
  {"Model":"universitytehran/PersianMind-v1.0", "Precision": "bfloat16", "#Params (B)": 6.82, "Part Multiple Choice": 29.27, "ARC Easy": 58.91, "ARC Challenge": 48.32, "MMLU Pro": 15.51, "AUT Multiple Choice Persian": 45.36, "Hub License": "cc-by-nc-sa-4.0", "Model sha": "main", "model_name_for_query": "universitytehran/PersianMind-v1.0"}
16
  {"Model":"MaralGPT/Maral-7B-alpha-1", "Precision": "bfloat16", "#Params (B)": 7.24, "Part Multiple Choice": 26.67, "ARC Easy": 44.54, "ARC Challenge": 30.87, "MMLU Pro": 15.99, "AUT Multiple Choice Persian": 36.09, "Hub License": "mit", "Model sha": "main", "model_name_for_query": "MaralGPT/Maral-7B-alpha-1"}
 
 
 
 
 
 
 
 
 
14
  {"Model":"google/gemma-2-27b-it", "Precision": "bfloat16", "#Params (B)": 27.2, "Part Multiple Choice": 46.03, "ARC Easy": 95.98, "ARC Challenge": 85.91, "MMLU Pro": 36.28, "AUT Multiple Choice Persian": 63.12, "Hub License": "gemma", "Model sha": "main", "model_name_for_query": "google/gemma-2-27b-it"}
15
  {"Model":"universitytehran/PersianMind-v1.0", "Precision": "bfloat16", "#Params (B)": 6.82, "Part Multiple Choice": 29.27, "ARC Easy": 58.91, "ARC Challenge": 48.32, "MMLU Pro": 15.51, "AUT Multiple Choice Persian": 45.36, "Hub License": "cc-by-nc-sa-4.0", "Model sha": "main", "model_name_for_query": "universitytehran/PersianMind-v1.0"}
16
  {"Model":"MaralGPT/Maral-7B-alpha-1", "Precision": "bfloat16", "#Params (B)": 7.24, "Part Multiple Choice": 26.67, "ARC Easy": 44.54, "ARC Challenge": 30.87, "MMLU Pro": 15.99, "AUT Multiple Choice Persian": 36.09, "Hub License": "mit", "Model sha": "main", "model_name_for_query": "MaralGPT/Maral-7B-alpha-1"}
17
+ {"Model":"meta-llama/Llama-3.1-8B", "Precision": "bfloat16", "#Params (B)": 8.03, "Part Multiple Choice": 35.52, "ARC Easy": 75.28, "ARC Challenge": 53.02, "MMLU Pro": 24.10, "AUT Multiple Choice Persian": 53.45, "Hub License": "llama3.1", "Model sha": "main", "model_name_for_query": "meta-llama/Llama-3.1-8B"}
18
+ {"Model":"meta-llama/Meta-Llama-3-8B", "Precision": "bfloat16", "#Params (B)": 8.03, "Part Multiple Choice": 34.32, "ARC Easy": 72.12, "ARC Challenge": 56.37, "MMLU Pro": 19.33, "AUT Multiple Choice Persian": 48.32, "Hub License": "llama3", "Model sha": "main", "model_name_for_query": "meta-llama/Meta-Llama-3-8B"}
19
+ {"Model":"PartAI/Dorna-1.1-Llama3.1-8B-Instruct", "Precision": "bfloat16", "#Params (B)": 8.03, "Part Multiple Choice": 34.48, "ARC Easy": 79.59, "ARC Challenge": 64.42, "MMLU Pro": 21.47, "AUT Multiple Choice Persian": 53.64, "Hub License": "llama3.1", "Model sha": "main", "model_name_for_query": "PartAI/Dorna-1.1-Llama3.1-8B-Instruct"}
20
+ {"Model":"lightblue/suzume-llama-3-8B-multilingual", "Precision": "bfloat16", "#Params (B)": 8.03, "Part Multiple Choice": 34.39, "ARC Easy": 72.41, "ARC Challenge": 56.37, "MMLU Pro": 21.95, "AUT Multiple Choice Persian": 51.28, "Hub License": "llama3", "Model sha": "main", "model_name_for_query": "lightblue/suzume-llama-3-8B-multilingual"}
21
+ {"Model":"Skywork/Skywork-o1-Open-Llama-3.1-8B", "Precision": "bfloat16", "#Params (B)": 8.03, "Part Multiple Choice": 27.02, "ARC Easy": 47.12, "ARC Challenge": 41.61, "MMLU Pro": 14.55, "AUT Multiple Choice Persian": 40.43, "Hub License": "llama3.1", "Model sha": "main", "model_name_for_query": "Skywork/Skywork-o1-Open-Llama-3.1-8B"}
22
+ {"Model":"O1-OPEN/OpenO1-LLama-8B-v0.1", "Precision": "bfloat16", "#Params (B)": 8.03, "Part Multiple Choice": 34.66, "ARC Easy": 77.87, "ARC Challenge": 63.08, "MMLU Pro": 21.24, "AUT Multiple Choice Persian": 54.24, "Hub License": "None", "Model sha": "main", "model_name_for_query": "O1-OPEN/OpenO1-LLama-8B-v0.1"}
23
+ {"Model":"PrincetonPLI/Llama-3-8B-Instruct-SkillMix", "Precision": "bfloat16", "#Params (B)": 8.03, "Part Multiple Choice": 34.67, "ARC Easy": 72.98, "ARC Challenge": 60.40, "MMLU Pro": 23.38, "AUT Multiple Choice Persian": 54.04, "Hub License": "llama3", "Model sha": "main", "model_name_for_query": "PrincetonPLI/Llama-3-8B-Instruct-SkillMix"}
24
+ {"Model":"Qwen/QwQ-32B-Preview", "Precision": "bfloat16", "#Params (B)": 32.8, "Part Multiple Choice": 46.64, "ARC Easy": 91.95, "ARC Challenge": 87.24, "MMLU Pro": 37.94, "AUT Multiple Choice Persian": 60.15, "Hub License": "apache-2.0", "Model sha": "main", "model_name_for_query": "Qwen/QwQ-32B-Preview"}