Yeyito commited on
Commit
a57e40e
β€’
1 Parent(s): 29d2eff

Current evals

Browse files
Files changed (1) hide show
  1. data/code_eval_board.csv +4 -5
data/code_eval_board.csv CHANGED
@@ -5,6 +5,7 @@ T,Models,ARC,HellaSwag,MMLU,TruthfulQA,Winogrande,GSM8K,Reference Model
5
  🟒,mistralai/Mistral-7B-v0.1,0.54,0.51,0.46,0.75,0,0.91,huggyllama/llama-7b
6
  πŸ”Ά,rishiraj/meow,0.11,0.49,0.28,0.36,0.02,0.95,huggyllama/llama-7b
7
  πŸ”Ά,Q-bert/MetaMath-Cybertron-Starling,0.52,0.64,0.51,0.75,0.01,0.99,huggyllama/llama-7b
 
8
  πŸ”Ά,AIDC-ai-business/Marcoroni-7B-v3,0.1,0.14,0.2,0.41,0.0,0.95,mistralai/Mistral-7B-v0.1
9
  πŸ”Ά,amazon/MistralLite,0.09,0.14,0.2,0.43,0.0,0.73,mistralai/Mistral-7B-v0.1
10
  πŸ”Ά,openchat/openchat_3.5,0.13,0.13,0.23,0.45,0.0,0.97,mistralai/Mistral-7B-v0.1
@@ -13,6 +14,7 @@ T,Models,ARC,HellaSwag,MMLU,TruthfulQA,Winogrande,GSM8K,Reference Model
13
  πŸ”Ά,microsoft/Orca-2-7b,0.88,0.8,0.77,0.91,0.0,1.0,mistralai/Mistral-7B-v0.1
14
  πŸ”Ά,WizardLM/WizardMath-7B-V1.1,0.1,0.11,0.21,0.4,0.0,0.99,mistralai/Mistral-7B-v0.1
15
  πŸ”Ά,01-ai/Yi-6B-200K,0.19,0.3,0.3,0.6,0.0,0.93,mistralai/Mistral-7B-v0.1
 
16
  πŸ”Ά,mistralai/Mistral-7B-Instruct-v0.2,0.06,0.21,0.17,0.48,0.0,0.95,mistralai/Mistral-7B-v0.1
17
  πŸ”Ά,Yhyu13/LMCocktail-10.7B-v1,0.1,0.44,0.23,0.51,0.0,0.97,mistralai/Mistral-7B-v0.1
18
  πŸ”Ά,ehartford/dolphin-2.1-mistral-7b,0.08,0.1,0.2,0.4,0.0,0.92,mistralai/Mistral-7B-v0.1
@@ -32,14 +34,11 @@ T,Models,ARC,HellaSwag,MMLU,TruthfulQA,Winogrande,GSM8K,Reference Model
32
  🟒,huggyllama/llama-7b,0.11,0.17,0.22,0.46,0.0,0.79,mistralai/Mistral-7B-v0.1
33
  🟒,tiiuae/falcon-7b-instruct,0.06,0.16,0.19,0.56,0.0,0.98,mistralai/Mistral-7B-v0.1
34
  πŸ”Ά,NousResearch/Nous-Hermes-llama-2-7b,0.09,0.18,0.26,0.5,0.0,0.96,mistralai/Mistral-7B-v0.1
35
- πŸ”Ά,openaccess-ai-collective/DPOpenHermes-7B-v2,0.08,0.11,0.22,0.41,0.0,0.96,mistralai/Mistral-7B-v0.1
36
- 🟒,01-ai/Yi-6B,0.28,0.32,0.3,0.62,0.02,0.94,mistralai/Mistral-7B-v0.1
37
  πŸ”Ά,Intel/neural-chat-7b-v3-1,0.1,0.15,0.18,0.49,0.0,0.81,mistralai/Mistral-7B-v0.1
38
  πŸ”Ά,fblgit/juanako-7b-UNA,0.09,0.15,0.18,0.46,0.0,0.81,mistralai/Mistral-7B-v0.1
39
  πŸ”Ά,Intel/neural-chat-7b-v3-2,0.12,0.14,0.2,0.5,0.0,0.93,mistralai/Mistral-7B-v0.1
40
  πŸ”Ά,fblgit/una-cybertron-7b-v2-bf16,0.1,0.12,0.21,0.46,0.0,0.92,mistralai/Mistral-7B-v0.1
41
- πŸ”Ά,Intel/neural-chat-7b-v3-3,0.06,0.15,0.18,0.47,0.0,0.98,mistralai/Mistral-7B-v0.1
42
  πŸ”Ά,fblgit/una-cybertron-7b-v3-OMA,0.04,0.16,0.17,0.36,0.0,0.94,mistralai/Mistral-7B-v0.1
43
- πŸ”Ά,fblgit/una-xaberius-34b-v1beta,0.37,0.54,0.33,0.61,0.04,0.96,huggyllama/llama-7b
44
- πŸ”Ά,upstage/SOLAR-10.7B-Instruct-v1.0,0.11,0.49,0.28,0.36,0.01,0.96,huggyllama/llama-7b
45
  πŸ”Ά,VAGOsolutions/SauerkrautLM-SOLAR-Instruct,0.12,0.54,0.32,0.34,0.01,0.96,huggyllama/llama-7b
 
 
 
5
  🟒,mistralai/Mistral-7B-v0.1,0.54,0.51,0.46,0.75,0,0.91,huggyllama/llama-7b
6
  πŸ”Ά,rishiraj/meow,0.11,0.49,0.28,0.36,0.02,0.95,huggyllama/llama-7b
7
  πŸ”Ά,Q-bert/MetaMath-Cybertron-Starling,0.52,0.64,0.51,0.75,0.01,0.99,huggyllama/llama-7b
8
+ πŸ”Ά,upstage/SOLAR-10.7B-Instruct-v1.0,0.11,0.49,0.28,0.36,0.01,0.96,huggyllama/llama-7b
9
  πŸ”Ά,AIDC-ai-business/Marcoroni-7B-v3,0.1,0.14,0.2,0.41,0.0,0.95,mistralai/Mistral-7B-v0.1
10
  πŸ”Ά,amazon/MistralLite,0.09,0.14,0.2,0.43,0.0,0.73,mistralai/Mistral-7B-v0.1
11
  πŸ”Ά,openchat/openchat_3.5,0.13,0.13,0.23,0.45,0.0,0.97,mistralai/Mistral-7B-v0.1
 
14
  πŸ”Ά,microsoft/Orca-2-7b,0.88,0.8,0.77,0.91,0.0,1.0,mistralai/Mistral-7B-v0.1
15
  πŸ”Ά,WizardLM/WizardMath-7B-V1.1,0.1,0.11,0.21,0.4,0.0,0.99,mistralai/Mistral-7B-v0.1
16
  πŸ”Ά,01-ai/Yi-6B-200K,0.19,0.3,0.3,0.6,0.0,0.93,mistralai/Mistral-7B-v0.1
17
+ πŸ”Ά,Intel/neural-chat-7b-v3-3,0.06,0.15,0.18,0.47,0.0,0.98,mistralai/Mistral-7B-v0.1
18
  πŸ”Ά,mistralai/Mistral-7B-Instruct-v0.2,0.06,0.21,0.17,0.48,0.0,0.95,mistralai/Mistral-7B-v0.1
19
  πŸ”Ά,Yhyu13/LMCocktail-10.7B-v1,0.1,0.44,0.23,0.51,0.0,0.97,mistralai/Mistral-7B-v0.1
20
  πŸ”Ά,ehartford/dolphin-2.1-mistral-7b,0.08,0.1,0.2,0.4,0.0,0.92,mistralai/Mistral-7B-v0.1
 
34
  🟒,huggyllama/llama-7b,0.11,0.17,0.22,0.46,0.0,0.79,mistralai/Mistral-7B-v0.1
35
  🟒,tiiuae/falcon-7b-instruct,0.06,0.16,0.19,0.56,0.0,0.98,mistralai/Mistral-7B-v0.1
36
  πŸ”Ά,NousResearch/Nous-Hermes-llama-2-7b,0.09,0.18,0.26,0.5,0.0,0.96,mistralai/Mistral-7B-v0.1
 
 
37
  πŸ”Ά,Intel/neural-chat-7b-v3-1,0.1,0.15,0.18,0.49,0.0,0.81,mistralai/Mistral-7B-v0.1
38
  πŸ”Ά,fblgit/juanako-7b-UNA,0.09,0.15,0.18,0.46,0.0,0.81,mistralai/Mistral-7B-v0.1
39
  πŸ”Ά,Intel/neural-chat-7b-v3-2,0.12,0.14,0.2,0.5,0.0,0.93,mistralai/Mistral-7B-v0.1
40
  πŸ”Ά,fblgit/una-cybertron-7b-v2-bf16,0.1,0.12,0.21,0.46,0.0,0.92,mistralai/Mistral-7B-v0.1
 
41
  πŸ”Ά,fblgit/una-cybertron-7b-v3-OMA,0.04,0.16,0.17,0.36,0.0,0.94,mistralai/Mistral-7B-v0.1
 
 
42
  πŸ”Ά,VAGOsolutions/SauerkrautLM-SOLAR-Instruct,0.12,0.54,0.32,0.34,0.01,0.96,huggyllama/llama-7b
43
+ πŸ”Ά,openaccess-ai-collective/DPOpenHermes-7B-v2,0.08,0.11,0.22,0.41,0.0,0.96,mistralai/Mistral-7B-v0.1
44
+ 🟒,01-ai/Yi-6B,0.28,0.32,0.3,0.62,0.02,0.94,mistralai/Mistral-7B-v0.1