Yeyito commited on
Commit
39963b1
โ€ข
1 Parent(s): f915caf

current eval

Browse files
Files changed (2) hide show
  1. data/code_eval_board.csv +2 -0
  2. data/queue.csv +4 -6
data/code_eval_board.csv CHANGED
@@ -6,3 +6,5 @@ T,Models,ARC,HellaSwag,MMLU,TruthfulQA,Winogrande,GSM8K,Reference Model
6
  ๐Ÿ”ถ,rishiraj/meow,0.11,0.49,0.28,0.36,0.02,0.95,huggyllama/llama-7b
7
  ๐Ÿ”ถ,Q-bert/MetaMath-Cybertron-Starling,0.52,0.64,0.51,0.75,0.01,0.99,huggyllama/llama-7b
8
  ๐Ÿ”ถ,upstage/SOLAR-10.7B-Instruct-v1.0,0.11,0.49,0.28,0.36,0.01,0.96,huggyllama/llama-7b
 
 
 
6
  ๐Ÿ”ถ,rishiraj/meow,0.11,0.49,0.28,0.36,0.02,0.95,huggyllama/llama-7b
7
  ๐Ÿ”ถ,Q-bert/MetaMath-Cybertron-Starling,0.52,0.64,0.51,0.75,0.01,0.99,huggyllama/llama-7b
8
  ๐Ÿ”ถ,upstage/SOLAR-10.7B-Instruct-v1.0,0.11,0.49,0.28,0.36,0.01,0.96,huggyllama/llama-7b
9
+ ๐Ÿ”ถ,AIDC-ai-business/Marcoroni-7B-v3,0.1,0.14,0.2,0.41,0.0,0.95,mistralai/Mistral-7B-v0.1
10
+ ๐Ÿ”ถ,amazon/MistralLite,0.09,0.14,0.2,0.43,0.0,0.73,mistralai/Mistral-7B-v0.1
data/queue.csv CHANGED
@@ -1,5 +1,4 @@
1
  Type,Model,ref_model
2
- ๐Ÿ”ถ finetuned,AIDC-ai-business/Marcoroni-7B-v3,mistralai/Mistral-7B-v0.1
3
  ๐Ÿ”ถ finetuned,openchat/openchat_3.5,mistralai/Mistral-7B-v0.1
4
  ๐Ÿ”ถ finetuned,teknium/OpenHermes-2.5-Mistral-7B,mistralai/Mistral-7B-v0.1
5
  ๐Ÿ”ถ finetuned,WizardLM/WizardMath-7B-V1.1,mistralai/Mistral-7B-v0.1
@@ -9,13 +8,12 @@ Type,Model,ref_model
9
  ๐Ÿ”ถ finetuned,HuggingFaceH4/zephyr-7b-beta,mistralai/Mistral-7B-v0.1
10
  ๐Ÿ”ถ finetuned,berkeley-nest/Starling-LM-7B-alpha,mistralai/Mistral-7B-v0.1
11
  ๐Ÿ”ถ finetuned,Open-Orca/Mistral-7B-OpenOrca,mistralai/Mistral-7B-v0.1
12
- ๐Ÿ”ถ finetuned,amazon/MistralLite,mistralai/Mistral-7B-v0.1
13
  ๐Ÿ”ถ finetuned,meta-math/MetaMath-Mistral-7B,mistralai/Mistral-7B-v0.1
14
  ๐Ÿ”ถ finetuned,microsoft/Orca-2-7b,mistralai/Mistral-7B-v0.1
15
  ๐Ÿ”ถ finetuned,01-ai/Yi-6B-200K,mistralai/Mistral-7B-v0.1
16
  ๐Ÿ”ถ finetuned,Yhyu13/LMCocktail-10.7B-v1,mistralai/Mistral-7B-v0.1
17
  ๐Ÿ”ถ finetuned,openchat/openchat-3.5-1210,mistralai/Mistral-7B-v0.1
18
- ๐Ÿ”ถ finetuned, Sao10K/Ana-v1-m7, mistralai/Mistral-7B-v0.1
19
- ๐Ÿ”ถ finetuned, jondurbin/bagel-dpo-7b-v0.1, mistralai/Mistral-7B-v0.1
20
- ๐Ÿ”ถ finetuned, rwitz/go-bruins-v2, mistralai/Mistral-7B-v0.1
21
- ๐Ÿ”ถ finetuned, chargoddard/loyal-piano-m7, mistralai/Mistral-7B-v0.1
 
1
  Type,Model,ref_model
 
2
  ๐Ÿ”ถ finetuned,openchat/openchat_3.5,mistralai/Mistral-7B-v0.1
3
  ๐Ÿ”ถ finetuned,teknium/OpenHermes-2.5-Mistral-7B,mistralai/Mistral-7B-v0.1
4
  ๐Ÿ”ถ finetuned,WizardLM/WizardMath-7B-V1.1,mistralai/Mistral-7B-v0.1
 
8
  ๐Ÿ”ถ finetuned,HuggingFaceH4/zephyr-7b-beta,mistralai/Mistral-7B-v0.1
9
  ๐Ÿ”ถ finetuned,berkeley-nest/Starling-LM-7B-alpha,mistralai/Mistral-7B-v0.1
10
  ๐Ÿ”ถ finetuned,Open-Orca/Mistral-7B-OpenOrca,mistralai/Mistral-7B-v0.1
 
11
  ๐Ÿ”ถ finetuned,meta-math/MetaMath-Mistral-7B,mistralai/Mistral-7B-v0.1
12
  ๐Ÿ”ถ finetuned,microsoft/Orca-2-7b,mistralai/Mistral-7B-v0.1
13
  ๐Ÿ”ถ finetuned,01-ai/Yi-6B-200K,mistralai/Mistral-7B-v0.1
14
  ๐Ÿ”ถ finetuned,Yhyu13/LMCocktail-10.7B-v1,mistralai/Mistral-7B-v0.1
15
  ๐Ÿ”ถ finetuned,openchat/openchat-3.5-1210,mistralai/Mistral-7B-v0.1
16
+ ๐Ÿ”ถ finetuned,Sao10K/Ana-v1-m7, mistralai/Mistral-7B-v0.1
17
+ ๐Ÿ”ถ finetuned,jondurbin/bagel-dpo-7b-v0.1, mistralai/Mistral-7B-v0.1
18
+ ๐Ÿ”ถ finetuned,rwitz/go-bruins-v2, mistralai/Mistral-7B-v0.1
19
+ ๐Ÿ”ถ finetuned,chargoddard/loyal-piano-m7, mistralai/Mistral-7B-v0.1