Adding Evaluation Results

#6
by T145 - opened
Files changed (1) hide show
  1. README.md +5 -5
README.md CHANGED
@@ -177,7 +177,7 @@ model-index:
177
  num_few_shot: 0
178
  metrics:
179
  - type: inst_level_strict_acc and prompt_level_strict_acc
180
- value: 65.24
181
  name: strict accuracy
182
  source:
183
  url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-ShiningValiant2
@@ -207,7 +207,7 @@ model-index:
207
  num_few_shot: 4
208
  metrics:
209
  - type: exact_match
210
- value: 11.63
211
  name: exact match
212
  source:
213
  url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-ShiningValiant2
@@ -222,7 +222,7 @@ model-index:
222
  num_few_shot: 0
223
  metrics:
224
  - type: acc_norm
225
- value: 8.95
226
  name: acc_norm
227
  source:
228
  url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-ShiningValiant2
@@ -237,7 +237,7 @@ model-index:
237
  num_few_shot: 0
238
  metrics:
239
  - type: acc_norm
240
- value: 7.19
241
  name: acc_norm
242
  source:
243
  url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-ShiningValiant2
@@ -254,7 +254,7 @@ model-index:
254
  num_few_shot: 5
255
  metrics:
256
  - type: acc
257
- value: 26.38
258
  name: accuracy
259
  source:
260
  url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-ShiningValiant2
 
177
  num_few_shot: 0
178
  metrics:
179
  - type: inst_level_strict_acc and prompt_level_strict_acc
180
+ value: 64.96
181
  name: strict accuracy
182
  source:
183
  url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-ShiningValiant2
 
207
  num_few_shot: 4
208
  metrics:
209
  - type: exact_match
210
+ value: 12.92
211
  name: exact match
212
  source:
213
  url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-ShiningValiant2
 
222
  num_few_shot: 0
223
  metrics:
224
  - type: acc_norm
225
+ value: 8.05
226
  name: acc_norm
227
  source:
228
  url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-ShiningValiant2
 
237
  num_few_shot: 0
238
  metrics:
239
  - type: acc_norm
240
+ value: 7.46
241
  name: acc_norm
242
  source:
243
  url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-ShiningValiant2
 
254
  num_few_shot: 5
255
  metrics:
256
  - type: acc
257
+ value: 26.46
258
  name: accuracy
259
  source:
260
  url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=ValiantLabs/Llama3.1-8B-ShiningValiant2