T145
/

ZEUS-8B-V10

@@ -11,104 +11,6 @@ base_model:
 model-index:
 - name: ZEUS-8B-V10
   results:
-  - task:
-      type: text-generation
-      name: Text Generation
-    dataset:
-      name: IFEval (0-Shot)
-      type: HuggingFaceH4/ifeval
-      args:
-        num_few_shot: 0
-    metrics:
-    - type: inst_level_strict_acc and prompt_level_strict_acc
-      value: 77.07
-      name: strict accuracy
-    source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=T145/ZEUS-8B-V10
-      name: Open LLM Leaderboard
-  - task:
-      type: text-generation
-      name: Text Generation
-    dataset:
-      name: BBH (3-Shot)
-      type: BBH
-      args:
-        num_few_shot: 3
-    metrics:
-    - type: acc_norm
-      value: 32.7
-      name: normalized accuracy
-    source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=T145/ZEUS-8B-V10
-      name: Open LLM Leaderboard
-  - task:
-      type: text-generation
-      name: Text Generation
-    dataset:
-      name: MATH Lvl 5 (4-Shot)
-      type: hendrycks/competition_math
-      args:
-        num_few_shot: 4
-    metrics:
-    - type: exact_match
-      value: 20.09
-      name: exact match
-    source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=T145/ZEUS-8B-V10
-      name: Open LLM Leaderboard
-  - task:
-      type: text-generation
-      name: Text Generation
-    dataset:
-      name: GPQA (0-shot)
-      type: Idavidrein/gpqa
-      args:
-        num_few_shot: 0
-    metrics:
-    - type: acc_norm
-      value: 9.96
-      name: acc_norm
-    source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=T145/ZEUS-8B-V10
-      name: Open LLM Leaderboard
-  - task:
-      type: text-generation
-      name: Text Generation
-    dataset:
-      name: MuSR (0-shot)
-      type: TAUR-Lab/MuSR
-      args:
-        num_few_shot: 0
-    metrics:
-    - type: acc_norm
-      value: 9.09
-      name: acc_norm
-    - type: acc_norm
-      value: 9.09
-      name: acc_norm
-    source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=T145/ZEUS-8B-V10
-      name: Open LLM Leaderboard
-  - task:
-      type: text-generation
-      name: Text Generation
-    dataset:
-      name: MMLU-PRO (5-shot)
-      type: TIGER-Lab/MMLU-Pro
-      config: main
-      split: test
-      args:
-        num_few_shot: 5
-    metrics:
-    - type: acc
-      value: 32.26
-      name: accuracy
-    - type: acc
-      value: 32.26
-      name: accuracy
-    source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=T145/ZEUS-8B-V10
-      name: Open LLM Leaderboard
   - task:
       type: text-generation
       name: Text Generation
@@ -231,29 +133,6 @@ tokenizer_source: union
 ```
 # [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard)
-Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/T145__ZEUS-8B-V10-details)
-|      Metric       |Value|
-|-------------------|----:|
-|Avg.               |30.19|
-|IFEval (0-Shot)    |77.07|
-|BBH (3-Shot)       |32.70|
-|MATH Lvl 5 (4-Shot)|20.09|
-|GPQA (0-shot)      | 9.96|
-|MuSR (0-shot)      | 9.09|
-|MMLU-PRO (5-shot)  |32.26|
-## Changes over V2
-|      Metric       |Change|
-|-------------------|-----:|
-|Avg.               |+0.12|
-|IFEval (0-Shot)    |-3.22|
-|BBH (3-Shot)       |+1.09|
-|MATH Lvl 5 (4-Shot)|-1.06|
-|GPQA (0-shot)      |+3.02|
-|MuSR (0-shot)      |+0.85|
-|MMLU-PRO (5-shot)  |+0.08|# [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard)
 Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/T145__ZEUS-8B-V10-details)!
 Summarized results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/contents/viewer/default/train?q=T145/ZEUS-8B-V10)!
@@ -267,3 +146,15 @@ Summarized results can be found [here](https://huggingface.co/datasets/open-llm-
 |MuSR (0-shot)      |     9.09|
 |MMLU-PRO (5-shot)  |    32.26|

 model-index:
 - name: ZEUS-8B-V10
   results:
   - task:
       type: text-generation
       name: Text Generation
 ```
 # [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard)
 Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/T145__ZEUS-8B-V10-details)!
 Summarized results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/contents/viewer/default/train?q=T145/ZEUS-8B-V10)!
 |MuSR (0-shot)      |     9.09|
 |MMLU-PRO (5-shot)  |    32.26|
+## Changes over V2
+|      Metric       |Change|
+|-------------------|-----:|
+|Avg.               |+0.12|
+|IFEval (0-Shot)    |-3.22|
+|BBH (3-Shot)       |+1.09|
+|MATH Lvl 5 (4-Shot)|-1.06|
+|GPQA (0-shot)      |+3.02|
+|MuSR (0-shot)      |+0.85|
+|MMLU-PRO (5-shot)  |+0.08|