CultriX commited on
Commit
cf88a41
1 Parent(s): 7f363ce

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +17 -8
README.md CHANGED
@@ -30,7 +30,8 @@ model-index:
30
  value: 56.85
31
  name: strict accuracy
32
  source:
33
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MergeStock
 
34
  name: Open LLM Leaderboard
35
  - task:
36
  type: text-generation
@@ -45,7 +46,8 @@ model-index:
45
  value: 51.01
46
  name: normalized accuracy
47
  source:
48
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MergeStock
 
49
  name: Open LLM Leaderboard
50
  - task:
51
  type: text-generation
@@ -60,7 +62,8 @@ model-index:
60
  value: 27.34
61
  name: exact match
62
  source:
63
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MergeStock
 
64
  name: Open LLM Leaderboard
65
  - task:
66
  type: text-generation
@@ -75,7 +78,8 @@ model-index:
75
  value: 16.44
76
  name: acc_norm
77
  source:
78
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MergeStock
 
79
  name: Open LLM Leaderboard
80
  - task:
81
  type: text-generation
@@ -90,7 +94,8 @@ model-index:
90
  value: 17.85
91
  name: acc_norm
92
  source:
93
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MergeStock
 
94
  name: Open LLM Leaderboard
95
  - task:
96
  type: text-generation
@@ -107,8 +112,13 @@ model-index:
107
  value: 48.84
108
  name: accuracy
109
  source:
110
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MergeStock
 
111
  name: Open LLM Leaderboard
 
 
 
 
112
  ---
113
  # merge
114
 
@@ -168,5 +178,4 @@ Detailed results can be found [here](https://huggingface.co/datasets/open-llm-le
168
  |MATH Lvl 5 (4-Shot)|27.34|
169
  |GPQA (0-shot) |16.44|
170
  |MuSR (0-shot) |17.85|
171
- |MMLU-PRO (5-shot) |48.84|
172
-
 
30
  value: 56.85
31
  name: strict accuracy
32
  source:
33
+ url: >-
34
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MergeStock
35
  name: Open LLM Leaderboard
36
  - task:
37
  type: text-generation
 
46
  value: 51.01
47
  name: normalized accuracy
48
  source:
49
+ url: >-
50
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MergeStock
51
  name: Open LLM Leaderboard
52
  - task:
53
  type: text-generation
 
62
  value: 27.34
63
  name: exact match
64
  source:
65
+ url: >-
66
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MergeStock
67
  name: Open LLM Leaderboard
68
  - task:
69
  type: text-generation
 
78
  value: 16.44
79
  name: acc_norm
80
  source:
81
+ url: >-
82
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MergeStock
83
  name: Open LLM Leaderboard
84
  - task:
85
  type: text-generation
 
94
  value: 17.85
95
  name: acc_norm
96
  source:
97
+ url: >-
98
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MergeStock
99
  name: Open LLM Leaderboard
100
  - task:
101
  type: text-generation
 
112
  value: 48.84
113
  name: accuracy
114
  source:
115
+ url: >-
116
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=CultriX/Qwen2.5-14B-MergeStock
117
  name: Open LLM Leaderboard
118
+ license: apache-2.0
119
+ language:
120
+ - en
121
+ pipeline_tag: text-generation
122
  ---
123
  # merge
124
 
 
178
  |MATH Lvl 5 (4-Shot)|27.34|
179
  |GPQA (0-shot) |16.44|
180
  |MuSR (0-shot) |17.85|
181
+ |MMLU-PRO (5-shot) |48.84|