Weyaxi commited on
Commit
3e08111
1 Parent(s): ea6c2a7

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +36 -29
README.md CHANGED
@@ -2,6 +2,8 @@
2
  model-index:
3
  - name: Dolphin2.1-OpenOrca-7B
4
  results:
 
 
5
  # AI2 Reasoning Challenge (25-Shot)
6
  - task:
7
  type: text-generation
@@ -21,6 +23,7 @@ model-index:
21
  name: Open LLM Leaderboard
22
  url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Weyaxi/Dolphin2.1-OpenOrca-7B
23
 
 
24
  # HellaSwag (10-shot)
25
  - task:
26
  type: text-generation
@@ -39,77 +42,81 @@ model-index:
39
  name: Open LLM Leaderboard
40
  url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Weyaxi/Dolphin2.1-OpenOrca-7B
41
 
42
- # TruthfulQA (0-shot)
 
43
  - task:
44
  type: text-generation
45
  name: Text Generation
46
  dataset:
47
- name: TruthfulQA (0-shot)
48
- type: truthful_qa
49
- config: multiple_choice
50
- split: validation
51
  args:
52
- num_few_shot: 0
53
  metrics:
54
- - type: mc2
55
- value: 53.84
 
56
  source:
57
  name: Open LLM Leaderboard
58
  url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Weyaxi/Dolphin2.1-OpenOrca-7B
59
 
60
- # GSM8k (5-shot)
 
61
  - task:
62
  type: text-generation
63
  name: Text Generation
64
  dataset:
65
- name: GSM8k (5-shot)
66
- type: gsm8k
67
- config: main
68
- split: test
69
  args:
70
- num_few_shot: 5
71
  metrics:
72
- - type: acc
73
- name: accuracy
74
- value: 19.94
75
  source:
76
  name: Open LLM Leaderboard
77
  url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Weyaxi/Dolphin2.1-OpenOrca-7B
78
 
79
- # MMLU (5-Shot)
 
80
  - task:
81
  type: text-generation
82
  name: Text Generation
83
  dataset:
84
- name: MMLU (5-Shot)
85
- type: cais/mmlu
86
- config: all
87
- split: test
88
  args:
89
  num_few_shot: 5
90
  metrics:
91
  - type: acc
92
  name: accuracy
93
- value: 62.66
94
  source:
95
  name: Open LLM Leaderboard
96
  url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Weyaxi/Dolphin2.1-OpenOrca-7B
97
 
98
- # Winogrande (5-shot)
 
99
  - task:
100
  type: text-generation
101
  name: Text Generation
102
  dataset:
103
- name: Winogrande (5-shot)
104
- type: winogrande
105
- config: winogrande_xl
106
- split: validation
107
  args:
108
  num_few_shot: 5
109
  metrics:
110
  - type: acc
111
  name: accuracy
112
- value: 78.22
113
  source:
114
  name: Open LLM Leaderboard
115
  url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Weyaxi/Dolphin2.1-OpenOrca-7B
 
2
  model-index:
3
  - name: Dolphin2.1-OpenOrca-7B
4
  results:
5
+
6
+
7
  # AI2 Reasoning Challenge (25-Shot)
8
  - task:
9
  type: text-generation
 
23
  name: Open LLM Leaderboard
24
  url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Weyaxi/Dolphin2.1-OpenOrca-7B
25
 
26
+
27
  # HellaSwag (10-shot)
28
  - task:
29
  type: text-generation
 
42
  name: Open LLM Leaderboard
43
  url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Weyaxi/Dolphin2.1-OpenOrca-7B
44
 
45
+
46
+ # MMLU (5-Shot)
47
  - task:
48
  type: text-generation
49
  name: Text Generation
50
  dataset:
51
+ name: MMLU (5-Shot)
52
+ type: cais/mmlu
53
+ config: all
54
+ split: test
55
  args:
56
+ num_few_shot: 5
57
  metrics:
58
+ - type: acc
59
+ name: accuracy
60
+ value: 62.66
61
  source:
62
  name: Open LLM Leaderboard
63
  url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Weyaxi/Dolphin2.1-OpenOrca-7B
64
 
65
+
66
+ # TruthfulQA (0-shot)
67
  - task:
68
  type: text-generation
69
  name: Text Generation
70
  dataset:
71
+ name: TruthfulQA (0-shot)
72
+ type: truthful_qa
73
+ config: multiple_choice
74
+ split: validation
75
  args:
76
+ num_few_shot: 0
77
  metrics:
78
+ - type: mc2
79
+ value: 53.84
 
80
  source:
81
  name: Open LLM Leaderboard
82
  url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Weyaxi/Dolphin2.1-OpenOrca-7B
83
 
84
+
85
+ # Winogrande (5-shot)
86
  - task:
87
  type: text-generation
88
  name: Text Generation
89
  dataset:
90
+ name: Winogrande (5-shot)
91
+ type: winogrande
92
+ config: winogrande_xl
93
+ split: validation
94
  args:
95
  num_few_shot: 5
96
  metrics:
97
  - type: acc
98
  name: accuracy
99
+ value: 78.22
100
  source:
101
  name: Open LLM Leaderboard
102
  url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Weyaxi/Dolphin2.1-OpenOrca-7B
103
 
104
+
105
+ # GSM8k (5-shot)
106
  - task:
107
  type: text-generation
108
  name: Text Generation
109
  dataset:
110
+ name: GSM8k (5-shot)
111
+ type: gsm8k
112
+ config: main
113
+ split: test
114
  args:
115
  num_few_shot: 5
116
  metrics:
117
  - type: acc
118
  name: accuracy
119
+ value: 19.94
120
  source:
121
  name: Open LLM Leaderboard
122
  url: https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard?query=Weyaxi/Dolphin2.1-OpenOrca-7B