Add official results for AlpacaEval
Browse files
README.md
CHANGED
@@ -128,11 +128,11 @@ model-index:
|
|
128 |
type: AlpacaEval
|
129 |
metrics:
|
130 |
- type: AlpacaEval 1.0
|
131 |
-
value: 91.
|
132 |
name: Win Rate
|
133 |
source:
|
134 |
-
url: https://
|
135 |
-
name:
|
136 |
- task:
|
137 |
type: text-generation
|
138 |
dataset:
|
@@ -140,11 +140,11 @@ model-index:
|
|
140 |
type: AlpacaEval
|
141 |
metrics:
|
142 |
- type: AlpacaEval 2.0
|
143 |
-
value: 12.
|
144 |
name: Win Rate
|
145 |
source:
|
146 |
-
url: https://
|
147 |
-
name:
|
148 |
- task:
|
149 |
type: text-generation
|
150 |
dataset:
|
|
|
128 |
type: AlpacaEval
|
129 |
metrics:
|
130 |
- type: AlpacaEval 1.0
|
131 |
+
value: 91.16%
|
132 |
name: Win Rate
|
133 |
source:
|
134 |
+
url: https://tatsu-lab.github.io/alpaca_eval/
|
135 |
+
name: Leaderboard
|
136 |
- task:
|
137 |
type: text-generation
|
138 |
dataset:
|
|
|
140 |
type: AlpacaEval
|
141 |
metrics:
|
142 |
- type: AlpacaEval 2.0
|
143 |
+
value: 12.57%
|
144 |
name: Win Rate
|
145 |
source:
|
146 |
+
url: https://tatsu-lab.github.io/alpaca_eval/
|
147 |
+
name: Leaderboard
|
148 |
- task:
|
149 |
type: text-generation
|
150 |
dataset:
|