JW17 commited on
Commit
1050739
1 Parent(s): c3693da

Add official results for AlpacaEval

Browse files
Files changed (1) hide show
  1. README.md +6 -6
README.md CHANGED
@@ -128,11 +128,11 @@ model-index:
128
  type: AlpacaEval
129
  metrics:
130
  - type: AlpacaEval 1.0
131
- value: 91.41%
132
  name: Win Rate
133
  source:
134
- url: https://github.com/tatsu-lab/alpaca_eval
135
- name: self-reported
136
  - task:
137
  type: text-generation
138
  dataset:
@@ -140,11 +140,11 @@ model-index:
140
  type: AlpacaEval
141
  metrics:
142
  - type: AlpacaEval 2.0
143
- value: 12.20%
144
  name: Win Rate
145
  source:
146
- url: https://github.com/tatsu-lab/alpaca_eval
147
- name: self-reported
148
  - task:
149
  type: text-generation
150
  dataset:
 
128
  type: AlpacaEval
129
  metrics:
130
  - type: AlpacaEval 1.0
131
+ value: 91.16%
132
  name: Win Rate
133
  source:
134
+ url: https://tatsu-lab.github.io/alpaca_eval/
135
+ name: Leaderboard
136
  - task:
137
  type: text-generation
138
  dataset:
 
140
  type: AlpacaEval
141
  metrics:
142
  - type: AlpacaEval 2.0
143
+ value: 12.57%
144
  name: Win Rate
145
  source:
146
+ url: https://tatsu-lab.github.io/alpaca_eval/
147
+ name: Leaderboard
148
  - task:
149
  type: text-generation
150
  dataset: