Add evaluation results on the autoevaluate--squad-sample config and test split of autoevaluate/squad-sample
Browse filesBeep boop, I am a bot from Hugging Face's automatic model evaluator 👋!\
Your model has been evaluated on the autoevaluate--squad-sample config and test split of the [autoevaluate/squad-sample](https://huggingface.co/datasets/autoevaluate/squad-sample) dataset by
@lewtun
, using the predictions stored [here](https://huggingface.co/datasets/autoevaluate/autoeval-staging-eval-project-c3da4aa4-0386-41d1-9c7c-12d712dd287c-126120).\
Accept this pull request to see the results displayed on the [Hub leaderboard](https://huggingface.co/spaces/autoevaluate/leaderboards?dataset=autoevaluate/squad-sample).\
Evaluate your model on more datasets [here](https://huggingface.co/spaces/autoevaluate/model-evaluator?dataset=autoevaluate/squad-sample).
README.md
CHANGED
@@ -1,10 +1,37 @@
|
|
1 |
---
|
2 |
-
language:
|
|
|
3 |
datasets:
|
4 |
- squad
|
5 |
metrics:
|
6 |
- squad
|
7 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
8 |
---
|
9 |
|
10 |
# DistilBERT base cased distilled SQuAD
|
|
|
1 |
---
|
2 |
+
language: en
|
3 |
+
license: apache-2.0
|
4 |
datasets:
|
5 |
- squad
|
6 |
metrics:
|
7 |
- squad
|
8 |
+
model-index:
|
9 |
+
- name: autoevaluate/distilbert-base-cased-distilled-squad
|
10 |
+
results:
|
11 |
+
- task:
|
12 |
+
type: question-answering
|
13 |
+
name: Question Answering
|
14 |
+
dataset:
|
15 |
+
name: autoevaluate/squad-sample
|
16 |
+
type: autoevaluate/squad-sample
|
17 |
+
config: autoevaluate--squad-sample
|
18 |
+
split: test
|
19 |
+
metrics:
|
20 |
+
- type: f1
|
21 |
+
value: 87.8248
|
22 |
+
name: F1
|
23 |
+
verified: true
|
24 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNTBiYzkyNGNmMWRhNDIwMDhhOTBlMzU2OTQyZTMxMzNiODM3YzA0Mjk3NzY0YTI0ZWNiZjRlMDIzM2EzY2E5OCIsInZlcnNpb24iOjF9.xEOZCY6PgAuoh1I9zox8ZNPv3uT-Nx1c9I1GCAYOtY0QJPMw47ph0f-dagKStf9tbLLtcE6XUz-72EZtK6mzAw
|
25 |
+
- type: exact_match
|
26 |
+
value: 84.0
|
27 |
+
name: Exact Match
|
28 |
+
verified: true
|
29 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYTdlODFkNDgyNDU5YjU1NDE0ZjVjYWU0Mzk5ZTA2ODRjYWRhMTg1MjFiNTg5ODA0NjE5OGVkZDc3ZjQ5N2E0NyIsInZlcnNpb24iOjF9.OPqpfiA6kRUzYEwqiYz-WVUMSBSlNn0T9v4uJUUKeQ4k0L7SKAfkqbR0LAg9xm6rh0-KadiUznFn3zDH2XUpDQ
|
30 |
+
- type: loss
|
31 |
+
value: 0.9980762600898743
|
32 |
+
name: loss
|
33 |
+
verified: true
|
34 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiM2Q0NDVkN2JlNmRmMmU1YzZhYWJiMDJhYmE0ZTUxOTA3MGEzMGMwYjI4M2EzNmYwY2FiNzMwOGIyYmUxYTIxZCIsInZlcnNpb24iOjF9.MQXuMC8iVbhMxSjgdMMOa9f1a_0ej7PoH2F_JbsOcYrfpt0c2q0KZmlasIaQFkjV-To62NhLts2oLWKgRQpwCw
|
35 |
---
|
36 |
|
37 |
# DistilBERT base cased distilled SQuAD
|