Commit
•
dce3153
1
Parent(s):
c2d9067
Add verifyToken field to verify evaluation results are produced by Hugging Face's automatic model evaluator
Browse filesBeep boop, I am a bot from Hugging Face's automatic model evaluator 👋! We've added a new `verifyToken` field to your evaluation results to verify that they are produced by the model evaluator. Accept this PR to ensure that your results remain listed as **verified** on the [Hub leaderboard](https://huggingface.co/spaces/autoevaluate/leaderboards).
README.md
CHANGED
@@ -12,16 +12,16 @@ model-index:
|
|
12 |
- name: bert-base-uncased-mnli
|
13 |
results:
|
14 |
- task:
|
15 |
-
name: Text Classification
|
16 |
type: text-classification
|
|
|
17 |
dataset:
|
18 |
name: GLUE MNLI
|
19 |
type: glue
|
20 |
args: mnli
|
21 |
metrics:
|
22 |
-
-
|
23 |
-
type: accuracy
|
24 |
value: 0.8500813669650122
|
|
|
25 |
- task:
|
26 |
type: natural-language-inference
|
27 |
name: Natural Language Inference
|
@@ -31,50 +31,61 @@ model-index:
|
|
31 |
config: mnli_matched
|
32 |
split: validation
|
33 |
metrics:
|
34 |
-
-
|
35 |
-
type: accuracy
|
36 |
value: 0.8467651553744269
|
|
|
37 |
verified: true
|
38 |
-
|
39 |
-
|
40 |
value: 0.8460148987014974
|
|
|
41 |
verified: true
|
42 |
-
|
43 |
-
|
44 |
value: 0.8467651553744269
|
|
|
45 |
verified: true
|
46 |
-
|
47 |
-
|
48 |
value: 0.8475656756385261
|
|
|
49 |
verified: true
|
50 |
-
|
51 |
-
|
52 |
value: 0.8463172075485045
|
|
|
53 |
verified: true
|
54 |
-
|
55 |
-
|
56 |
value: 0.8467651553744269
|
|
|
57 |
verified: true
|
58 |
-
|
59 |
-
|
60 |
value: 0.8467651553744269
|
|
|
61 |
verified: true
|
62 |
-
|
63 |
-
|
64 |
value: 0.8459654597797398
|
|
|
65 |
verified: true
|
66 |
-
|
67 |
-
|
68 |
value: 0.8467651553744269
|
|
|
69 |
verified: true
|
70 |
-
|
71 |
-
|
72 |
value: 0.8469586362613581
|
|
|
73 |
verified: true
|
74 |
-
|
75 |
-
|
76 |
value: 0.42515239119529724
|
|
|
77 |
verified: true
|
|
|
78 |
---
|
79 |
|
80 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
|
|
12 |
- name: bert-base-uncased-mnli
|
13 |
results:
|
14 |
- task:
|
|
|
15 |
type: text-classification
|
16 |
+
name: Text Classification
|
17 |
dataset:
|
18 |
name: GLUE MNLI
|
19 |
type: glue
|
20 |
args: mnli
|
21 |
metrics:
|
22 |
+
- type: accuracy
|
|
|
23 |
value: 0.8500813669650122
|
24 |
+
name: Accuracy
|
25 |
- task:
|
26 |
type: natural-language-inference
|
27 |
name: Natural Language Inference
|
|
|
31 |
config: mnli_matched
|
32 |
split: validation
|
33 |
metrics:
|
34 |
+
- type: accuracy
|
|
|
35 |
value: 0.8467651553744269
|
36 |
+
name: Accuracy
|
37 |
verified: true
|
38 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiN2MwZjZhM2RlMmU5Mjg5NzE0MTA3ODdjZGQwN2U5ZWNhYWUzMmRjMmVhMGEyMjQ3ZGMwOGRjNzkzM2VlNmUyOCIsInZlcnNpb24iOjF9.C6QBegyKVg-5xN06res-t3KxhUbC3kloOy_zf8Lxv981N2aNtmzpVPmiUimrESQj2j9h8PRhH3_shVd_iCpfCA
|
39 |
+
- type: precision
|
40 |
value: 0.8460148987014974
|
41 |
+
name: Precision Macro
|
42 |
verified: true
|
43 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNWViM2QzYjgxZWFkMzlhMzA4ZjdiYzJjZTRhMDQwMjYwZmU3ZmQ5ZmU5YjgzY2FkOWNhMThhODczNjhiMWRiMyIsInZlcnNpb24iOjF9.yLUl2HVaLNjaQImJELdCZjGIqFoBjoCLMh4iijrlneVn87_fJxaieaES-lf6za141LSPSnHmp1H6SKo1L7GGCQ
|
44 |
+
- type: precision
|
45 |
value: 0.8467651553744269
|
46 |
+
name: Precision Micro
|
47 |
verified: true
|
48 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiOGIzMjJlMjIwNzA4YzAxYzQ5NGIxZjM0MWE2OWFlYTlmOTU5NzNjZTg0MTJiOTQ2N2U4NmE0NDFmNTc1MGQ5ZCIsInZlcnNpb24iOjF9.u-6lo01PvyYYLnVSc11mzEzga-p6b3gKxWLi_6ziAFZH_3HLZIqrdBoedqhkuRau5u6DcdUlGlWvs0k_7gxCBg
|
49 |
+
- type: precision
|
50 |
value: 0.8475656756385261
|
51 |
+
name: Precision Weighted
|
52 |
verified: true
|
53 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiY2FlZmE0MTMwNjRlN2MwZjZiMWY1OWE2OTM5MTc3N2Q2ZTVkMzBiYWUyMjU5YThlYjE1MGJkN2ViZTM3ODBhOCIsInZlcnNpb24iOjF9.0u0DToJ9Y_xstI5UB2yXydcHWPasql0z60zLONiRVWEjR6dbs2JzAHmRUrN3IO1QDRz5ssH0w979VRa-lyk3AA
|
54 |
+
- type: recall
|
55 |
value: 0.8463172075485045
|
56 |
+
name: Recall Macro
|
57 |
verified: true
|
58 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNzQ3MjA4MDI1YWZhYTg0NDliYjQ3NGQ5Y2I2NGI1NDNmNTQ3NjdkMmMxYWQ0NDExMzdhNzdmZWFmZTkyNGM5YiIsInZlcnNpb24iOjF9.veXK2iXkDSCDqM3_y3PyGwbZWsQRO_tvNRdmQB3vbvK1Bv4BYYL8WKUfIXm2Apr6IPRA0zeJNvfWIGnigX37Dg
|
59 |
+
- type: recall
|
60 |
value: 0.8467651553744269
|
61 |
+
name: Recall Micro
|
62 |
verified: true
|
63 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiMDdlMzcwMzEyNWYxZGFhY2JkNzZmZWQ5NzU4ODQ2MjU3ODMzZGRmZmNlYTM2YTBkNTI4MjAzM2FkOWUxNDBlZSIsInZlcnNpb24iOjF9.rRyz3xQyJ4plzLAc7bJhSbTWdJB7ioX4qhaX6k0e52JL5RdBfwmMJc9lVPUhE70__10Hk_MdzLor5sFF1yaFAA
|
64 |
+
- type: recall
|
65 |
value: 0.8467651553744269
|
66 |
+
name: Recall Weighted
|
67 |
verified: true
|
68 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiNTc2YzUwMWZjNGYyMjczNzk1YWJkZjkxMDI5NGRjMzdlMTU3YzZlZDQxNmI2YWE3MTQ3ZDVkMDAwY2NlNTA2NSIsInZlcnNpb24iOjF9.j4Kdqqo9LQxsb0A1TEd5K2U7j0qXrv50pbIc9DVdhoIrfIyFiSHuhPHIPZLubr-w0gVjn6aYl-kcM9EiGOSgCg
|
69 |
+
- type: f1
|
70 |
value: 0.8459654597797398
|
71 |
+
name: F1 Macro
|
72 |
verified: true
|
73 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZjcxOWM1YjBiNDVlODZlMjUyZTMwNDUzOTM2MmM4MGNiN2QwOGY1MTE2YjhkZDJjNTlhM2JhMzI4MTcwZjMyYyIsInZlcnNpb24iOjF9.T7zjSHGRWPNMYIiEWGRQTeqY9LHMm0j-3RE3wmYJ5je--eoMhBa7AvRefmSQwZgJtmxwITGGpvXz-0qdfel3Ag
|
74 |
+
- type: f1
|
75 |
value: 0.8467651553744269
|
76 |
+
name: F1 Micro
|
77 |
verified: true
|
78 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiYzIzMjFlYzZmMmEyMDRlNDY5ZmYxOGMxZWM2ZjFjYmZlMTRlOTFiMjg3MWJmNmFjMzdkYTM2ODJlOGEwZWY1MSIsInZlcnNpb24iOjF9.1ZvHppu3JfoorjOpQooRVUFlsR1lLLoW_NoswdSsIUwyArbIDg6KRZLwxf-G40efl7hbdXZbr7Ey1WsyTdc0Dw
|
79 |
+
- type: f1
|
80 |
value: 0.8469586362613581
|
81 |
+
name: F1 Weighted
|
82 |
verified: true
|
83 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZDM0MTlhYjZlNzBjNjIwNTQyMWIzN2VlNDU5ZmE5YWRlNGYyMGJmZTA4YzFjMGZmMmJlYTNiMzc0YjVhZjQ1NSIsInZlcnNpb24iOjF9.Na8fUEOkFTbctyzR7oSKJNTn2DCwHs-kEXUOBhz9_nxedczUDKiB1xOR372db9b3ot8ttlmceaNgBOnPIiBCBw
|
84 |
+
- type: loss
|
85 |
value: 0.42515239119529724
|
86 |
+
name: loss
|
87 |
verified: true
|
88 |
+
verifyToken: eyJhbGciOiJFZERTQSIsInR5cCI6IkpXVCJ9.eyJoYXNoIjoiZDg5NWViMWNmYjczN2ZmMjIzODg2ZGYxZmU2ZjdjM2M2MDZjYTI0ZDc4OTUwZDk3YzBiZmFlMjI4ZmQ4Zjg0YSIsInZlcnNpb24iOjF9.4g708h4xeFXdR0vYBgU70gr-I-rLns2RrPWUg4hEQTO4RzQ1fCe-54gH5kH3DTRwLJU4qJYL4SQNZOE-62ahDg
|
89 |
---
|
90 |
|
91 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|