MSey commited on
Commit
9c73c46
·
verified ·
1 Parent(s): 2b1020f

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +6 -184
README.md CHANGED
@@ -11,166 +11,38 @@ pipeline_tag: token-classification
11
  We fine-tuned our base model for 71 epochs on the Ca dataset, epoch 61 showed the best results.
12
  ## Metrics
13
  seqeval entity-wise in evaulate
14
- _train_AVGf1 0.9756326545937595
15
-
16
- _train_DIAGNOSIS.avg_tokens_per_entity 6.812357501139991
17
-
18
- _train_DIAGNOSIS.entity_count 8772
19
-
20
- _train_DIAGNOSIS.f1 0.9847202499289974
21
-
22
- _train_DIAGNOSIS.precision 0.9813200498132005
23
-
24
- _train_DIAGNOSIS.recall 0.9881440948472412
25
-
26
- _train_DIAGNOSIS.token_count 59758
27
-
28
- _train_DIAGNOSTIC.avg_tokens_per_entity 5.99338106173173
29
-
30
- _train_DIAGNOSTIC.entity_count 7403
31
-
32
- _train_DIAGNOSTIC.f1 0.9729585006693441
33
-
34
- _train_DIAGNOSTIC.precision 0.9643094069258326
35
-
36
- _train_DIAGNOSTIC.recall 0.9817641496690531
37
-
38
- _train_DIAGNOSTIC.token_count 44369
39
-
40
- _train_DRUG.avg_tokens_per_entity 3.8747056052755533
41
-
42
- _train_DRUG.entity_count 4246
43
-
44
- _train_DRUG.f1 0.9928328046058043
45
-
46
- _train_DRUG.precision 0.9906213364595545
47
-
48
- _train_DRUG.recall 0.9950541686292982
49
-
50
- _train_DRUG.token_count 16452
51
-
52
- _train_MEDICAL_FINDING.avg_tokens_per_entity 8.822587975587586
53
-
54
- _train_MEDICAL_FINDING.entity_count 30804
55
-
56
- _train_MEDICAL_FINDING.f1 0.9658010684140024
57
-
58
- _train_MEDICAL_FINDING.precision 0.9603299419071156
59
-
60
- _train_MEDICAL_FINDING.recall 0.9713348915725231
61
-
62
- _train_MEDICAL_FINDING.token_count 271771
63
-
64
- _train_THERAPY.avg_tokens_per_entity 8.560322448421916
65
-
66
- _train_THERAPY.entity_count 7319
67
-
68
- _train_THERAPY.f1 0.9618506493506493
69
-
70
- _train_THERAPY.precision 0.9524447421299397
71
-
72
- _train_THERAPY.recall 0.9714441863642574
73
-
74
- _train_THERAPY.token_count 62653
75
-
76
- _train_accuracy 0.9938551197147224
77
-
78
- _train_f1 0.9709934550640488
79
-
80
- _train_loss 0.020609384402632713
81
-
82
- _train_precision 0.9651517964122382
83
-
84
- _train_recall 0.9769062585405849
85
-
86
- _train_runtime 142.8691
87
-
88
- _train_samples_per_second 229.063
89
-
90
- _train_steps_per_second 28.635
91
-
92
  eval_AVGf1 0.7889642398534424
93
 
94
- eval_DIAGNOSIS.avg_len 6.790370685982105
95
-
96
- eval_DIAGNOSIS.avg_tokens_per_entity 6.790370685982105
97
-
98
- eval_DIAGNOSIS.count 2347
99
-
100
- eval_DIAGNOSIS.entity_count 2347
101
-
102
  eval_DIAGNOSIS.f1 0.7870941224825319
103
 
104
  eval_DIAGNOSIS.precision 0.760222310440651
105
 
106
  eval_DIAGNOSIS.recall 0.815935236472092
107
 
108
- eval_DIAGNOSIS.token_count 15937
109
-
110
- eval_DIAGNOSTIC.avg_len 6.030130756111427
111
-
112
- eval_DIAGNOSTIC.avg_tokens_per_entity 6.030130756111427
113
-
114
- eval_DIAGNOSTIC.count 1759
115
-
116
- eval_DIAGNOSTIC.entity_count 1759
117
-
118
  eval_DIAGNOSTIC.f1 0.7870518994114499
119
 
120
  eval_DIAGNOSTIC.precision 0.7433046993431026
121
 
122
  eval_DIAGNOSTIC.recall 0.8362706083001705
123
 
124
- eval_DIAGNOSTIC.token_count 10607
125
-
126
- eval_DRUG.avg_len 3.9235500878734624
127
-
128
- eval_DRUG.avg_tokens_per_entity 3.9235500878734624
129
-
130
- eval_DRUG.count 1138
131
-
132
- eval_DRUG.entity_count 1138
133
-
134
  eval_DRUG.f1 0.9196581196581196
135
 
136
  eval_DRUG.precision 0.8951747088186356
137
 
138
  eval_DRUG.recall 0.945518453427065
139
 
140
- eval_DRUG.token_count 4465
141
-
142
- eval_MEDICAL_FINDING.avg_len 8.781120867768594
143
-
144
- eval_MEDICAL_FINDING.avg_tokens_per_entity 8.781120867768594
145
-
146
- eval_MEDICAL_FINDING.count 7744
147
-
148
- eval_MEDICAL_FINDING.entity_count 7744
149
-
150
  eval_MEDICAL_FINDING.f1 0.7699975080986794
151
 
152
  eval_MEDICAL_FINDING.precision 0.7438613384689456
153
 
154
  eval_MEDICAL_FINDING.recall 0.7980371900826446
155
 
156
- eval_MEDICAL_FINDING.token_count 68001
157
-
158
- eval_THERAPY.avg_len 8.44420941300899
159
-
160
- eval_THERAPY.avg_tokens_per_entity 8.44420941300899
161
-
162
- eval_THERAPY.count 1891
163
-
164
- eval_THERAPY.entity_count 1891
165
-
166
  eval_THERAPY.f1 0.6810195496164316
167
 
168
  eval_THERAPY.precision 0.64
169
 
170
  eval_THERAPY.recall 0.7276573241671074
171
 
172
- eval_THERAPY.token_count 15968
173
-
174
  eval_accuracy 0.9332097564796261
175
 
176
  eval_f1 0.7744305184135064
@@ -181,94 +53,44 @@ eval_precision 0.7437801708132195
181
 
182
  eval_recall 0.8077155722830835
183
 
184
- eval_runtime 36.8437
185
 
186
- eval_samples_per_second 222.073
187
 
188
- eval_steps_per_second 27.766
189
 
190
  test_AVGf1 0.7491200818619402
191
 
192
- test_DIAGNOSIS.avg_len 7.408243727598566
193
-
194
- test_DIAGNOSIS.avg_tokens_per_entity 7.408243727598566
195
-
196
- test_DIAGNOSIS.count 2790
197
-
198
- test_DIAGNOSIS.entity_count 2790
199
-
200
  test_DIAGNOSIS.f1 0.703534151254349
201
 
202
  test_DIAGNOSIS.precision 0.7192062897791089
203
 
204
  test_DIAGNOSIS.recall 0.6885304659498208
205
 
206
- test_DIAGNOSIS.token_count 20669
207
-
208
- test_DIAGNOSTIC.avg_len 6.136954503249767
209
-
210
- test_DIAGNOSTIC.avg_tokens_per_entity 6.136954503249767
211
-
212
- test_DIAGNOSTIC.count 2154
213
-
214
- test_DIAGNOSTIC.entity_count 2154
215
-
216
  test_DIAGNOSTIC.f1 0.7718579234972678
217
 
218
  test_DIAGNOSTIC.precision 0.7573726541554959
219
 
220
  test_DIAGNOSTIC.recall 0.786908077994429
221
 
222
- test_DIAGNOSTIC.token_count 13219
223
-
224
- test_DRUG.avg_len 3.7937931034482757
225
-
226
- test_DRUG.avg_tokens_per_entity 3.7937931034482757
227
-
228
- test_DRUG.count 1450
229
-
230
- test_DRUG.entity_count 1450
231
-
232
  test_DRUG.f1 0.9024472008045592
233
 
234
  test_DRUG.precision 0.878016960208741
235
 
236
  test_DRUG.recall 0.9282758620689655
237
 
238
- test_DRUG.token_count 5501
239
-
240
- test_MEDICAL_FINDING.avg_len 9.53191489361702
241
-
242
- test_MEDICAL_FINDING.avg_tokens_per_entity 9.53191489361702
243
-
244
- test_MEDICAL_FINDING.count 8366
245
-
246
- test_MEDICAL_FINDING.entity_count 8366
247
-
248
  test_MEDICAL_FINDING.f1 0.7280362842264404
249
 
250
  test_MEDICAL_FINDING.precision 0.6848203939745076
251
 
252
  test_MEDICAL_FINDING.recall 0.7770738704279225
253
 
254
- test_MEDICAL_FINDING.token_count 79744
255
-
256
- test_THERAPY.avg_len 8.884771802982376
257
-
258
- test_THERAPY.avg_tokens_per_entity 8.884771802982376
259
-
260
- test_THERAPY.count 2213
261
-
262
- test_THERAPY.entity_count 2213
263
-
264
  test_THERAPY.f1 0.639724849527085
265
 
266
  test_THERAPY.precision 0.6100861008610086
267
 
268
  test_THERAPY.recall 0.6723904202440126
269
 
270
- test_THERAPY.token_count 19662
271
-
272
  test_accuracy 0.9229989726085077
273
 
274
  test_f1 0.7327920332701502
@@ -279,8 +101,8 @@ test_precision 0.7048546859693045
279
 
280
  test_recall 0.7630354091792847
281
 
282
- test_runtime 42.7477
283
 
284
- test_samples_per_second 221.977
285
 
286
- test_steps_per_second 27.768
 
11
  We fine-tuned our base model for 71 epochs on the Ca dataset, epoch 61 showed the best results.
12
  ## Metrics
13
  seqeval entity-wise in evaulate
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
14
  eval_AVGf1 0.7889642398534424
15
 
 
 
 
 
 
 
 
 
16
  eval_DIAGNOSIS.f1 0.7870941224825319
17
 
18
  eval_DIAGNOSIS.precision 0.760222310440651
19
 
20
  eval_DIAGNOSIS.recall 0.815935236472092
21
 
 
 
 
 
 
 
 
 
 
 
22
  eval_DIAGNOSTIC.f1 0.7870518994114499
23
 
24
  eval_DIAGNOSTIC.precision 0.7433046993431026
25
 
26
  eval_DIAGNOSTIC.recall 0.8362706083001705
27
 
 
 
 
 
 
 
 
 
 
 
28
  eval_DRUG.f1 0.9196581196581196
29
 
30
  eval_DRUG.precision 0.8951747088186356
31
 
32
  eval_DRUG.recall 0.945518453427065
33
 
 
 
 
 
 
 
 
 
 
 
34
  eval_MEDICAL_FINDING.f1 0.7699975080986794
35
 
36
  eval_MEDICAL_FINDING.precision 0.7438613384689456
37
 
38
  eval_MEDICAL_FINDING.recall 0.7980371900826446
39
 
 
 
 
 
 
 
 
 
 
 
40
  eval_THERAPY.f1 0.6810195496164316
41
 
42
  eval_THERAPY.precision 0.64
43
 
44
  eval_THERAPY.recall 0.7276573241671074
45
 
 
 
46
  eval_accuracy 0.9332097564796261
47
 
48
  eval_f1 0.7744305184135064
 
53
 
54
  eval_recall 0.8077155722830835
55
 
56
+ eval_runtime 50.3125
57
 
58
+ eval_samples_per_second 162.624
59
 
60
+ eval_steps_per_second 20.333
61
 
62
  test_AVGf1 0.7491200818619402
63
 
 
 
 
 
 
 
 
 
64
  test_DIAGNOSIS.f1 0.703534151254349
65
 
66
  test_DIAGNOSIS.precision 0.7192062897791089
67
 
68
  test_DIAGNOSIS.recall 0.6885304659498208
69
 
 
 
 
 
 
 
 
 
 
 
70
  test_DIAGNOSTIC.f1 0.7718579234972678
71
 
72
  test_DIAGNOSTIC.precision 0.7573726541554959
73
 
74
  test_DIAGNOSTIC.recall 0.786908077994429
75
 
 
 
 
 
 
 
 
 
 
 
76
  test_DRUG.f1 0.9024472008045592
77
 
78
  test_DRUG.precision 0.878016960208741
79
 
80
  test_DRUG.recall 0.9282758620689655
81
 
 
 
 
 
 
 
 
 
 
 
82
  test_MEDICAL_FINDING.f1 0.7280362842264404
83
 
84
  test_MEDICAL_FINDING.precision 0.6848203939745076
85
 
86
  test_MEDICAL_FINDING.recall 0.7770738704279225
87
 
 
 
 
 
 
 
 
 
 
 
88
  test_THERAPY.f1 0.639724849527085
89
 
90
  test_THERAPY.precision 0.6100861008610086
91
 
92
  test_THERAPY.recall 0.6723904202440126
93
 
 
 
94
  test_accuracy 0.9229989726085077
95
 
96
  test_f1 0.7327920332701502
 
101
 
102
  test_recall 0.7630354091792847
103
 
104
+ test_runtime 58.5022
105
 
106
+ test_samples_per_second 162.199
107
 
108
+ test_steps_per_second 20.29