SerdarHelli commited on
Commit
15de256
·
1 Parent(s): 6a33562

ThyroidTumorClassification

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 19.73,
3
- "eval_f1": 0.9312977099236641,
4
- "eval_loss": 0.5987359285354614,
5
- "eval_runtime": 0.4648,
6
- "eval_samples_per_second": 176.425,
7
- "eval_steps_per_second": 6.455,
8
- "total_flos": 1.620732679243776e+17,
9
- "train_loss": 0.8578881025314331,
10
- "train_runtime": 102.9255,
11
- "train_samples_per_second": 63.347,
12
- "train_steps_per_second": 0.389
13
  }
 
1
  {
2
+ "epoch": 30.0,
3
+ "eval_f1": 0.8837209302325582,
4
+ "eval_loss": 0.5682619214057922,
5
+ "eval_runtime": 0.6789,
6
+ "eval_samples_per_second": 139.94,
7
+ "eval_steps_per_second": 4.419,
8
+ "total_flos": 2.8570124903878656e+17,
9
+ "train_loss": 0.5013438595665826,
10
+ "train_runtime": 222.831,
11
+ "train_samples_per_second": 51.025,
12
+ "train_steps_per_second": 0.404
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 19.73,
3
- "eval_f1": 0.9312977099236641,
4
- "eval_loss": 0.5987359285354614,
5
- "eval_runtime": 0.4648,
6
- "eval_samples_per_second": 176.425,
7
- "eval_steps_per_second": 6.455
8
  }
 
1
  {
2
+ "epoch": 30.0,
3
+ "eval_f1": 0.8837209302325582,
4
+ "eval_loss": 0.5682619214057922,
5
+ "eval_runtime": 0.6789,
6
+ "eval_samples_per_second": 139.94,
7
+ "eval_steps_per_second": 4.419
8
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ce7c3b86954dad0996ccf49be4284947b73504f1521f15cd9a889bf12083e90
3
  size 111347349
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f5768f543feec39b661a0d3347394478b69fe2fb6010928ea157000d3c03bb2
3
  size 111347349
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 19.73,
3
- "total_flos": 1.620732679243776e+17,
4
- "train_loss": 0.8578881025314331,
5
- "train_runtime": 102.9255,
6
- "train_samples_per_second": 63.347,
7
- "train_steps_per_second": 0.389
8
  }
 
1
  {
2
+ "epoch": 30.0,
3
+ "total_flos": 2.8570124903878656e+17,
4
+ "train_loss": 0.5013438595665826,
5
+ "train_runtime": 222.831,
6
+ "train_samples_per_second": 51.025,
7
+ "train_steps_per_second": 0.404
8
  }
trainer_state.json CHANGED
@@ -1,211 +1,313 @@
1
  {
2
- "best_metric": 0.9312977099236641,
3
- "best_model_checkpoint": "Cvt-finetuned-thyroid/checkpoint-36",
4
- "epoch": 19.727272727272727,
5
- "global_step": 40,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.73,
12
- "eval_f1": 0.08695652173913043,
13
- "eval_loss": 0.729124128818512,
14
- "eval_runtime": 0.5602,
15
- "eval_samples_per_second": 146.387,
16
- "eval_steps_per_second": 5.356,
17
- "step": 2
18
- },
19
- {
20
- "epoch": 1.73,
21
- "eval_f1": 0.24,
22
- "eval_loss": 0.715528666973114,
23
- "eval_runtime": 0.4576,
24
- "eval_samples_per_second": 179.212,
25
- "eval_steps_per_second": 6.557,
26
- "step": 4
27
- },
28
- {
29
- "epoch": 2.73,
30
- "eval_f1": 0.4651162790697675,
31
- "eval_loss": 0.6962855458259583,
32
- "eval_runtime": 0.4553,
33
- "eval_samples_per_second": 180.089,
34
- "eval_steps_per_second": 6.589,
35
- "step": 6
36
  },
37
  {
38
- "epoch": 3.73,
39
- "eval_f1": 0.6732673267326733,
40
- "eval_loss": 0.6805053353309631,
41
- "eval_runtime": 0.456,
42
- "eval_samples_per_second": 179.84,
43
- "eval_steps_per_second": 6.58,
44
- "step": 8
45
  },
46
  {
47
- "epoch": 4.73,
48
- "eval_f1": 0.8035714285714285,
49
- "eval_loss": 0.6671938896179199,
50
- "eval_runtime": 0.4582,
51
- "eval_samples_per_second": 178.951,
52
- "eval_steps_per_second": 6.547,
53
- "step": 10
54
  },
55
  {
56
- "epoch": 5.73,
57
- "eval_f1": 0.8666666666666666,
58
- "eval_loss": 0.6562464237213135,
59
- "eval_runtime": 0.4523,
60
- "eval_samples_per_second": 181.301,
61
- "eval_steps_per_second": 6.633,
62
  "step": 12
63
  },
64
  {
65
- "epoch": 6.73,
66
- "eval_f1": 0.8688524590163934,
67
- "eval_loss": 0.6468915343284607,
68
- "eval_runtime": 0.4563,
69
- "eval_samples_per_second": 179.688,
70
- "eval_steps_per_second": 6.574,
71
- "step": 14
72
  },
73
  {
74
- "epoch": 7.73,
75
- "eval_f1": 0.9047619047619049,
76
- "eval_loss": 0.6390055418014526,
77
- "eval_runtime": 0.4554,
78
- "eval_samples_per_second": 180.045,
79
- "eval_steps_per_second": 6.587,
80
- "step": 16
81
  },
82
  {
83
- "epoch": 8.73,
84
- "eval_f1": 0.9218749999999999,
85
- "eval_loss": 0.6321854591369629,
86
- "eval_runtime": 0.4533,
87
- "eval_samples_per_second": 180.88,
88
- "eval_steps_per_second": 6.618,
89
- "step": 18
90
  },
91
  {
92
- "epoch": 9.73,
93
- "eval_f1": 0.9218749999999999,
94
- "eval_loss": 0.6260910034179688,
95
- "eval_runtime": 0.4585,
96
- "eval_samples_per_second": 178.853,
97
- "eval_steps_per_second": 6.543,
98
- "step": 20
99
  },
100
  {
101
- "epoch": 10.73,
102
- "eval_f1": 0.9147286821705426,
103
- "eval_loss": 0.6207503080368042,
104
- "eval_runtime": 0.4613,
105
- "eval_samples_per_second": 177.741,
106
- "eval_steps_per_second": 6.503,
107
- "step": 22
108
  },
109
  {
110
- "epoch": 11.73,
111
- "eval_f1": 0.9147286821705426,
112
- "eval_loss": 0.6160098910331726,
113
- "eval_runtime": 0.4683,
114
- "eval_samples_per_second": 175.09,
115
- "eval_steps_per_second": 6.406,
116
- "step": 24
117
  },
118
  {
119
- "epoch": 12.36,
120
- "learning_rate": 4.166666666666667e-06,
121
- "loss": 0.8937,
122
- "step": 25
 
 
 
 
 
 
 
 
 
 
 
 
123
  },
124
  {
125
- "epoch": 12.73,
126
- "eval_f1": 0.9147286821705426,
127
- "eval_loss": 0.6118525862693787,
128
- "eval_runtime": 0.4721,
129
- "eval_samples_per_second": 173.678,
130
- "eval_steps_per_second": 6.354,
131
- "step": 26
132
  },
133
  {
134
- "epoch": 13.73,
135
- "eval_f1": 0.9147286821705426,
136
- "eval_loss": 0.6081259846687317,
137
- "eval_runtime": 0.4553,
138
- "eval_samples_per_second": 180.118,
139
- "eval_steps_per_second": 6.59,
140
- "step": 28
141
  },
142
  {
143
- "epoch": 14.73,
144
- "eval_f1": 0.923076923076923,
145
- "eval_loss": 0.6047901511192322,
146
- "eval_runtime": 0.4555,
147
- "eval_samples_per_second": 180.011,
148
- "eval_steps_per_second": 6.586,
149
- "step": 30
150
  },
151
  {
152
- "epoch": 15.73,
153
- "eval_f1": 0.923076923076923,
154
- "eval_loss": 0.6022080183029175,
155
- "eval_runtime": 0.4519,
156
- "eval_samples_per_second": 181.441,
157
- "eval_steps_per_second": 6.638,
158
- "step": 32
159
  },
160
  {
161
- "epoch": 16.73,
162
- "eval_f1": 0.923076923076923,
163
- "eval_loss": 0.6001817584037781,
164
- "eval_runtime": 0.4544,
165
- "eval_samples_per_second": 180.453,
166
- "eval_steps_per_second": 6.602,
167
- "step": 34
168
  },
169
  {
170
- "epoch": 17.73,
171
- "eval_f1": 0.9312977099236641,
172
- "eval_loss": 0.5987359285354614,
173
- "eval_runtime": 0.4559,
174
- "eval_samples_per_second": 179.858,
175
- "eval_steps_per_second": 6.58,
176
- "step": 36
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
177
  },
178
  {
179
- "epoch": 18.73,
180
- "eval_f1": 0.9312977099236641,
181
- "eval_loss": 0.5978376269340515,
182
- "eval_runtime": 0.4536,
183
- "eval_samples_per_second": 180.765,
184
- "eval_steps_per_second": 6.613,
185
- "step": 38
186
  },
187
  {
188
- "epoch": 19.73,
189
- "eval_f1": 0.9312977099236641,
190
- "eval_loss": 0.5974743962287903,
191
- "eval_runtime": 0.4555,
192
- "eval_samples_per_second": 180.031,
193
- "eval_steps_per_second": 6.586,
194
- "step": 40
195
  },
196
  {
197
- "epoch": 19.73,
198
- "step": 40,
199
- "total_flos": 1.620732679243776e+17,
200
- "train_loss": 0.8578881025314331,
201
- "train_runtime": 102.9255,
202
- "train_samples_per_second": 63.347,
203
- "train_steps_per_second": 0.389
204
  }
205
  ],
206
- "max_steps": 40,
207
- "num_train_epochs": 20,
208
- "total_flos": 1.620732679243776e+17,
209
  "trial_name": null,
210
  "trial_params": null
211
  }
 
1
  {
2
+ "best_metric": 0.8837209302325582,
3
+ "best_model_checkpoint": "Cvt-finetuned-thyroid/checkpoint-27",
4
+ "epoch": 30.0,
5
+ "global_step": 90,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 1.0,
12
+ "eval_f1": 0.5052631578947367,
13
+ "eval_loss": 0.687919557094574,
14
+ "eval_runtime": 0.6589,
15
+ "eval_samples_per_second": 144.182,
16
+ "eval_steps_per_second": 4.553,
17
+ "step": 3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
18
  },
19
  {
20
+ "epoch": 2.0,
21
+ "eval_f1": 0.673076923076923,
22
+ "eval_loss": 0.6748365759849548,
23
+ "eval_runtime": 0.6341,
24
+ "eval_samples_per_second": 149.822,
25
+ "eval_steps_per_second": 4.731,
26
+ "step": 6
27
  },
28
  {
29
+ "epoch": 3.0,
30
+ "eval_f1": 0.8034188034188033,
31
+ "eval_loss": 0.6552020311355591,
32
+ "eval_runtime": 0.6415,
33
+ "eval_samples_per_second": 148.089,
34
+ "eval_steps_per_second": 4.676,
35
+ "step": 9
36
  },
37
  {
38
+ "epoch": 4.0,
39
+ "eval_f1": 0.88,
40
+ "eval_loss": 0.6357027888298035,
41
+ "eval_runtime": 0.6465,
42
+ "eval_samples_per_second": 146.936,
43
+ "eval_steps_per_second": 4.64,
44
  "step": 12
45
  },
46
  {
47
+ "epoch": 5.0,
48
+ "eval_f1": 0.8615384615384616,
49
+ "eval_loss": 0.6192407011985779,
50
+ "eval_runtime": 0.6387,
51
+ "eval_samples_per_second": 148.729,
52
+ "eval_steps_per_second": 4.697,
53
+ "step": 15
54
  },
55
  {
56
+ "epoch": 6.0,
57
+ "eval_f1": 0.8769230769230769,
58
+ "eval_loss": 0.604374349117279,
59
+ "eval_runtime": 0.645,
60
+ "eval_samples_per_second": 147.298,
61
+ "eval_steps_per_second": 4.652,
62
+ "step": 18
63
  },
64
  {
65
+ "epoch": 7.0,
66
+ "eval_f1": 0.8769230769230769,
67
+ "eval_loss": 0.5909456014633179,
68
+ "eval_runtime": 0.6526,
69
+ "eval_samples_per_second": 145.576,
70
+ "eval_steps_per_second": 4.597,
71
+ "step": 21
72
  },
73
  {
74
+ "epoch": 8.0,
75
+ "eval_f1": 0.8769230769230769,
76
+ "eval_loss": 0.5791701674461365,
77
+ "eval_runtime": 0.6491,
78
+ "eval_samples_per_second": 146.347,
79
+ "eval_steps_per_second": 4.621,
80
+ "step": 24
81
  },
82
  {
83
+ "epoch": 8.33,
84
+ "learning_rate": 8.024691358024692e-06,
85
+ "loss": 0.638,
86
+ "step": 25
 
 
 
87
  },
88
  {
89
+ "epoch": 9.0,
90
+ "eval_f1": 0.8837209302325582,
91
+ "eval_loss": 0.5682619214057922,
92
+ "eval_runtime": 0.6497,
93
+ "eval_samples_per_second": 146.222,
94
+ "eval_steps_per_second": 4.618,
95
+ "step": 27
96
  },
97
  {
98
+ "epoch": 10.0,
99
+ "eval_f1": 0.8837209302325582,
100
+ "eval_loss": 0.5576053261756897,
101
+ "eval_runtime": 0.653,
102
+ "eval_samples_per_second": 145.478,
103
+ "eval_steps_per_second": 4.594,
104
+ "step": 30
105
+ },
106
+ {
107
+ "epoch": 11.0,
108
+ "eval_f1": 0.8837209302325582,
109
+ "eval_loss": 0.5474461913108826,
110
+ "eval_runtime": 0.651,
111
+ "eval_samples_per_second": 145.928,
112
+ "eval_steps_per_second": 4.608,
113
+ "step": 33
114
  },
115
  {
116
+ "epoch": 12.0,
117
+ "eval_f1": 0.8837209302325582,
118
+ "eval_loss": 0.5376133322715759,
119
+ "eval_runtime": 0.6594,
120
+ "eval_samples_per_second": 144.075,
121
+ "eval_steps_per_second": 4.55,
122
+ "step": 36
123
  },
124
  {
125
+ "epoch": 13.0,
126
+ "eval_f1": 0.8837209302325582,
127
+ "eval_loss": 0.5282223224639893,
128
+ "eval_runtime": 0.6631,
129
+ "eval_samples_per_second": 143.267,
130
+ "eval_steps_per_second": 4.524,
131
+ "step": 39
132
  },
133
  {
134
+ "epoch": 14.0,
135
+ "eval_f1": 0.8837209302325582,
136
+ "eval_loss": 0.5196569561958313,
137
+ "eval_runtime": 0.6551,
138
+ "eval_samples_per_second": 145.016,
139
+ "eval_steps_per_second": 4.579,
140
+ "step": 42
141
  },
142
  {
143
+ "epoch": 15.0,
144
+ "eval_f1": 0.8837209302325582,
145
+ "eval_loss": 0.5118635296821594,
146
+ "eval_runtime": 0.6658,
147
+ "eval_samples_per_second": 142.69,
148
+ "eval_steps_per_second": 4.506,
149
+ "step": 45
150
  },
151
  {
152
+ "epoch": 16.0,
153
+ "eval_f1": 0.8837209302325582,
154
+ "eval_loss": 0.5053044557571411,
155
+ "eval_runtime": 0.6565,
156
+ "eval_samples_per_second": 144.71,
157
+ "eval_steps_per_second": 4.57,
158
+ "step": 48
159
  },
160
  {
161
+ "epoch": 16.67,
162
+ "learning_rate": 4.938271604938272e-06,
163
+ "loss": 0.4926,
164
+ "step": 50
165
+ },
166
+ {
167
+ "epoch": 17.0,
168
+ "eval_f1": 0.8837209302325582,
169
+ "eval_loss": 0.49933797121047974,
170
+ "eval_runtime": 0.6612,
171
+ "eval_samples_per_second": 143.679,
172
+ "eval_steps_per_second": 4.537,
173
+ "step": 51
174
+ },
175
+ {
176
+ "epoch": 18.0,
177
+ "eval_f1": 0.8837209302325582,
178
+ "eval_loss": 0.4940946102142334,
179
+ "eval_runtime": 0.661,
180
+ "eval_samples_per_second": 143.726,
181
+ "eval_steps_per_second": 4.539,
182
+ "step": 54
183
+ },
184
+ {
185
+ "epoch": 19.0,
186
+ "eval_f1": 0.8837209302325582,
187
+ "eval_loss": 0.4895910918712616,
188
+ "eval_runtime": 0.6623,
189
+ "eval_samples_per_second": 143.44,
190
+ "eval_steps_per_second": 4.53,
191
+ "step": 57
192
+ },
193
+ {
194
+ "epoch": 20.0,
195
+ "eval_f1": 0.8837209302325582,
196
+ "eval_loss": 0.4853971004486084,
197
+ "eval_runtime": 0.6837,
198
+ "eval_samples_per_second": 138.946,
199
+ "eval_steps_per_second": 4.388,
200
+ "step": 60
201
+ },
202
+ {
203
+ "epoch": 21.0,
204
+ "eval_f1": 0.8837209302325582,
205
+ "eval_loss": 0.48188260197639465,
206
+ "eval_runtime": 0.6669,
207
+ "eval_samples_per_second": 142.45,
208
+ "eval_steps_per_second": 4.498,
209
+ "step": 63
210
+ },
211
+ {
212
+ "epoch": 22.0,
213
+ "eval_f1": 0.8837209302325582,
214
+ "eval_loss": 0.4790306091308594,
215
+ "eval_runtime": 0.6675,
216
+ "eval_samples_per_second": 142.322,
217
+ "eval_steps_per_second": 4.494,
218
+ "step": 66
219
+ },
220
+ {
221
+ "epoch": 23.0,
222
+ "eval_f1": 0.8837209302325582,
223
+ "eval_loss": 0.47673219442367554,
224
+ "eval_runtime": 0.6755,
225
+ "eval_samples_per_second": 140.639,
226
+ "eval_steps_per_second": 4.441,
227
+ "step": 69
228
+ },
229
+ {
230
+ "epoch": 24.0,
231
+ "eval_f1": 0.8837209302325582,
232
+ "eval_loss": 0.4748006761074066,
233
+ "eval_runtime": 0.6675,
234
+ "eval_samples_per_second": 142.313,
235
+ "eval_steps_per_second": 4.494,
236
+ "step": 72
237
+ },
238
+ {
239
+ "epoch": 25.0,
240
+ "learning_rate": 1.8518518518518519e-06,
241
+ "loss": 0.4289,
242
+ "step": 75
243
+ },
244
+ {
245
+ "epoch": 25.0,
246
+ "eval_f1": 0.8837209302325582,
247
+ "eval_loss": 0.4731859564781189,
248
+ "eval_runtime": 0.6627,
249
+ "eval_samples_per_second": 143.353,
250
+ "eval_steps_per_second": 4.527,
251
+ "step": 75
252
+ },
253
+ {
254
+ "epoch": 26.0,
255
+ "eval_f1": 0.8837209302325582,
256
+ "eval_loss": 0.4718676507472992,
257
+ "eval_runtime": 0.6719,
258
+ "eval_samples_per_second": 141.397,
259
+ "eval_steps_per_second": 4.465,
260
+ "step": 78
261
+ },
262
+ {
263
+ "epoch": 27.0,
264
+ "eval_f1": 0.8837209302325582,
265
+ "eval_loss": 0.4708217680454254,
266
+ "eval_runtime": 0.68,
267
+ "eval_samples_per_second": 139.706,
268
+ "eval_steps_per_second": 4.412,
269
+ "step": 81
270
+ },
271
+ {
272
+ "epoch": 28.0,
273
+ "eval_f1": 0.8837209302325582,
274
+ "eval_loss": 0.47011542320251465,
275
+ "eval_runtime": 0.6739,
276
+ "eval_samples_per_second": 140.966,
277
+ "eval_steps_per_second": 4.452,
278
+ "step": 84
279
  },
280
  {
281
+ "epoch": 29.0,
282
+ "eval_f1": 0.8837209302325582,
283
+ "eval_loss": 0.4697326123714447,
284
+ "eval_runtime": 0.6728,
285
+ "eval_samples_per_second": 141.199,
286
+ "eval_steps_per_second": 4.459,
287
+ "step": 87
288
  },
289
  {
290
+ "epoch": 30.0,
291
+ "eval_f1": 0.8837209302325582,
292
+ "eval_loss": 0.4695647060871124,
293
+ "eval_runtime": 0.6801,
294
+ "eval_samples_per_second": 139.689,
295
+ "eval_steps_per_second": 4.411,
296
+ "step": 90
297
  },
298
  {
299
+ "epoch": 30.0,
300
+ "step": 90,
301
+ "total_flos": 2.8570124903878656e+17,
302
+ "train_loss": 0.5013438595665826,
303
+ "train_runtime": 222.831,
304
+ "train_samples_per_second": 51.025,
305
+ "train_steps_per_second": 0.404
306
  }
307
  ],
308
+ "max_steps": 90,
309
+ "num_train_epochs": 30,
310
+ "total_flos": 2.8570124903878656e+17,
311
  "trial_name": null,
312
  "trial_params": null
313
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98064b8c1615330c92e0bd8f4b34a86ff482df6adfeb93cfdfa4d377fa744a73
3
  size 3311
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6605b4550676653f6a9e7bbcb528bc7fd05170d1b839094df3e2a84195ed6b46
3
  size 3311