dvs commited on
Commit
eb4d443
1 Parent(s): e8b5ef6

Upload folder using huggingface_hub

Browse files
README.md ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ ---
3
+ tags:
4
+ - autotrain
5
+ - image-classification
6
+ widget:
7
+ - src: https://huggingface.co/datasets/mishig/sample_images/resolve/main/tiger.jpg
8
+ example_title: Tiger
9
+ - src: https://huggingface.co/datasets/mishig/sample_images/resolve/main/teapot.jpg
10
+ example_title: Teapot
11
+ - src: https://huggingface.co/datasets/mishig/sample_images/resolve/main/palace.jpg
12
+ example_title: Palace
13
+ datasets:
14
+ - autotrain-5ozhd-efa4o/autotrain-data
15
+ ---
16
+
17
+ # Model Trained Using AutoTrain
18
+
19
+ - Problem type: Image Classification
20
+
21
+ ## Validation Metricsg
22
+ loss: 0.04287773743271828
23
+
24
+ f1: 1.0
25
+
26
+ precision: 1.0
27
+
28
+ recall: 1.0
29
+
30
+ auc: 1.0
31
+
32
+ accuracy: 1.0
checkpoint-72/config.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "google/vit-base-patch16-224",
3
+ "_num_labels": 2,
4
+ "architectures": [
5
+ "ViTForImageClassification"
6
+ ],
7
+ "attention_probs_dropout_prob": 0.0,
8
+ "encoder_stride": 16,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.0,
11
+ "hidden_size": 768,
12
+ "id2label": {
13
+ "0": "mulder",
14
+ "1": "scully"
15
+ },
16
+ "image_size": 224,
17
+ "initializer_range": 0.02,
18
+ "intermediate_size": 3072,
19
+ "label2id": {
20
+ "mulder": 0,
21
+ "scully": 1
22
+ },
23
+ "layer_norm_eps": 1e-12,
24
+ "model_type": "vit",
25
+ "num_attention_heads": 12,
26
+ "num_channels": 3,
27
+ "num_hidden_layers": 12,
28
+ "patch_size": 16,
29
+ "problem_type": "single_label_classification",
30
+ "qkv_bias": true,
31
+ "torch_dtype": "float32",
32
+ "transformers_version": "4.37.0"
33
+ }
checkpoint-72/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:981b48030a011740f8674bba203e9161515fa357d3b4151d614e82314c6311f3
3
+ size 343223968
checkpoint-72/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c351b8d27e95707ad8b35b4baf2eca351e97f2f7b4063e7875700053d4261e2
3
+ size 686568890
checkpoint-72/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b902436ede14f21853f48e294c48e3183ef19dffb39894033493cfce466e974d
3
+ size 14244
checkpoint-72/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2c360eab626edb5c10de58a3359d614f7dd14f014dd86e743cf484d659eb801
3
+ size 1064
checkpoint-72/trainer_state.json ADDED
@@ -0,0 +1,687 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.04287773743271828,
3
+ "best_model_checkpoint": "autotrain-5ozhd-efa4o/checkpoint-72",
4
+ "epoch": 18.0,
5
+ "eval_steps": 500,
6
+ "global_step": 72,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.25,
13
+ "learning_rate": 6.25e-06,
14
+ "loss": 0.6818,
15
+ "step": 1
16
+ },
17
+ {
18
+ "epoch": 0.5,
19
+ "learning_rate": 1.25e-05,
20
+ "loss": 0.8124,
21
+ "step": 2
22
+ },
23
+ {
24
+ "epoch": 0.75,
25
+ "learning_rate": 1.8750000000000002e-05,
26
+ "loss": 0.5196,
27
+ "step": 3
28
+ },
29
+ {
30
+ "epoch": 1.0,
31
+ "learning_rate": 1.8750000000000002e-05,
32
+ "loss": 0.8215,
33
+ "step": 4
34
+ },
35
+ {
36
+ "epoch": 1.0,
37
+ "eval_accuracy": 0.7142857142857143,
38
+ "eval_auc": 0.41666666666666663,
39
+ "eval_f1": 0.75,
40
+ "eval_loss": 0.5936104655265808,
41
+ "eval_precision": 0.75,
42
+ "eval_recall": 0.75,
43
+ "eval_runtime": 0.2459,
44
+ "eval_samples_per_second": 28.47,
45
+ "eval_steps_per_second": 4.067,
46
+ "step": 4
47
+ },
48
+ {
49
+ "epoch": 1.25,
50
+ "learning_rate": 2.5e-05,
51
+ "loss": 0.9638,
52
+ "step": 5
53
+ },
54
+ {
55
+ "epoch": 1.5,
56
+ "learning_rate": 2.5e-05,
57
+ "loss": 0.659,
58
+ "step": 6
59
+ },
60
+ {
61
+ "epoch": 1.75,
62
+ "learning_rate": 3.125e-05,
63
+ "loss": 0.9674,
64
+ "step": 7
65
+ },
66
+ {
67
+ "epoch": 2.0,
68
+ "learning_rate": 3.7500000000000003e-05,
69
+ "loss": 0.9059,
70
+ "step": 8
71
+ },
72
+ {
73
+ "epoch": 2.0,
74
+ "eval_accuracy": 0.7142857142857143,
75
+ "eval_auc": 0.5,
76
+ "eval_f1": 0.75,
77
+ "eval_loss": 0.5316336750984192,
78
+ "eval_precision": 0.75,
79
+ "eval_recall": 0.75,
80
+ "eval_runtime": 0.2429,
81
+ "eval_samples_per_second": 28.813,
82
+ "eval_steps_per_second": 4.116,
83
+ "step": 8
84
+ },
85
+ {
86
+ "epoch": 2.25,
87
+ "learning_rate": 4.375e-05,
88
+ "loss": 0.7961,
89
+ "step": 9
90
+ },
91
+ {
92
+ "epoch": 2.5,
93
+ "learning_rate": 5e-05,
94
+ "loss": 0.6182,
95
+ "step": 10
96
+ },
97
+ {
98
+ "epoch": 2.75,
99
+ "learning_rate": 4.930555555555556e-05,
100
+ "loss": 0.5245,
101
+ "step": 11
102
+ },
103
+ {
104
+ "epoch": 3.0,
105
+ "learning_rate": 4.8611111111111115e-05,
106
+ "loss": 0.3528,
107
+ "step": 12
108
+ },
109
+ {
110
+ "epoch": 3.0,
111
+ "eval_accuracy": 1.0,
112
+ "eval_auc": 0.7500000000000001,
113
+ "eval_f1": 1.0,
114
+ "eval_loss": 0.4492535889148712,
115
+ "eval_precision": 1.0,
116
+ "eval_recall": 1.0,
117
+ "eval_runtime": 0.2334,
118
+ "eval_samples_per_second": 29.991,
119
+ "eval_steps_per_second": 4.284,
120
+ "step": 12
121
+ },
122
+ {
123
+ "epoch": 3.25,
124
+ "learning_rate": 4.791666666666667e-05,
125
+ "loss": 0.5171,
126
+ "step": 13
127
+ },
128
+ {
129
+ "epoch": 3.5,
130
+ "learning_rate": 4.722222222222222e-05,
131
+ "loss": 0.4058,
132
+ "step": 14
133
+ },
134
+ {
135
+ "epoch": 3.75,
136
+ "learning_rate": 4.652777777777778e-05,
137
+ "loss": 0.2961,
138
+ "step": 15
139
+ },
140
+ {
141
+ "epoch": 4.0,
142
+ "learning_rate": 4.5833333333333334e-05,
143
+ "loss": 0.6474,
144
+ "step": 16
145
+ },
146
+ {
147
+ "epoch": 4.0,
148
+ "eval_accuracy": 1.0,
149
+ "eval_auc": 0.9166666666666667,
150
+ "eval_f1": 1.0,
151
+ "eval_loss": 0.348563015460968,
152
+ "eval_precision": 1.0,
153
+ "eval_recall": 1.0,
154
+ "eval_runtime": 0.2304,
155
+ "eval_samples_per_second": 30.388,
156
+ "eval_steps_per_second": 4.341,
157
+ "step": 16
158
+ },
159
+ {
160
+ "epoch": 4.25,
161
+ "learning_rate": 4.5138888888888894e-05,
162
+ "loss": 0.244,
163
+ "step": 17
164
+ },
165
+ {
166
+ "epoch": 4.5,
167
+ "learning_rate": 4.4444444444444447e-05,
168
+ "loss": 0.2783,
169
+ "step": 18
170
+ },
171
+ {
172
+ "epoch": 4.75,
173
+ "learning_rate": 4.375e-05,
174
+ "loss": 0.3117,
175
+ "step": 19
176
+ },
177
+ {
178
+ "epoch": 5.0,
179
+ "learning_rate": 4.305555555555556e-05,
180
+ "loss": 0.178,
181
+ "step": 20
182
+ },
183
+ {
184
+ "epoch": 5.0,
185
+ "eval_accuracy": 1.0,
186
+ "eval_auc": 1.0,
187
+ "eval_f1": 1.0,
188
+ "eval_loss": 0.2634625732898712,
189
+ "eval_precision": 1.0,
190
+ "eval_recall": 1.0,
191
+ "eval_runtime": 0.2419,
192
+ "eval_samples_per_second": 28.936,
193
+ "eval_steps_per_second": 4.134,
194
+ "step": 20
195
+ },
196
+ {
197
+ "epoch": 5.25,
198
+ "learning_rate": 4.236111111111111e-05,
199
+ "loss": 0.2442,
200
+ "step": 21
201
+ },
202
+ {
203
+ "epoch": 5.5,
204
+ "learning_rate": 4.166666666666667e-05,
205
+ "loss": 0.2336,
206
+ "step": 22
207
+ },
208
+ {
209
+ "epoch": 5.75,
210
+ "learning_rate": 4.0972222222222225e-05,
211
+ "loss": 0.1733,
212
+ "step": 23
213
+ },
214
+ {
215
+ "epoch": 6.0,
216
+ "learning_rate": 4.027777777777778e-05,
217
+ "loss": 0.3612,
218
+ "step": 24
219
+ },
220
+ {
221
+ "epoch": 6.0,
222
+ "eval_accuracy": 1.0,
223
+ "eval_auc": 1.0,
224
+ "eval_f1": 1.0,
225
+ "eval_loss": 0.2078421264886856,
226
+ "eval_precision": 1.0,
227
+ "eval_recall": 1.0,
228
+ "eval_runtime": 0.23,
229
+ "eval_samples_per_second": 30.428,
230
+ "eval_steps_per_second": 4.347,
231
+ "step": 24
232
+ },
233
+ {
234
+ "epoch": 6.25,
235
+ "learning_rate": 3.958333333333333e-05,
236
+ "loss": 0.1645,
237
+ "step": 25
238
+ },
239
+ {
240
+ "epoch": 6.5,
241
+ "learning_rate": 3.888888888888889e-05,
242
+ "loss": 0.1022,
243
+ "step": 26
244
+ },
245
+ {
246
+ "epoch": 6.75,
247
+ "learning_rate": 3.8194444444444444e-05,
248
+ "loss": 0.1811,
249
+ "step": 27
250
+ },
251
+ {
252
+ "epoch": 7.0,
253
+ "learning_rate": 3.7500000000000003e-05,
254
+ "loss": 0.044,
255
+ "step": 28
256
+ },
257
+ {
258
+ "epoch": 7.0,
259
+ "eval_accuracy": 1.0,
260
+ "eval_auc": 1.0,
261
+ "eval_f1": 1.0,
262
+ "eval_loss": 0.172084242105484,
263
+ "eval_precision": 1.0,
264
+ "eval_recall": 1.0,
265
+ "eval_runtime": 0.2324,
266
+ "eval_samples_per_second": 30.126,
267
+ "eval_steps_per_second": 4.304,
268
+ "step": 28
269
+ },
270
+ {
271
+ "epoch": 7.25,
272
+ "learning_rate": 3.6805555555555556e-05,
273
+ "loss": 0.217,
274
+ "step": 29
275
+ },
276
+ {
277
+ "epoch": 7.5,
278
+ "learning_rate": 3.611111111111111e-05,
279
+ "loss": 0.1082,
280
+ "step": 30
281
+ },
282
+ {
283
+ "epoch": 7.75,
284
+ "learning_rate": 3.541666666666667e-05,
285
+ "loss": 0.1583,
286
+ "step": 31
287
+ },
288
+ {
289
+ "epoch": 8.0,
290
+ "learning_rate": 3.472222222222222e-05,
291
+ "loss": 0.3623,
292
+ "step": 32
293
+ },
294
+ {
295
+ "epoch": 8.0,
296
+ "eval_accuracy": 1.0,
297
+ "eval_auc": 1.0,
298
+ "eval_f1": 1.0,
299
+ "eval_loss": 0.1323634535074234,
300
+ "eval_precision": 1.0,
301
+ "eval_recall": 1.0,
302
+ "eval_runtime": 0.235,
303
+ "eval_samples_per_second": 29.785,
304
+ "eval_steps_per_second": 4.255,
305
+ "step": 32
306
+ },
307
+ {
308
+ "epoch": 8.25,
309
+ "learning_rate": 3.402777777777778e-05,
310
+ "loss": 0.035,
311
+ "step": 33
312
+ },
313
+ {
314
+ "epoch": 8.5,
315
+ "learning_rate": 3.3333333333333335e-05,
316
+ "loss": 0.1694,
317
+ "step": 34
318
+ },
319
+ {
320
+ "epoch": 8.75,
321
+ "learning_rate": 3.263888888888889e-05,
322
+ "loss": 0.0791,
323
+ "step": 35
324
+ },
325
+ {
326
+ "epoch": 9.0,
327
+ "learning_rate": 3.194444444444444e-05,
328
+ "loss": 0.043,
329
+ "step": 36
330
+ },
331
+ {
332
+ "epoch": 9.0,
333
+ "eval_accuracy": 1.0,
334
+ "eval_auc": 1.0,
335
+ "eval_f1": 1.0,
336
+ "eval_loss": 0.1202654168009758,
337
+ "eval_precision": 1.0,
338
+ "eval_recall": 1.0,
339
+ "eval_runtime": 0.2369,
340
+ "eval_samples_per_second": 29.552,
341
+ "eval_steps_per_second": 4.222,
342
+ "step": 36
343
+ },
344
+ {
345
+ "epoch": 9.25,
346
+ "learning_rate": 3.125e-05,
347
+ "loss": 0.1728,
348
+ "step": 37
349
+ },
350
+ {
351
+ "epoch": 9.5,
352
+ "learning_rate": 3.055555555555556e-05,
353
+ "loss": 0.2055,
354
+ "step": 38
355
+ },
356
+ {
357
+ "epoch": 9.75,
358
+ "learning_rate": 2.9861111111111113e-05,
359
+ "loss": 0.0609,
360
+ "step": 39
361
+ },
362
+ {
363
+ "epoch": 10.0,
364
+ "learning_rate": 2.916666666666667e-05,
365
+ "loss": 0.0123,
366
+ "step": 40
367
+ },
368
+ {
369
+ "epoch": 10.0,
370
+ "eval_accuracy": 1.0,
371
+ "eval_auc": 1.0,
372
+ "eval_f1": 1.0,
373
+ "eval_loss": 0.1008061096072197,
374
+ "eval_precision": 1.0,
375
+ "eval_recall": 1.0,
376
+ "eval_runtime": 0.2372,
377
+ "eval_samples_per_second": 29.514,
378
+ "eval_steps_per_second": 4.216,
379
+ "step": 40
380
+ },
381
+ {
382
+ "epoch": 10.25,
383
+ "learning_rate": 2.8472222222222223e-05,
384
+ "loss": 0.1631,
385
+ "step": 41
386
+ },
387
+ {
388
+ "epoch": 10.5,
389
+ "learning_rate": 2.777777777777778e-05,
390
+ "loss": 0.0666,
391
+ "step": 42
392
+ },
393
+ {
394
+ "epoch": 10.75,
395
+ "learning_rate": 2.7083333333333332e-05,
396
+ "loss": 0.0095,
397
+ "step": 43
398
+ },
399
+ {
400
+ "epoch": 11.0,
401
+ "learning_rate": 2.6388888888888892e-05,
402
+ "loss": 0.0165,
403
+ "step": 44
404
+ },
405
+ {
406
+ "epoch": 11.0,
407
+ "eval_accuracy": 1.0,
408
+ "eval_auc": 1.0,
409
+ "eval_f1": 1.0,
410
+ "eval_loss": 0.086181640625,
411
+ "eval_precision": 1.0,
412
+ "eval_recall": 1.0,
413
+ "eval_runtime": 0.2365,
414
+ "eval_samples_per_second": 29.599,
415
+ "eval_steps_per_second": 4.228,
416
+ "step": 44
417
+ },
418
+ {
419
+ "epoch": 11.25,
420
+ "learning_rate": 2.5694444444444445e-05,
421
+ "loss": 0.0071,
422
+ "step": 45
423
+ },
424
+ {
425
+ "epoch": 11.5,
426
+ "learning_rate": 2.5e-05,
427
+ "loss": 0.0273,
428
+ "step": 46
429
+ },
430
+ {
431
+ "epoch": 11.75,
432
+ "learning_rate": 2.4305555555555558e-05,
433
+ "loss": 0.0077,
434
+ "step": 47
435
+ },
436
+ {
437
+ "epoch": 12.0,
438
+ "learning_rate": 2.361111111111111e-05,
439
+ "loss": 0.0156,
440
+ "step": 48
441
+ },
442
+ {
443
+ "epoch": 12.0,
444
+ "eval_accuracy": 1.0,
445
+ "eval_auc": 1.0,
446
+ "eval_f1": 1.0,
447
+ "eval_loss": 0.0849238708615303,
448
+ "eval_precision": 1.0,
449
+ "eval_recall": 1.0,
450
+ "eval_runtime": 0.2379,
451
+ "eval_samples_per_second": 29.419,
452
+ "eval_steps_per_second": 4.203,
453
+ "step": 48
454
+ },
455
+ {
456
+ "epoch": 12.25,
457
+ "learning_rate": 2.2916666666666667e-05,
458
+ "loss": 0.0043,
459
+ "step": 49
460
+ },
461
+ {
462
+ "epoch": 12.5,
463
+ "learning_rate": 2.2222222222222223e-05,
464
+ "loss": 0.0472,
465
+ "step": 50
466
+ },
467
+ {
468
+ "epoch": 12.75,
469
+ "learning_rate": 2.152777777777778e-05,
470
+ "loss": 0.0095,
471
+ "step": 51
472
+ },
473
+ {
474
+ "epoch": 13.0,
475
+ "learning_rate": 2.0833333333333336e-05,
476
+ "loss": 0.0052,
477
+ "step": 52
478
+ },
479
+ {
480
+ "epoch": 13.0,
481
+ "eval_accuracy": 1.0,
482
+ "eval_auc": 1.0,
483
+ "eval_f1": 1.0,
484
+ "eval_loss": 0.07886940985918045,
485
+ "eval_precision": 1.0,
486
+ "eval_recall": 1.0,
487
+ "eval_runtime": 0.2319,
488
+ "eval_samples_per_second": 30.181,
489
+ "eval_steps_per_second": 4.312,
490
+ "step": 52
491
+ },
492
+ {
493
+ "epoch": 13.25,
494
+ "learning_rate": 2.013888888888889e-05,
495
+ "loss": 0.0147,
496
+ "step": 53
497
+ },
498
+ {
499
+ "epoch": 13.5,
500
+ "learning_rate": 1.9444444444444445e-05,
501
+ "loss": 0.0156,
502
+ "step": 54
503
+ },
504
+ {
505
+ "epoch": 13.75,
506
+ "learning_rate": 1.8750000000000002e-05,
507
+ "loss": 0.0188,
508
+ "step": 55
509
+ },
510
+ {
511
+ "epoch": 14.0,
512
+ "learning_rate": 1.8055555555555555e-05,
513
+ "loss": 0.0017,
514
+ "step": 56
515
+ },
516
+ {
517
+ "epoch": 14.0,
518
+ "eval_accuracy": 1.0,
519
+ "eval_auc": 1.0,
520
+ "eval_f1": 1.0,
521
+ "eval_loss": 0.0678296759724617,
522
+ "eval_precision": 1.0,
523
+ "eval_recall": 1.0,
524
+ "eval_runtime": 0.2316,
525
+ "eval_samples_per_second": 30.221,
526
+ "eval_steps_per_second": 4.317,
527
+ "step": 56
528
+ },
529
+ {
530
+ "epoch": 14.25,
531
+ "learning_rate": 1.736111111111111e-05,
532
+ "loss": 0.0117,
533
+ "step": 57
534
+ },
535
+ {
536
+ "epoch": 14.5,
537
+ "learning_rate": 1.6666666666666667e-05,
538
+ "loss": 0.0072,
539
+ "step": 58
540
+ },
541
+ {
542
+ "epoch": 14.75,
543
+ "learning_rate": 1.597222222222222e-05,
544
+ "loss": 0.004,
545
+ "step": 59
546
+ },
547
+ {
548
+ "epoch": 15.0,
549
+ "learning_rate": 1.527777777777778e-05,
550
+ "loss": 0.0028,
551
+ "step": 60
552
+ },
553
+ {
554
+ "epoch": 15.0,
555
+ "eval_accuracy": 1.0,
556
+ "eval_auc": 1.0,
557
+ "eval_f1": 1.0,
558
+ "eval_loss": 0.05511965602636337,
559
+ "eval_precision": 1.0,
560
+ "eval_recall": 1.0,
561
+ "eval_runtime": 0.2451,
562
+ "eval_samples_per_second": 28.561,
563
+ "eval_steps_per_second": 4.08,
564
+ "step": 60
565
+ },
566
+ {
567
+ "epoch": 15.25,
568
+ "learning_rate": 1.4583333333333335e-05,
569
+ "loss": 0.0099,
570
+ "step": 61
571
+ },
572
+ {
573
+ "epoch": 15.5,
574
+ "learning_rate": 1.388888888888889e-05,
575
+ "loss": 0.0082,
576
+ "step": 62
577
+ },
578
+ {
579
+ "epoch": 15.75,
580
+ "learning_rate": 1.3194444444444446e-05,
581
+ "loss": 0.005,
582
+ "step": 63
583
+ },
584
+ {
585
+ "epoch": 16.0,
586
+ "learning_rate": 1.25e-05,
587
+ "loss": 0.0043,
588
+ "step": 64
589
+ },
590
+ {
591
+ "epoch": 16.0,
592
+ "eval_accuracy": 1.0,
593
+ "eval_auc": 1.0,
594
+ "eval_f1": 1.0,
595
+ "eval_loss": 0.04743194580078125,
596
+ "eval_precision": 1.0,
597
+ "eval_recall": 1.0,
598
+ "eval_runtime": 0.2312,
599
+ "eval_samples_per_second": 30.271,
600
+ "eval_steps_per_second": 4.324,
601
+ "step": 64
602
+ },
603
+ {
604
+ "epoch": 16.25,
605
+ "learning_rate": 1.1805555555555555e-05,
606
+ "loss": 0.2229,
607
+ "step": 65
608
+ },
609
+ {
610
+ "epoch": 16.5,
611
+ "learning_rate": 1.1111111111111112e-05,
612
+ "loss": 0.0214,
613
+ "step": 66
614
+ },
615
+ {
616
+ "epoch": 16.75,
617
+ "learning_rate": 1.0416666666666668e-05,
618
+ "loss": 0.0079,
619
+ "step": 67
620
+ },
621
+ {
622
+ "epoch": 17.0,
623
+ "learning_rate": 9.722222222222223e-06,
624
+ "loss": 0.0022,
625
+ "step": 68
626
+ },
627
+ {
628
+ "epoch": 17.0,
629
+ "eval_accuracy": 1.0,
630
+ "eval_auc": 1.0,
631
+ "eval_f1": 1.0,
632
+ "eval_loss": 0.04407283291220665,
633
+ "eval_precision": 1.0,
634
+ "eval_recall": 1.0,
635
+ "eval_runtime": 0.231,
636
+ "eval_samples_per_second": 30.304,
637
+ "eval_steps_per_second": 4.329,
638
+ "step": 68
639
+ },
640
+ {
641
+ "epoch": 17.25,
642
+ "learning_rate": 9.027777777777777e-06,
643
+ "loss": 0.0155,
644
+ "step": 69
645
+ },
646
+ {
647
+ "epoch": 17.5,
648
+ "learning_rate": 8.333333333333334e-06,
649
+ "loss": 0.0181,
650
+ "step": 70
651
+ },
652
+ {
653
+ "epoch": 17.75,
654
+ "learning_rate": 7.63888888888889e-06,
655
+ "loss": 0.0042,
656
+ "step": 71
657
+ },
658
+ {
659
+ "epoch": 18.0,
660
+ "learning_rate": 6.944444444444445e-06,
661
+ "loss": 0.0035,
662
+ "step": 72
663
+ },
664
+ {
665
+ "epoch": 18.0,
666
+ "eval_accuracy": 1.0,
667
+ "eval_auc": 1.0,
668
+ "eval_f1": 1.0,
669
+ "eval_loss": 0.04287773743271828,
670
+ "eval_precision": 1.0,
671
+ "eval_recall": 1.0,
672
+ "eval_runtime": 0.2292,
673
+ "eval_samples_per_second": 30.539,
674
+ "eval_steps_per_second": 4.363,
675
+ "step": 72
676
+ }
677
+ ],
678
+ "logging_steps": 1,
679
+ "max_steps": 80,
680
+ "num_input_tokens_seen": 0,
681
+ "num_train_epochs": 20,
682
+ "save_steps": 500,
683
+ "total_flos": 3.766110695269171e+16,
684
+ "train_batch_size": 8,
685
+ "trial_name": null,
686
+ "trial_params": null
687
+ }
checkpoint-72/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe5c22cdb148b1741f8bacd35417ccf73ebad1b8a9b96139dfe410e06c0eea57
3
+ size 4728
config.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "google/vit-base-patch16-224",
3
+ "_num_labels": 2,
4
+ "architectures": [
5
+ "ViTForImageClassification"
6
+ ],
7
+ "attention_probs_dropout_prob": 0.0,
8
+ "encoder_stride": 16,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.0,
11
+ "hidden_size": 768,
12
+ "id2label": {
13
+ "0": "mulder",
14
+ "1": "scully"
15
+ },
16
+ "image_size": 224,
17
+ "initializer_range": 0.02,
18
+ "intermediate_size": 3072,
19
+ "label2id": {
20
+ "mulder": 0,
21
+ "scully": 1
22
+ },
23
+ "layer_norm_eps": 1e-12,
24
+ "model_type": "vit",
25
+ "num_attention_heads": 12,
26
+ "num_channels": 3,
27
+ "num_hidden_layers": 12,
28
+ "patch_size": 16,
29
+ "problem_type": "single_label_classification",
30
+ "qkv_bias": true,
31
+ "torch_dtype": "float32",
32
+ "transformers_version": "4.37.0"
33
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:981b48030a011740f8674bba203e9161515fa357d3b4151d614e82314c6311f3
3
+ size 343223968
preprocessor_config.json ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "do_rescale": true,
4
+ "do_resize": true,
5
+ "image_mean": [
6
+ 0.5,
7
+ 0.5,
8
+ 0.5
9
+ ],
10
+ "image_processor_type": "ViTImageProcessor",
11
+ "image_std": [
12
+ 0.5,
13
+ 0.5,
14
+ 0.5
15
+ ],
16
+ "resample": 2,
17
+ "rescale_factor": 0.00392156862745098,
18
+ "size": {
19
+ "height": 224,
20
+ "width": 224
21
+ }
22
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe5c22cdb148b1741f8bacd35417ccf73ebad1b8a9b96139dfe410e06c0eea57
3
+ size 4728
training_params.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "data_path": "autotrain-5ozhd-efa4o/autotrain-data",
3
+ "model": "google/vit-base-patch16-224",
4
+ "username": "dvs",
5
+ "lr": 5e-05,
6
+ "epochs": 20,
7
+ "batch_size": 8,
8
+ "warmup_ratio": 0.1,
9
+ "gradient_accumulation": 1,
10
+ "optimizer": "adamw_torch",
11
+ "scheduler": "linear",
12
+ "weight_decay": 0.0,
13
+ "max_grad_norm": 1.0,
14
+ "seed": 42,
15
+ "train_split": "train",
16
+ "valid_split": "validation",
17
+ "logging_steps": -1,
18
+ "project_name": "autotrain-5ozhd-efa4o",
19
+ "auto_find_batch_size": false,
20
+ "mixed_precision": "fp16",
21
+ "save_total_limit": 1,
22
+ "save_strategy": "epoch",
23
+ "push_to_hub": true,
24
+ "repo_id": "dvs/autotrain-5ozhd-efa4o",
25
+ "evaluation_strategy": "epoch",
26
+ "image_column": "autotrain_image",
27
+ "target_column": "autotrain_label",
28
+ "log": "none"
29
+ }