Melo1512 commited on
Commit
193ae33
·
verified ·
1 Parent(s): 5c48706

End of training

Browse files
README.md CHANGED
@@ -23,7 +23,7 @@ model-index:
23
  metrics:
24
  - name: Accuracy
25
  type: accuracy
26
- value: 0.8879227053140096
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -33,8 +33,8 @@ should probably proofread and complete it, then remove this comment. -->
33
 
34
  This model is a fine-tuned version of [facebook/vit-msn-small](https://huggingface.co/facebook/vit-msn-small) on the imagefolder dataset.
35
  It achieves the following results on the evaluation set:
36
- - Loss: 0.3520
37
- - Accuracy: 0.8879
38
 
39
  ## Model description
40
 
 
23
  metrics:
24
  - name: Accuracy
25
  type: accuracy
26
+ value: 0.9497584541062802
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
33
 
34
  This model is a fine-tuned version of [facebook/vit-msn-small](https://huggingface.co/facebook/vit-msn-small) on the imagefolder dataset.
35
  It achieves the following results on the evaluation set:
36
+ - Loss: 0.1871
37
+ - Accuracy: 0.9498
38
 
39
  ## Model description
40
 
all_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 18.46153846153846,
3
+ "eval_accuracy": 0.9497584541062802,
4
+ "eval_loss": 0.1871330887079239,
5
+ "eval_runtime": 4.3162,
6
+ "eval_samples_per_second": 239.797,
7
+ "eval_steps_per_second": 3.939,
8
+ "total_flos": 2.9458314315627725e+17,
9
+ "train_loss": 0.35900469223658243,
10
+ "train_runtime": 212.0852,
11
+ "train_samples_per_second": 76.856,
12
+ "train_steps_per_second": 0.283
13
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 18.46153846153846,
3
+ "eval_accuracy": 0.9497584541062802,
4
+ "eval_loss": 0.1871330887079239,
5
+ "eval_runtime": 4.3162,
6
+ "eval_samples_per_second": 239.797,
7
+ "eval_steps_per_second": 3.939
8
+ }
runs/Jan14_17-38-22_c583982b4f3d/events.out.tfevents.1736876536.c583982b4f3d.215.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21caf6cc841fb69179ec969142789a3901dcdcfe6451bd8a6d89dff3e5f75a3b
3
+ size 722
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 18.46153846153846,
3
+ "total_flos": 2.9458314315627725e+17,
4
+ "train_loss": 0.35900469223658243,
5
+ "train_runtime": 212.0852,
6
+ "train_samples_per_second": 76.856,
7
+ "train_steps_per_second": 0.283
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,255 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9497584541062802,
3
+ "best_model_checkpoint": "vit-msn-small-corect_deepcleaned_dataset_lateral_flow_ivalidation/checkpoint-22",
4
+ "epoch": 18.46153846153846,
5
+ "eval_steps": 500,
6
+ "global_step": 60,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.9230769230769231,
13
+ "eval_accuracy": 0.8927536231884058,
14
+ "eval_loss": 0.3933483958244324,
15
+ "eval_runtime": 4.3694,
16
+ "eval_samples_per_second": 236.874,
17
+ "eval_steps_per_second": 3.891,
18
+ "step": 3
19
+ },
20
+ {
21
+ "epoch": 1.8461538461538463,
22
+ "eval_accuracy": 0.9188405797101449,
23
+ "eval_loss": 0.4166622459888458,
24
+ "eval_runtime": 4.2818,
25
+ "eval_samples_per_second": 241.72,
26
+ "eval_steps_per_second": 3.97,
27
+ "step": 6
28
+ },
29
+ {
30
+ "epoch": 2.769230769230769,
31
+ "eval_accuracy": 0.4966183574879227,
32
+ "eval_loss": 0.933142364025116,
33
+ "eval_runtime": 4.3066,
34
+ "eval_samples_per_second": 240.328,
35
+ "eval_steps_per_second": 3.947,
36
+ "step": 9
37
+ },
38
+ {
39
+ "epoch": 3.076923076923077,
40
+ "grad_norm": 62.32957458496094,
41
+ "learning_rate": 4.62962962962963e-05,
42
+ "loss": 0.615,
43
+ "step": 10
44
+ },
45
+ {
46
+ "epoch": 4.0,
47
+ "eval_accuracy": 0.9178743961352657,
48
+ "eval_loss": 0.3084805905818939,
49
+ "eval_runtime": 4.3796,
50
+ "eval_samples_per_second": 236.322,
51
+ "eval_steps_per_second": 3.882,
52
+ "step": 13
53
+ },
54
+ {
55
+ "epoch": 4.923076923076923,
56
+ "eval_accuracy": 0.9333333333333333,
57
+ "eval_loss": 0.22097891569137573,
58
+ "eval_runtime": 4.3446,
59
+ "eval_samples_per_second": 238.226,
60
+ "eval_steps_per_second": 3.913,
61
+ "step": 16
62
+ },
63
+ {
64
+ "epoch": 5.846153846153846,
65
+ "eval_accuracy": 0.9391304347826087,
66
+ "eval_loss": 0.21061654388904572,
67
+ "eval_runtime": 4.4485,
68
+ "eval_samples_per_second": 232.66,
69
+ "eval_steps_per_second": 3.821,
70
+ "step": 19
71
+ },
72
+ {
73
+ "epoch": 6.153846153846154,
74
+ "grad_norm": 3.9477076530456543,
75
+ "learning_rate": 3.7037037037037037e-05,
76
+ "loss": 0.3763,
77
+ "step": 20
78
+ },
79
+ {
80
+ "epoch": 6.769230769230769,
81
+ "eval_accuracy": 0.9497584541062802,
82
+ "eval_loss": 0.1871330887079239,
83
+ "eval_runtime": 4.3598,
84
+ "eval_samples_per_second": 237.396,
85
+ "eval_steps_per_second": 3.899,
86
+ "step": 22
87
+ },
88
+ {
89
+ "epoch": 8.0,
90
+ "eval_accuracy": 0.9371980676328503,
91
+ "eval_loss": 0.20427261292934418,
92
+ "eval_runtime": 4.2827,
93
+ "eval_samples_per_second": 241.673,
94
+ "eval_steps_per_second": 3.97,
95
+ "step": 26
96
+ },
97
+ {
98
+ "epoch": 8.923076923076923,
99
+ "eval_accuracy": 0.8888888888888888,
100
+ "eval_loss": 0.31205740571022034,
101
+ "eval_runtime": 4.4195,
102
+ "eval_samples_per_second": 234.192,
103
+ "eval_steps_per_second": 3.847,
104
+ "step": 29
105
+ },
106
+ {
107
+ "epoch": 9.23076923076923,
108
+ "grad_norm": 4.070008754730225,
109
+ "learning_rate": 2.777777777777778e-05,
110
+ "loss": 0.3511,
111
+ "step": 30
112
+ },
113
+ {
114
+ "epoch": 9.846153846153847,
115
+ "eval_accuracy": 0.9314009661835749,
116
+ "eval_loss": 0.20154337584972382,
117
+ "eval_runtime": 4.2969,
118
+ "eval_samples_per_second": 240.871,
119
+ "eval_steps_per_second": 3.956,
120
+ "step": 32
121
+ },
122
+ {
123
+ "epoch": 10.76923076923077,
124
+ "eval_accuracy": 0.8376811594202899,
125
+ "eval_loss": 0.44852134585380554,
126
+ "eval_runtime": 4.3709,
127
+ "eval_samples_per_second": 236.795,
128
+ "eval_steps_per_second": 3.889,
129
+ "step": 35
130
+ },
131
+ {
132
+ "epoch": 12.0,
133
+ "eval_accuracy": 0.9285024154589372,
134
+ "eval_loss": 0.24452261626720428,
135
+ "eval_runtime": 4.3262,
136
+ "eval_samples_per_second": 239.241,
137
+ "eval_steps_per_second": 3.93,
138
+ "step": 39
139
+ },
140
+ {
141
+ "epoch": 12.307692307692308,
142
+ "grad_norm": 7.704187393188477,
143
+ "learning_rate": 1.8518518518518518e-05,
144
+ "loss": 0.2962,
145
+ "step": 40
146
+ },
147
+ {
148
+ "epoch": 12.923076923076923,
149
+ "eval_accuracy": 0.9053140096618357,
150
+ "eval_loss": 0.30447185039520264,
151
+ "eval_runtime": 4.2886,
152
+ "eval_samples_per_second": 241.336,
153
+ "eval_steps_per_second": 3.964,
154
+ "step": 42
155
+ },
156
+ {
157
+ "epoch": 13.846153846153847,
158
+ "eval_accuracy": 0.8714975845410629,
159
+ "eval_loss": 0.3914734721183777,
160
+ "eval_runtime": 4.4006,
161
+ "eval_samples_per_second": 235.195,
162
+ "eval_steps_per_second": 3.863,
163
+ "step": 45
164
+ },
165
+ {
166
+ "epoch": 14.76923076923077,
167
+ "eval_accuracy": 0.893719806763285,
168
+ "eval_loss": 0.31650951504707336,
169
+ "eval_runtime": 4.327,
170
+ "eval_samples_per_second": 239.195,
171
+ "eval_steps_per_second": 3.929,
172
+ "step": 48
173
+ },
174
+ {
175
+ "epoch": 15.384615384615385,
176
+ "grad_norm": 5.901269912719727,
177
+ "learning_rate": 9.259259259259259e-06,
178
+ "loss": 0.2553,
179
+ "step": 50
180
+ },
181
+ {
182
+ "epoch": 16.0,
183
+ "eval_accuracy": 0.9082125603864735,
184
+ "eval_loss": 0.28225788474082947,
185
+ "eval_runtime": 4.4633,
186
+ "eval_samples_per_second": 231.89,
187
+ "eval_steps_per_second": 3.809,
188
+ "step": 52
189
+ },
190
+ {
191
+ "epoch": 16.923076923076923,
192
+ "eval_accuracy": 0.8869565217391304,
193
+ "eval_loss": 0.3504292070865631,
194
+ "eval_runtime": 4.37,
195
+ "eval_samples_per_second": 236.841,
196
+ "eval_steps_per_second": 3.89,
197
+ "step": 55
198
+ },
199
+ {
200
+ "epoch": 17.846153846153847,
201
+ "eval_accuracy": 0.8869565217391304,
202
+ "eval_loss": 0.36792051792144775,
203
+ "eval_runtime": 4.4082,
204
+ "eval_samples_per_second": 234.792,
205
+ "eval_steps_per_second": 3.856,
206
+ "step": 58
207
+ },
208
+ {
209
+ "epoch": 18.46153846153846,
210
+ "grad_norm": 7.85857629776001,
211
+ "learning_rate": 0.0,
212
+ "loss": 0.2601,
213
+ "step": 60
214
+ },
215
+ {
216
+ "epoch": 18.46153846153846,
217
+ "eval_accuracy": 0.8879227053140096,
218
+ "eval_loss": 0.3520191013813019,
219
+ "eval_runtime": 4.3424,
220
+ "eval_samples_per_second": 238.347,
221
+ "eval_steps_per_second": 3.915,
222
+ "step": 60
223
+ },
224
+ {
225
+ "epoch": 18.46153846153846,
226
+ "step": 60,
227
+ "total_flos": 2.9458314315627725e+17,
228
+ "train_loss": 0.35900469223658243,
229
+ "train_runtime": 212.0852,
230
+ "train_samples_per_second": 76.856,
231
+ "train_steps_per_second": 0.283
232
+ }
233
+ ],
234
+ "logging_steps": 10,
235
+ "max_steps": 60,
236
+ "num_input_tokens_seen": 0,
237
+ "num_train_epochs": 20,
238
+ "save_steps": 500,
239
+ "stateful_callbacks": {
240
+ "TrainerControl": {
241
+ "args": {
242
+ "should_epoch_stop": false,
243
+ "should_evaluate": false,
244
+ "should_log": false,
245
+ "should_save": true,
246
+ "should_training_stop": true
247
+ },
248
+ "attributes": {}
249
+ }
250
+ },
251
+ "total_flos": 2.9458314315627725e+17,
252
+ "train_batch_size": 64,
253
+ "trial_name": null,
254
+ "trial_params": null
255
+ }