Bisher commited on
Commit
e784ba7
1 Parent(s): c170167

End of training

Browse files
Files changed (3) hide show
  1. all_results.json +8 -0
  2. train_results.json +8 -0
  3. trainer_state.json +311 -0
all_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 0.48959608323133413,
3
+ "total_flos": 1.6503006591246067e+18,
4
+ "train_loss": 0.018675562590360642,
5
+ "train_runtime": 8627.3162,
6
+ "train_samples_per_second": 43.148,
7
+ "train_steps_per_second": 0.071
8
+ }
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 0.48959608323133413,
3
+ "total_flos": 1.6503006591246067e+18,
4
+ "train_loss": 0.018675562590360642,
5
+ "train_runtime": 8627.3162,
6
+ "train_samples_per_second": 43.148,
7
+ "train_steps_per_second": 0.071
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,311 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.06726457399116248,
3
+ "best_model_checkpoint": "/kaggle/working/wav2vec2_ASV_deepfake_audio_detection_DF_finetune_frozen/checkpoint-50",
4
+ "epoch": 0.48959608323133413,
5
+ "eval_steps": 10,
6
+ "global_step": 100,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.04895960832313342,
13
+ "grad_norm": 77894.5078125,
14
+ "learning_rate": 4.838709677419355e-06,
15
+ "loss": 0.025,
16
+ "step": 10
17
+ },
18
+ {
19
+ "epoch": 0.04895960832313342,
20
+ "eval_EER": 0.08262155976067725,
21
+ "eval_FN": 1699,
22
+ "eval_FP": 17,
23
+ "eval_TN": 17896,
24
+ "eval_TP": 308,
25
+ "eval_accuracy": 0.9138554216867469,
26
+ "eval_auc_roc": 0.9731609967469688,
27
+ "eval_f1": 0.8847202256623079,
28
+ "eval_loss": 0.35726311802864075,
29
+ "eval_min_tDCF": 0.03291284056297015,
30
+ "eval_precision": 0.9167599198883981,
31
+ "eval_recall": 0.9138554216867469,
32
+ "eval_runtime": 546.0537,
33
+ "eval_samples_per_second": 36.48,
34
+ "eval_steps_per_second": 0.242,
35
+ "step": 10
36
+ },
37
+ {
38
+ "epoch": 0.09791921664626684,
39
+ "grad_norm": 27190.29296875,
40
+ "learning_rate": 9.67741935483871e-06,
41
+ "loss": 0.0219,
42
+ "step": 20
43
+ },
44
+ {
45
+ "epoch": 0.09791921664626684,
46
+ "eval_EER": 0.07573492775282602,
47
+ "eval_FN": 1668,
48
+ "eval_FP": 22,
49
+ "eval_TN": 17891,
50
+ "eval_TP": 339,
51
+ "eval_accuracy": 0.9151606425702812,
52
+ "eval_auc_roc": 0.9758758569313771,
53
+ "eval_f1": 0.8875379989575978,
54
+ "eval_loss": 0.3001716732978821,
55
+ "eval_min_tDCF": 0.03205938818890207,
56
+ "eval_precision": 0.917171754233548,
57
+ "eval_recall": 0.9151606425702812,
58
+ "eval_runtime": 554.4205,
59
+ "eval_samples_per_second": 35.929,
60
+ "eval_steps_per_second": 0.238,
61
+ "step": 20
62
+ },
63
+ {
64
+ "epoch": 0.14687882496940025,
65
+ "grad_norm": 95780.625,
66
+ "learning_rate": 1.4516129032258065e-05,
67
+ "loss": 0.0193,
68
+ "step": 30
69
+ },
70
+ {
71
+ "epoch": 0.14687882496940025,
72
+ "eval_EER": 0.07095405571220935,
73
+ "eval_FN": 1653,
74
+ "eval_FP": 23,
75
+ "eval_TN": 17890,
76
+ "eval_TP": 354,
77
+ "eval_accuracy": 0.915863453815261,
78
+ "eval_auc_roc": 0.9540513467197973,
79
+ "eval_f1": 0.8889310464970523,
80
+ "eval_loss": 0.3557206988334656,
81
+ "eval_min_tDCF": 0.03200446819985352,
82
+ "eval_precision": 0.9177925127856772,
83
+ "eval_recall": 0.915863453815261,
84
+ "eval_runtime": 551.47,
85
+ "eval_samples_per_second": 36.122,
86
+ "eval_steps_per_second": 0.239,
87
+ "step": 30
88
+ },
89
+ {
90
+ "epoch": 0.19583843329253367,
91
+ "grad_norm": 40466.99609375,
92
+ "learning_rate": 1.935483870967742e-05,
93
+ "loss": 0.0197,
94
+ "step": 40
95
+ },
96
+ {
97
+ "epoch": 0.19583843329253367,
98
+ "eval_EER": 0.08021923268560038,
99
+ "eval_FN": 1584,
100
+ "eval_FP": 28,
101
+ "eval_TN": 17885,
102
+ "eval_TP": 423,
103
+ "eval_accuracy": 0.9190763052208836,
104
+ "eval_auc_roc": 0.9453176234544026,
105
+ "eval_f1": 0.8951467366785592,
106
+ "eval_loss": 0.39631858468055725,
107
+ "eval_min_tDCF": 0.03254273666351324,
108
+ "eval_precision": 0.920581989378439,
109
+ "eval_recall": 0.9190763052208836,
110
+ "eval_runtime": 551.299,
111
+ "eval_samples_per_second": 36.133,
112
+ "eval_steps_per_second": 0.239,
113
+ "step": 40
114
+ },
115
+ {
116
+ "epoch": 0.24479804161566707,
117
+ "grad_norm": 28958.201171875,
118
+ "learning_rate": 2.4193548387096773e-05,
119
+ "loss": 0.0181,
120
+ "step": 50
121
+ },
122
+ {
123
+ "epoch": 0.24479804161566707,
124
+ "eval_EER": 0.06726457399116248,
125
+ "eval_FN": 1661,
126
+ "eval_FP": 22,
127
+ "eval_TN": 17891,
128
+ "eval_TP": 346,
129
+ "eval_accuracy": 0.9155120481927711,
130
+ "eval_auc_roc": 0.9793639834408634,
131
+ "eval_f1": 0.8882073263221536,
132
+ "eval_loss": 0.35242822766304016,
133
+ "eval_min_tDCF": 0.03236891446008307,
134
+ "eval_precision": 0.9175830413065126,
135
+ "eval_recall": 0.9155120481927711,
136
+ "eval_runtime": 550.223,
137
+ "eval_samples_per_second": 36.204,
138
+ "eval_steps_per_second": 0.24,
139
+ "step": 50
140
+ },
141
+ {
142
+ "epoch": 0.2937576499388005,
143
+ "grad_norm": 46908.421875,
144
+ "learning_rate": 2.903225806451613e-05,
145
+ "loss": 0.0152,
146
+ "step": 60
147
+ },
148
+ {
149
+ "epoch": 0.2937576499388005,
150
+ "eval_EER": 0.08570004982564361,
151
+ "eval_FN": 1888,
152
+ "eval_FP": 5,
153
+ "eval_TN": 17908,
154
+ "eval_TP": 119,
155
+ "eval_accuracy": 0.9049698795180723,
156
+ "eval_auc_roc": 0.9581749145672833,
157
+ "eval_f1": 0.8653571590111583,
158
+ "eval_loss": 0.5160898566246033,
159
+ "eval_min_tDCF": 0.031358433391353344,
160
+ "eval_precision": 0.9101736730881184,
161
+ "eval_recall": 0.9049698795180723,
162
+ "eval_runtime": 552.7337,
163
+ "eval_samples_per_second": 36.039,
164
+ "eval_steps_per_second": 0.239,
165
+ "step": 60
166
+ },
167
+ {
168
+ "epoch": 0.3427172582619339,
169
+ "grad_norm": 120295.6171875,
170
+ "learning_rate": 2.9563636363636365e-05,
171
+ "loss": 0.0155,
172
+ "step": 70
173
+ },
174
+ {
175
+ "epoch": 0.3427172582619339,
176
+ "eval_EER": 0.13951170901879414,
177
+ "eval_FN": 1917,
178
+ "eval_FP": 1,
179
+ "eval_TN": 17912,
180
+ "eval_TP": 90,
181
+ "eval_accuracy": 0.903714859437751,
182
+ "eval_auc_roc": 0.9383886286903336,
183
+ "eval_f1": 0.8621926152008602,
184
+ "eval_loss": 0.6375065445899963,
185
+ "eval_min_tDCF": 0.030651624856462438,
186
+ "eval_precision": 0.9119566963565227,
187
+ "eval_recall": 0.903714859437751,
188
+ "eval_runtime": 551.4752,
189
+ "eval_samples_per_second": 36.121,
190
+ "eval_steps_per_second": 0.239,
191
+ "step": 70
192
+ },
193
+ {
194
+ "epoch": 0.39167686658506734,
195
+ "grad_norm": 63272.81640625,
196
+ "learning_rate": 2.901818181818182e-05,
197
+ "loss": 0.0193,
198
+ "step": 80
199
+ },
200
+ {
201
+ "epoch": 0.39167686658506734,
202
+ "eval_EER": 0.06427503736920785,
203
+ "eval_FN": 1740,
204
+ "eval_FP": 14,
205
+ "eval_TN": 17899,
206
+ "eval_TP": 267,
207
+ "eval_accuracy": 0.9119477911646586,
208
+ "eval_auc_roc": 0.9815884175385593,
209
+ "eval_f1": 0.880759359883601,
210
+ "eval_loss": 0.35206612944602966,
211
+ "eval_min_tDCF": 0.03087150091077144,
212
+ "eval_precision": 0.9153076989953792,
213
+ "eval_recall": 0.9119477911646586,
214
+ "eval_runtime": 551.1598,
215
+ "eval_samples_per_second": 36.142,
216
+ "eval_steps_per_second": 0.239,
217
+ "step": 80
218
+ },
219
+ {
220
+ "epoch": 0.44063647490820074,
221
+ "grad_norm": 36752.71875,
222
+ "learning_rate": 2.8472727272727275e-05,
223
+ "loss": 0.0158,
224
+ "step": 90
225
+ },
226
+ {
227
+ "epoch": 0.44063647490820074,
228
+ "eval_EER": 0.061285500747384154,
229
+ "eval_FN": 1853,
230
+ "eval_FP": 7,
231
+ "eval_TN": 17906,
232
+ "eval_TP": 154,
233
+ "eval_accuracy": 0.9066265060240963,
234
+ "eval_auc_roc": 0.9839317761029052,
235
+ "eval_f1": 0.8691616005883785,
236
+ "eval_loss": 0.3774518072605133,
237
+ "eval_min_tDCF": 0.02896076260303809,
238
+ "eval_precision": 0.9112880071281149,
239
+ "eval_recall": 0.9066265060240963,
240
+ "eval_runtime": 548.348,
241
+ "eval_samples_per_second": 36.327,
242
+ "eval_steps_per_second": 0.241,
243
+ "step": 90
244
+ },
245
+ {
246
+ "epoch": 0.48959608323133413,
247
+ "grad_norm": 23041.998046875,
248
+ "learning_rate": 2.7927272727272727e-05,
249
+ "loss": 0.017,
250
+ "step": 100
251
+ },
252
+ {
253
+ "epoch": 0.48959608323133413,
254
+ "eval_EER": 0.05879422022919777,
255
+ "eval_FN": 1742,
256
+ "eval_FP": 20,
257
+ "eval_TN": 17893,
258
+ "eval_TP": 265,
259
+ "eval_accuracy": 0.9115461847389559,
260
+ "eval_auc_roc": 0.9849050903204274,
261
+ "eval_f1": 0.880346418763591,
262
+ "eval_loss": 0.4076322317123413,
263
+ "eval_min_tDCF": 0.02710664658288187,
264
+ "eval_precision": 0.9131492081469701,
265
+ "eval_recall": 0.9115461847389559,
266
+ "eval_runtime": 552.237,
267
+ "eval_samples_per_second": 36.071,
268
+ "eval_steps_per_second": 0.239,
269
+ "step": 100
270
+ },
271
+ {
272
+ "epoch": 0.48959608323133413,
273
+ "step": 100,
274
+ "total_flos": 1.6503006591246067e+18,
275
+ "train_loss": 0.018675562590360642,
276
+ "train_runtime": 8627.3162,
277
+ "train_samples_per_second": 43.148,
278
+ "train_steps_per_second": 0.071
279
+ }
280
+ ],
281
+ "logging_steps": 10,
282
+ "max_steps": 612,
283
+ "num_input_tokens_seen": 0,
284
+ "num_train_epochs": 3,
285
+ "save_steps": 50,
286
+ "stateful_callbacks": {
287
+ "EarlyStoppingCallback": {
288
+ "args": {
289
+ "early_stopping_patience": 3,
290
+ "early_stopping_threshold": 0.0
291
+ },
292
+ "attributes": {
293
+ "early_stopping_patience_counter": 0
294
+ }
295
+ },
296
+ "TrainerControl": {
297
+ "args": {
298
+ "should_epoch_stop": false,
299
+ "should_evaluate": false,
300
+ "should_log": false,
301
+ "should_save": true,
302
+ "should_training_stop": true
303
+ },
304
+ "attributes": {}
305
+ }
306
+ },
307
+ "total_flos": 1.6503006591246067e+18,
308
+ "train_batch_size": 152,
309
+ "trial_name": null,
310
+ "trial_params": null
311
+ }