detr-r101-cd45rb-all-4ah / trainer_state.json
polejowska's picture
End of training
a09a9f1
{
"best_metric": 1.596240758895874,
"best_model_checkpoint": "detr-r101-cd45rb-all-4ah\\checkpoint-46060",
"epoch": 20.0,
"global_step": 46060,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"learning_rate": 9.0034737299175e-06,
"loss": 2.3757,
"step": 2303
},
{
"epoch": 1.0,
"eval_loss": 1.822200059890747,
"eval_runtime": 713.8422,
"eval_samples_per_second": 2.495,
"eval_steps_per_second": 0.312,
"step": 2303
},
{
"epoch": 2.0,
"learning_rate": 8.004342162396874e-06,
"loss": 2.1779,
"step": 4606
},
{
"epoch": 2.0,
"eval_loss": 1.7999826669692993,
"eval_runtime": 728.2283,
"eval_samples_per_second": 2.446,
"eval_steps_per_second": 0.306,
"step": 4606
},
{
"epoch": 3.0,
"learning_rate": 7.005210594876249e-06,
"loss": 2.1259,
"step": 6909
},
{
"epoch": 3.0,
"eval_loss": 1.73061203956604,
"eval_runtime": 745.2135,
"eval_samples_per_second": 2.39,
"eval_steps_per_second": 0.299,
"step": 6909
},
{
"epoch": 4.0,
"learning_rate": 6.005644811115936e-06,
"loss": 2.0969,
"step": 9212
},
{
"epoch": 4.0,
"eval_loss": 1.6853969097137451,
"eval_runtime": 742.3303,
"eval_samples_per_second": 2.399,
"eval_steps_per_second": 0.3,
"step": 9212
},
{
"epoch": 5.0,
"learning_rate": 5.005644811115936e-06,
"loss": 2.0699,
"step": 11515
},
{
"epoch": 5.0,
"eval_loss": 1.6933584213256836,
"eval_runtime": 218.19,
"eval_samples_per_second": 8.163,
"eval_steps_per_second": 1.022,
"step": 11515
},
{
"epoch": 6.0,
"learning_rate": 4.005644811115936e-06,
"loss": 2.0398,
"step": 13818
},
{
"epoch": 6.0,
"eval_loss": 1.6654878854751587,
"eval_runtime": 217.319,
"eval_samples_per_second": 8.195,
"eval_steps_per_second": 1.026,
"step": 13818
},
{
"epoch": 7.0,
"learning_rate": 3.005644811115936e-06,
"loss": 2.0203,
"step": 16121
},
{
"epoch": 7.0,
"eval_loss": 1.657590627670288,
"eval_runtime": 220.5653,
"eval_samples_per_second": 8.075,
"eval_steps_per_second": 1.011,
"step": 16121
},
{
"epoch": 8.0,
"learning_rate": 2.0065132435953105e-06,
"loss": 2.009,
"step": 18424
},
{
"epoch": 8.0,
"eval_loss": 1.6401054859161377,
"eval_runtime": 221.9532,
"eval_samples_per_second": 8.024,
"eval_steps_per_second": 1.005,
"step": 18424
},
{
"epoch": 9.0,
"learning_rate": 1.0069474598349978e-06,
"loss": 1.9923,
"step": 20727
},
{
"epoch": 9.0,
"eval_loss": 1.6319390535354614,
"eval_runtime": 220.4641,
"eval_samples_per_second": 8.078,
"eval_steps_per_second": 1.012,
"step": 20727
},
{
"epoch": 10.0,
"learning_rate": 7.381676074685194e-09,
"loss": 1.9802,
"step": 23030
},
{
"epoch": 10.0,
"eval_loss": 1.6264243125915527,
"eval_runtime": 219.9308,
"eval_samples_per_second": 8.098,
"eval_steps_per_second": 1.014,
"step": 23030
},
{
"epoch": 11.0,
"learning_rate": 4.503690838037343e-06,
"loss": 2.0027,
"step": 25333
},
{
"epoch": 11.0,
"eval_loss": 1.6538771390914917,
"eval_runtime": 653.5646,
"eval_samples_per_second": 2.725,
"eval_steps_per_second": 0.341,
"step": 25333
},
{
"epoch": 12.0,
"learning_rate": 4.003907946157187e-06,
"loss": 2.0005,
"step": 27636
},
{
"epoch": 12.0,
"eval_loss": 1.6563668251037598,
"eval_runtime": 217.5695,
"eval_samples_per_second": 8.186,
"eval_steps_per_second": 1.025,
"step": 27636
},
{
"epoch": 13.0,
"learning_rate": 3.50412505427703e-06,
"loss": 1.9861,
"step": 29939
},
{
"epoch": 13.0,
"eval_loss": 1.6382570266723633,
"eval_runtime": 220.9586,
"eval_samples_per_second": 8.06,
"eval_steps_per_second": 1.009,
"step": 29939
},
{
"epoch": 14.0,
"learning_rate": 3.004342162396874e-06,
"loss": 1.9778,
"step": 32242
},
{
"epoch": 14.0,
"eval_loss": 1.6245843172073364,
"eval_runtime": 765.4452,
"eval_samples_per_second": 2.327,
"eval_steps_per_second": 0.291,
"step": 32242
},
{
"epoch": 15.0,
"learning_rate": 2.504342162396874e-06,
"loss": 1.9602,
"step": 34545
},
{
"epoch": 15.0,
"eval_loss": 1.6119104623794556,
"eval_runtime": 762.5288,
"eval_samples_per_second": 2.336,
"eval_steps_per_second": 0.292,
"step": 34545
},
{
"epoch": 16.0,
"learning_rate": 2.0045592705167173e-06,
"loss": 1.9599,
"step": 36848
},
{
"epoch": 16.0,
"eval_loss": 1.6097208261489868,
"eval_runtime": 767.5249,
"eval_samples_per_second": 2.32,
"eval_steps_per_second": 0.291,
"step": 36848
},
{
"epoch": 17.0,
"learning_rate": 1.504776378636561e-06,
"loss": 1.9464,
"step": 39151
},
{
"epoch": 17.0,
"eval_loss": 1.6114660501480103,
"eval_runtime": 768.6581,
"eval_samples_per_second": 2.317,
"eval_steps_per_second": 0.29,
"step": 39151
},
{
"epoch": 18.0,
"learning_rate": 1.0052105948762484e-06,
"loss": 1.9376,
"step": 41454
},
{
"epoch": 18.0,
"eval_loss": 1.6017816066741943,
"eval_runtime": 636.6555,
"eval_samples_per_second": 2.797,
"eval_steps_per_second": 0.35,
"step": 41454
},
{
"epoch": 19.0,
"learning_rate": 5.054277029960921e-07,
"loss": 1.9273,
"step": 43757
},
{
"epoch": 19.0,
"eval_loss": 1.5967309474945068,
"eval_runtime": 741.1917,
"eval_samples_per_second": 2.403,
"eval_steps_per_second": 0.301,
"step": 43757
},
{
"epoch": 20.0,
"learning_rate": 5.644811115935737e-09,
"loss": 1.928,
"step": 46060
},
{
"epoch": 20.0,
"eval_loss": 1.596240758895874,
"eval_runtime": 718.7174,
"eval_samples_per_second": 2.478,
"eval_steps_per_second": 0.31,
"step": 46060
},
{
"epoch": 20.0,
"step": 46060,
"total_flos": 2.5644983981460485e+20,
"train_loss": 0.9813270691421515,
"train_runtime": 81506.6025,
"train_samples_per_second": 4.52,
"train_steps_per_second": 0.565
}
],
"max_steps": 46060,
"num_train_epochs": 20,
"total_flos": 2.5644983981460485e+20,
"trial_name": null,
"trial_params": null
}