|
{ |
|
"best_metric": 1.5881637334823608, |
|
"best_model_checkpoint": "detr-r50-cd45rb-all-4ah\\checkpoint-46060", |
|
"epoch": 20.0, |
|
"global_step": 46060, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 9.501519756838906e-06, |
|
"loss": 2.4171, |
|
"step": 2303 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_loss": 1.8409900665283203, |
|
"eval_runtime": 206.0212, |
|
"eval_samples_per_second": 8.645, |
|
"eval_steps_per_second": 1.082, |
|
"step": 2303 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 9.001953973078595e-06, |
|
"loss": 2.1862, |
|
"step": 4606 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_loss": 1.7626707553863525, |
|
"eval_runtime": 208.1902, |
|
"eval_samples_per_second": 8.555, |
|
"eval_steps_per_second": 1.071, |
|
"step": 4606 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 8.502171081198437e-06, |
|
"loss": 2.1252, |
|
"step": 6909 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_loss": 1.7528759241104126, |
|
"eval_runtime": 207.3023, |
|
"eval_samples_per_second": 8.591, |
|
"eval_steps_per_second": 1.076, |
|
"step": 6909 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 8.002171081198438e-06, |
|
"loss": 2.1065, |
|
"step": 9212 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_loss": 1.7416059970855713, |
|
"eval_runtime": 207.0434, |
|
"eval_samples_per_second": 8.602, |
|
"eval_steps_per_second": 1.077, |
|
"step": 9212 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 7.502388189318282e-06, |
|
"loss": 2.0764, |
|
"step": 11515 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_loss": 1.699079990386963, |
|
"eval_runtime": 391.8586, |
|
"eval_samples_per_second": 4.545, |
|
"eval_steps_per_second": 0.569, |
|
"step": 11515 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 7.002605297438124e-06, |
|
"loss": 2.051, |
|
"step": 13818 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_loss": 1.6862515211105347, |
|
"eval_runtime": 383.5485, |
|
"eval_samples_per_second": 4.643, |
|
"eval_steps_per_second": 0.581, |
|
"step": 13818 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 6.502822405557968e-06, |
|
"loss": 2.039, |
|
"step": 16121 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_loss": 1.6824065446853638, |
|
"eval_runtime": 379.3509, |
|
"eval_samples_per_second": 4.695, |
|
"eval_steps_per_second": 0.588, |
|
"step": 16121 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 6.002822405557969e-06, |
|
"loss": 2.0266, |
|
"step": 18424 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_loss": 1.6705697774887085, |
|
"eval_runtime": 387.7566, |
|
"eval_samples_per_second": 4.593, |
|
"eval_steps_per_second": 0.575, |
|
"step": 18424 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 5.503039513677813e-06, |
|
"loss": 2.0177, |
|
"step": 20727 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_loss": 1.6724380254745483, |
|
"eval_runtime": 388.2463, |
|
"eval_samples_per_second": 4.587, |
|
"eval_steps_per_second": 0.574, |
|
"step": 20727 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 5.003256621797655e-06, |
|
"loss": 2.006, |
|
"step": 23030 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_loss": 1.6438802480697632, |
|
"eval_runtime": 381.3527, |
|
"eval_samples_per_second": 4.67, |
|
"eval_steps_per_second": 0.585, |
|
"step": 23030 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"learning_rate": 4.503690838037343e-06, |
|
"loss": 1.9853, |
|
"step": 25333 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_loss": 1.6503098011016846, |
|
"eval_runtime": 371.6041, |
|
"eval_samples_per_second": 4.793, |
|
"eval_steps_per_second": 0.6, |
|
"step": 25333 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"learning_rate": 4.003690838037343e-06, |
|
"loss": 1.9794, |
|
"step": 27636 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_loss": 1.6337422132492065, |
|
"eval_runtime": 367.1164, |
|
"eval_samples_per_second": 4.851, |
|
"eval_steps_per_second": 0.607, |
|
"step": 27636 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"learning_rate": 3.5039079461571867e-06, |
|
"loss": 1.9676, |
|
"step": 29939 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_loss": 1.6212905645370483, |
|
"eval_runtime": 384.5295, |
|
"eval_samples_per_second": 4.632, |
|
"eval_steps_per_second": 0.58, |
|
"step": 29939 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"learning_rate": 3.004342162396874e-06, |
|
"loss": 1.9646, |
|
"step": 32242 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_loss": 1.6212937831878662, |
|
"eval_runtime": 366.0496, |
|
"eval_samples_per_second": 4.865, |
|
"eval_steps_per_second": 0.609, |
|
"step": 32242 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"learning_rate": 2.504342162396874e-06, |
|
"loss": 1.9551, |
|
"step": 34545 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_loss": 1.614364743232727, |
|
"eval_runtime": 201.7258, |
|
"eval_samples_per_second": 8.829, |
|
"eval_steps_per_second": 1.105, |
|
"step": 34545 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"learning_rate": 2.0043421623968738e-06, |
|
"loss": 1.9448, |
|
"step": 36848 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_loss": 1.6080951690673828, |
|
"eval_runtime": 202.5165, |
|
"eval_samples_per_second": 8.794, |
|
"eval_steps_per_second": 1.101, |
|
"step": 36848 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"learning_rate": 1.504776378636561e-06, |
|
"loss": 1.9347, |
|
"step": 39151 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_loss": 1.5986374616622925, |
|
"eval_runtime": 375.2604, |
|
"eval_samples_per_second": 4.746, |
|
"eval_steps_per_second": 0.594, |
|
"step": 39151 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"learning_rate": 1.0047763786365611e-06, |
|
"loss": 1.9287, |
|
"step": 41454 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_loss": 1.5923762321472168, |
|
"eval_runtime": 382.3809, |
|
"eval_samples_per_second": 4.658, |
|
"eval_steps_per_second": 0.583, |
|
"step": 41454 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"learning_rate": 5.052105948762484e-07, |
|
"loss": 1.9177, |
|
"step": 43757 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_loss": 1.590692162513733, |
|
"eval_runtime": 371.0354, |
|
"eval_samples_per_second": 4.8, |
|
"eval_steps_per_second": 0.601, |
|
"step": 43757 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"learning_rate": 5.210594876248372e-09, |
|
"loss": 1.9216, |
|
"step": 46060 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_loss": 1.5881637334823608, |
|
"eval_runtime": 379.3818, |
|
"eval_samples_per_second": 4.694, |
|
"eval_steps_per_second": 0.588, |
|
"step": 46060 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"step": 46060, |
|
"total_flos": 1.7606512956165125e+20, |
|
"train_loss": 2.027567579142694, |
|
"train_runtime": 94939.1754, |
|
"train_samples_per_second": 3.881, |
|
"train_steps_per_second": 0.485 |
|
} |
|
], |
|
"max_steps": 46060, |
|
"num_train_epochs": 20, |
|
"total_flos": 1.7606512956165125e+20, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|