|
{ |
|
"best_metric": 1.647210717201233, |
|
"best_model_checkpoint": "detr-r50-cd45rb-all-1ah\\checkpoint-23030", |
|
"epoch": 10.0, |
|
"global_step": 23030, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 9.0034737299175e-06, |
|
"loss": 2.4098, |
|
"step": 2303 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_loss": 1.8949893712997437, |
|
"eval_runtime": 360.2555, |
|
"eval_samples_per_second": 4.944, |
|
"eval_steps_per_second": 0.619, |
|
"step": 2303 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 8.003907946157187e-06, |
|
"loss": 2.1885, |
|
"step": 4606 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_loss": 1.8040752410888672, |
|
"eval_runtime": 206.1007, |
|
"eval_samples_per_second": 8.641, |
|
"eval_steps_per_second": 1.082, |
|
"step": 4606 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 7.003907946157187e-06, |
|
"loss": 2.1283, |
|
"step": 6909 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_loss": 1.7426284551620483, |
|
"eval_runtime": 206.5714, |
|
"eval_samples_per_second": 8.622, |
|
"eval_steps_per_second": 1.08, |
|
"step": 6909 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 6.0043421623968744e-06, |
|
"loss": 2.0899, |
|
"step": 9212 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_loss": 1.7134923934936523, |
|
"eval_runtime": 206.8464, |
|
"eval_samples_per_second": 8.61, |
|
"eval_steps_per_second": 1.078, |
|
"step": 9212 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 5.004776378636561e-06, |
|
"loss": 2.0724, |
|
"step": 11515 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_loss": 1.6892552375793457, |
|
"eval_runtime": 205.7121, |
|
"eval_samples_per_second": 8.658, |
|
"eval_steps_per_second": 1.084, |
|
"step": 11515 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 4.004776378636561e-06, |
|
"loss": 2.0495, |
|
"step": 13818 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_loss": 1.691046953201294, |
|
"eval_runtime": 205.6737, |
|
"eval_samples_per_second": 8.659, |
|
"eval_steps_per_second": 1.084, |
|
"step": 13818 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 3.005644811115936e-06, |
|
"loss": 2.0379, |
|
"step": 16121 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_loss": 1.6886247396469116, |
|
"eval_runtime": 372.0107, |
|
"eval_samples_per_second": 4.787, |
|
"eval_steps_per_second": 0.599, |
|
"step": 16121 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 2.0060790273556234e-06, |
|
"loss": 2.0203, |
|
"step": 18424 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_loss": 1.6616142988204956, |
|
"eval_runtime": 371.4764, |
|
"eval_samples_per_second": 4.794, |
|
"eval_steps_per_second": 0.6, |
|
"step": 18424 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 1.0065132435953105e-06, |
|
"loss": 2.0067, |
|
"step": 20727 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_loss": 1.6533863544464111, |
|
"eval_runtime": 376.2664, |
|
"eval_samples_per_second": 4.733, |
|
"eval_steps_per_second": 0.593, |
|
"step": 20727 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 6.513243595310465e-09, |
|
"loss": 1.9953, |
|
"step": 23030 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_loss": 1.647210717201233, |
|
"eval_runtime": 376.7422, |
|
"eval_samples_per_second": 4.727, |
|
"eval_steps_per_second": 0.592, |
|
"step": 23030 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"step": 23030, |
|
"total_flos": 8.803256478082562e+19, |
|
"train_loss": 2.0998485543652303, |
|
"train_runtime": 42150.26, |
|
"train_samples_per_second": 4.37, |
|
"train_steps_per_second": 0.546 |
|
} |
|
], |
|
"max_steps": 23030, |
|
"num_train_epochs": 10, |
|
"total_flos": 8.803256478082562e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|