|
{ |
|
"best_metric": 2.070624589920044, |
|
"best_model_checkpoint": "detr-r50-cd45rb-2ah-6l\\checkpoint-23030", |
|
"epoch": 5.0, |
|
"global_step": 23030, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 8.0034737299175e-06, |
|
"loss": 3.4851, |
|
"step": 4606 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_loss": 2.4806125164031982, |
|
"eval_runtime": 237.1291, |
|
"eval_samples_per_second": 7.511, |
|
"eval_steps_per_second": 0.94, |
|
"step": 4606 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 6.004776378636562e-06, |
|
"loss": 2.995, |
|
"step": 9212 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_loss": 2.2760725021362305, |
|
"eval_runtime": 207.1825, |
|
"eval_samples_per_second": 8.596, |
|
"eval_steps_per_second": 1.076, |
|
"step": 9212 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 4.005644811115936e-06, |
|
"loss": 2.7717, |
|
"step": 13818 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_loss": 2.160128355026245, |
|
"eval_runtime": 205.8051, |
|
"eval_samples_per_second": 8.654, |
|
"eval_steps_per_second": 1.084, |
|
"step": 13818 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 2.0060790273556234e-06, |
|
"loss": 2.674, |
|
"step": 18424 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_loss": 2.0849480628967285, |
|
"eval_runtime": 198.2919, |
|
"eval_samples_per_second": 8.982, |
|
"eval_steps_per_second": 1.125, |
|
"step": 18424 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 6.513243595310465e-09, |
|
"loss": 2.6185, |
|
"step": 23030 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_loss": 2.070624589920044, |
|
"eval_runtime": 204.5209, |
|
"eval_samples_per_second": 8.708, |
|
"eval_steps_per_second": 1.09, |
|
"step": 23030 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"step": 23030, |
|
"total_flos": 4.401655508016e+19, |
|
"train_loss": 2.908882859992401, |
|
"train_runtime": 15260.3368, |
|
"train_samples_per_second": 6.036, |
|
"train_steps_per_second": 1.509 |
|
} |
|
], |
|
"max_steps": 23030, |
|
"num_train_epochs": 5, |
|
"total_flos": 4.401655508016e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|