|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 49.98039215686274, |
|
"global_step": 1250, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 3.98, |
|
"learning_rate": 3.675e-06, |
|
"loss": 20.0794, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 7.98, |
|
"learning_rate": 7.425e-06, |
|
"loss": 10.5776, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 11.98, |
|
"learning_rate": 1.1174999999999999e-05, |
|
"loss": 6.6033, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 15.98, |
|
"learning_rate": 1.4925e-05, |
|
"loss": 5.3857, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 19.98, |
|
"learning_rate": 1.8675e-05, |
|
"loss": 4.4431, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 19.98, |
|
"eval_loss": 4.144110202789307, |
|
"eval_runtime": 12.9526, |
|
"eval_samples_per_second": 26.327, |
|
"eval_steps_per_second": 3.32, |
|
"eval_wer": 1.0, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 23.98, |
|
"learning_rate": 2.2424999999999996e-05, |
|
"loss": 3.7383, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 27.98, |
|
"learning_rate": 2.6174999999999996e-05, |
|
"loss": 3.361, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 31.98, |
|
"learning_rate": 2.9925e-05, |
|
"loss": 3.2219, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 35.98, |
|
"learning_rate": 3.3675e-05, |
|
"loss": 3.104, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 39.98, |
|
"learning_rate": 3.7424999999999995e-05, |
|
"loss": 3.0399, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 39.98, |
|
"eval_loss": 2.9768528938293457, |
|
"eval_runtime": 12.8843, |
|
"eval_samples_per_second": 26.466, |
|
"eval_steps_per_second": 3.337, |
|
"eval_wer": 0.9988929889298893, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 43.98, |
|
"learning_rate": 4.1175e-05, |
|
"loss": 2.9893, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 47.98, |
|
"learning_rate": 4.4924999999999994e-05, |
|
"loss": 2.953, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 49.98, |
|
"step": 1250, |
|
"total_flos": 4.919672600088422e+18, |
|
"train_loss": 5.6772947265625, |
|
"train_runtime": 2084.0288, |
|
"train_samples_per_second": 19.434, |
|
"train_steps_per_second": 0.6 |
|
} |
|
], |
|
"max_steps": 1250, |
|
"num_train_epochs": 50, |
|
"total_flos": 4.919672600088422e+18, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|