|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 19.99591836734694, |
|
"global_step": 2440, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_cer": 1.0, |
|
"eval_loss": 3.4127440452575684, |
|
"eval_runtime": 162.9527, |
|
"eval_samples_per_second": 6.64, |
|
"eval_steps_per_second": 0.835, |
|
"eval_wer": 1.0, |
|
"step": 122 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_cer": 1.0, |
|
"eval_loss": 2.9441540241241455, |
|
"eval_runtime": 163.1192, |
|
"eval_samples_per_second": 6.633, |
|
"eval_steps_per_second": 0.834, |
|
"eval_wer": 1.0, |
|
"step": 244 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_cer": 0.3244493212689078, |
|
"eval_loss": 1.2275432348251343, |
|
"eval_runtime": 159.0312, |
|
"eval_samples_per_second": 6.804, |
|
"eval_steps_per_second": 0.855, |
|
"eval_wer": 0.8635921622015851, |
|
"step": 366 |
|
}, |
|
{ |
|
"epoch": 3.28, |
|
"learning_rate": 0.0002388, |
|
"loss": 3.9307, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_cer": 0.2023591638341556, |
|
"eval_loss": 0.7168374061584473, |
|
"eval_runtime": 158.5869, |
|
"eval_samples_per_second": 6.823, |
|
"eval_steps_per_second": 0.858, |
|
"eval_wer": 0.501920552341129, |
|
"step": 488 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_cer": 0.17312679219727137, |
|
"eval_loss": 0.617878794670105, |
|
"eval_runtime": 158.2056, |
|
"eval_samples_per_second": 6.839, |
|
"eval_steps_per_second": 0.86, |
|
"eval_wer": 0.41668692565760684, |
|
"step": 610 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_cer": 0.16569868368602203, |
|
"eval_loss": 0.6016563177108765, |
|
"eval_runtime": 157.9983, |
|
"eval_samples_per_second": 6.848, |
|
"eval_steps_per_second": 0.861, |
|
"eval_wer": 0.37708465016774445, |
|
"step": 732 |
|
}, |
|
{ |
|
"epoch": 6.56, |
|
"learning_rate": 0.00025391752577319586, |
|
"loss": 0.6036, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_cer": 0.16388987711259606, |
|
"eval_loss": 0.6307795643806458, |
|
"eval_runtime": 159.8432, |
|
"eval_samples_per_second": 6.769, |
|
"eval_steps_per_second": 0.851, |
|
"eval_wer": 0.3708610881509214, |
|
"step": 854 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_cer": 0.1604865775407946, |
|
"eval_loss": 0.6786409616470337, |
|
"eval_runtime": 160.9659, |
|
"eval_samples_per_second": 6.722, |
|
"eval_steps_per_second": 0.845, |
|
"eval_wer": 0.35467010259153015, |
|
"step": 976 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_cer": 0.15351281380865225, |
|
"eval_loss": 0.696066677570343, |
|
"eval_runtime": 165.3737, |
|
"eval_samples_per_second": 6.543, |
|
"eval_steps_per_second": 0.822, |
|
"eval_wer": 0.3348324986629066, |
|
"step": 1098 |
|
}, |
|
{ |
|
"epoch": 9.83, |
|
"learning_rate": 0.00019206185567010307, |
|
"loss": 0.303, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_cer": 0.15007951033634373, |
|
"eval_loss": 0.713607132434845, |
|
"eval_runtime": 160.5614, |
|
"eval_samples_per_second": 6.739, |
|
"eval_steps_per_second": 0.847, |
|
"eval_wer": 0.3272961540331599, |
|
"step": 1220 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_cer": 0.1534270883786321, |
|
"eval_loss": 0.724854052066803, |
|
"eval_runtime": 158.4702, |
|
"eval_samples_per_second": 6.828, |
|
"eval_steps_per_second": 0.858, |
|
"eval_wer": 0.3330821218456751, |
|
"step": 1342 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_cer": 0.15021667102437603, |
|
"eval_loss": 0.7961975932121277, |
|
"eval_runtime": 158.6964, |
|
"eval_samples_per_second": 6.818, |
|
"eval_steps_per_second": 0.857, |
|
"eval_wer": 0.3294598142655711, |
|
"step": 1464 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_cer": 0.15035811798390933, |
|
"eval_loss": 0.8382342457771301, |
|
"eval_runtime": 159.3031, |
|
"eval_samples_per_second": 6.792, |
|
"eval_steps_per_second": 0.854, |
|
"eval_wer": 0.3209996596489522, |
|
"step": 1586 |
|
}, |
|
{ |
|
"epoch": 13.11, |
|
"learning_rate": 0.0001302061855670103, |
|
"loss": 0.1685, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_cer": 0.1506152942739699, |
|
"eval_loss": 0.8463586568832397, |
|
"eval_runtime": 159.0294, |
|
"eval_samples_per_second": 6.804, |
|
"eval_steps_per_second": 0.855, |
|
"eval_wer": 0.3242329946030048, |
|
"step": 1708 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_cer": 0.14896507974608128, |
|
"eval_loss": 0.9096932411193848, |
|
"eval_runtime": 162.4549, |
|
"eval_samples_per_second": 6.66, |
|
"eval_steps_per_second": 0.837, |
|
"eval_wer": 0.3218019156901833, |
|
"step": 1830 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_cer": 0.14725485741717853, |
|
"eval_loss": 0.963500440120697, |
|
"eval_runtime": 158.9025, |
|
"eval_samples_per_second": 6.809, |
|
"eval_steps_per_second": 0.856, |
|
"eval_wer": 0.31263674818884624, |
|
"step": 1952 |
|
}, |
|
{ |
|
"epoch": 16.39, |
|
"learning_rate": 6.835051546391752e-05, |
|
"loss": 0.1031, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_cer": 0.1464233207459827, |
|
"eval_loss": 0.9706696271896362, |
|
"eval_runtime": 158.7074, |
|
"eval_samples_per_second": 6.818, |
|
"eval_steps_per_second": 0.857, |
|
"eval_wer": 0.3110565468955122, |
|
"step": 2074 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_cer": 0.14608041902590194, |
|
"eval_loss": 1.0005509853363037, |
|
"eval_runtime": 158.0719, |
|
"eval_samples_per_second": 6.845, |
|
"eval_steps_per_second": 0.86, |
|
"eval_wer": 0.31331745028443625, |
|
"step": 2196 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_cer": 0.14561750170379292, |
|
"eval_loss": 1.0291253328323364, |
|
"eval_runtime": 159.3838, |
|
"eval_samples_per_second": 6.789, |
|
"eval_steps_per_second": 0.853, |
|
"eval_wer": 0.31030291243253755, |
|
"step": 2318 |
|
}, |
|
{ |
|
"epoch": 19.67, |
|
"learning_rate": 6.494845360824742e-06, |
|
"loss": 0.0629, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_cer": 0.1464233207459827, |
|
"eval_loss": 1.0326457023620605, |
|
"eval_runtime": 158.8998, |
|
"eval_samples_per_second": 6.809, |
|
"eval_steps_per_second": 0.856, |
|
"eval_wer": 0.31287985608012836, |
|
"step": 2440 |
|
} |
|
], |
|
"max_steps": 2440, |
|
"num_train_epochs": 20, |
|
"total_flos": 7.698957470096574e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|