|
{ |
|
"best_metric": 0.2075, |
|
"best_model_checkpoint": "/content/model_asr/checkpoint-1100", |
|
"epoch": 80.0, |
|
"global_step": 1200, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 3.33, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 8.6183, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 3.33, |
|
"eval_loss": 4.025334358215332, |
|
"eval_runtime": 15.3335, |
|
"eval_samples_per_second": 31.304, |
|
"eval_steps_per_second": 3.913, |
|
"eval_wer": 1.0, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 6.67, |
|
"learning_rate": 9.6e-05, |
|
"loss": 3.2794, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 6.67, |
|
"eval_loss": 3.0245492458343506, |
|
"eval_runtime": 15.5923, |
|
"eval_samples_per_second": 30.784, |
|
"eval_steps_per_second": 3.848, |
|
"eval_wer": 1.0, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 9.956913093678348e-05, |
|
"loss": 2.9692, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_loss": 2.8865509033203125, |
|
"eval_runtime": 15.6178, |
|
"eval_samples_per_second": 30.734, |
|
"eval_steps_per_second": 3.842, |
|
"eval_wer": 1.0, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 13.33, |
|
"learning_rate": 9.813243995692098e-05, |
|
"loss": 2.8042, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 13.33, |
|
"eval_loss": 2.635584831237793, |
|
"eval_runtime": 15.4284, |
|
"eval_samples_per_second": 31.112, |
|
"eval_steps_per_second": 3.889, |
|
"eval_wer": 1.0, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 16.67, |
|
"learning_rate": 9.57159113020304e-05, |
|
"loss": 2.5114, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 16.67, |
|
"eval_loss": 2.116630792617798, |
|
"eval_runtime": 15.5962, |
|
"eval_samples_per_second": 30.777, |
|
"eval_steps_per_second": 3.847, |
|
"eval_wer": 1.0, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"learning_rate": 9.236873852683213e-05, |
|
"loss": 1.7677, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_loss": 1.0035134553909302, |
|
"eval_runtime": 15.4247, |
|
"eval_samples_per_second": 31.119, |
|
"eval_steps_per_second": 3.89, |
|
"eval_wer": 0.89375, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 23.33, |
|
"learning_rate": 8.815906041658002e-05, |
|
"loss": 0.8802, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 23.33, |
|
"eval_loss": 0.3643040060997009, |
|
"eval_runtime": 15.6657, |
|
"eval_samples_per_second": 30.64, |
|
"eval_steps_per_second": 3.83, |
|
"eval_wer": 0.5025, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 26.67, |
|
"learning_rate": 8.31725738778896e-05, |
|
"loss": 0.4318, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 26.67, |
|
"eval_loss": 0.14456388354301453, |
|
"eval_runtime": 15.4959, |
|
"eval_samples_per_second": 30.976, |
|
"eval_steps_per_second": 3.872, |
|
"eval_wer": 0.3075, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"learning_rate": 7.751078939684885e-05, |
|
"loss": 0.2275, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_loss": 0.07944890111684799, |
|
"eval_runtime": 16.2382, |
|
"eval_samples_per_second": 29.56, |
|
"eval_steps_per_second": 3.695, |
|
"eval_wer": 0.25, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 33.33, |
|
"learning_rate": 7.128896457825364e-05, |
|
"loss": 0.1407, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 33.33, |
|
"eval_loss": 0.05435527116060257, |
|
"eval_runtime": 15.4181, |
|
"eval_samples_per_second": 31.132, |
|
"eval_steps_per_second": 3.892, |
|
"eval_wer": 0.22125, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 36.67, |
|
"learning_rate": 6.463375783314937e-05, |
|
"loss": 0.1191, |
|
"step": 550 |
|
}, |
|
{ |
|
"epoch": 36.67, |
|
"eval_loss": 0.046384669840335846, |
|
"eval_runtime": 15.8291, |
|
"eval_samples_per_second": 30.324, |
|
"eval_steps_per_second": 3.79, |
|
"eval_wer": 0.23375, |
|
"step": 550 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"learning_rate": 5.768064997883498e-05, |
|
"loss": 0.0825, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_loss": 0.03952096030116081, |
|
"eval_runtime": 15.4288, |
|
"eval_samples_per_second": 31.111, |
|
"eval_steps_per_second": 3.889, |
|
"eval_wer": 0.25625, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 43.33, |
|
"learning_rate": 5.057118624011702e-05, |
|
"loss": 0.0699, |
|
"step": 650 |
|
}, |
|
{ |
|
"epoch": 43.33, |
|
"eval_loss": 0.03604818880558014, |
|
"eval_runtime": 15.4828, |
|
"eval_samples_per_second": 31.002, |
|
"eval_steps_per_second": 3.875, |
|
"eval_wer": 0.2125, |
|
"step": 650 |
|
}, |
|
{ |
|
"epoch": 46.67, |
|
"learning_rate": 4.345009479671536e-05, |
|
"loss": 0.0592, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 46.67, |
|
"eval_loss": 0.02805432118475437, |
|
"eval_runtime": 15.5578, |
|
"eval_samples_per_second": 30.853, |
|
"eval_steps_per_second": 3.857, |
|
"eval_wer": 0.23875, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"learning_rate": 3.646234053488574e-05, |
|
"loss": 0.0546, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_loss": 0.023771686479449272, |
|
"eval_runtime": 15.8929, |
|
"eval_samples_per_second": 30.202, |
|
"eval_steps_per_second": 3.775, |
|
"eval_wer": 0.26375, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 53.33, |
|
"learning_rate": 2.9750173980379736e-05, |
|
"loss": 0.0455, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 53.33, |
|
"eval_loss": 0.021949028596282005, |
|
"eval_runtime": 15.824, |
|
"eval_samples_per_second": 30.334, |
|
"eval_steps_per_second": 3.792, |
|
"eval_wer": 0.24125, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 56.67, |
|
"learning_rate": 2.3450235487957135e-05, |
|
"loss": 0.0391, |
|
"step": 850 |
|
}, |
|
{ |
|
"epoch": 56.67, |
|
"eval_loss": 0.020865805447101593, |
|
"eval_runtime": 16.0515, |
|
"eval_samples_per_second": 29.904, |
|
"eval_steps_per_second": 3.738, |
|
"eval_wer": 0.24375, |
|
"step": 850 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"learning_rate": 1.7690773637801294e-05, |
|
"loss": 0.0367, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_loss": 0.022958721965551376, |
|
"eval_runtime": 15.4228, |
|
"eval_samples_per_second": 31.123, |
|
"eval_steps_per_second": 3.89, |
|
"eval_wer": 0.21625, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 63.33, |
|
"learning_rate": 1.2589034464264932e-05, |
|
"loss": 0.0333, |
|
"step": 950 |
|
}, |
|
{ |
|
"epoch": 63.33, |
|
"eval_loss": 0.021822014823555946, |
|
"eval_runtime": 15.5217, |
|
"eval_samples_per_second": 30.924, |
|
"eval_steps_per_second": 3.866, |
|
"eval_wer": 0.23, |
|
"step": 950 |
|
}, |
|
{ |
|
"epoch": 66.67, |
|
"learning_rate": 8.248874664720375e-06, |
|
"loss": 0.0327, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 66.67, |
|
"eval_loss": 0.02000792883336544, |
|
"eval_runtime": 15.8435, |
|
"eval_samples_per_second": 30.296, |
|
"eval_steps_per_second": 3.787, |
|
"eval_wer": 0.21625, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"learning_rate": 4.758647376699032e-06, |
|
"loss": 0.0306, |
|
"step": 1050 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_loss": 0.02014043927192688, |
|
"eval_runtime": 15.7796, |
|
"eval_samples_per_second": 30.419, |
|
"eval_steps_per_second": 3.802, |
|
"eval_wer": 0.21625, |
|
"step": 1050 |
|
}, |
|
{ |
|
"epoch": 73.33, |
|
"learning_rate": 2.1894035628006517e-06, |
|
"loss": 0.0269, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 73.33, |
|
"eval_loss": 0.02098565548658371, |
|
"eval_runtime": 16.1184, |
|
"eval_samples_per_second": 29.78, |
|
"eval_steps_per_second": 3.722, |
|
"eval_wer": 0.2075, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 76.67, |
|
"learning_rate": 5.934456179888804e-07, |
|
"loss": 0.0288, |
|
"step": 1150 |
|
}, |
|
{ |
|
"epoch": 76.67, |
|
"eval_loss": 0.021614952012896538, |
|
"eval_runtime": 15.8598, |
|
"eval_samples_per_second": 30.265, |
|
"eval_steps_per_second": 3.783, |
|
"eval_wer": 0.21625, |
|
"step": 1150 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"learning_rate": 3.262643657425679e-09, |
|
"loss": 0.0289, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_loss": 0.02152070961892605, |
|
"eval_runtime": 16.1024, |
|
"eval_samples_per_second": 29.809, |
|
"eval_steps_per_second": 3.726, |
|
"eval_wer": 0.21625, |
|
"step": 1200 |
|
} |
|
], |
|
"max_steps": 1200, |
|
"num_train_epochs": 80, |
|
"total_flos": 3.3688058529081743e+18, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|