{ "best_metric": 0.2075, "best_model_checkpoint": "/content/model_asr/checkpoint-1100", "epoch": 80.0, "global_step": 1200, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 3.33, "learning_rate": 4.600000000000001e-05, "loss": 8.6183, "step": 50 }, { "epoch": 3.33, "eval_loss": 4.025334358215332, "eval_runtime": 15.3335, "eval_samples_per_second": 31.304, "eval_steps_per_second": 3.913, "eval_wer": 1.0, "step": 50 }, { "epoch": 6.67, "learning_rate": 9.6e-05, "loss": 3.2794, "step": 100 }, { "epoch": 6.67, "eval_loss": 3.0245492458343506, "eval_runtime": 15.5923, "eval_samples_per_second": 30.784, "eval_steps_per_second": 3.848, "eval_wer": 1.0, "step": 100 }, { "epoch": 10.0, "learning_rate": 9.956913093678348e-05, "loss": 2.9692, "step": 150 }, { "epoch": 10.0, "eval_loss": 2.8865509033203125, "eval_runtime": 15.6178, "eval_samples_per_second": 30.734, "eval_steps_per_second": 3.842, "eval_wer": 1.0, "step": 150 }, { "epoch": 13.33, "learning_rate": 9.813243995692098e-05, "loss": 2.8042, "step": 200 }, { "epoch": 13.33, "eval_loss": 2.635584831237793, "eval_runtime": 15.4284, "eval_samples_per_second": 31.112, "eval_steps_per_second": 3.889, "eval_wer": 1.0, "step": 200 }, { "epoch": 16.67, "learning_rate": 9.57159113020304e-05, "loss": 2.5114, "step": 250 }, { "epoch": 16.67, "eval_loss": 2.116630792617798, "eval_runtime": 15.5962, "eval_samples_per_second": 30.777, "eval_steps_per_second": 3.847, "eval_wer": 1.0, "step": 250 }, { "epoch": 20.0, "learning_rate": 9.236873852683213e-05, "loss": 1.7677, "step": 300 }, { "epoch": 20.0, "eval_loss": 1.0035134553909302, "eval_runtime": 15.4247, "eval_samples_per_second": 31.119, "eval_steps_per_second": 3.89, "eval_wer": 0.89375, "step": 300 }, { "epoch": 23.33, "learning_rate": 8.815906041658002e-05, "loss": 0.8802, "step": 350 }, { "epoch": 23.33, "eval_loss": 0.3643040060997009, "eval_runtime": 15.6657, "eval_samples_per_second": 30.64, "eval_steps_per_second": 3.83, "eval_wer": 0.5025, "step": 350 }, { "epoch": 26.67, "learning_rate": 8.31725738778896e-05, "loss": 0.4318, "step": 400 }, { "epoch": 26.67, "eval_loss": 0.14456388354301453, "eval_runtime": 15.4959, "eval_samples_per_second": 30.976, "eval_steps_per_second": 3.872, "eval_wer": 0.3075, "step": 400 }, { "epoch": 30.0, "learning_rate": 7.751078939684885e-05, "loss": 0.2275, "step": 450 }, { "epoch": 30.0, "eval_loss": 0.07944890111684799, "eval_runtime": 16.2382, "eval_samples_per_second": 29.56, "eval_steps_per_second": 3.695, "eval_wer": 0.25, "step": 450 }, { "epoch": 33.33, "learning_rate": 7.128896457825364e-05, "loss": 0.1407, "step": 500 }, { "epoch": 33.33, "eval_loss": 0.05435527116060257, "eval_runtime": 15.4181, "eval_samples_per_second": 31.132, "eval_steps_per_second": 3.892, "eval_wer": 0.22125, "step": 500 }, { "epoch": 36.67, "learning_rate": 6.463375783314937e-05, "loss": 0.1191, "step": 550 }, { "epoch": 36.67, "eval_loss": 0.046384669840335846, "eval_runtime": 15.8291, "eval_samples_per_second": 30.324, "eval_steps_per_second": 3.79, "eval_wer": 0.23375, "step": 550 }, { "epoch": 40.0, "learning_rate": 5.768064997883498e-05, "loss": 0.0825, "step": 600 }, { "epoch": 40.0, "eval_loss": 0.03952096030116081, "eval_runtime": 15.4288, "eval_samples_per_second": 31.111, "eval_steps_per_second": 3.889, "eval_wer": 0.25625, "step": 600 }, { "epoch": 43.33, "learning_rate": 5.057118624011702e-05, "loss": 0.0699, "step": 650 }, { "epoch": 43.33, "eval_loss": 0.03604818880558014, "eval_runtime": 15.4828, "eval_samples_per_second": 31.002, "eval_steps_per_second": 3.875, "eval_wer": 0.2125, "step": 650 }, { "epoch": 46.67, "learning_rate": 4.345009479671536e-05, "loss": 0.0592, "step": 700 }, { "epoch": 46.67, "eval_loss": 0.02805432118475437, "eval_runtime": 15.5578, "eval_samples_per_second": 30.853, "eval_steps_per_second": 3.857, "eval_wer": 0.23875, "step": 700 }, { "epoch": 50.0, "learning_rate": 3.646234053488574e-05, "loss": 0.0546, "step": 750 }, { "epoch": 50.0, "eval_loss": 0.023771686479449272, "eval_runtime": 15.8929, "eval_samples_per_second": 30.202, "eval_steps_per_second": 3.775, "eval_wer": 0.26375, "step": 750 }, { "epoch": 53.33, "learning_rate": 2.9750173980379736e-05, "loss": 0.0455, "step": 800 }, { "epoch": 53.33, "eval_loss": 0.021949028596282005, "eval_runtime": 15.824, "eval_samples_per_second": 30.334, "eval_steps_per_second": 3.792, "eval_wer": 0.24125, "step": 800 }, { "epoch": 56.67, "learning_rate": 2.3450235487957135e-05, "loss": 0.0391, "step": 850 }, { "epoch": 56.67, "eval_loss": 0.020865805447101593, "eval_runtime": 16.0515, "eval_samples_per_second": 29.904, "eval_steps_per_second": 3.738, "eval_wer": 0.24375, "step": 850 }, { "epoch": 60.0, "learning_rate": 1.7690773637801294e-05, "loss": 0.0367, "step": 900 }, { "epoch": 60.0, "eval_loss": 0.022958721965551376, "eval_runtime": 15.4228, "eval_samples_per_second": 31.123, "eval_steps_per_second": 3.89, "eval_wer": 0.21625, "step": 900 }, { "epoch": 63.33, "learning_rate": 1.2589034464264932e-05, "loss": 0.0333, "step": 950 }, { "epoch": 63.33, "eval_loss": 0.021822014823555946, "eval_runtime": 15.5217, "eval_samples_per_second": 30.924, "eval_steps_per_second": 3.866, "eval_wer": 0.23, "step": 950 }, { "epoch": 66.67, "learning_rate": 8.248874664720375e-06, "loss": 0.0327, "step": 1000 }, { "epoch": 66.67, "eval_loss": 0.02000792883336544, "eval_runtime": 15.8435, "eval_samples_per_second": 30.296, "eval_steps_per_second": 3.787, "eval_wer": 0.21625, "step": 1000 }, { "epoch": 70.0, "learning_rate": 4.758647376699032e-06, "loss": 0.0306, "step": 1050 }, { "epoch": 70.0, "eval_loss": 0.02014043927192688, "eval_runtime": 15.7796, "eval_samples_per_second": 30.419, "eval_steps_per_second": 3.802, "eval_wer": 0.21625, "step": 1050 }, { "epoch": 73.33, "learning_rate": 2.1894035628006517e-06, "loss": 0.0269, "step": 1100 }, { "epoch": 73.33, "eval_loss": 0.02098565548658371, "eval_runtime": 16.1184, "eval_samples_per_second": 29.78, "eval_steps_per_second": 3.722, "eval_wer": 0.2075, "step": 1100 }, { "epoch": 76.67, "learning_rate": 5.934456179888804e-07, "loss": 0.0288, "step": 1150 }, { "epoch": 76.67, "eval_loss": 0.021614952012896538, "eval_runtime": 15.8598, "eval_samples_per_second": 30.265, "eval_steps_per_second": 3.783, "eval_wer": 0.21625, "step": 1150 }, { "epoch": 80.0, "learning_rate": 3.262643657425679e-09, "loss": 0.0289, "step": 1200 }, { "epoch": 80.0, "eval_loss": 0.02152070961892605, "eval_runtime": 16.1024, "eval_samples_per_second": 29.809, "eval_steps_per_second": 3.726, "eval_wer": 0.21625, "step": 1200 } ], "max_steps": 1200, "num_train_epochs": 80, "total_flos": 3.3688058529081743e+18, "trial_name": null, "trial_params": null }