ailabs_proj / trainer_state.json
Akashpb13's picture
Upload trainer_state.json
b2875eb
raw
history blame
8.75 kB
{
"best_metric": 0.2075,
"best_model_checkpoint": "/content/model_asr/checkpoint-1100",
"epoch": 80.0,
"global_step": 1200,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 3.33,
"learning_rate": 4.600000000000001e-05,
"loss": 8.6183,
"step": 50
},
{
"epoch": 3.33,
"eval_loss": 4.025334358215332,
"eval_runtime": 15.3335,
"eval_samples_per_second": 31.304,
"eval_steps_per_second": 3.913,
"eval_wer": 1.0,
"step": 50
},
{
"epoch": 6.67,
"learning_rate": 9.6e-05,
"loss": 3.2794,
"step": 100
},
{
"epoch": 6.67,
"eval_loss": 3.0245492458343506,
"eval_runtime": 15.5923,
"eval_samples_per_second": 30.784,
"eval_steps_per_second": 3.848,
"eval_wer": 1.0,
"step": 100
},
{
"epoch": 10.0,
"learning_rate": 9.956913093678348e-05,
"loss": 2.9692,
"step": 150
},
{
"epoch": 10.0,
"eval_loss": 2.8865509033203125,
"eval_runtime": 15.6178,
"eval_samples_per_second": 30.734,
"eval_steps_per_second": 3.842,
"eval_wer": 1.0,
"step": 150
},
{
"epoch": 13.33,
"learning_rate": 9.813243995692098e-05,
"loss": 2.8042,
"step": 200
},
{
"epoch": 13.33,
"eval_loss": 2.635584831237793,
"eval_runtime": 15.4284,
"eval_samples_per_second": 31.112,
"eval_steps_per_second": 3.889,
"eval_wer": 1.0,
"step": 200
},
{
"epoch": 16.67,
"learning_rate": 9.57159113020304e-05,
"loss": 2.5114,
"step": 250
},
{
"epoch": 16.67,
"eval_loss": 2.116630792617798,
"eval_runtime": 15.5962,
"eval_samples_per_second": 30.777,
"eval_steps_per_second": 3.847,
"eval_wer": 1.0,
"step": 250
},
{
"epoch": 20.0,
"learning_rate": 9.236873852683213e-05,
"loss": 1.7677,
"step": 300
},
{
"epoch": 20.0,
"eval_loss": 1.0035134553909302,
"eval_runtime": 15.4247,
"eval_samples_per_second": 31.119,
"eval_steps_per_second": 3.89,
"eval_wer": 0.89375,
"step": 300
},
{
"epoch": 23.33,
"learning_rate": 8.815906041658002e-05,
"loss": 0.8802,
"step": 350
},
{
"epoch": 23.33,
"eval_loss": 0.3643040060997009,
"eval_runtime": 15.6657,
"eval_samples_per_second": 30.64,
"eval_steps_per_second": 3.83,
"eval_wer": 0.5025,
"step": 350
},
{
"epoch": 26.67,
"learning_rate": 8.31725738778896e-05,
"loss": 0.4318,
"step": 400
},
{
"epoch": 26.67,
"eval_loss": 0.14456388354301453,
"eval_runtime": 15.4959,
"eval_samples_per_second": 30.976,
"eval_steps_per_second": 3.872,
"eval_wer": 0.3075,
"step": 400
},
{
"epoch": 30.0,
"learning_rate": 7.751078939684885e-05,
"loss": 0.2275,
"step": 450
},
{
"epoch": 30.0,
"eval_loss": 0.07944890111684799,
"eval_runtime": 16.2382,
"eval_samples_per_second": 29.56,
"eval_steps_per_second": 3.695,
"eval_wer": 0.25,
"step": 450
},
{
"epoch": 33.33,
"learning_rate": 7.128896457825364e-05,
"loss": 0.1407,
"step": 500
},
{
"epoch": 33.33,
"eval_loss": 0.05435527116060257,
"eval_runtime": 15.4181,
"eval_samples_per_second": 31.132,
"eval_steps_per_second": 3.892,
"eval_wer": 0.22125,
"step": 500
},
{
"epoch": 36.67,
"learning_rate": 6.463375783314937e-05,
"loss": 0.1191,
"step": 550
},
{
"epoch": 36.67,
"eval_loss": 0.046384669840335846,
"eval_runtime": 15.8291,
"eval_samples_per_second": 30.324,
"eval_steps_per_second": 3.79,
"eval_wer": 0.23375,
"step": 550
},
{
"epoch": 40.0,
"learning_rate": 5.768064997883498e-05,
"loss": 0.0825,
"step": 600
},
{
"epoch": 40.0,
"eval_loss": 0.03952096030116081,
"eval_runtime": 15.4288,
"eval_samples_per_second": 31.111,
"eval_steps_per_second": 3.889,
"eval_wer": 0.25625,
"step": 600
},
{
"epoch": 43.33,
"learning_rate": 5.057118624011702e-05,
"loss": 0.0699,
"step": 650
},
{
"epoch": 43.33,
"eval_loss": 0.03604818880558014,
"eval_runtime": 15.4828,
"eval_samples_per_second": 31.002,
"eval_steps_per_second": 3.875,
"eval_wer": 0.2125,
"step": 650
},
{
"epoch": 46.67,
"learning_rate": 4.345009479671536e-05,
"loss": 0.0592,
"step": 700
},
{
"epoch": 46.67,
"eval_loss": 0.02805432118475437,
"eval_runtime": 15.5578,
"eval_samples_per_second": 30.853,
"eval_steps_per_second": 3.857,
"eval_wer": 0.23875,
"step": 700
},
{
"epoch": 50.0,
"learning_rate": 3.646234053488574e-05,
"loss": 0.0546,
"step": 750
},
{
"epoch": 50.0,
"eval_loss": 0.023771686479449272,
"eval_runtime": 15.8929,
"eval_samples_per_second": 30.202,
"eval_steps_per_second": 3.775,
"eval_wer": 0.26375,
"step": 750
},
{
"epoch": 53.33,
"learning_rate": 2.9750173980379736e-05,
"loss": 0.0455,
"step": 800
},
{
"epoch": 53.33,
"eval_loss": 0.021949028596282005,
"eval_runtime": 15.824,
"eval_samples_per_second": 30.334,
"eval_steps_per_second": 3.792,
"eval_wer": 0.24125,
"step": 800
},
{
"epoch": 56.67,
"learning_rate": 2.3450235487957135e-05,
"loss": 0.0391,
"step": 850
},
{
"epoch": 56.67,
"eval_loss": 0.020865805447101593,
"eval_runtime": 16.0515,
"eval_samples_per_second": 29.904,
"eval_steps_per_second": 3.738,
"eval_wer": 0.24375,
"step": 850
},
{
"epoch": 60.0,
"learning_rate": 1.7690773637801294e-05,
"loss": 0.0367,
"step": 900
},
{
"epoch": 60.0,
"eval_loss": 0.022958721965551376,
"eval_runtime": 15.4228,
"eval_samples_per_second": 31.123,
"eval_steps_per_second": 3.89,
"eval_wer": 0.21625,
"step": 900
},
{
"epoch": 63.33,
"learning_rate": 1.2589034464264932e-05,
"loss": 0.0333,
"step": 950
},
{
"epoch": 63.33,
"eval_loss": 0.021822014823555946,
"eval_runtime": 15.5217,
"eval_samples_per_second": 30.924,
"eval_steps_per_second": 3.866,
"eval_wer": 0.23,
"step": 950
},
{
"epoch": 66.67,
"learning_rate": 8.248874664720375e-06,
"loss": 0.0327,
"step": 1000
},
{
"epoch": 66.67,
"eval_loss": 0.02000792883336544,
"eval_runtime": 15.8435,
"eval_samples_per_second": 30.296,
"eval_steps_per_second": 3.787,
"eval_wer": 0.21625,
"step": 1000
},
{
"epoch": 70.0,
"learning_rate": 4.758647376699032e-06,
"loss": 0.0306,
"step": 1050
},
{
"epoch": 70.0,
"eval_loss": 0.02014043927192688,
"eval_runtime": 15.7796,
"eval_samples_per_second": 30.419,
"eval_steps_per_second": 3.802,
"eval_wer": 0.21625,
"step": 1050
},
{
"epoch": 73.33,
"learning_rate": 2.1894035628006517e-06,
"loss": 0.0269,
"step": 1100
},
{
"epoch": 73.33,
"eval_loss": 0.02098565548658371,
"eval_runtime": 16.1184,
"eval_samples_per_second": 29.78,
"eval_steps_per_second": 3.722,
"eval_wer": 0.2075,
"step": 1100
},
{
"epoch": 76.67,
"learning_rate": 5.934456179888804e-07,
"loss": 0.0288,
"step": 1150
},
{
"epoch": 76.67,
"eval_loss": 0.021614952012896538,
"eval_runtime": 15.8598,
"eval_samples_per_second": 30.265,
"eval_steps_per_second": 3.783,
"eval_wer": 0.21625,
"step": 1150
},
{
"epoch": 80.0,
"learning_rate": 3.262643657425679e-09,
"loss": 0.0289,
"step": 1200
},
{
"epoch": 80.0,
"eval_loss": 0.02152070961892605,
"eval_runtime": 16.1024,
"eval_samples_per_second": 29.809,
"eval_steps_per_second": 3.726,
"eval_wer": 0.21625,
"step": 1200
}
],
"max_steps": 1200,
"num_train_epochs": 80,
"total_flos": 3.3688058529081743e+18,
"trial_name": null,
"trial_params": null
}