Edresson's picture
Add checkpoints
981996c
{
"best_metric": 0.34823477268218994,
"best_model_checkpoint": "../checkpoints/Wav2Vec-voxpopuli/one-speaker/Final-paper/GT+GEN-dxg1/RU/100-epoch/checkpoint-26775",
"epoch": 72.99784777929955,
"global_step": 31025,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0,
"learning_rate": 1.4822134387351778e-08,
"loss": 12.3693,
"step": 1
},
{
"epoch": 0.23,
"learning_rate": 1.4525691699604743e-06,
"loss": 16.0709,
"step": 100
},
{
"epoch": 0.47,
"learning_rate": 2.9347826086956523e-06,
"loss": 15.3276,
"step": 200
},
{
"epoch": 0.7,
"learning_rate": 4.416996047430831e-06,
"loss": 12.0358,
"step": 300
},
{
"epoch": 0.94,
"learning_rate": 5.8843873517786565e-06,
"loss": 9.1409,
"step": 400
},
{
"epoch": 1.0,
"eval_loss": 6.154871940612793,
"eval_runtime": 318.3436,
"eval_samples_per_second": 26.456,
"eval_wer": 1.0,
"step": 425
},
{
"epoch": 1.18,
"learning_rate": 7.366600790513834e-06,
"loss": 7.4893,
"step": 500
},
{
"epoch": 1.41,
"learning_rate": 8.848814229249012e-06,
"loss": 6.0766,
"step": 600
},
{
"epoch": 1.65,
"learning_rate": 1.033102766798419e-05,
"loss": 5.2545,
"step": 700
},
{
"epoch": 1.88,
"learning_rate": 1.1813241106719368e-05,
"loss": 4.5575,
"step": 800
},
{
"epoch": 2.0,
"eval_loss": 3.599003553390503,
"eval_runtime": 317.6472,
"eval_samples_per_second": 26.514,
"eval_wer": 1.0,
"step": 850
},
{
"epoch": 2.12,
"learning_rate": 1.3295454545454546e-05,
"loss": 4.0577,
"step": 900
},
{
"epoch": 2.35,
"learning_rate": 1.4777667984189723e-05,
"loss": 3.5943,
"step": 1000
},
{
"epoch": 2.59,
"learning_rate": 1.6259881422924904e-05,
"loss": 3.3759,
"step": 1100
},
{
"epoch": 2.82,
"learning_rate": 1.774209486166008e-05,
"loss": 3.2785,
"step": 1200
},
{
"epoch": 3.0,
"eval_loss": 3.146242380142212,
"eval_runtime": 318.9247,
"eval_samples_per_second": 26.407,
"eval_wer": 1.0,
"step": 1275
},
{
"epoch": 3.06,
"learning_rate": 1.9224308300395258e-05,
"loss": 3.2268,
"step": 1300
},
{
"epoch": 3.29,
"learning_rate": 2.0706521739130433e-05,
"loss": 3.1416,
"step": 1400
},
{
"epoch": 3.53,
"learning_rate": 2.2188735177865615e-05,
"loss": 3.1018,
"step": 1500
},
{
"epoch": 3.76,
"learning_rate": 2.3670948616600794e-05,
"loss": 3.0594,
"step": 1600
},
{
"epoch": 4.0,
"learning_rate": 2.515316205533597e-05,
"loss": 3.0063,
"step": 1700
},
{
"epoch": 4.0,
"eval_loss": 2.9775705337524414,
"eval_runtime": 316.7007,
"eval_samples_per_second": 26.593,
"eval_wer": 1.0,
"step": 1700
},
{
"epoch": 4.23,
"learning_rate": 2.6635375494071148e-05,
"loss": 2.8872,
"step": 1800
},
{
"epoch": 4.47,
"learning_rate": 2.8117588932806323e-05,
"loss": 2.5959,
"step": 1900
},
{
"epoch": 4.7,
"learning_rate": 2.9599802371541505e-05,
"loss": 2.1892,
"step": 2000
},
{
"epoch": 4.94,
"learning_rate": 2.9945893863029945e-05,
"loss": 1.9088,
"step": 2100
},
{
"epoch": 5.0,
"eval_loss": 1.6493474245071411,
"eval_runtime": 318.4422,
"eval_samples_per_second": 26.448,
"eval_wer": 0.9566750042119724,
"step": 2125
},
{
"epoch": 5.18,
"learning_rate": 2.987177586718055e-05,
"loss": 1.6933,
"step": 2200
},
{
"epoch": 5.41,
"learning_rate": 2.979765787133116e-05,
"loss": 1.5286,
"step": 2300
},
{
"epoch": 5.65,
"learning_rate": 2.9723539875481766e-05,
"loss": 1.4406,
"step": 2400
},
{
"epoch": 5.88,
"learning_rate": 2.9649421879632374e-05,
"loss": 1.3302,
"step": 2500
},
{
"epoch": 6.0,
"eval_loss": 1.2176637649536133,
"eval_runtime": 318.9899,
"eval_samples_per_second": 26.402,
"eval_wer": 0.8561190238592035,
"step": 2550
},
{
"epoch": 6.12,
"learning_rate": 2.9575303883782986e-05,
"loss": 1.251,
"step": 2600
},
{
"epoch": 6.35,
"learning_rate": 2.950118588793359e-05,
"loss": 1.162,
"step": 2700
},
{
"epoch": 6.59,
"learning_rate": 2.94270678920842e-05,
"loss": 1.1033,
"step": 2800
},
{
"epoch": 6.82,
"learning_rate": 2.9352949896234806e-05,
"loss": 1.0447,
"step": 2900
},
{
"epoch": 7.0,
"eval_loss": 0.9863032102584839,
"eval_runtime": 317.5697,
"eval_samples_per_second": 26.52,
"eval_wer": 0.7464522232734153,
"step": 2975
},
{
"epoch": 7.06,
"learning_rate": 2.9278831900385414e-05,
"loss": 1.0038,
"step": 3000
},
{
"epoch": 7.29,
"learning_rate": 2.9204713904536022e-05,
"loss": 0.963,
"step": 3100
},
{
"epoch": 7.53,
"learning_rate": 2.913059590868663e-05,
"loss": 0.9284,
"step": 3200
},
{
"epoch": 7.76,
"learning_rate": 2.9056477912837235e-05,
"loss": 0.8925,
"step": 3300
},
{
"epoch": 8.0,
"learning_rate": 2.8982359916987847e-05,
"loss": 0.8712,
"step": 3400
},
{
"epoch": 8.0,
"eval_loss": 0.8418087363243103,
"eval_runtime": 318.12,
"eval_samples_per_second": 26.474,
"eval_wer": 0.653970269955029,
"step": 3400
},
{
"epoch": 8.23,
"learning_rate": 2.890824192113845e-05,
"loss": 0.8478,
"step": 3500
},
{
"epoch": 8.47,
"learning_rate": 2.883412392528906e-05,
"loss": 0.8175,
"step": 3600
},
{
"epoch": 8.7,
"learning_rate": 2.876000592943967e-05,
"loss": 0.8035,
"step": 3700
},
{
"epoch": 8.94,
"learning_rate": 2.8685887933590275e-05,
"loss": 0.7815,
"step": 3800
},
{
"epoch": 9.0,
"eval_loss": 0.7524622678756714,
"eval_runtime": 318.9732,
"eval_samples_per_second": 26.403,
"eval_wer": 0.5982426355283109,
"step": 3825
},
{
"epoch": 9.18,
"learning_rate": 2.8611769937740884e-05,
"loss": 0.7671,
"step": 3900
},
{
"epoch": 9.41,
"learning_rate": 2.853765194189149e-05,
"loss": 0.7474,
"step": 4000
},
{
"epoch": 9.65,
"learning_rate": 2.84635339460421e-05,
"loss": 0.7477,
"step": 4100
},
{
"epoch": 9.88,
"learning_rate": 2.8389415950192708e-05,
"loss": 0.7128,
"step": 4200
},
{
"epoch": 10.0,
"eval_loss": 0.6934680938720703,
"eval_runtime": 317.9061,
"eval_samples_per_second": 26.492,
"eval_wer": 0.5617993545962339,
"step": 4250
},
{
"epoch": 10.12,
"learning_rate": 2.8315297954343316e-05,
"loss": 0.7134,
"step": 4300
},
{
"epoch": 10.35,
"learning_rate": 2.8241179958493924e-05,
"loss": 0.7025,
"step": 4400
},
{
"epoch": 10.59,
"learning_rate": 2.8167061962644532e-05,
"loss": 0.6806,
"step": 4500
},
{
"epoch": 10.82,
"learning_rate": 2.8092943966795137e-05,
"loss": 0.6713,
"step": 4600
},
{
"epoch": 11.0,
"eval_loss": 0.6441113948822021,
"eval_runtime": 330.7931,
"eval_samples_per_second": 25.46,
"eval_wer": 0.5259781495833388,
"step": 4675
},
{
"epoch": 11.06,
"learning_rate": 2.8018825970945745e-05,
"loss": 0.6707,
"step": 4700
},
{
"epoch": 11.29,
"learning_rate": 2.7944707975096356e-05,
"loss": 0.6552,
"step": 4800
},
{
"epoch": 11.53,
"learning_rate": 2.787058997924696e-05,
"loss": 0.6435,
"step": 4900
},
{
"epoch": 11.76,
"learning_rate": 2.779647198339757e-05,
"loss": 0.632,
"step": 5000
},
{
"epoch": 12.0,
"learning_rate": 2.7722353987548177e-05,
"loss": 0.632,
"step": 5100
},
{
"epoch": 12.0,
"eval_loss": 0.6222620010375977,
"eval_runtime": 318.5241,
"eval_samples_per_second": 26.441,
"eval_wer": 0.5066678762587318,
"step": 5100
},
{
"epoch": 12.23,
"learning_rate": 2.7648235991698785e-05,
"loss": 0.6169,
"step": 5200
},
{
"epoch": 12.47,
"learning_rate": 2.7574117995849393e-05,
"loss": 0.6068,
"step": 5300
},
{
"epoch": 12.7,
"learning_rate": 2.75e-05,
"loss": 0.6036,
"step": 5400
},
{
"epoch": 12.94,
"learning_rate": 2.742588200415061e-05,
"loss": 0.5917,
"step": 5500
},
{
"epoch": 13.0,
"eval_loss": 0.5906757712364197,
"eval_runtime": 319.1883,
"eval_samples_per_second": 26.386,
"eval_wer": 0.4835214680991693,
"step": 5525
},
{
"epoch": 13.18,
"learning_rate": 2.7351764008301217e-05,
"loss": 0.5905,
"step": 5600
},
{
"epoch": 13.41,
"learning_rate": 2.7277646012451822e-05,
"loss": 0.5818,
"step": 5700
},
{
"epoch": 13.65,
"learning_rate": 2.720352801660243e-05,
"loss": 0.5737,
"step": 5800
},
{
"epoch": 13.88,
"learning_rate": 2.712941002075304e-05,
"loss": 0.5607,
"step": 5900
},
{
"epoch": 14.0,
"eval_loss": 0.5859212279319763,
"eval_runtime": 319.205,
"eval_samples_per_second": 26.384,
"eval_wer": 0.47469576599577507,
"step": 5950
},
{
"epoch": 14.12,
"learning_rate": 2.7055292024903646e-05,
"loss": 0.5661,
"step": 6000
},
{
"epoch": 14.35,
"learning_rate": 2.6981174029054254e-05,
"loss": 0.5503,
"step": 6100
},
{
"epoch": 14.59,
"learning_rate": 2.6907056033204865e-05,
"loss": 0.5517,
"step": 6200
},
{
"epoch": 14.82,
"learning_rate": 2.683293803735547e-05,
"loss": 0.544,
"step": 6300
},
{
"epoch": 15.0,
"eval_loss": 0.5427600741386414,
"eval_runtime": 317.4374,
"eval_samples_per_second": 26.531,
"eval_wer": 0.45460789777219063,
"step": 6375
},
{
"epoch": 15.06,
"learning_rate": 2.6758820041506078e-05,
"loss": 0.5377,
"step": 6400
},
{
"epoch": 15.29,
"learning_rate": 2.6684702045656686e-05,
"loss": 0.5364,
"step": 6500
},
{
"epoch": 15.53,
"learning_rate": 2.6610584049807294e-05,
"loss": 0.5207,
"step": 6600
},
{
"epoch": 15.76,
"learning_rate": 2.6536466053957902e-05,
"loss": 0.518,
"step": 6700
},
{
"epoch": 16.0,
"learning_rate": 2.6462348058108507e-05,
"loss": 0.5208,
"step": 6800
},
{
"epoch": 16.0,
"eval_loss": 0.549843966960907,
"eval_runtime": 315.364,
"eval_samples_per_second": 26.706,
"eval_wer": 0.4465857103977398,
"step": 6800
},
{
"epoch": 16.23,
"learning_rate": 2.638823006225912e-05,
"loss": 0.5157,
"step": 6900
},
{
"epoch": 16.47,
"learning_rate": 2.6314112066409726e-05,
"loss": 0.5056,
"step": 7000
},
{
"epoch": 16.7,
"learning_rate": 2.623999407056033e-05,
"loss": 0.5052,
"step": 7100
},
{
"epoch": 16.94,
"learning_rate": 2.616587607471094e-05,
"loss": 0.4979,
"step": 7200
},
{
"epoch": 17.0,
"eval_loss": 0.5181886553764343,
"eval_runtime": 316.5373,
"eval_samples_per_second": 26.607,
"eval_wer": 0.432731561280958,
"step": 7225
},
{
"epoch": 17.18,
"learning_rate": 2.609175807886155e-05,
"loss": 0.4981,
"step": 7300
},
{
"epoch": 17.41,
"learning_rate": 2.6017640083012155e-05,
"loss": 0.4886,
"step": 7400
},
{
"epoch": 17.65,
"learning_rate": 2.5943522087162763e-05,
"loss": 0.4807,
"step": 7500
},
{
"epoch": 17.88,
"learning_rate": 2.586940409131337e-05,
"loss": 0.4829,
"step": 7600
},
{
"epoch": 18.0,
"eval_loss": 0.5218132138252258,
"eval_runtime": 316.5653,
"eval_samples_per_second": 26.604,
"eval_wer": 0.42257098793431913,
"step": 7650
},
{
"epoch": 18.12,
"learning_rate": 2.579528609546398e-05,
"loss": 0.4803,
"step": 7700
},
{
"epoch": 18.35,
"learning_rate": 2.5721168099614588e-05,
"loss": 0.4731,
"step": 7800
},
{
"epoch": 18.59,
"learning_rate": 2.5647050103765192e-05,
"loss": 0.4732,
"step": 7900
},
{
"epoch": 18.82,
"learning_rate": 2.5572932107915804e-05,
"loss": 0.4667,
"step": 8000
},
{
"epoch": 19.0,
"eval_loss": 0.49254098534584045,
"eval_runtime": 314.8242,
"eval_samples_per_second": 26.751,
"eval_wer": 0.4067339718251448,
"step": 8075
},
{
"epoch": 19.06,
"learning_rate": 2.5498814112066412e-05,
"loss": 0.47,
"step": 8100
},
{
"epoch": 19.29,
"learning_rate": 2.5424696116217016e-05,
"loss": 0.4549,
"step": 8200
},
{
"epoch": 19.53,
"learning_rate": 2.5350578120367624e-05,
"loss": 0.4486,
"step": 8300
},
{
"epoch": 19.76,
"learning_rate": 2.5276460124518236e-05,
"loss": 0.4516,
"step": 8400
},
{
"epoch": 20.0,
"learning_rate": 2.520234212866884e-05,
"loss": 0.4517,
"step": 8500
},
{
"epoch": 20.0,
"eval_loss": 0.4848106801509857,
"eval_runtime": 317.0239,
"eval_samples_per_second": 26.566,
"eval_wer": 0.398400746491103,
"step": 8500
},
{
"epoch": 20.23,
"learning_rate": 2.512822413281945e-05,
"loss": 0.4469,
"step": 8600
},
{
"epoch": 20.47,
"learning_rate": 2.505410613697006e-05,
"loss": 0.441,
"step": 8700
},
{
"epoch": 20.7,
"learning_rate": 2.4979988141120665e-05,
"loss": 0.4379,
"step": 8800
},
{
"epoch": 20.94,
"learning_rate": 2.4905870145271273e-05,
"loss": 0.4372,
"step": 8900
},
{
"epoch": 21.0,
"eval_loss": 0.48364755511283875,
"eval_runtime": 316.0715,
"eval_samples_per_second": 26.646,
"eval_wer": 0.39547180570495455,
"step": 8925
},
{
"epoch": 21.18,
"learning_rate": 2.4831752149421877e-05,
"loss": 0.4374,
"step": 9000
},
{
"epoch": 21.41,
"learning_rate": 2.475763415357249e-05,
"loss": 0.4326,
"step": 9100
},
{
"epoch": 21.65,
"learning_rate": 2.4683516157723097e-05,
"loss": 0.4247,
"step": 9200
},
{
"epoch": 21.88,
"learning_rate": 2.46093981618737e-05,
"loss": 0.4277,
"step": 9300
},
{
"epoch": 22.0,
"eval_loss": 0.48058849573135376,
"eval_runtime": 319.3273,
"eval_samples_per_second": 26.374,
"eval_wer": 0.39389069607703375,
"step": 9350
},
{
"epoch": 22.12,
"learning_rate": 2.453528016602431e-05,
"loss": 0.4265,
"step": 9400
},
{
"epoch": 22.35,
"learning_rate": 2.446116217017492e-05,
"loss": 0.4147,
"step": 9500
},
{
"epoch": 22.59,
"learning_rate": 2.4387044174325526e-05,
"loss": 0.4194,
"step": 9600
},
{
"epoch": 22.82,
"learning_rate": 2.4312926178476134e-05,
"loss": 0.412,
"step": 9700
},
{
"epoch": 23.0,
"eval_loss": 0.44829100370407104,
"eval_runtime": 316.8142,
"eval_samples_per_second": 26.583,
"eval_wer": 0.3794274309560529,
"step": 9775
},
{
"epoch": 23.06,
"learning_rate": 2.4238808182626745e-05,
"loss": 0.4157,
"step": 9800
},
{
"epoch": 23.29,
"learning_rate": 2.416469018677735e-05,
"loss": 0.4051,
"step": 9900
},
{
"epoch": 23.53,
"learning_rate": 2.4090572190927958e-05,
"loss": 0.4046,
"step": 10000
},
{
"epoch": 23.76,
"learning_rate": 2.4016454195078563e-05,
"loss": 0.4003,
"step": 10100
},
{
"epoch": 24.0,
"learning_rate": 2.3942336199229174e-05,
"loss": 0.403,
"step": 10200
},
{
"epoch": 24.0,
"eval_loss": 0.45721083879470825,
"eval_runtime": 318.2524,
"eval_samples_per_second": 26.463,
"eval_wer": 0.37823511877762084,
"step": 10200
},
{
"epoch": 24.23,
"learning_rate": 2.3868218203379782e-05,
"loss": 0.3971,
"step": 10300
},
{
"epoch": 24.47,
"learning_rate": 2.3794100207530387e-05,
"loss": 0.3982,
"step": 10400
},
{
"epoch": 24.7,
"learning_rate": 2.3719982211680998e-05,
"loss": 0.3959,
"step": 10500
},
{
"epoch": 24.94,
"learning_rate": 2.3645864215831606e-05,
"loss": 0.394,
"step": 10600
},
{
"epoch": 25.0,
"eval_loss": 0.4389103055000305,
"eval_runtime": 315.649,
"eval_samples_per_second": 26.682,
"eval_wer": 0.37056284910770987,
"step": 10625
},
{
"epoch": 25.18,
"learning_rate": 2.357174621998221e-05,
"loss": 0.3935,
"step": 10700
},
{
"epoch": 25.41,
"learning_rate": 2.349762822413282e-05,
"loss": 0.3863,
"step": 10800
},
{
"epoch": 25.65,
"learning_rate": 2.342351022828343e-05,
"loss": 0.3882,
"step": 10900
},
{
"epoch": 25.88,
"learning_rate": 2.335013341239253e-05,
"loss": 0.3887,
"step": 11000
},
{
"epoch": 26.0,
"eval_loss": 0.43516942858695984,
"eval_runtime": 315.434,
"eval_samples_per_second": 26.7,
"eval_wer": 0.36394033255141844,
"step": 11050
},
{
"epoch": 26.12,
"learning_rate": 2.3276015416543136e-05,
"loss": 0.3902,
"step": 11100
},
{
"epoch": 26.35,
"learning_rate": 2.3201897420693744e-05,
"loss": 0.3858,
"step": 11200
},
{
"epoch": 26.59,
"learning_rate": 2.3127779424844355e-05,
"loss": 0.3785,
"step": 11300
},
{
"epoch": 26.82,
"learning_rate": 2.305366142899496e-05,
"loss": 0.378,
"step": 11400
},
{
"epoch": 27.0,
"eval_loss": 0.443709135055542,
"eval_runtime": 318.0942,
"eval_samples_per_second": 26.476,
"eval_wer": 0.3679967859410842,
"step": 11475
},
{
"epoch": 27.06,
"learning_rate": 2.2979543433145568e-05,
"loss": 0.3835,
"step": 11500
},
{
"epoch": 27.29,
"learning_rate": 2.2905425437296176e-05,
"loss": 0.3776,
"step": 11600
},
{
"epoch": 27.53,
"learning_rate": 2.2831307441446784e-05,
"loss": 0.3721,
"step": 11700
},
{
"epoch": 27.76,
"learning_rate": 2.2757189445597392e-05,
"loss": 0.3686,
"step": 11800
},
{
"epoch": 28.0,
"learning_rate": 2.2683071449748e-05,
"loss": 0.3711,
"step": 11900
},
{
"epoch": 28.0,
"eval_loss": 0.4321639835834503,
"eval_runtime": 315.6052,
"eval_samples_per_second": 26.685,
"eval_wer": 0.3558403856870699,
"step": 11900
},
{
"epoch": 28.23,
"learning_rate": 2.26096946338571e-05,
"loss": 0.3767,
"step": 12000
},
{
"epoch": 28.47,
"learning_rate": 2.253557663800771e-05,
"loss": 0.363,
"step": 12100
},
{
"epoch": 28.7,
"learning_rate": 2.2461458642158317e-05,
"loss": 0.3667,
"step": 12200
},
{
"epoch": 28.94,
"learning_rate": 2.2387340646308925e-05,
"loss": 0.3657,
"step": 12300
},
{
"epoch": 29.0,
"eval_loss": 0.4269185960292816,
"eval_runtime": 316.1021,
"eval_samples_per_second": 26.643,
"eval_wer": 0.3577714130195306,
"step": 12325
},
{
"epoch": 29.18,
"learning_rate": 2.2313222650459533e-05,
"loss": 0.3624,
"step": 12400
},
{
"epoch": 29.41,
"learning_rate": 2.223910465461014e-05,
"loss": 0.3575,
"step": 12500
},
{
"epoch": 29.65,
"learning_rate": 2.216498665876075e-05,
"loss": 0.349,
"step": 12600
},
{
"epoch": 29.88,
"learning_rate": 2.2090868662911354e-05,
"loss": 0.3548,
"step": 12700
},
{
"epoch": 30.0,
"eval_loss": 0.4217592477798462,
"eval_runtime": 317.2188,
"eval_samples_per_second": 26.55,
"eval_wer": 0.34779227848265315,
"step": 12750
},
{
"epoch": 30.12,
"learning_rate": 2.2016750667061965e-05,
"loss": 0.3589,
"step": 12800
},
{
"epoch": 30.35,
"learning_rate": 2.194263267121257e-05,
"loss": 0.3522,
"step": 12900
},
{
"epoch": 30.59,
"learning_rate": 2.1868514675363178e-05,
"loss": 0.3443,
"step": 13000
},
{
"epoch": 30.82,
"learning_rate": 2.1794396679513786e-05,
"loss": 0.3464,
"step": 13100
},
{
"epoch": 31.0,
"eval_loss": 0.42884036898612976,
"eval_runtime": 317.8415,
"eval_samples_per_second": 26.497,
"eval_wer": 0.3482329155920737,
"step": 13175
},
{
"epoch": 31.06,
"learning_rate": 2.1720278683664394e-05,
"loss": 0.3489,
"step": 13200
},
{
"epoch": 31.29,
"learning_rate": 2.1646160687815002e-05,
"loss": 0.3443,
"step": 13300
},
{
"epoch": 31.53,
"learning_rate": 2.157204269196561e-05,
"loss": 0.3457,
"step": 13400
},
{
"epoch": 31.76,
"learning_rate": 2.1497924696116218e-05,
"loss": 0.3514,
"step": 13500
},
{
"epoch": 32.0,
"learning_rate": 2.1423806700266826e-05,
"loss": 0.3447,
"step": 13600
},
{
"epoch": 32.0,
"eval_loss": 0.41752490401268005,
"eval_runtime": 317.3655,
"eval_samples_per_second": 26.537,
"eval_wer": 0.34579645157527766,
"step": 13600
},
{
"epoch": 32.23,
"learning_rate": 2.1349688704417434e-05,
"loss": 0.3373,
"step": 13700
},
{
"epoch": 32.47,
"learning_rate": 2.127557070856804e-05,
"loss": 0.3403,
"step": 13800
},
{
"epoch": 32.7,
"learning_rate": 2.120145271271865e-05,
"loss": 0.3418,
"step": 13900
},
{
"epoch": 32.94,
"learning_rate": 2.1127334716869255e-05,
"loss": 0.3378,
"step": 14000
},
{
"epoch": 33.0,
"eval_loss": 0.4071788787841797,
"eval_runtime": 317.9264,
"eval_samples_per_second": 26.49,
"eval_wer": 0.3422843146148961,
"step": 14025
},
{
"epoch": 33.18,
"learning_rate": 2.1053216721019863e-05,
"loss": 0.3358,
"step": 14100
},
{
"epoch": 33.41,
"learning_rate": 2.0979098725170475e-05,
"loss": 0.333,
"step": 14200
},
{
"epoch": 33.65,
"learning_rate": 2.090498072932108e-05,
"loss": 0.3339,
"step": 14300
},
{
"epoch": 33.88,
"learning_rate": 2.0830862733471687e-05,
"loss": 0.3323,
"step": 14400
},
{
"epoch": 34.0,
"eval_loss": 0.39172977209091187,
"eval_runtime": 317.2839,
"eval_samples_per_second": 26.544,
"eval_wer": 0.3331605344668939,
"step": 14450
},
{
"epoch": 34.12,
"learning_rate": 2.0756744737622295e-05,
"loss": 0.3338,
"step": 14500
},
{
"epoch": 34.35,
"learning_rate": 2.0682626741772903e-05,
"loss": 0.3286,
"step": 14600
},
{
"epoch": 34.59,
"learning_rate": 2.060850874592351e-05,
"loss": 0.3286,
"step": 14700
},
{
"epoch": 34.82,
"learning_rate": 2.053439075007412e-05,
"loss": 0.3278,
"step": 14800
},
{
"epoch": 35.0,
"eval_loss": 0.40219607949256897,
"eval_runtime": 317.0822,
"eval_samples_per_second": 26.561,
"eval_wer": 0.3327587771024222,
"step": 14875
},
{
"epoch": 35.06,
"learning_rate": 2.0460272754224724e-05,
"loss": 0.3245,
"step": 14900
},
{
"epoch": 35.29,
"learning_rate": 2.0386154758375336e-05,
"loss": 0.3184,
"step": 15000
},
{
"epoch": 35.53,
"learning_rate": 2.031203676252594e-05,
"loss": 0.3313,
"step": 15100
},
{
"epoch": 35.76,
"learning_rate": 2.023791876667655e-05,
"loss": 0.3267,
"step": 15200
},
{
"epoch": 36.0,
"learning_rate": 2.016380077082716e-05,
"loss": 0.3221,
"step": 15300
},
{
"epoch": 36.0,
"eval_loss": 0.4049491584300995,
"eval_runtime": 318.0804,
"eval_samples_per_second": 26.478,
"eval_wer": 0.33557107865372404,
"step": 15300
},
{
"epoch": 36.23,
"learning_rate": 2.0089682774977765e-05,
"loss": 0.3196,
"step": 15400
},
{
"epoch": 36.47,
"learning_rate": 2.0015564779128373e-05,
"loss": 0.3239,
"step": 15500
},
{
"epoch": 36.7,
"learning_rate": 1.994144678327898e-05,
"loss": 0.3199,
"step": 15600
},
{
"epoch": 36.94,
"learning_rate": 1.986732878742959e-05,
"loss": 0.3171,
"step": 15700
},
{
"epoch": 37.0,
"eval_loss": 0.3955913484096527,
"eval_runtime": 317.9907,
"eval_samples_per_second": 26.485,
"eval_wer": 0.33121654721945026,
"step": 15725
},
{
"epoch": 37.18,
"learning_rate": 1.9793210791580197e-05,
"loss": 0.3235,
"step": 15800
},
{
"epoch": 37.41,
"learning_rate": 1.9719092795730805e-05,
"loss": 0.3155,
"step": 15900
},
{
"epoch": 37.65,
"learning_rate": 1.9644974799881413e-05,
"loss": 0.3193,
"step": 16000
},
{
"epoch": 37.88,
"learning_rate": 1.957085680403202e-05,
"loss": 0.3128,
"step": 16100
},
{
"epoch": 38.0,
"eval_loss": 0.3912222683429718,
"eval_runtime": 317.3702,
"eval_samples_per_second": 26.537,
"eval_wer": 0.3300112751260352,
"step": 16150
},
{
"epoch": 38.12,
"learning_rate": 1.9496738808182626e-05,
"loss": 0.315,
"step": 16200
},
{
"epoch": 38.35,
"learning_rate": 1.9422620812333234e-05,
"loss": 0.3106,
"step": 16300
},
{
"epoch": 38.59,
"learning_rate": 1.9349243996442334e-05,
"loss": 0.3091,
"step": 16400
},
{
"epoch": 38.82,
"learning_rate": 1.9275867180551438e-05,
"loss": 0.3114,
"step": 16500
},
{
"epoch": 39.0,
"eval_loss": 0.40268105268478394,
"eval_runtime": 317.2535,
"eval_samples_per_second": 26.547,
"eval_wer": 0.3303352730006091,
"step": 16575
},
{
"epoch": 39.06,
"learning_rate": 1.9201749184702046e-05,
"loss": 0.3144,
"step": 16600
},
{
"epoch": 39.29,
"learning_rate": 1.9127631188852654e-05,
"loss": 0.3102,
"step": 16700
},
{
"epoch": 39.53,
"learning_rate": 1.905351319300326e-05,
"loss": 0.3098,
"step": 16800
},
{
"epoch": 39.76,
"learning_rate": 1.897939519715387e-05,
"loss": 0.3071,
"step": 16900
},
{
"epoch": 40.0,
"learning_rate": 1.890527720130448e-05,
"loss": 0.3061,
"step": 17000
},
{
"epoch": 40.0,
"eval_loss": 0.39571964740753174,
"eval_runtime": 319.4169,
"eval_samples_per_second": 26.367,
"eval_wer": 0.32423115304363603,
"step": 17000
},
{
"epoch": 40.23,
"learning_rate": 1.8831159205455083e-05,
"loss": 0.2991,
"step": 17100
},
{
"epoch": 40.47,
"learning_rate": 1.8757041209605695e-05,
"loss": 0.3006,
"step": 17200
},
{
"epoch": 40.7,
"learning_rate": 1.8682923213756303e-05,
"loss": 0.3041,
"step": 17300
},
{
"epoch": 40.94,
"learning_rate": 1.8608805217906907e-05,
"loss": 0.306,
"step": 17400
},
{
"epoch": 41.0,
"eval_loss": 0.3856252431869507,
"eval_runtime": 318.6166,
"eval_samples_per_second": 26.433,
"eval_wer": 0.322105726986431,
"step": 17425
},
{
"epoch": 41.18,
"learning_rate": 1.8534687222057515e-05,
"loss": 0.308,
"step": 17500
},
{
"epoch": 41.41,
"learning_rate": 1.8460569226208123e-05,
"loss": 0.298,
"step": 17600
},
{
"epoch": 41.65,
"learning_rate": 1.838645123035873e-05,
"loss": 0.3004,
"step": 17700
},
{
"epoch": 41.88,
"learning_rate": 1.831233323450934e-05,
"loss": 0.299,
"step": 17800
},
{
"epoch": 42.0,
"eval_loss": 0.384583979845047,
"eval_runtime": 316.4886,
"eval_samples_per_second": 26.611,
"eval_wer": 0.3222223662212776,
"step": 17850
},
{
"epoch": 42.12,
"learning_rate": 1.8238215238659944e-05,
"loss": 0.2965,
"step": 17900
},
{
"epoch": 42.35,
"learning_rate": 1.8164097242810556e-05,
"loss": 0.3002,
"step": 18000
},
{
"epoch": 42.59,
"learning_rate": 1.8089979246961164e-05,
"loss": 0.2961,
"step": 18100
},
{
"epoch": 42.82,
"learning_rate": 1.801586125111177e-05,
"loss": 0.295,
"step": 18200
},
{
"epoch": 43.0,
"eval_loss": 0.3782486915588379,
"eval_runtime": 316.5726,
"eval_samples_per_second": 26.604,
"eval_wer": 0.3191767862002825,
"step": 18275
},
{
"epoch": 43.06,
"learning_rate": 1.794174325526238e-05,
"loss": 0.2962,
"step": 18300
},
{
"epoch": 43.29,
"learning_rate": 1.7867625259412988e-05,
"loss": 0.2926,
"step": 18400
},
{
"epoch": 43.53,
"learning_rate": 1.7793507263563593e-05,
"loss": 0.2993,
"step": 18500
},
{
"epoch": 43.76,
"learning_rate": 1.77193892677142e-05,
"loss": 0.2908,
"step": 18600
},
{
"epoch": 44.0,
"learning_rate": 1.764527127186481e-05,
"loss": 0.2919,
"step": 18700
},
{
"epoch": 44.0,
"eval_loss": 0.3738417625427246,
"eval_runtime": 316.4549,
"eval_samples_per_second": 26.614,
"eval_wer": 0.3151980923005145,
"step": 18700
},
{
"epoch": 44.23,
"learning_rate": 1.7571153276015417e-05,
"loss": 0.2927,
"step": 18800
},
{
"epoch": 44.47,
"learning_rate": 1.7497035280166025e-05,
"loss": 0.2913,
"step": 18900
},
{
"epoch": 44.7,
"learning_rate": 1.7422917284316633e-05,
"loss": 0.2906,
"step": 19000
},
{
"epoch": 44.94,
"learning_rate": 1.734879928846724e-05,
"loss": 0.2837,
"step": 19100
},
{
"epoch": 45.0,
"eval_loss": 0.38119739294052124,
"eval_runtime": 317.5894,
"eval_samples_per_second": 26.519,
"eval_wer": 0.31785487487202085,
"step": 19125
},
{
"epoch": 45.18,
"learning_rate": 1.727468129261785e-05,
"loss": 0.2909,
"step": 19200
},
{
"epoch": 45.41,
"learning_rate": 1.7200563296768454e-05,
"loss": 0.2858,
"step": 19300
},
{
"epoch": 45.65,
"learning_rate": 1.7126445300919065e-05,
"loss": 0.2905,
"step": 19400
},
{
"epoch": 45.88,
"learning_rate": 1.7052327305069673e-05,
"loss": 0.2825,
"step": 19500
},
{
"epoch": 46.0,
"eval_loss": 0.38637784123420715,
"eval_runtime": 317.552,
"eval_samples_per_second": 26.522,
"eval_wer": 0.31740127784761735,
"step": 19550
},
{
"epoch": 46.12,
"learning_rate": 1.6978209309220278e-05,
"loss": 0.29,
"step": 19600
},
{
"epoch": 46.35,
"learning_rate": 1.690409131337089e-05,
"loss": 0.29,
"step": 19700
},
{
"epoch": 46.59,
"learning_rate": 1.6829973317521494e-05,
"loss": 0.2855,
"step": 19800
},
{
"epoch": 46.82,
"learning_rate": 1.6755855321672102e-05,
"loss": 0.2827,
"step": 19900
},
{
"epoch": 47.0,
"eval_loss": 0.38330715894699097,
"eval_runtime": 317.4978,
"eval_samples_per_second": 26.526,
"eval_wer": 0.3139798602921165,
"step": 19975
},
{
"epoch": 47.06,
"learning_rate": 1.668173732582271e-05,
"loss": 0.2883,
"step": 20000
},
{
"epoch": 47.29,
"learning_rate": 1.6607619329973318e-05,
"loss": 0.282,
"step": 20100
},
{
"epoch": 47.53,
"learning_rate": 1.6533501334123926e-05,
"loss": 0.2826,
"step": 20200
},
{
"epoch": 47.76,
"learning_rate": 1.6459383338274534e-05,
"loss": 0.2756,
"step": 20300
},
{
"epoch": 48.0,
"learning_rate": 1.638526534242514e-05,
"loss": 0.2849,
"step": 20400
},
{
"epoch": 48.0,
"eval_loss": 0.3806135356426239,
"eval_runtime": 317.6019,
"eval_samples_per_second": 26.517,
"eval_wer": 0.31536657119529293,
"step": 20400
},
{
"epoch": 48.23,
"learning_rate": 1.631114734657575e-05,
"loss": 0.2844,
"step": 20500
},
{
"epoch": 48.47,
"learning_rate": 1.623702935072636e-05,
"loss": 0.2808,
"step": 20600
},
{
"epoch": 48.7,
"learning_rate": 1.616365253483546e-05,
"loss": 0.2845,
"step": 20700
},
{
"epoch": 48.94,
"learning_rate": 1.6089534538986064e-05,
"loss": 0.2767,
"step": 20800
},
{
"epoch": 49.0,
"eval_loss": 0.37584495544433594,
"eval_runtime": 317.5121,
"eval_samples_per_second": 26.525,
"eval_wer": 0.3132929847980197,
"step": 20825
},
{
"epoch": 49.18,
"learning_rate": 1.6015416543136675e-05,
"loss": 0.283,
"step": 20900
},
{
"epoch": 49.41,
"learning_rate": 1.5941298547287283e-05,
"loss": 0.2801,
"step": 21000
},
{
"epoch": 49.65,
"learning_rate": 1.5867180551437888e-05,
"loss": 0.2737,
"step": 21100
},
{
"epoch": 49.88,
"learning_rate": 1.57930625555885e-05,
"loss": 0.2732,
"step": 21200
},
{
"epoch": 50.0,
"eval_loss": 0.3800816833972931,
"eval_runtime": 317.0609,
"eval_samples_per_second": 26.563,
"eval_wer": 0.31414833918689494,
"step": 21250
},
{
"epoch": 50.12,
"learning_rate": 1.5718944559739107e-05,
"loss": 0.2818,
"step": 21300
},
{
"epoch": 50.35,
"learning_rate": 1.5644826563889712e-05,
"loss": 0.2728,
"step": 21400
},
{
"epoch": 50.59,
"learning_rate": 1.557070856804032e-05,
"loss": 0.276,
"step": 21500
},
{
"epoch": 50.82,
"learning_rate": 1.5496590572190928e-05,
"loss": 0.2691,
"step": 21600
},
{
"epoch": 51.0,
"eval_loss": 0.3639204800128937,
"eval_runtime": 317.0756,
"eval_samples_per_second": 26.561,
"eval_wer": 0.30717590492606367,
"step": 21675
},
{
"epoch": 51.06,
"learning_rate": 1.5422472576341536e-05,
"loss": 0.2741,
"step": 21700
},
{
"epoch": 51.29,
"learning_rate": 1.5348354580492144e-05,
"loss": 0.2722,
"step": 21800
},
{
"epoch": 51.53,
"learning_rate": 1.527423658464275e-05,
"loss": 0.2724,
"step": 21900
},
{
"epoch": 51.76,
"learning_rate": 1.520011858879336e-05,
"loss": 0.2662,
"step": 22000
},
{
"epoch": 52.0,
"learning_rate": 1.5126000592943967e-05,
"loss": 0.2742,
"step": 22100
},
{
"epoch": 52.0,
"eval_loss": 0.36436760425567627,
"eval_runtime": 316.4547,
"eval_samples_per_second": 26.614,
"eval_wer": 0.30645014968701806,
"step": 22100
},
{
"epoch": 52.23,
"learning_rate": 1.5051882597094575e-05,
"loss": 0.2699,
"step": 22200
},
{
"epoch": 52.47,
"learning_rate": 1.4977764601245183e-05,
"loss": 0.2732,
"step": 22300
},
{
"epoch": 52.7,
"learning_rate": 1.4903646605395791e-05,
"loss": 0.2723,
"step": 22400
},
{
"epoch": 52.94,
"learning_rate": 1.4829528609546397e-05,
"loss": 0.2671,
"step": 22500
},
{
"epoch": 53.0,
"eval_loss": 0.3704889416694641,
"eval_runtime": 317.8613,
"eval_samples_per_second": 26.496,
"eval_wer": 0.3060743121525123,
"step": 22525
},
{
"epoch": 53.18,
"learning_rate": 1.4755410613697007e-05,
"loss": 0.2713,
"step": 22600
},
{
"epoch": 53.41,
"learning_rate": 1.4681292617847613e-05,
"loss": 0.2658,
"step": 22700
},
{
"epoch": 53.65,
"learning_rate": 1.4607174621998221e-05,
"loss": 0.2707,
"step": 22800
},
{
"epoch": 53.88,
"learning_rate": 1.4533797806107324e-05,
"loss": 0.2618,
"step": 22900
},
{
"epoch": 54.0,
"eval_loss": 0.3567538857460022,
"eval_runtime": 353.5118,
"eval_samples_per_second": 23.824,
"eval_wer": 0.3049986392089268,
"step": 22950
},
{
"epoch": 54.12,
"learning_rate": 1.4459679810257932e-05,
"loss": 0.2679,
"step": 23000
},
{
"epoch": 54.35,
"learning_rate": 1.4385561814408538e-05,
"loss": 0.2647,
"step": 23100
},
{
"epoch": 54.59,
"learning_rate": 1.4311443818559146e-05,
"loss": 0.2632,
"step": 23200
},
{
"epoch": 54.82,
"learning_rate": 1.4237325822709754e-05,
"loss": 0.265,
"step": 23300
},
{
"epoch": 55.0,
"eval_loss": 0.3651841878890991,
"eval_runtime": 317.4254,
"eval_samples_per_second": 26.532,
"eval_wer": 0.3071111053511489,
"step": 23375
},
{
"epoch": 55.06,
"learning_rate": 1.4163207826860362e-05,
"loss": 0.2638,
"step": 23400
},
{
"epoch": 55.29,
"learning_rate": 1.408908983101097e-05,
"loss": 0.2648,
"step": 23500
},
{
"epoch": 55.53,
"learning_rate": 1.4014971835161577e-05,
"loss": 0.264,
"step": 23600
},
{
"epoch": 55.76,
"learning_rate": 1.3940853839312186e-05,
"loss": 0.2631,
"step": 23700
},
{
"epoch": 56.0,
"learning_rate": 1.3866735843462793e-05,
"loss": 0.2655,
"step": 23800
},
{
"epoch": 56.0,
"eval_loss": 0.3658052384853363,
"eval_runtime": 316.7135,
"eval_samples_per_second": 26.592,
"eval_wer": 0.3048431202291313,
"step": 23800
},
{
"epoch": 56.23,
"learning_rate": 1.3792617847613401e-05,
"loss": 0.2635,
"step": 23900
},
{
"epoch": 56.47,
"learning_rate": 1.3718499851764009e-05,
"loss": 0.2658,
"step": 24000
},
{
"epoch": 56.7,
"learning_rate": 1.3644381855914617e-05,
"loss": 0.2683,
"step": 24100
},
{
"epoch": 56.94,
"learning_rate": 1.3570263860065223e-05,
"loss": 0.2588,
"step": 24200
},
{
"epoch": 57.0,
"eval_loss": 0.3624616861343384,
"eval_runtime": 317.8838,
"eval_samples_per_second": 26.494,
"eval_wer": 0.30356008864581846,
"step": 24225
},
{
"epoch": 57.18,
"learning_rate": 1.3496145864215831e-05,
"loss": 0.2566,
"step": 24300
},
{
"epoch": 57.41,
"learning_rate": 1.3422027868366441e-05,
"loss": 0.2575,
"step": 24400
},
{
"epoch": 57.65,
"learning_rate": 1.3347909872517047e-05,
"loss": 0.2643,
"step": 24500
},
{
"epoch": 57.88,
"learning_rate": 1.3273791876667656e-05,
"loss": 0.2585,
"step": 24600
},
{
"epoch": 58.0,
"eval_loss": 0.3619252145290375,
"eval_runtime": 317.5906,
"eval_samples_per_second": 26.518,
"eval_wer": 0.3017457005482044,
"step": 24650
},
{
"epoch": 58.12,
"learning_rate": 1.3199673880818262e-05,
"loss": 0.2616,
"step": 24700
},
{
"epoch": 58.35,
"learning_rate": 1.3125555884968872e-05,
"loss": 0.2588,
"step": 24800
},
{
"epoch": 58.59,
"learning_rate": 1.3051437889119478e-05,
"loss": 0.2606,
"step": 24900
},
{
"epoch": 58.82,
"learning_rate": 1.2977319893270086e-05,
"loss": 0.2616,
"step": 25000
},
{
"epoch": 59.0,
"eval_loss": 0.35793522000312805,
"eval_runtime": 316.6098,
"eval_samples_per_second": 26.601,
"eval_wer": 0.3006829875196019,
"step": 25075
},
{
"epoch": 59.06,
"learning_rate": 1.2903943077379188e-05,
"loss": 0.2591,
"step": 25100
},
{
"epoch": 59.29,
"learning_rate": 1.2830566261488289e-05,
"loss": 0.2606,
"step": 25200
},
{
"epoch": 59.53,
"learning_rate": 1.2756448265638897e-05,
"loss": 0.2581,
"step": 25300
},
{
"epoch": 59.76,
"learning_rate": 1.2682330269789505e-05,
"loss": 0.2574,
"step": 25400
},
{
"epoch": 60.0,
"learning_rate": 1.2608212273940113e-05,
"loss": 0.2509,
"step": 25500
},
{
"epoch": 60.0,
"eval_loss": 0.36091676354408264,
"eval_runtime": 663.9043,
"eval_samples_per_second": 12.686,
"eval_wer": 0.2987519601871412,
"step": 25500
},
{
"epoch": 60.23,
"learning_rate": 1.2534094278090721e-05,
"loss": 0.2566,
"step": 25600
},
{
"epoch": 60.47,
"learning_rate": 1.2459976282241328e-05,
"loss": 0.2556,
"step": 25700
},
{
"epoch": 60.7,
"learning_rate": 1.2385858286391937e-05,
"loss": 0.2539,
"step": 25800
},
{
"epoch": 60.94,
"learning_rate": 1.2311740290542544e-05,
"loss": 0.2538,
"step": 25900
},
{
"epoch": 61.0,
"eval_loss": 0.3586573004722595,
"eval_runtime": 317.4988,
"eval_samples_per_second": 26.526,
"eval_wer": 0.29758556783867496,
"step": 25925
},
{
"epoch": 61.18,
"learning_rate": 1.2237622294693152e-05,
"loss": 0.2589,
"step": 26000
},
{
"epoch": 61.41,
"learning_rate": 1.2163504298843758e-05,
"loss": 0.249,
"step": 26100
},
{
"epoch": 61.65,
"learning_rate": 1.2089386302994368e-05,
"loss": 0.2464,
"step": 26200
},
{
"epoch": 61.88,
"learning_rate": 1.2015268307144976e-05,
"loss": 0.2563,
"step": 26300
},
{
"epoch": 62.0,
"eval_loss": 0.3534925878047943,
"eval_runtime": 317.8014,
"eval_samples_per_second": 26.501,
"eval_wer": 0.29697645183447596,
"step": 26350
},
{
"epoch": 62.12,
"learning_rate": 1.1941150311295582e-05,
"loss": 0.2559,
"step": 26400
},
{
"epoch": 62.35,
"learning_rate": 1.1867032315446192e-05,
"loss": 0.2543,
"step": 26500
},
{
"epoch": 62.59,
"learning_rate": 1.1792914319596798e-05,
"loss": 0.2496,
"step": 26600
},
{
"epoch": 62.82,
"learning_rate": 1.1718796323747406e-05,
"loss": 0.249,
"step": 26700
},
{
"epoch": 63.0,
"eval_loss": 0.34823477268218994,
"eval_runtime": 317.6983,
"eval_samples_per_second": 26.509,
"eval_wer": 0.29906299814673215,
"step": 26775
},
{
"epoch": 63.06,
"learning_rate": 1.1644678327898013e-05,
"loss": 0.2536,
"step": 26800
},
{
"epoch": 63.29,
"learning_rate": 1.1570560332048623e-05,
"loss": 0.2481,
"step": 26900
},
{
"epoch": 63.53,
"learning_rate": 1.1496442336199229e-05,
"loss": 0.2504,
"step": 27000
},
{
"epoch": 63.76,
"learning_rate": 1.1422324340349837e-05,
"loss": 0.2482,
"step": 27100
},
{
"epoch": 64.0,
"learning_rate": 1.1348206344500445e-05,
"loss": 0.2508,
"step": 27200
},
{
"epoch": 64.0,
"eval_loss": 0.35596856474876404,
"eval_runtime": 314.8406,
"eval_samples_per_second": 26.75,
"eval_wer": 0.29501950467204935,
"step": 27200
},
{
"epoch": 64.23,
"learning_rate": 1.1274088348651053e-05,
"loss": 0.2562,
"step": 27300
},
{
"epoch": 64.47,
"learning_rate": 1.1199970352801661e-05,
"loss": 0.2504,
"step": 27400
},
{
"epoch": 64.7,
"learning_rate": 1.1125852356952268e-05,
"loss": 0.25,
"step": 27500
},
{
"epoch": 64.94,
"learning_rate": 1.1051734361102877e-05,
"loss": 0.2518,
"step": 27600
},
{
"epoch": 65.0,
"eval_loss": 0.35186004638671875,
"eval_runtime": 317.5788,
"eval_samples_per_second": 26.519,
"eval_wer": 0.2965358147250554,
"step": 27625
},
{
"epoch": 65.18,
"learning_rate": 1.0977616365253484e-05,
"loss": 0.2502,
"step": 27700
},
{
"epoch": 65.41,
"learning_rate": 1.0903498369404092e-05,
"loss": 0.2451,
"step": 27800
},
{
"epoch": 65.65,
"learning_rate": 1.0829380373554698e-05,
"loss": 0.2508,
"step": 27900
},
{
"epoch": 65.88,
"learning_rate": 1.0755262377705308e-05,
"loss": 0.248,
"step": 28000
},
{
"epoch": 66.0,
"eval_loss": 0.34826791286468506,
"eval_runtime": 315.877,
"eval_samples_per_second": 26.662,
"eval_wer": 0.2940863907932764,
"step": 28050
},
{
"epoch": 66.12,
"learning_rate": 1.0681144381855916e-05,
"loss": 0.2488,
"step": 28100
},
{
"epoch": 66.35,
"learning_rate": 1.0607026386006522e-05,
"loss": 0.2446,
"step": 28200
},
{
"epoch": 66.59,
"learning_rate": 1.053290839015713e-05,
"loss": 0.2472,
"step": 28300
},
{
"epoch": 66.82,
"learning_rate": 1.0458790394307738e-05,
"loss": 0.2427,
"step": 28400
},
{
"epoch": 67.0,
"eval_loss": 0.35498106479644775,
"eval_runtime": 315.9906,
"eval_samples_per_second": 26.653,
"eval_wer": 0.29247936133538965,
"step": 28475
},
{
"epoch": 67.06,
"learning_rate": 1.0384672398458346e-05,
"loss": 0.2519,
"step": 28500
},
{
"epoch": 67.29,
"learning_rate": 1.0310554402608953e-05,
"loss": 0.2463,
"step": 28600
},
{
"epoch": 67.53,
"learning_rate": 1.0236436406759562e-05,
"loss": 0.2406,
"step": 28700
},
{
"epoch": 67.76,
"learning_rate": 1.0162318410910169e-05,
"loss": 0.2434,
"step": 28800
},
{
"epoch": 68.0,
"learning_rate": 1.0088200415060777e-05,
"loss": 0.2439,
"step": 28900
},
{
"epoch": 68.0,
"eval_loss": 0.35530757904052734,
"eval_runtime": 316.4428,
"eval_samples_per_second": 26.615,
"eval_wer": 0.2964710151501406,
"step": 28900
},
{
"epoch": 68.23,
"learning_rate": 1.0014082419211385e-05,
"loss": 0.2444,
"step": 29000
},
{
"epoch": 68.47,
"learning_rate": 9.939964423361993e-06,
"loss": 0.2459,
"step": 29100
},
{
"epoch": 68.7,
"learning_rate": 9.865846427512601e-06,
"loss": 0.2397,
"step": 29200
},
{
"epoch": 68.94,
"learning_rate": 9.791728431663207e-06,
"loss": 0.2427,
"step": 29300
},
{
"epoch": 69.0,
"eval_loss": 0.35256123542785645,
"eval_runtime": 316.7354,
"eval_samples_per_second": 26.59,
"eval_wer": 0.29481214603232203,
"step": 29325
},
{
"epoch": 69.18,
"learning_rate": 9.717610435813815e-06,
"loss": 0.2464,
"step": 29400
},
{
"epoch": 69.41,
"learning_rate": 9.643492439964424e-06,
"loss": 0.2396,
"step": 29500
},
{
"epoch": 69.65,
"learning_rate": 9.569374444115032e-06,
"loss": 0.2441,
"step": 29600
},
{
"epoch": 69.88,
"learning_rate": 9.495256448265638e-06,
"loss": 0.2412,
"step": 29700
},
{
"epoch": 70.0,
"eval_loss": 0.356432169675827,
"eval_runtime": 316.2059,
"eval_samples_per_second": 26.635,
"eval_wer": 0.2973004497090499,
"step": 29750
},
{
"epoch": 70.12,
"learning_rate": 9.421879632374742e-06,
"loss": 0.2488,
"step": 29800
},
{
"epoch": 70.35,
"learning_rate": 9.347761636525348e-06,
"loss": 0.2348,
"step": 29900
},
{
"epoch": 70.59,
"learning_rate": 9.273643640675956e-06,
"loss": 0.2426,
"step": 30000
},
{
"epoch": 70.82,
"learning_rate": 9.199525644826563e-06,
"loss": 0.2394,
"step": 30100
},
{
"epoch": 71.0,
"eval_loss": 0.3529145419597626,
"eval_runtime": 314.7426,
"eval_samples_per_second": 26.758,
"eval_wer": 0.28974481927398554,
"step": 30175
},
{
"epoch": 71.06,
"learning_rate": 9.125407648977172e-06,
"loss": 0.2451,
"step": 30200
},
{
"epoch": 71.29,
"learning_rate": 9.051289653127779e-06,
"loss": 0.2371,
"step": 30300
},
{
"epoch": 71.53,
"learning_rate": 8.977171657278387e-06,
"loss": 0.2367,
"step": 30400
},
{
"epoch": 71.76,
"learning_rate": 8.903053661428997e-06,
"loss": 0.2417,
"step": 30500
},
{
"epoch": 72.0,
"learning_rate": 8.828935665579603e-06,
"loss": 0.247,
"step": 30600
},
{
"epoch": 72.0,
"eval_loss": 0.3524751663208008,
"eval_runtime": 316.256,
"eval_samples_per_second": 26.63,
"eval_wer": 0.2913777685618382,
"step": 30600
},
{
"epoch": 72.23,
"learning_rate": 8.754817669730211e-06,
"loss": 0.2448,
"step": 30700
},
{
"epoch": 72.47,
"learning_rate": 8.680699673880817e-06,
"loss": 0.238,
"step": 30800
},
{
"epoch": 72.7,
"learning_rate": 8.606581678031427e-06,
"loss": 0.2341,
"step": 30900
},
{
"epoch": 72.94,
"learning_rate": 8.532463682182034e-06,
"loss": 0.2371,
"step": 31000
},
{
"epoch": 73.0,
"eval_loss": 0.3488871455192566,
"eval_runtime": 316.856,
"eval_samples_per_second": 26.58,
"eval_wer": 0.28990033825378103,
"step": 31025
},
{
"epoch": 73.0,
"step": 31025,
"total_flos": 0,
"train_runtime": 465541.7438,
"train_samples_per_second": 0.091
}
],
"max_steps": 42500,
"num_train_epochs": 100,
"total_flos": 0,
"trial_name": null,
"trial_params": null
}