{ "best_metric": 0.5727322101593018, "best_model_checkpoint": "wav2vec2-large-xlsr-coraa-exp-3/checkpoint-1554", "epoch": 131.0, "global_step": 1834, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.07, "learning_rate": 3e-05, "loss": 38.4524, "step": 1 }, { "epoch": 1.0, "eval_cer": 0.9586533212010919, "eval_loss": 28.540863037109375, "eval_runtime": 53.1462, "eval_samples_per_second": 10.198, "eval_steps_per_second": 1.279, "eval_wer": 1.0, "step": 14 }, { "epoch": 2.0, "eval_cer": 0.9618562329390354, "eval_loss": 8.314471244812012, "eval_runtime": 53.0408, "eval_samples_per_second": 10.219, "eval_steps_per_second": 1.282, "eval_wer": 1.0, "step": 28 }, { "epoch": 3.0, "eval_cer": 0.9618562329390354, "eval_loss": 4.788250923156738, "eval_runtime": 52.9102, "eval_samples_per_second": 10.244, "eval_steps_per_second": 1.285, "eval_wer": 1.0, "step": 42 }, { "epoch": 4.0, "eval_cer": 0.9618562329390354, "eval_loss": 4.076758861541748, "eval_runtime": 53.0042, "eval_samples_per_second": 10.226, "eval_steps_per_second": 1.283, "eval_wer": 1.0, "step": 56 }, { "epoch": 5.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.790695905685425, "eval_runtime": 52.9066, "eval_samples_per_second": 10.244, "eval_steps_per_second": 1.285, "eval_wer": 1.0, "step": 70 }, { "epoch": 6.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.6234583854675293, "eval_runtime": 52.8613, "eval_samples_per_second": 10.253, "eval_steps_per_second": 1.286, "eval_wer": 1.0, "step": 84 }, { "epoch": 7.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.5015854835510254, "eval_runtime": 52.9075, "eval_samples_per_second": 10.244, "eval_steps_per_second": 1.285, "eval_wer": 1.0, "step": 98 }, { "epoch": 7.14, "learning_rate": 2.8614285714285714e-05, "loss": 9.6862, "step": 100 }, { "epoch": 8.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.361980438232422, "eval_runtime": 52.945, "eval_samples_per_second": 10.237, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 112 }, { "epoch": 9.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.262788772583008, "eval_runtime": 53.023, "eval_samples_per_second": 10.222, "eval_steps_per_second": 1.282, "eval_wer": 1.0, "step": 126 }, { "epoch": 10.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.2084038257598877, "eval_runtime": 52.9601, "eval_samples_per_second": 10.234, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 140 }, { "epoch": 11.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.1405389308929443, "eval_runtime": 52.9576, "eval_samples_per_second": 10.235, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 154 }, { "epoch": 12.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.1096060276031494, "eval_runtime": 52.9571, "eval_samples_per_second": 10.235, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 168 }, { "epoch": 13.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.094794511795044, "eval_runtime": 53.0065, "eval_samples_per_second": 10.225, "eval_steps_per_second": 1.283, "eval_wer": 1.0, "step": 182 }, { "epoch": 14.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0671029090881348, "eval_runtime": 52.99, "eval_samples_per_second": 10.228, "eval_steps_per_second": 1.283, "eval_wer": 1.0, "step": 196 }, { "epoch": 14.29, "learning_rate": 2.7185714285714287e-05, "loss": 3.0986, "step": 200 }, { "epoch": 15.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0809550285339355, "eval_runtime": 52.9614, "eval_samples_per_second": 10.234, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 210 }, { "epoch": 16.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0577237606048584, "eval_runtime": 52.9744, "eval_samples_per_second": 10.231, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 224 }, { "epoch": 17.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0414350032806396, "eval_runtime": 52.9471, "eval_samples_per_second": 10.237, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 238 }, { "epoch": 18.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.039754629135132, "eval_runtime": 52.9536, "eval_samples_per_second": 10.235, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 252 }, { "epoch": 19.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0336570739746094, "eval_runtime": 52.9861, "eval_samples_per_second": 10.229, "eval_steps_per_second": 1.283, "eval_wer": 1.0, "step": 266 }, { "epoch": 20.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.025843381881714, "eval_runtime": 53.0011, "eval_samples_per_second": 10.226, "eval_steps_per_second": 1.283, "eval_wer": 1.0, "step": 280 }, { "epoch": 21.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0206263065338135, "eval_runtime": 52.9519, "eval_samples_per_second": 10.236, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 294 }, { "epoch": 21.43, "learning_rate": 2.5757142857142857e-05, "loss": 2.9619, "step": 300 }, { "epoch": 22.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.018939256668091, "eval_runtime": 52.9394, "eval_samples_per_second": 10.238, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 308 }, { "epoch": 23.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0166780948638916, "eval_runtime": 52.9637, "eval_samples_per_second": 10.233, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 322 }, { "epoch": 24.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.006849527359009, "eval_runtime": 52.9579, "eval_samples_per_second": 10.235, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 336 }, { "epoch": 25.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.001568555831909, "eval_runtime": 52.976, "eval_samples_per_second": 10.231, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 350 }, { "epoch": 26.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0053274631500244, "eval_runtime": 53.0349, "eval_samples_per_second": 10.22, "eval_steps_per_second": 1.282, "eval_wer": 1.0, "step": 364 }, { "epoch": 27.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.002009868621826, "eval_runtime": 52.9483, "eval_samples_per_second": 10.236, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 378 }, { "epoch": 28.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.00075626373291, "eval_runtime": 53.0974, "eval_samples_per_second": 10.208, "eval_steps_per_second": 1.281, "eval_wer": 1.0, "step": 392 }, { "epoch": 28.57, "learning_rate": 2.432857142857143e-05, "loss": 2.9276, "step": 400 }, { "epoch": 29.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.9920263290405273, "eval_runtime": 53.6317, "eval_samples_per_second": 10.106, "eval_steps_per_second": 1.268, "eval_wer": 1.0, "step": 406 }, { "epoch": 30.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.9916112422943115, "eval_runtime": 52.9892, "eval_samples_per_second": 10.228, "eval_steps_per_second": 1.283, "eval_wer": 1.0, "step": 420 }, { "epoch": 31.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.993955373764038, "eval_runtime": 53.0308, "eval_samples_per_second": 10.22, "eval_steps_per_second": 1.282, "eval_wer": 1.0, "step": 434 }, { "epoch": 32.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.985051155090332, "eval_runtime": 52.9796, "eval_samples_per_second": 10.23, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 448 }, { "epoch": 33.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.9817941188812256, "eval_runtime": 52.9663, "eval_samples_per_second": 10.233, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 462 }, { "epoch": 34.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.9794976711273193, "eval_runtime": 53.0874, "eval_samples_per_second": 10.21, "eval_steps_per_second": 1.281, "eval_wer": 1.0, "step": 476 }, { "epoch": 35.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.973381757736206, "eval_runtime": 52.9719, "eval_samples_per_second": 10.232, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 490 }, { "epoch": 35.71, "learning_rate": 2.29e-05, "loss": 2.9141, "step": 500 }, { "epoch": 36.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.954444169998169, "eval_runtime": 52.9904, "eval_samples_per_second": 10.228, "eval_steps_per_second": 1.283, "eval_wer": 1.0, "step": 504 }, { "epoch": 37.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.9253017902374268, "eval_runtime": 52.9492, "eval_samples_per_second": 10.236, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 518 }, { "epoch": 38.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.849879264831543, "eval_runtime": 53.141, "eval_samples_per_second": 10.199, "eval_steps_per_second": 1.28, "eval_wer": 1.0, "step": 532 }, { "epoch": 39.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.800652503967285, "eval_runtime": 53.0816, "eval_samples_per_second": 10.211, "eval_steps_per_second": 1.281, "eval_wer": 1.0, "step": 546 }, { "epoch": 40.0, "eval_cer": 0.9602183803457689, "eval_loss": 2.773822784423828, "eval_runtime": 53.357, "eval_samples_per_second": 10.158, "eval_steps_per_second": 1.274, "eval_wer": 1.0, "step": 560 }, { "epoch": 41.0, "eval_cer": 0.9604367606915377, "eval_loss": 2.699044942855835, "eval_runtime": 53.0987, "eval_samples_per_second": 10.207, "eval_steps_per_second": 1.281, "eval_wer": 1.0, "step": 574 }, { "epoch": 42.0, "eval_cer": 0.9327024567788899, "eval_loss": 2.5829148292541504, "eval_runtime": 52.9511, "eval_samples_per_second": 10.236, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 588 }, { "epoch": 42.86, "learning_rate": 2.1471428571428574e-05, "loss": 2.7541, "step": 600 }, { "epoch": 43.0, "eval_cer": 0.8496087352138307, "eval_loss": 2.4752373695373535, "eval_runtime": 53.6351, "eval_samples_per_second": 10.105, "eval_steps_per_second": 1.268, "eval_wer": 1.0, "step": 602 }, { "epoch": 44.0, "eval_cer": 0.708498635122839, "eval_loss": 2.2684857845306396, "eval_runtime": 53.0701, "eval_samples_per_second": 10.213, "eval_steps_per_second": 1.281, "eval_wer": 1.0, "step": 616 }, { "epoch": 45.0, "eval_cer": 0.6326114649681529, "eval_loss": 2.102912187576294, "eval_runtime": 53.098, "eval_samples_per_second": 10.208, "eval_steps_per_second": 1.281, "eval_wer": 1.0, "step": 630 }, { "epoch": 46.0, "eval_cer": 0.5549044585987262, "eval_loss": 1.8554308414459229, "eval_runtime": 53.0602, "eval_samples_per_second": 10.215, "eval_steps_per_second": 1.282, "eval_wer": 1.0, "step": 644 }, { "epoch": 47.0, "eval_cer": 0.47395814376706097, "eval_loss": 1.6462159156799316, "eval_runtime": 53.1159, "eval_samples_per_second": 10.204, "eval_steps_per_second": 1.28, "eval_wer": 0.9995936611133686, "step": 658 }, { "epoch": 48.0, "eval_cer": 0.428098271155596, "eval_loss": 1.460442066192627, "eval_runtime": 53.1598, "eval_samples_per_second": 10.196, "eval_steps_per_second": 1.279, "eval_wer": 0.9987809833401057, "step": 672 }, { "epoch": 49.0, "eval_cer": 0.3805277525022748, "eval_loss": 1.2930712699890137, "eval_runtime": 53.1092, "eval_samples_per_second": 10.205, "eval_steps_per_second": 1.28, "eval_wer": 0.981511580658269, "step": 686 }, { "epoch": 50.0, "learning_rate": 2.004285714285714e-05, "loss": 1.9662, "step": 700 }, { "epoch": 50.0, "eval_cer": 0.34424021838034574, "eval_loss": 1.1677709817886353, "eval_runtime": 53.2327, "eval_samples_per_second": 10.182, "eval_steps_per_second": 1.277, "eval_wer": 0.9246241365298659, "step": 700 }, { "epoch": 51.0, "eval_cer": 0.29747042766151044, "eval_loss": 1.0561025142669678, "eval_runtime": 53.203, "eval_samples_per_second": 10.187, "eval_steps_per_second": 1.278, "eval_wer": 0.778138967899228, "step": 714 }, { "epoch": 52.0, "eval_cer": 0.24178343949044587, "eval_loss": 0.9993860721588135, "eval_runtime": 53.1277, "eval_samples_per_second": 10.202, "eval_steps_per_second": 1.28, "eval_wer": 0.5709061357171882, "step": 728 }, { "epoch": 53.0, "eval_cer": 0.22114649681528661, "eval_loss": 0.8893789052963257, "eval_runtime": 53.2214, "eval_samples_per_second": 10.184, "eval_steps_per_second": 1.278, "eval_wer": 0.5040633888663145, "step": 742 }, { "epoch": 54.0, "eval_cer": 0.21881710646041858, "eval_loss": 0.8921266198158264, "eval_runtime": 53.1697, "eval_samples_per_second": 10.194, "eval_steps_per_second": 1.279, "eval_wer": 0.49207639171068673, "step": 756 }, { "epoch": 55.0, "eval_cer": 0.21281164695177435, "eval_loss": 0.8739840388298035, "eval_runtime": 53.6319, "eval_samples_per_second": 10.106, "eval_steps_per_second": 1.268, "eval_wer": 0.4717594473791142, "step": 770 }, { "epoch": 56.0, "eval_cer": 0.20764331210191084, "eval_loss": 0.8273698091506958, "eval_runtime": 53.0587, "eval_samples_per_second": 10.215, "eval_steps_per_second": 1.282, "eval_wer": 0.45550589191385615, "step": 784 }, { "epoch": 57.0, "eval_cer": 0.20833484986351228, "eval_loss": 0.8199306726455688, "eval_runtime": 53.6361, "eval_samples_per_second": 10.105, "eval_steps_per_second": 1.268, "eval_wer": 0.44920763917106865, "step": 798 }, { "epoch": 57.14, "learning_rate": 1.8614285714285715e-05, "loss": 1.0586, "step": 800 }, { "epoch": 58.0, "eval_cer": 0.20687898089171974, "eval_loss": 0.7865574955940247, "eval_runtime": 53.1251, "eval_samples_per_second": 10.202, "eval_steps_per_second": 1.28, "eval_wer": 0.4463632669646485, "step": 812 }, { "epoch": 59.0, "eval_cer": 0.2026933575978162, "eval_loss": 0.7334416508674622, "eval_runtime": 53.189, "eval_samples_per_second": 10.19, "eval_steps_per_second": 1.278, "eval_wer": 0.4329540837058106, "step": 826 }, { "epoch": 60.0, "eval_cer": 0.2037852593266606, "eval_loss": 0.7200602293014526, "eval_runtime": 53.2175, "eval_samples_per_second": 10.185, "eval_steps_per_second": 1.278, "eval_wer": 0.43945550589191384, "step": 840 }, { "epoch": 61.0, "eval_cer": 0.200582347588717, "eval_loss": 0.7093716263771057, "eval_runtime": 53.0938, "eval_samples_per_second": 10.208, "eval_steps_per_second": 1.281, "eval_wer": 0.4266558309630232, "step": 854 }, { "epoch": 62.0, "eval_cer": 0.19854413102820745, "eval_loss": 0.6839061379432678, "eval_runtime": 53.0803, "eval_samples_per_second": 10.211, "eval_steps_per_second": 1.281, "eval_wer": 0.42503047541649736, "step": 868 }, { "epoch": 63.0, "eval_cer": 0.195705186533212, "eval_loss": 0.6769891977310181, "eval_runtime": 53.0971, "eval_samples_per_second": 10.208, "eval_steps_per_second": 1.281, "eval_wer": 0.41609101991060543, "step": 882 }, { "epoch": 64.0, "eval_cer": 0.19828935395814376, "eval_loss": 0.6982135772705078, "eval_runtime": 53.1485, "eval_samples_per_second": 10.198, "eval_steps_per_second": 1.279, "eval_wer": 0.4205607476635514, "step": 896 }, { "epoch": 64.29, "learning_rate": 1.7185714285714285e-05, "loss": 0.7351, "step": 900 }, { "epoch": 65.0, "eval_cer": 0.19963603275705186, "eval_loss": 0.693848192691803, "eval_runtime": 53.0652, "eval_samples_per_second": 10.214, "eval_steps_per_second": 1.281, "eval_wer": 0.42503047541649736, "step": 910 }, { "epoch": 66.0, "eval_cer": 0.19879890809827117, "eval_loss": 0.695080041885376, "eval_runtime": 53.1168, "eval_samples_per_second": 10.204, "eval_steps_per_second": 1.28, "eval_wer": 0.4171068671271841, "step": 924 }, { "epoch": 67.0, "eval_cer": 0.1967242948134668, "eval_loss": 0.6676416397094727, "eval_runtime": 53.1815, "eval_samples_per_second": 10.192, "eval_steps_per_second": 1.279, "eval_wer": 0.4108086143843966, "step": 938 }, { "epoch": 68.0, "eval_cer": 0.19552320291173794, "eval_loss": 0.6553406715393066, "eval_runtime": 53.145, "eval_samples_per_second": 10.199, "eval_steps_per_second": 1.28, "eval_wer": 0.4051198699715563, "step": 952 }, { "epoch": 69.0, "eval_cer": 0.19534121929026388, "eval_loss": 0.6544891595840454, "eval_runtime": 53.1125, "eval_samples_per_second": 10.205, "eval_steps_per_second": 1.28, "eval_wer": 0.3998374644453474, "step": 966 }, { "epoch": 70.0, "eval_cer": 0.19333939945404913, "eval_loss": 0.638877272605896, "eval_runtime": 53.0484, "eval_samples_per_second": 10.217, "eval_steps_per_second": 1.282, "eval_wer": 0.39780577001219014, "step": 980 }, { "epoch": 71.0, "eval_cer": 0.19250227479526844, "eval_loss": 0.6450415849685669, "eval_runtime": 53.2149, "eval_samples_per_second": 10.185, "eval_steps_per_second": 1.278, "eval_wer": 0.39577407557903294, "step": 994 }, { "epoch": 71.43, "learning_rate": 1.5757142857142858e-05, "loss": 0.5758, "step": 1000 }, { "epoch": 72.0, "eval_cer": 0.19308462238398544, "eval_loss": 0.6343913078308105, "eval_runtime": 53.0867, "eval_samples_per_second": 10.21, "eval_steps_per_second": 1.281, "eval_wer": 0.3963835839089801, "step": 1008 }, { "epoch": 73.0, "eval_cer": 0.1913375796178344, "eval_loss": 0.6251675486564636, "eval_runtime": 53.3018, "eval_samples_per_second": 10.169, "eval_steps_per_second": 1.276, "eval_wer": 0.39089800893945553, "step": 1022 }, { "epoch": 74.0, "eval_cer": 0.1892265696087352, "eval_loss": 0.621448278427124, "eval_runtime": 53.1841, "eval_samples_per_second": 10.191, "eval_steps_per_second": 1.279, "eval_wer": 0.3866314506298253, "step": 1036 }, { "epoch": 75.0, "eval_cer": 0.18980891719745224, "eval_loss": 0.614743173122406, "eval_runtime": 53.1447, "eval_samples_per_second": 10.199, "eval_steps_per_second": 1.28, "eval_wer": 0.3852092645266152, "step": 1050 }, { "epoch": 76.0, "eval_cer": 0.1908644222020018, "eval_loss": 0.6253055930137634, "eval_runtime": 53.142, "eval_samples_per_second": 10.199, "eval_steps_per_second": 1.28, "eval_wer": 0.38480292563998375, "step": 1064 }, { "epoch": 77.0, "eval_cer": 0.19228389444949953, "eval_loss": 0.6244810223579407, "eval_runtime": 53.6784, "eval_samples_per_second": 10.097, "eval_steps_per_second": 1.267, "eval_wer": 0.3884599756196668, "step": 1078 }, { "epoch": 78.0, "eval_cer": 0.1897361237488626, "eval_loss": 0.5956248044967651, "eval_runtime": 53.1231, "eval_samples_per_second": 10.203, "eval_steps_per_second": 1.28, "eval_wer": 0.3854124339699309, "step": 1092 }, { "epoch": 78.57, "learning_rate": 1.4328571428571428e-05, "loss": 0.5238, "step": 1100 }, { "epoch": 79.0, "eval_cer": 0.18817106460418562, "eval_loss": 0.6082769632339478, "eval_runtime": 53.1516, "eval_samples_per_second": 10.197, "eval_steps_per_second": 1.279, "eval_wer": 0.3841934173100366, "step": 1106 }, { "epoch": 80.0, "eval_cer": 0.18871701546860783, "eval_loss": 0.6062718629837036, "eval_runtime": 53.1003, "eval_samples_per_second": 10.207, "eval_steps_per_second": 1.281, "eval_wer": 0.38399024786672087, "step": 1120 }, { "epoch": 81.0, "eval_cer": 0.18828025477707006, "eval_loss": 0.6067720055580139, "eval_runtime": 53.1024, "eval_samples_per_second": 10.207, "eval_steps_per_second": 1.281, "eval_wer": 0.3797236895570906, "step": 1134 }, { "epoch": 82.0, "eval_cer": 0.18806187443130118, "eval_loss": 0.6015568375587463, "eval_runtime": 53.1272, "eval_samples_per_second": 10.202, "eval_steps_per_second": 1.28, "eval_wer": 0.3803331978870378, "step": 1148 }, { "epoch": 83.0, "eval_cer": 0.18933575978161965, "eval_loss": 0.6118575930595398, "eval_runtime": 53.1719, "eval_samples_per_second": 10.193, "eval_steps_per_second": 1.279, "eval_wer": 0.3783015034538805, "step": 1162 }, { "epoch": 84.0, "eval_cer": 0.18740673339399455, "eval_loss": 0.5936925411224365, "eval_runtime": 53.1145, "eval_samples_per_second": 10.204, "eval_steps_per_second": 1.28, "eval_wer": 0.3772856562373019, "step": 1176 }, { "epoch": 85.0, "eval_cer": 0.1870427661510464, "eval_loss": 0.5894333124160767, "eval_runtime": 53.1189, "eval_samples_per_second": 10.204, "eval_steps_per_second": 1.28, "eval_wer": 0.3756603006907761, "step": 1190 }, { "epoch": 85.71, "learning_rate": 1.29e-05, "loss": 0.4655, "step": 1200 }, { "epoch": 86.0, "eval_cer": 0.18787989080982712, "eval_loss": 0.6003877520561218, "eval_runtime": 53.1193, "eval_samples_per_second": 10.203, "eval_steps_per_second": 1.28, "eval_wer": 0.3754571312474604, "step": 1204 }, { "epoch": 87.0, "eval_cer": 0.18762511373976343, "eval_loss": 0.5948131084442139, "eval_runtime": 53.1566, "eval_samples_per_second": 10.196, "eval_steps_per_second": 1.279, "eval_wer": 0.3748476229175132, "step": 1218 }, { "epoch": 88.0, "eval_cer": 0.18857142857142858, "eval_loss": 0.5988134145736694, "eval_runtime": 53.1572, "eval_samples_per_second": 10.196, "eval_steps_per_second": 1.279, "eval_wer": 0.3768793173506705, "step": 1232 }, { "epoch": 89.0, "eval_cer": 0.1867515923566879, "eval_loss": 0.5889683961868286, "eval_runtime": 53.2403, "eval_samples_per_second": 10.18, "eval_steps_per_second": 1.277, "eval_wer": 0.3734254368143031, "step": 1246 }, { "epoch": 90.0, "eval_cer": 0.18806187443130118, "eval_loss": 0.6008641719818115, "eval_runtime": 53.1831, "eval_samples_per_second": 10.191, "eval_steps_per_second": 1.279, "eval_wer": 0.3730190979276717, "step": 1260 }, { "epoch": 91.0, "eval_cer": 0.18817106460418562, "eval_loss": 0.5979772210121155, "eval_runtime": 53.2005, "eval_samples_per_second": 10.188, "eval_steps_per_second": 1.278, "eval_wer": 0.3722064201544088, "step": 1274 }, { "epoch": 92.0, "eval_cer": 0.1867879890809827, "eval_loss": 0.5938224792480469, "eval_runtime": 53.1011, "eval_samples_per_second": 10.207, "eval_steps_per_second": 1.281, "eval_wer": 0.3715969118244616, "step": 1288 }, { "epoch": 92.86, "learning_rate": 1.1471428571428572e-05, "loss": 0.4249, "step": 1300 }, { "epoch": 93.0, "eval_cer": 0.1864604185623294, "eval_loss": 0.5928549766540527, "eval_runtime": 53.1157, "eval_samples_per_second": 10.204, "eval_steps_per_second": 1.28, "eval_wer": 0.3724095895977245, "step": 1302 }, { "epoch": 94.0, "eval_cer": 0.185950864422202, "eval_loss": 0.5924369096755981, "eval_runtime": 53.2099, "eval_samples_per_second": 10.186, "eval_steps_per_second": 1.278, "eval_wer": 0.36793986184477856, "step": 1316 }, { "epoch": 95.0, "eval_cer": 0.18587807097361236, "eval_loss": 0.58665531873703, "eval_runtime": 53.2364, "eval_samples_per_second": 10.181, "eval_steps_per_second": 1.277, "eval_wer": 0.3695652173913043, "step": 1330 }, { "epoch": 96.0, "eval_cer": 0.1867879890809827, "eval_loss": 0.5969748497009277, "eval_runtime": 53.1096, "eval_samples_per_second": 10.205, "eval_steps_per_second": 1.28, "eval_wer": 0.3715969118244616, "step": 1344 }, { "epoch": 97.0, "eval_cer": 0.1856960873521383, "eval_loss": 0.5795917510986328, "eval_runtime": 53.6685, "eval_samples_per_second": 10.099, "eval_steps_per_second": 1.267, "eval_wer": 0.36895570906135716, "step": 1358 }, { "epoch": 98.0, "eval_cer": 0.18496815286624205, "eval_loss": 0.5856068134307861, "eval_runtime": 53.0879, "eval_samples_per_second": 10.209, "eval_steps_per_second": 1.281, "eval_wer": 0.3644859813084112, "step": 1372 }, { "epoch": 99.0, "eval_cer": 0.1861692447679709, "eval_loss": 0.5871953368186951, "eval_runtime": 53.649, "eval_samples_per_second": 10.103, "eval_steps_per_second": 1.267, "eval_wer": 0.3667208451848842, "step": 1386 }, { "epoch": 100.0, "learning_rate": 1.0042857142857144e-05, "loss": 0.3738, "step": 1400 }, { "epoch": 100.0, "eval_cer": 0.18613284804367608, "eval_loss": 0.5910260677337646, "eval_runtime": 53.1405, "eval_samples_per_second": 10.199, "eval_steps_per_second": 1.28, "eval_wer": 0.36793986184477856, "step": 1400 }, { "epoch": 101.0, "eval_cer": 0.18420382165605095, "eval_loss": 0.5777124762535095, "eval_runtime": 53.6, "eval_samples_per_second": 10.112, "eval_steps_per_second": 1.269, "eval_wer": 0.36631450629825274, "step": 1414 }, { "epoch": 102.0, "eval_cer": 0.1856960873521383, "eval_loss": 0.5909616351127625, "eval_runtime": 53.2098, "eval_samples_per_second": 10.186, "eval_steps_per_second": 1.278, "eval_wer": 0.36387647297846404, "step": 1428 }, { "epoch": 103.0, "eval_cer": 0.18453139217470427, "eval_loss": 0.5758861899375916, "eval_runtime": 53.1517, "eval_samples_per_second": 10.197, "eval_steps_per_second": 1.279, "eval_wer": 0.3610321007720439, "step": 1442 }, { "epoch": 104.0, "eval_cer": 0.18493175614194723, "eval_loss": 0.5818917155265808, "eval_runtime": 53.1789, "eval_samples_per_second": 10.192, "eval_steps_per_second": 1.279, "eval_wer": 0.3634701340918326, "step": 1456 }, { "epoch": 105.0, "eval_cer": 0.1848589626933576, "eval_loss": 0.5803173184394836, "eval_runtime": 53.1693, "eval_samples_per_second": 10.194, "eval_steps_per_second": 1.279, "eval_wer": 0.3622511174319382, "step": 1470 }, { "epoch": 106.0, "eval_cer": 0.18467697907188352, "eval_loss": 0.5861043930053711, "eval_runtime": 53.2812, "eval_samples_per_second": 10.172, "eval_steps_per_second": 1.276, "eval_wer": 0.36286062576188544, "step": 1484 }, { "epoch": 107.0, "eval_cer": 0.18496815286624205, "eval_loss": 0.5844627022743225, "eval_runtime": 53.1253, "eval_samples_per_second": 10.202, "eval_steps_per_second": 1.28, "eval_wer": 0.3650954896383584, "step": 1498 }, { "epoch": 107.14, "learning_rate": 8.614285714285714e-06, "loss": 0.3563, "step": 1500 }, { "epoch": 108.0, "eval_cer": 0.18471337579617833, "eval_loss": 0.5820903182029724, "eval_runtime": 53.1043, "eval_samples_per_second": 10.206, "eval_steps_per_second": 1.28, "eval_wer": 0.3632669646485169, "step": 1512 }, { "epoch": 109.0, "eval_cer": 0.18453139217470427, "eval_loss": 0.5792232751846313, "eval_runtime": 53.0873, "eval_samples_per_second": 10.21, "eval_steps_per_second": 1.281, "eval_wer": 0.36265745631856966, "step": 1526 }, { "epoch": 110.0, "eval_cer": 0.1843494085532302, "eval_loss": 0.5829302668571472, "eval_runtime": 53.0492, "eval_samples_per_second": 10.217, "eval_steps_per_second": 1.282, "eval_wer": 0.36143843965867534, "step": 1540 }, { "epoch": 111.0, "eval_cer": 0.18318471337579617, "eval_loss": 0.5727322101593018, "eval_runtime": 53.1308, "eval_samples_per_second": 10.201, "eval_steps_per_second": 1.28, "eval_wer": 0.35920357578220236, "step": 1554 }, { "epoch": 112.0, "eval_cer": 0.18416742493175614, "eval_loss": 0.575890064239502, "eval_runtime": 53.1222, "eval_samples_per_second": 10.203, "eval_steps_per_second": 1.28, "eval_wer": 0.36286062576188544, "step": 1568 }, { "epoch": 113.0, "eval_cer": 0.18471337579617833, "eval_loss": 0.5798218250274658, "eval_runtime": 53.0903, "eval_samples_per_second": 10.209, "eval_steps_per_second": 1.281, "eval_wer": 0.3596099146688338, "step": 1582 }, { "epoch": 114.0, "eval_cer": 0.18504094631483167, "eval_loss": 0.5879067182540894, "eval_runtime": 53.1424, "eval_samples_per_second": 10.199, "eval_steps_per_second": 1.28, "eval_wer": 0.3596099146688338, "step": 1596 }, { "epoch": 114.29, "learning_rate": 7.185714285714286e-06, "loss": 0.345, "step": 1600 }, { "epoch": 115.0, "eval_cer": 0.1840218380345769, "eval_loss": 0.5758743286132812, "eval_runtime": 53.0762, "eval_samples_per_second": 10.212, "eval_steps_per_second": 1.281, "eval_wer": 0.36143843965867534, "step": 1610 }, { "epoch": 116.0, "eval_cer": 0.1840582347588717, "eval_loss": 0.5808991193771362, "eval_runtime": 53.1924, "eval_samples_per_second": 10.189, "eval_steps_per_second": 1.278, "eval_wer": 0.36042259244209673, "step": 1624 }, { "epoch": 117.0, "eval_cer": 0.1826751592356688, "eval_loss": 0.5791444778442383, "eval_runtime": 53.1076, "eval_samples_per_second": 10.206, "eval_steps_per_second": 1.28, "eval_wer": 0.35778138967899226, "step": 1638 }, { "epoch": 118.0, "eval_cer": 0.18354868061874433, "eval_loss": 0.5796310305595398, "eval_runtime": 53.2195, "eval_samples_per_second": 10.184, "eval_steps_per_second": 1.278, "eval_wer": 0.36001625355546524, "step": 1652 }, { "epoch": 119.0, "eval_cer": 0.18496815286624205, "eval_loss": 0.5885907411575317, "eval_runtime": 53.1, "eval_samples_per_second": 10.207, "eval_steps_per_second": 1.281, "eval_wer": 0.36387647297846404, "step": 1666 }, { "epoch": 120.0, "eval_cer": 0.18289353958143767, "eval_loss": 0.5753579139709473, "eval_runtime": 53.1652, "eval_samples_per_second": 10.195, "eval_steps_per_second": 1.279, "eval_wer": 0.36021942299878096, "step": 1680 }, { "epoch": 121.0, "eval_cer": 0.18387625113739764, "eval_loss": 0.5874112248420715, "eval_runtime": 53.1394, "eval_samples_per_second": 10.2, "eval_steps_per_second": 1.28, "eval_wer": 0.3594067452255181, "step": 1694 }, { "epoch": 121.43, "learning_rate": 5.7571428571428574e-06, "loss": 0.3369, "step": 1700 }, { "epoch": 122.0, "eval_cer": 0.18383985441310283, "eval_loss": 0.5810351371765137, "eval_runtime": 53.1776, "eval_samples_per_second": 10.192, "eval_steps_per_second": 1.279, "eval_wer": 0.36021942299878096, "step": 1708 }, { "epoch": 123.0, "eval_cer": 0.18453139217470427, "eval_loss": 0.5847538709640503, "eval_runtime": 53.195, "eval_samples_per_second": 10.189, "eval_steps_per_second": 1.278, "eval_wer": 0.3594067452255181, "step": 1722 }, { "epoch": 124.0, "eval_cer": 0.18340309372156505, "eval_loss": 0.5764136910438538, "eval_runtime": 53.0869, "eval_samples_per_second": 10.21, "eval_steps_per_second": 1.281, "eval_wer": 0.35757822023567654, "step": 1736 }, { "epoch": 125.0, "eval_cer": 0.18409463148316652, "eval_loss": 0.5837183594703674, "eval_runtime": 53.2211, "eval_samples_per_second": 10.184, "eval_steps_per_second": 1.278, "eval_wer": 0.35757822023567654, "step": 1750 }, { "epoch": 126.0, "eval_cer": 0.18354868061874433, "eval_loss": 0.5778501629829407, "eval_runtime": 53.1674, "eval_samples_per_second": 10.194, "eval_steps_per_second": 1.279, "eval_wer": 0.3571718813490451, "step": 1764 }, { "epoch": 127.0, "eval_cer": 0.1840218380345769, "eval_loss": 0.5837158560752869, "eval_runtime": 53.7242, "eval_samples_per_second": 10.089, "eval_steps_per_second": 1.266, "eval_wer": 0.3583908980089395, "step": 1778 }, { "epoch": 128.0, "eval_cer": 0.18391264786169245, "eval_loss": 0.5836318135261536, "eval_runtime": 53.1001, "eval_samples_per_second": 10.207, "eval_steps_per_second": 1.281, "eval_wer": 0.3573750507923608, "step": 1792 }, { "epoch": 128.57, "learning_rate": 4.328571428571429e-06, "loss": 0.3268, "step": 1800 }, { "epoch": 129.0, "eval_cer": 0.18307552320291173, "eval_loss": 0.5775274634361267, "eval_runtime": 53.1, "eval_samples_per_second": 10.207, "eval_steps_per_second": 1.281, "eval_wer": 0.3563592035757822, "step": 1806 }, { "epoch": 130.0, "eval_cer": 0.18394904458598726, "eval_loss": 0.5831055641174316, "eval_runtime": 53.1352, "eval_samples_per_second": 10.2, "eval_steps_per_second": 1.28, "eval_wer": 0.35900040633888664, "step": 1820 }, { "epoch": 131.0, "eval_cer": 0.18380345768880801, "eval_loss": 0.5862288475036621, "eval_runtime": 53.6233, "eval_samples_per_second": 10.108, "eval_steps_per_second": 1.268, "eval_wer": 0.35778138967899226, "step": 1834 }, { "epoch": 131.0, "step": 1834, "total_flos": 1.636975334282897e+19, "train_loss": 1.7576082530172468, "train_runtime": 27670.5914, "train_samples_per_second": 2.429, "train_steps_per_second": 0.076 } ], "max_steps": 2100, "num_train_epochs": 150, "total_flos": 1.636975334282897e+19, "trial_name": null, "trial_params": null }