diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,23785 @@ +{ + "best_metric": 0.09579244742265228, + "best_model_checkpoint": "./wav2vec2-large-xlsr-53-german-cv9/checkpoint-117381", + "epoch": 32.999859451862264, + "global_step": 117381, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.01, + "learning_rate": 1.686814731515322e-07, + "loss": 12.2823, + "step": 30 + }, + { + "epoch": 0.02, + "learning_rate": 3.3174023053134664e-07, + "loss": 12.8864, + "step": 60 + }, + { + "epoch": 0.03, + "learning_rate": 5.004217036828789e-07, + "loss": 11.7331, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 6.691031768344111e-07, + "loss": 12.8009, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 8.377846499859433e-07, + "loss": 12.1084, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 1.0064661231374754e-06, + "loss": 12.08, + "step": 180 + }, + { + "epoch": 0.06, + "learning_rate": 1.1751475962890077e-06, + "loss": 12.5185, + "step": 210 + }, + { + "epoch": 0.07, + "learning_rate": 1.3382063536688221e-06, + "loss": 11.5036, + "step": 240 + }, + { + "epoch": 0.08, + "learning_rate": 1.5068878268203542e-06, + "loss": 12.2999, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 1.6699465842001688e-06, + "loss": 11.3572, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 1.838628057351701e-06, + "loss": 10.856, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 2.007309530503233e-06, + "loss": 10.7287, + "step": 360 + }, + { + "epoch": 0.11, + "learning_rate": 2.1759910036547654e-06, + "loss": 9.3588, + "step": 390 + }, + { + "epoch": 0.12, + "learning_rate": 2.3446724768062973e-06, + "loss": 9.3074, + "step": 420 + }, + { + "epoch": 0.13, + "learning_rate": 2.5133539499578296e-06, + "loss": 8.1078, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 2.682035423109362e-06, + "loss": 7.0939, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 2.850716896260894e-06, + "loss": 6.2733, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 3.0193983694124264e-06, + "loss": 5.3202, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 3.1880798425639583e-06, + "loss": 5.0092, + "step": 570 + }, + { + "epoch": 0.17, + "learning_rate": 3.3567613157154906e-06, + "loss": 4.4977, + "step": 600 + }, + { + "epoch": 0.18, + "learning_rate": 3.525442788867023e-06, + "loss": 4.201, + "step": 630 + }, + { + "epoch": 0.19, + "learning_rate": 3.694124262018555e-06, + "loss": 4.019, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 3.8628057351700874e-06, + "loss": 3.7649, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.03148720832162e-06, + "loss": 3.7088, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.200168681473152e-06, + "loss": 3.5882, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.368850154624684e-06, + "loss": 3.4896, + "step": 780 + }, + { + "epoch": 0.23, + "learning_rate": 4.5375316277762166e-06, + "loss": 3.4466, + "step": 810 + }, + { + "epoch": 0.24, + "learning_rate": 4.706213100927748e-06, + "loss": 3.3378, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.87489457407928e-06, + "loss": 3.3351, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 5.043576047230813e-06, + "loss": 3.2781, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 5.212257520382345e-06, + "loss": 3.2183, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 5.380938993533877e-06, + "loss": 3.2128, + "step": 960 + }, + { + "epoch": 0.28, + "learning_rate": 5.5496204666854094e-06, + "loss": 3.1512, + "step": 990 + }, + { + "epoch": 0.29, + "learning_rate": 5.718301939836942e-06, + "loss": 3.1617, + "step": 1020 + }, + { + "epoch": 0.3, + "learning_rate": 5.886983412988474e-06, + "loss": 3.1274, + "step": 1050 + }, + { + "epoch": 0.3, + "learning_rate": 6.0556648861400054e-06, + "loss": 3.0881, + "step": 1080 + }, + { + "epoch": 0.31, + "learning_rate": 6.224346359291538e-06, + "loss": 3.098, + "step": 1110 + }, + { + "epoch": 0.32, + "learning_rate": 6.39302783244307e-06, + "loss": 3.0544, + "step": 1140 + }, + { + "epoch": 0.33, + "learning_rate": 6.561709305594603e-06, + "loss": 3.0735, + "step": 1170 + }, + { + "epoch": 0.34, + "learning_rate": 6.7303907787461346e-06, + "loss": 3.0573, + "step": 1200 + }, + { + "epoch": 0.35, + "learning_rate": 6.899072251897668e-06, + "loss": 3.0233, + "step": 1230 + }, + { + "epoch": 0.35, + "learning_rate": 7.067753725049199e-06, + "loss": 3.0445, + "step": 1260 + }, + { + "epoch": 0.36, + "learning_rate": 7.236435198200732e-06, + "loss": 3.0156, + "step": 1290 + }, + { + "epoch": 0.37, + "learning_rate": 7.405116671352264e-06, + "loss": 3.0256, + "step": 1320 + }, + { + "epoch": 0.38, + "learning_rate": 7.573798144503795e-06, + "loss": 3.0266, + "step": 1350 + }, + { + "epoch": 0.39, + "learning_rate": 7.742479617655327e-06, + "loss": 2.9992, + "step": 1380 + }, + { + "epoch": 0.4, + "learning_rate": 7.91116109080686e-06, + "loss": 3.0169, + "step": 1410 + }, + { + "epoch": 0.4, + "learning_rate": 8.079842563958392e-06, + "loss": 2.9879, + "step": 1440 + }, + { + "epoch": 0.41, + "learning_rate": 8.248524037109924e-06, + "loss": 3.0014, + "step": 1470 + }, + { + "epoch": 0.42, + "learning_rate": 8.417205510261457e-06, + "loss": 3.0054, + "step": 1500 + }, + { + "epoch": 0.43, + "learning_rate": 8.585886983412989e-06, + "loss": 2.9833, + "step": 1530 + }, + { + "epoch": 0.44, + "learning_rate": 8.754568456564521e-06, + "loss": 3.0009, + "step": 1560 + }, + { + "epoch": 0.45, + "learning_rate": 8.923249929716053e-06, + "loss": 2.9731, + "step": 1590 + }, + { + "epoch": 0.46, + "learning_rate": 9.091931402867586e-06, + "loss": 2.9975, + "step": 1620 + }, + { + "epoch": 0.46, + "learning_rate": 9.260612876019118e-06, + "loss": 2.997, + "step": 1650 + }, + { + "epoch": 0.47, + "learning_rate": 9.42929434917065e-06, + "loss": 2.9667, + "step": 1680 + }, + { + "epoch": 0.48, + "learning_rate": 9.597975822322183e-06, + "loss": 2.9925, + "step": 1710 + }, + { + "epoch": 0.49, + "learning_rate": 9.766657295473715e-06, + "loss": 2.9607, + "step": 1740 + }, + { + "epoch": 0.5, + "learning_rate": 9.935338768625247e-06, + "loss": 2.9754, + "step": 1770 + }, + { + "epoch": 0.51, + "learning_rate": 1.010402024177678e-05, + "loss": 2.9615, + "step": 1800 + }, + { + "epoch": 0.51, + "learning_rate": 1.0272701714928312e-05, + "loss": 2.9534, + "step": 1830 + }, + { + "epoch": 0.52, + "learning_rate": 1.0441383188079842e-05, + "loss": 2.9674, + "step": 1860 + }, + { + "epoch": 0.53, + "learning_rate": 1.0610064661231375e-05, + "loss": 2.9443, + "step": 1890 + }, + { + "epoch": 0.54, + "learning_rate": 1.0778746134382907e-05, + "loss": 2.9559, + "step": 1920 + }, + { + "epoch": 0.55, + "learning_rate": 1.0947427607534439e-05, + "loss": 2.9475, + "step": 1950 + }, + { + "epoch": 0.56, + "learning_rate": 1.1116109080685971e-05, + "loss": 2.94, + "step": 1980 + }, + { + "epoch": 0.57, + "learning_rate": 1.1284790553837504e-05, + "loss": 2.9509, + "step": 2010 + }, + { + "epoch": 0.57, + "learning_rate": 1.1453472026989036e-05, + "loss": 2.9327, + "step": 2040 + }, + { + "epoch": 0.58, + "learning_rate": 1.1622153500140568e-05, + "loss": 2.9454, + "step": 2070 + }, + { + "epoch": 0.59, + "learning_rate": 1.17908349732921e-05, + "loss": 2.9409, + "step": 2100 + }, + { + "epoch": 0.6, + "learning_rate": 1.1959516446443633e-05, + "loss": 2.9342, + "step": 2130 + }, + { + "epoch": 0.61, + "learning_rate": 1.2128197919595165e-05, + "loss": 2.9434, + "step": 2160 + }, + { + "epoch": 0.62, + "learning_rate": 1.2296879392746697e-05, + "loss": 2.9311, + "step": 2190 + }, + { + "epoch": 0.62, + "learning_rate": 1.246556086589823e-05, + "loss": 2.939, + "step": 2220 + }, + { + "epoch": 0.63, + "learning_rate": 1.2634242339049762e-05, + "loss": 2.9328, + "step": 2250 + }, + { + "epoch": 0.64, + "learning_rate": 1.2802923812201296e-05, + "loss": 2.929, + "step": 2280 + }, + { + "epoch": 0.65, + "learning_rate": 1.2971605285352825e-05, + "loss": 2.9352, + "step": 2310 + }, + { + "epoch": 0.66, + "learning_rate": 1.3140286758504359e-05, + "loss": 2.9237, + "step": 2340 + }, + { + "epoch": 0.67, + "learning_rate": 1.3308968231655891e-05, + "loss": 2.9313, + "step": 2370 + }, + { + "epoch": 0.67, + "learning_rate": 1.3477649704807422e-05, + "loss": 2.9168, + "step": 2400 + }, + { + "epoch": 0.68, + "learning_rate": 1.3646331177958954e-05, + "loss": 2.9164, + "step": 2430 + }, + { + "epoch": 0.69, + "learning_rate": 1.3815012651110488e-05, + "loss": 2.9112, + "step": 2460 + }, + { + "epoch": 0.7, + "learning_rate": 1.398369412426202e-05, + "loss": 2.8939, + "step": 2490 + }, + { + "epoch": 0.71, + "learning_rate": 1.415237559741355e-05, + "loss": 2.893, + "step": 2520 + }, + { + "epoch": 0.72, + "learning_rate": 1.4321057070565083e-05, + "loss": 2.8611, + "step": 2550 + }, + { + "epoch": 0.73, + "learning_rate": 1.4489738543716615e-05, + "loss": 2.8146, + "step": 2580 + }, + { + "epoch": 0.73, + "learning_rate": 1.465842001686815e-05, + "loss": 2.7328, + "step": 2610 + }, + { + "epoch": 0.74, + "learning_rate": 1.482710149001968e-05, + "loss": 2.5982, + "step": 2640 + }, + { + "epoch": 0.75, + "learning_rate": 1.4995782963171212e-05, + "loss": 2.4667, + "step": 2670 + }, + { + "epoch": 0.76, + "learning_rate": 1.5164464436322745e-05, + "loss": 2.237, + "step": 2700 + }, + { + "epoch": 0.77, + "learning_rate": 1.533314590947428e-05, + "loss": 2.0234, + "step": 2730 + }, + { + "epoch": 0.78, + "learning_rate": 1.5501827382625807e-05, + "loss": 1.7856, + "step": 2760 + }, + { + "epoch": 0.78, + "learning_rate": 1.567050885577734e-05, + "loss": 1.4936, + "step": 2790 + }, + { + "epoch": 0.79, + "learning_rate": 1.5839190328928875e-05, + "loss": 1.3168, + "step": 2820 + }, + { + "epoch": 0.8, + "learning_rate": 1.6007871802080408e-05, + "loss": 1.1575, + "step": 2850 + }, + { + "epoch": 0.81, + "learning_rate": 1.6176553275231937e-05, + "loss": 1.0244, + "step": 2880 + }, + { + "epoch": 0.82, + "learning_rate": 1.634523474838347e-05, + "loss": 0.9434, + "step": 2910 + }, + { + "epoch": 0.83, + "learning_rate": 1.6513916221535004e-05, + "loss": 0.8609, + "step": 2940 + }, + { + "epoch": 0.83, + "learning_rate": 1.6682597694686533e-05, + "loss": 0.8089, + "step": 2970 + }, + { + "epoch": 0.84, + "learning_rate": 1.6851279167838066e-05, + "loss": 0.7682, + "step": 3000 + }, + { + "epoch": 0.85, + "learning_rate": 1.7019960640989598e-05, + "loss": 0.7005, + "step": 3030 + }, + { + "epoch": 0.86, + "learning_rate": 1.718864211414113e-05, + "loss": 0.691, + "step": 3060 + }, + { + "epoch": 0.87, + "learning_rate": 1.7357323587292663e-05, + "loss": 0.6244, + "step": 3090 + }, + { + "epoch": 0.88, + "learning_rate": 1.7526005060444195e-05, + "loss": 0.6426, + "step": 3120 + }, + { + "epoch": 0.89, + "learning_rate": 1.7694686533595727e-05, + "loss": 0.6254, + "step": 3150 + }, + { + "epoch": 0.89, + "learning_rate": 1.786336800674726e-05, + "loss": 0.5489, + "step": 3180 + }, + { + "epoch": 0.9, + "learning_rate": 1.803204947989879e-05, + "loss": 0.5744, + "step": 3210 + }, + { + "epoch": 0.91, + "learning_rate": 1.8200730953050324e-05, + "loss": 0.5247, + "step": 3240 + }, + { + "epoch": 0.92, + "learning_rate": 1.8369412426201856e-05, + "loss": 0.5261, + "step": 3270 + }, + { + "epoch": 0.93, + "learning_rate": 1.853809389935339e-05, + "loss": 0.5122, + "step": 3300 + }, + { + "epoch": 0.94, + "learning_rate": 1.870677537250492e-05, + "loss": 0.4845, + "step": 3330 + }, + { + "epoch": 0.94, + "learning_rate": 1.8875456845656453e-05, + "loss": 0.5051, + "step": 3360 + }, + { + "epoch": 0.95, + "learning_rate": 1.9044138318807985e-05, + "loss": 0.4715, + "step": 3390 + }, + { + "epoch": 0.96, + "learning_rate": 1.9212819791959518e-05, + "loss": 0.484, + "step": 3420 + }, + { + "epoch": 0.97, + "learning_rate": 1.938150126511105e-05, + "loss": 0.4563, + "step": 3450 + }, + { + "epoch": 0.98, + "learning_rate": 1.9550182738262582e-05, + "loss": 0.4204, + "step": 3480 + }, + { + "epoch": 0.99, + "learning_rate": 1.9718864211414114e-05, + "loss": 0.4372, + "step": 3510 + }, + { + "epoch": 1.0, + "learning_rate": 1.9887545684565643e-05, + "loss": 0.4129, + "step": 3540 + }, + { + "epoch": 1.0, + "eval_loss": 0.30152174830436707, + "eval_runtime": 623.0811, + "eval_samples_per_second": 25.732, + "eval_steps_per_second": 0.806, + "eval_wer": 0.24989423116291132, + "step": 3557 + }, + { + "epoch": 1.0, + "learning_rate": 2.005622715771718e-05, + "loss": 0.4449, + "step": 3570 + }, + { + "epoch": 1.01, + "learning_rate": 2.022490863086871e-05, + "loss": 0.4039, + "step": 3600 + }, + { + "epoch": 1.02, + "learning_rate": 2.0393590104020244e-05, + "loss": 0.418, + "step": 3630 + }, + { + "epoch": 1.03, + "learning_rate": 2.0562271577171773e-05, + "loss": 0.4121, + "step": 3660 + }, + { + "epoch": 1.04, + "learning_rate": 2.0730953050323308e-05, + "loss": 0.3687, + "step": 3690 + }, + { + "epoch": 1.05, + "learning_rate": 2.089963452347484e-05, + "loss": 0.383, + "step": 3720 + }, + { + "epoch": 1.05, + "learning_rate": 2.1068315996626373e-05, + "loss": 0.3786, + "step": 3750 + }, + { + "epoch": 1.06, + "learning_rate": 2.12369974697779e-05, + "loss": 0.3714, + "step": 3780 + }, + { + "epoch": 1.07, + "learning_rate": 2.1405678942929437e-05, + "loss": 0.3948, + "step": 3810 + }, + { + "epoch": 1.08, + "learning_rate": 2.157436041608097e-05, + "loss": 0.334, + "step": 3840 + }, + { + "epoch": 1.09, + "learning_rate": 2.1743041889232502e-05, + "loss": 0.3746, + "step": 3870 + }, + { + "epoch": 1.1, + "learning_rate": 2.191172336238403e-05, + "loss": 0.3451, + "step": 3900 + }, + { + "epoch": 1.1, + "learning_rate": 2.2080404835535563e-05, + "loss": 0.3487, + "step": 3930 + }, + { + "epoch": 1.11, + "learning_rate": 2.22490863086871e-05, + "loss": 0.3646, + "step": 3960 + }, + { + "epoch": 1.12, + "learning_rate": 2.2417767781838628e-05, + "loss": 0.3259, + "step": 3990 + }, + { + "epoch": 1.13, + "learning_rate": 2.258644925499016e-05, + "loss": 0.3539, + "step": 4020 + }, + { + "epoch": 1.14, + "learning_rate": 2.2755130728141692e-05, + "loss": 0.3308, + "step": 4050 + }, + { + "epoch": 1.15, + "learning_rate": 2.2923812201293228e-05, + "loss": 0.3477, + "step": 4080 + }, + { + "epoch": 1.16, + "learning_rate": 2.3092493674444757e-05, + "loss": 0.3484, + "step": 4110 + }, + { + "epoch": 1.16, + "learning_rate": 2.326117514759629e-05, + "loss": 0.3045, + "step": 4140 + }, + { + "epoch": 1.17, + "learning_rate": 2.342985662074782e-05, + "loss": 0.3454, + "step": 4170 + }, + { + "epoch": 1.18, + "learning_rate": 2.3598538093899357e-05, + "loss": 0.3136, + "step": 4200 + }, + { + "epoch": 1.19, + "learning_rate": 2.3767219567050886e-05, + "loss": 0.3281, + "step": 4230 + }, + { + "epoch": 1.2, + "learning_rate": 2.3935901040202418e-05, + "loss": 0.3355, + "step": 4260 + }, + { + "epoch": 1.21, + "learning_rate": 2.410458251335395e-05, + "loss": 0.2986, + "step": 4290 + }, + { + "epoch": 1.21, + "learning_rate": 2.4273263986505486e-05, + "loss": 0.3142, + "step": 4320 + }, + { + "epoch": 1.22, + "learning_rate": 2.4441945459657015e-05, + "loss": 0.2982, + "step": 4350 + }, + { + "epoch": 1.23, + "learning_rate": 2.4610626932808547e-05, + "loss": 0.3141, + "step": 4380 + }, + { + "epoch": 1.24, + "learning_rate": 2.477930840596008e-05, + "loss": 0.315, + "step": 4410 + }, + { + "epoch": 1.25, + "learning_rate": 2.4947989879111612e-05, + "loss": 0.2788, + "step": 4440 + }, + { + "epoch": 1.26, + "learning_rate": 2.5116671352263144e-05, + "loss": 0.315, + "step": 4470 + }, + { + "epoch": 1.27, + "learning_rate": 2.5285352825414676e-05, + "loss": 0.2849, + "step": 4500 + }, + { + "epoch": 1.27, + "learning_rate": 2.545403429856621e-05, + "loss": 0.2895, + "step": 4530 + }, + { + "epoch": 1.28, + "learning_rate": 2.562271577171774e-05, + "loss": 0.3063, + "step": 4560 + }, + { + "epoch": 1.29, + "learning_rate": 2.5791397244869277e-05, + "loss": 0.2696, + "step": 4590 + }, + { + "epoch": 1.3, + "learning_rate": 2.5960078718020802e-05, + "loss": 0.2898, + "step": 4620 + }, + { + "epoch": 1.31, + "learning_rate": 2.6128760191172335e-05, + "loss": 0.2863, + "step": 4650 + }, + { + "epoch": 1.32, + "learning_rate": 2.629744166432387e-05, + "loss": 0.2812, + "step": 4680 + }, + { + "epoch": 1.32, + "learning_rate": 2.6466123137475402e-05, + "loss": 0.3064, + "step": 4710 + }, + { + "epoch": 1.33, + "learning_rate": 2.6634804610626935e-05, + "loss": 0.2684, + "step": 4740 + }, + { + "epoch": 1.34, + "learning_rate": 2.6803486083778467e-05, + "loss": 0.2983, + "step": 4770 + }, + { + "epoch": 1.35, + "learning_rate": 2.697216755693e-05, + "loss": 0.2669, + "step": 4800 + }, + { + "epoch": 1.36, + "learning_rate": 2.714084903008153e-05, + "loss": 0.2748, + "step": 4830 + }, + { + "epoch": 1.37, + "learning_rate": 2.730953050323306e-05, + "loss": 0.295, + "step": 4860 + }, + { + "epoch": 1.37, + "learning_rate": 2.7478211976384593e-05, + "loss": 0.2643, + "step": 4890 + }, + { + "epoch": 1.38, + "learning_rate": 2.7646893449536125e-05, + "loss": 0.2695, + "step": 4920 + }, + { + "epoch": 1.39, + "learning_rate": 2.781557492268766e-05, + "loss": 0.2522, + "step": 4950 + }, + { + "epoch": 1.4, + "learning_rate": 2.7984256395839193e-05, + "loss": 0.2639, + "step": 4980 + }, + { + "epoch": 1.41, + "learning_rate": 2.8152937868990725e-05, + "loss": 0.2784, + "step": 5010 + }, + { + "epoch": 1.42, + "learning_rate": 2.8321619342142258e-05, + "loss": 0.2378, + "step": 5040 + }, + { + "epoch": 1.43, + "learning_rate": 2.8490300815293786e-05, + "loss": 0.2685, + "step": 5070 + }, + { + "epoch": 1.43, + "learning_rate": 2.865898228844532e-05, + "loss": 0.2423, + "step": 5100 + }, + { + "epoch": 1.44, + "learning_rate": 2.882766376159685e-05, + "loss": 0.2529, + "step": 5130 + }, + { + "epoch": 1.45, + "learning_rate": 2.8996345234748383e-05, + "loss": 0.2808, + "step": 5160 + }, + { + "epoch": 1.46, + "learning_rate": 2.916502670789992e-05, + "loss": 0.2333, + "step": 5190 + }, + { + "epoch": 1.47, + "learning_rate": 2.933370818105145e-05, + "loss": 0.2647, + "step": 5220 + }, + { + "epoch": 1.48, + "learning_rate": 2.9502389654202984e-05, + "loss": 0.2424, + "step": 5250 + }, + { + "epoch": 1.48, + "learning_rate": 2.9671071127354516e-05, + "loss": 0.2479, + "step": 5280 + }, + { + "epoch": 1.49, + "learning_rate": 2.9839752600506045e-05, + "loss": 0.2717, + "step": 5310 + }, + { + "epoch": 1.5, + "learning_rate": 3.0008434073657577e-05, + "loss": 0.2188, + "step": 5340 + }, + { + "epoch": 1.51, + "learning_rate": 3.017711554680911e-05, + "loss": 0.258, + "step": 5370 + }, + { + "epoch": 1.52, + "learning_rate": 3.034579701996064e-05, + "loss": 0.2504, + "step": 5400 + }, + { + "epoch": 1.53, + "learning_rate": 3.0514478493112174e-05, + "loss": 0.2478, + "step": 5430 + }, + { + "epoch": 1.53, + "learning_rate": 3.068315996626371e-05, + "loss": 0.2725, + "step": 5460 + }, + { + "epoch": 1.54, + "learning_rate": 3.085184143941524e-05, + "loss": 0.2233, + "step": 5490 + }, + { + "epoch": 1.55, + "learning_rate": 3.1020522912566774e-05, + "loss": 0.2592, + "step": 5520 + }, + { + "epoch": 1.56, + "learning_rate": 3.11892043857183e-05, + "loss": 0.231, + "step": 5550 + }, + { + "epoch": 1.57, + "learning_rate": 3.135788585886983e-05, + "loss": 0.2413, + "step": 5580 + }, + { + "epoch": 1.58, + "learning_rate": 3.1526567332021364e-05, + "loss": 0.2557, + "step": 5610 + }, + { + "epoch": 1.59, + "learning_rate": 3.16952488051729e-05, + "loss": 0.2252, + "step": 5640 + }, + { + "epoch": 1.59, + "learning_rate": 3.1863930278324436e-05, + "loss": 0.2532, + "step": 5670 + }, + { + "epoch": 1.6, + "learning_rate": 3.203261175147597e-05, + "loss": 0.2228, + "step": 5700 + }, + { + "epoch": 1.61, + "learning_rate": 3.22012932246275e-05, + "loss": 0.2448, + "step": 5730 + }, + { + "epoch": 1.62, + "learning_rate": 3.2369974697779026e-05, + "loss": 0.2447, + "step": 5760 + }, + { + "epoch": 1.63, + "learning_rate": 3.253865617093056e-05, + "loss": 0.212, + "step": 5790 + }, + { + "epoch": 1.64, + "learning_rate": 3.270733764408209e-05, + "loss": 0.2454, + "step": 5820 + }, + { + "epoch": 1.64, + "learning_rate": 3.287601911723362e-05, + "loss": 0.2195, + "step": 5850 + }, + { + "epoch": 1.65, + "learning_rate": 3.3044700590385155e-05, + "loss": 0.2381, + "step": 5880 + }, + { + "epoch": 1.66, + "learning_rate": 3.3213382063536694e-05, + "loss": 0.2493, + "step": 5910 + }, + { + "epoch": 1.67, + "learning_rate": 3.3382063536688226e-05, + "loss": 0.2076, + "step": 5940 + }, + { + "epoch": 1.68, + "learning_rate": 3.355074500983976e-05, + "loss": 0.2393, + "step": 5970 + }, + { + "epoch": 1.69, + "learning_rate": 3.3719426482991284e-05, + "loss": 0.2199, + "step": 6000 + }, + { + "epoch": 1.7, + "learning_rate": 3.3888107956142816e-05, + "loss": 0.222, + "step": 6030 + }, + { + "epoch": 1.7, + "learning_rate": 3.405678942929435e-05, + "loss": 0.2496, + "step": 6060 + }, + { + "epoch": 1.71, + "learning_rate": 3.422547090244588e-05, + "loss": 0.2088, + "step": 6090 + }, + { + "epoch": 1.72, + "learning_rate": 3.439415237559741e-05, + "loss": 0.2253, + "step": 6120 + }, + { + "epoch": 1.73, + "learning_rate": 3.456283384874895e-05, + "loss": 0.2095, + "step": 6150 + }, + { + "epoch": 1.74, + "learning_rate": 3.4731515321900484e-05, + "loss": 0.213, + "step": 6180 + }, + { + "epoch": 1.75, + "learning_rate": 3.490019679505201e-05, + "loss": 0.2355, + "step": 6210 + }, + { + "epoch": 1.75, + "learning_rate": 3.506887826820354e-05, + "loss": 0.2123, + "step": 6240 + }, + { + "epoch": 1.76, + "learning_rate": 3.5237559741355074e-05, + "loss": 0.2308, + "step": 6270 + }, + { + "epoch": 1.77, + "learning_rate": 3.540624121450661e-05, + "loss": 0.2101, + "step": 6300 + }, + { + "epoch": 1.78, + "learning_rate": 3.557492268765814e-05, + "loss": 0.2167, + "step": 6330 + }, + { + "epoch": 1.79, + "learning_rate": 3.574360416080967e-05, + "loss": 0.2397, + "step": 6360 + }, + { + "epoch": 1.8, + "learning_rate": 3.5912285633961204e-05, + "loss": 0.1999, + "step": 6390 + }, + { + "epoch": 1.8, + "learning_rate": 3.608096710711274e-05, + "loss": 0.2222, + "step": 6420 + }, + { + "epoch": 1.81, + "learning_rate": 3.624964858026427e-05, + "loss": 0.2063, + "step": 6450 + }, + { + "epoch": 1.82, + "learning_rate": 3.64183300534158e-05, + "loss": 0.2067, + "step": 6480 + }, + { + "epoch": 1.83, + "learning_rate": 3.658701152656733e-05, + "loss": 0.2246, + "step": 6510 + }, + { + "epoch": 1.84, + "learning_rate": 3.6755692999718865e-05, + "loss": 0.1943, + "step": 6540 + }, + { + "epoch": 1.85, + "learning_rate": 3.69243744728704e-05, + "loss": 0.2244, + "step": 6570 + }, + { + "epoch": 1.86, + "learning_rate": 3.709305594602193e-05, + "loss": 0.2056, + "step": 6600 + }, + { + "epoch": 1.86, + "learning_rate": 3.726173741917346e-05, + "loss": 0.2057, + "step": 6630 + }, + { + "epoch": 1.87, + "learning_rate": 3.7430418892324994e-05, + "loss": 0.2234, + "step": 6660 + }, + { + "epoch": 1.88, + "learning_rate": 3.7599100365476526e-05, + "loss": 0.1853, + "step": 6690 + }, + { + "epoch": 1.89, + "learning_rate": 3.776778183862806e-05, + "loss": 0.2223, + "step": 6720 + }, + { + "epoch": 1.9, + "learning_rate": 3.793646331177959e-05, + "loss": 0.2018, + "step": 6750 + }, + { + "epoch": 1.91, + "learning_rate": 3.810514478493112e-05, + "loss": 0.2041, + "step": 6780 + }, + { + "epoch": 1.91, + "learning_rate": 3.8273826258082656e-05, + "loss": 0.2263, + "step": 6810 + }, + { + "epoch": 1.92, + "learning_rate": 3.844250773123419e-05, + "loss": 0.1908, + "step": 6840 + }, + { + "epoch": 1.93, + "learning_rate": 3.861118920438572e-05, + "loss": 0.218, + "step": 6870 + }, + { + "epoch": 1.94, + "learning_rate": 3.877987067753725e-05, + "loss": 0.1993, + "step": 6900 + }, + { + "epoch": 1.95, + "learning_rate": 3.8948552150688785e-05, + "loss": 0.2047, + "step": 6930 + }, + { + "epoch": 1.96, + "learning_rate": 3.911723362384032e-05, + "loss": 0.2235, + "step": 6960 + }, + { + "epoch": 1.97, + "learning_rate": 3.928591509699185e-05, + "loss": 0.1838, + "step": 6990 + }, + { + "epoch": 1.97, + "learning_rate": 3.945459657014338e-05, + "loss": 0.2098, + "step": 7020 + }, + { + "epoch": 1.98, + "learning_rate": 3.9623278043294914e-05, + "loss": 0.1947, + "step": 7050 + }, + { + "epoch": 1.99, + "learning_rate": 3.9791959516446446e-05, + "loss": 0.203, + "step": 7080 + }, + { + "epoch": 2.0, + "learning_rate": 3.996064098959797e-05, + "loss": 0.2121, + "step": 7110 + }, + { + "epoch": 2.0, + "eval_loss": 0.15964379906654358, + "eval_runtime": 627.5077, + "eval_samples_per_second": 25.55, + "eval_steps_per_second": 0.8, + "eval_wer": 0.15666753101415254, + "step": 7114 + }, + { + "epoch": 2.01, + "learning_rate": 4.012932246274951e-05, + "loss": 0.1881, + "step": 7140 + }, + { + "epoch": 2.02, + "learning_rate": 4.029800393590104e-05, + "loss": 0.2157, + "step": 7170 + }, + { + "epoch": 2.02, + "learning_rate": 4.0466685409052575e-05, + "loss": 0.1762, + "step": 7200 + }, + { + "epoch": 2.03, + "learning_rate": 4.063536688220411e-05, + "loss": 0.193, + "step": 7230 + }, + { + "epoch": 2.04, + "learning_rate": 4.080404835535564e-05, + "loss": 0.1967, + "step": 7260 + }, + { + "epoch": 2.05, + "learning_rate": 4.097272982850717e-05, + "loss": 0.1824, + "step": 7290 + }, + { + "epoch": 2.06, + "learning_rate": 4.1141411301658704e-05, + "loss": 0.2006, + "step": 7320 + }, + { + "epoch": 2.07, + "learning_rate": 4.131009277481023e-05, + "loss": 0.1734, + "step": 7350 + }, + { + "epoch": 2.07, + "learning_rate": 4.147877424796177e-05, + "loss": 0.2023, + "step": 7380 + }, + { + "epoch": 2.08, + "learning_rate": 4.16474557211133e-05, + "loss": 0.1827, + "step": 7410 + }, + { + "epoch": 2.09, + "learning_rate": 4.1816137194264834e-05, + "loss": 0.1903, + "step": 7440 + }, + { + "epoch": 2.1, + "learning_rate": 4.1984818667416366e-05, + "loss": 0.2175, + "step": 7470 + }, + { + "epoch": 2.11, + "learning_rate": 4.21535001405679e-05, + "loss": 0.1789, + "step": 7500 + }, + { + "epoch": 2.12, + "learning_rate": 4.232218161371943e-05, + "loss": 0.2071, + "step": 7530 + }, + { + "epoch": 2.13, + "learning_rate": 4.249086308687096e-05, + "loss": 0.1964, + "step": 7560 + }, + { + "epoch": 2.13, + "learning_rate": 4.265954456002249e-05, + "loss": 0.1821, + "step": 7590 + }, + { + "epoch": 2.14, + "learning_rate": 4.282822603317402e-05, + "loss": 0.2075, + "step": 7620 + }, + { + "epoch": 2.15, + "learning_rate": 4.299690750632556e-05, + "loss": 0.1699, + "step": 7650 + }, + { + "epoch": 2.16, + "learning_rate": 4.316558897947709e-05, + "loss": 0.1778, + "step": 7680 + }, + { + "epoch": 2.17, + "learning_rate": 4.3334270452628624e-05, + "loss": 0.191, + "step": 7710 + }, + { + "epoch": 2.18, + "learning_rate": 4.3502951925780156e-05, + "loss": 0.1773, + "step": 7740 + }, + { + "epoch": 2.18, + "learning_rate": 4.367163339893169e-05, + "loss": 0.202, + "step": 7770 + }, + { + "epoch": 2.19, + "learning_rate": 4.3840314872083214e-05, + "loss": 0.1645, + "step": 7800 + }, + { + "epoch": 2.2, + "learning_rate": 4.4008996345234746e-05, + "loss": 0.1896, + "step": 7830 + }, + { + "epoch": 2.21, + "learning_rate": 4.417767781838628e-05, + "loss": 0.1864, + "step": 7860 + }, + { + "epoch": 2.22, + "learning_rate": 4.434635929153782e-05, + "loss": 0.1854, + "step": 7890 + }, + { + "epoch": 2.23, + "learning_rate": 4.451504076468935e-05, + "loss": 0.1959, + "step": 7920 + }, + { + "epoch": 2.23, + "learning_rate": 4.468372223784088e-05, + "loss": 0.1658, + "step": 7950 + }, + { + "epoch": 2.24, + "learning_rate": 4.4852403710992415e-05, + "loss": 0.1884, + "step": 7980 + }, + { + "epoch": 2.25, + "learning_rate": 4.502108518414395e-05, + "loss": 0.1841, + "step": 8010 + }, + { + "epoch": 2.26, + "learning_rate": 4.518976665729547e-05, + "loss": 0.1774, + "step": 8040 + }, + { + "epoch": 2.27, + "learning_rate": 4.5358448130447005e-05, + "loss": 0.1997, + "step": 8070 + }, + { + "epoch": 2.28, + "learning_rate": 4.552712960359854e-05, + "loss": 0.1656, + "step": 8100 + }, + { + "epoch": 2.29, + "learning_rate": 4.569581107675007e-05, + "loss": 0.1964, + "step": 8130 + }, + { + "epoch": 2.29, + "learning_rate": 4.586449254990161e-05, + "loss": 0.1807, + "step": 8160 + }, + { + "epoch": 2.3, + "learning_rate": 4.603317402305314e-05, + "loss": 0.1777, + "step": 8190 + }, + { + "epoch": 2.31, + "learning_rate": 4.620185549620467e-05, + "loss": 0.1921, + "step": 8220 + }, + { + "epoch": 2.32, + "learning_rate": 4.63705369693562e-05, + "loss": 0.1708, + "step": 8250 + }, + { + "epoch": 2.33, + "learning_rate": 4.653921844250773e-05, + "loss": 0.1743, + "step": 8280 + }, + { + "epoch": 2.34, + "learning_rate": 4.670789991565926e-05, + "loss": 0.1758, + "step": 8310 + }, + { + "epoch": 2.34, + "learning_rate": 4.6876581388810795e-05, + "loss": 0.1789, + "step": 8340 + }, + { + "epoch": 2.35, + "learning_rate": 4.704526286196233e-05, + "loss": 0.1953, + "step": 8370 + }, + { + "epoch": 2.36, + "learning_rate": 4.7213944335113867e-05, + "loss": 0.1648, + "step": 8400 + }, + { + "epoch": 2.37, + "learning_rate": 4.73826258082654e-05, + "loss": 0.1803, + "step": 8430 + }, + { + "epoch": 2.38, + "learning_rate": 4.755130728141693e-05, + "loss": 0.1767, + "step": 8460 + }, + { + "epoch": 2.39, + "learning_rate": 4.771998875456846e-05, + "loss": 0.1703, + "step": 8490 + }, + { + "epoch": 2.4, + "learning_rate": 4.788867022771999e-05, + "loss": 0.1928, + "step": 8520 + }, + { + "epoch": 2.4, + "learning_rate": 4.805735170087152e-05, + "loss": 0.1645, + "step": 8550 + }, + { + "epoch": 2.41, + "learning_rate": 4.8226033174023054e-05, + "loss": 0.1894, + "step": 8580 + }, + { + "epoch": 2.42, + "learning_rate": 4.8394714647174586e-05, + "loss": 0.1749, + "step": 8610 + }, + { + "epoch": 2.43, + "learning_rate": 4.856339612032612e-05, + "loss": 0.1707, + "step": 8640 + }, + { + "epoch": 2.44, + "learning_rate": 4.873207759347766e-05, + "loss": 0.1834, + "step": 8670 + }, + { + "epoch": 2.45, + "learning_rate": 4.890075906662918e-05, + "loss": 0.1675, + "step": 8700 + }, + { + "epoch": 2.45, + "learning_rate": 4.9069440539780715e-05, + "loss": 0.1894, + "step": 8730 + }, + { + "epoch": 2.46, + "learning_rate": 4.923812201293225e-05, + "loss": 0.1742, + "step": 8760 + }, + { + "epoch": 2.47, + "learning_rate": 4.940680348608378e-05, + "loss": 0.1704, + "step": 8790 + }, + { + "epoch": 2.48, + "learning_rate": 4.957548495923531e-05, + "loss": 0.1758, + "step": 8820 + }, + { + "epoch": 2.49, + "learning_rate": 4.9744166432386844e-05, + "loss": 0.1603, + "step": 8850 + }, + { + "epoch": 2.5, + "learning_rate": 4.9912847905538376e-05, + "loss": 0.18, + "step": 8880 + }, + { + "epoch": 2.5, + "learning_rate": 5.008152937868991e-05, + "loss": 0.1695, + "step": 8910 + }, + { + "epoch": 2.51, + "learning_rate": 5.025021085184144e-05, + "loss": 0.1637, + "step": 8940 + }, + { + "epoch": 2.52, + "learning_rate": 5.041889232499297e-05, + "loss": 0.1739, + "step": 8970 + }, + { + "epoch": 2.53, + "learning_rate": 5.0587573798144506e-05, + "loss": 0.1587, + "step": 9000 + }, + { + "epoch": 2.54, + "learning_rate": 5.075625527129604e-05, + "loss": 0.1834, + "step": 9030 + }, + { + "epoch": 2.55, + "learning_rate": 5.092493674444757e-05, + "loss": 0.1678, + "step": 9060 + }, + { + "epoch": 2.56, + "learning_rate": 5.10936182175991e-05, + "loss": 0.166, + "step": 9090 + }, + { + "epoch": 2.56, + "learning_rate": 5.1262299690750635e-05, + "loss": 0.1821, + "step": 9120 + }, + { + "epoch": 2.57, + "learning_rate": 5.143098116390217e-05, + "loss": 0.1633, + "step": 9150 + }, + { + "epoch": 2.58, + "learning_rate": 5.1599662637053706e-05, + "loss": 0.1758, + "step": 9180 + }, + { + "epoch": 2.59, + "learning_rate": 5.176834411020524e-05, + "loss": 0.1663, + "step": 9210 + }, + { + "epoch": 2.6, + "learning_rate": 5.193702558335677e-05, + "loss": 0.1625, + "step": 9240 + }, + { + "epoch": 2.61, + "learning_rate": 5.210570705650829e-05, + "loss": 0.1889, + "step": 9270 + }, + { + "epoch": 2.61, + "learning_rate": 5.227438852965982e-05, + "loss": 0.1523, + "step": 9300 + }, + { + "epoch": 2.62, + "learning_rate": 5.2443070002811354e-05, + "loss": 0.1687, + "step": 9330 + }, + { + "epoch": 2.63, + "learning_rate": 5.2611751475962886e-05, + "loss": 0.1646, + "step": 9360 + }, + { + "epoch": 2.64, + "learning_rate": 5.2780432949114425e-05, + "loss": 0.1666, + "step": 9390 + }, + { + "epoch": 2.65, + "learning_rate": 5.294911442226596e-05, + "loss": 0.1743, + "step": 9420 + }, + { + "epoch": 2.66, + "learning_rate": 5.311779589541749e-05, + "loss": 0.1561, + "step": 9450 + }, + { + "epoch": 2.67, + "learning_rate": 5.328647736856902e-05, + "loss": 0.1784, + "step": 9480 + }, + { + "epoch": 2.67, + "learning_rate": 5.3455158841720554e-05, + "loss": 0.1673, + "step": 9510 + }, + { + "epoch": 2.68, + "learning_rate": 5.3623840314872087e-05, + "loss": 0.1732, + "step": 9540 + }, + { + "epoch": 2.69, + "learning_rate": 5.379252178802362e-05, + "loss": 0.1679, + "step": 9570 + }, + { + "epoch": 2.7, + "learning_rate": 5.396120326117515e-05, + "loss": 0.1542, + "step": 9600 + }, + { + "epoch": 2.71, + "learning_rate": 5.4129884734326683e-05, + "loss": 0.1692, + "step": 9630 + }, + { + "epoch": 2.72, + "learning_rate": 5.4298566207478216e-05, + "loss": 0.1589, + "step": 9660 + }, + { + "epoch": 2.72, + "learning_rate": 5.4467247680629755e-05, + "loss": 0.1563, + "step": 9690 + }, + { + "epoch": 2.73, + "learning_rate": 5.463592915378129e-05, + "loss": 0.1766, + "step": 9720 + }, + { + "epoch": 2.74, + "learning_rate": 5.4804610626932806e-05, + "loss": 0.1475, + "step": 9750 + }, + { + "epoch": 2.75, + "learning_rate": 5.497329210008434e-05, + "loss": 0.1816, + "step": 9780 + }, + { + "epoch": 2.76, + "learning_rate": 5.514197357323587e-05, + "loss": 0.1729, + "step": 9810 + }, + { + "epoch": 2.77, + "learning_rate": 5.53106550463874e-05, + "loss": 0.1575, + "step": 9840 + }, + { + "epoch": 2.77, + "learning_rate": 5.5479336519538935e-05, + "loss": 0.1817, + "step": 9870 + }, + { + "epoch": 2.78, + "learning_rate": 5.5648017992690474e-05, + "loss": 0.1444, + "step": 9900 + }, + { + "epoch": 2.79, + "learning_rate": 5.5816699465842006e-05, + "loss": 0.1692, + "step": 9930 + }, + { + "epoch": 2.8, + "learning_rate": 5.598538093899354e-05, + "loss": 0.1668, + "step": 9960 + }, + { + "epoch": 2.81, + "learning_rate": 5.615406241214507e-05, + "loss": 0.1577, + "step": 9990 + }, + { + "epoch": 2.82, + "learning_rate": 5.63227438852966e-05, + "loss": 0.1751, + "step": 10020 + }, + { + "epoch": 2.83, + "learning_rate": 5.6491425358448135e-05, + "loss": 0.1488, + "step": 10050 + }, + { + "epoch": 2.83, + "learning_rate": 5.666010683159967e-05, + "loss": 0.1676, + "step": 10080 + }, + { + "epoch": 2.84, + "learning_rate": 5.68287883047512e-05, + "loss": 0.1643, + "step": 10110 + }, + { + "epoch": 2.85, + "learning_rate": 5.699746977790273e-05, + "loss": 0.1543, + "step": 10140 + }, + { + "epoch": 2.86, + "learning_rate": 5.7166151251054265e-05, + "loss": 0.1774, + "step": 10170 + }, + { + "epoch": 2.87, + "learning_rate": 5.733483272420579e-05, + "loss": 0.1443, + "step": 10200 + }, + { + "epoch": 2.88, + "learning_rate": 5.750351419735732e-05, + "loss": 0.1646, + "step": 10230 + }, + { + "epoch": 2.88, + "learning_rate": 5.7672195670508855e-05, + "loss": 0.1643, + "step": 10260 + }, + { + "epoch": 2.89, + "learning_rate": 5.784087714366039e-05, + "loss": 0.155, + "step": 10290 + }, + { + "epoch": 2.9, + "learning_rate": 5.800955861681192e-05, + "loss": 0.1762, + "step": 10320 + }, + { + "epoch": 2.91, + "learning_rate": 5.817824008996345e-05, + "loss": 0.1512, + "step": 10350 + }, + { + "epoch": 2.92, + "learning_rate": 5.8346921563114984e-05, + "loss": 0.1664, + "step": 10380 + }, + { + "epoch": 2.93, + "learning_rate": 5.851560303626652e-05, + "loss": 0.1529, + "step": 10410 + }, + { + "epoch": 2.93, + "learning_rate": 5.8684284509418055e-05, + "loss": 0.1604, + "step": 10440 + }, + { + "epoch": 2.94, + "learning_rate": 5.885296598256959e-05, + "loss": 0.1697, + "step": 10470 + }, + { + "epoch": 2.95, + "learning_rate": 5.902164745572112e-05, + "loss": 0.1388, + "step": 10500 + }, + { + "epoch": 2.96, + "learning_rate": 5.919032892887265e-05, + "loss": 0.1636, + "step": 10530 + }, + { + "epoch": 2.97, + "learning_rate": 5.9359010402024184e-05, + "loss": 0.1558, + "step": 10560 + }, + { + "epoch": 2.98, + "learning_rate": 5.9527691875175717e-05, + "loss": 0.1585, + "step": 10590 + }, + { + "epoch": 2.99, + "learning_rate": 5.969637334832725e-05, + "loss": 0.1678, + "step": 10620 + }, + { + "epoch": 2.99, + "learning_rate": 5.9865054821478774e-05, + "loss": 0.1455, + "step": 10650 + }, + { + "epoch": 3.0, + "eval_loss": 0.13774625957012177, + "eval_runtime": 628.643, + "eval_samples_per_second": 25.504, + "eval_steps_per_second": 0.799, + "eval_wer": 0.1353977590654129, + "step": 10671 + }, + { + "epoch": 3.0, + "learning_rate": 6.003373629463031e-05, + "loss": 0.1738, + "step": 10680 + }, + { + "epoch": 3.01, + "learning_rate": 6.020241776778184e-05, + "loss": 0.1472, + "step": 10710 + }, + { + "epoch": 3.02, + "learning_rate": 6.037109924093337e-05, + "loss": 0.1587, + "step": 10740 + }, + { + "epoch": 3.03, + "learning_rate": 6.0539780714084903e-05, + "loss": 0.1587, + "step": 10770 + }, + { + "epoch": 3.04, + "learning_rate": 6.0708462187236436e-05, + "loss": 0.1487, + "step": 10800 + }, + { + "epoch": 3.04, + "learning_rate": 6.087714366038797e-05, + "loss": 0.1543, + "step": 10830 + }, + { + "epoch": 3.05, + "learning_rate": 6.104582513353951e-05, + "loss": 0.1412, + "step": 10860 + }, + { + "epoch": 3.06, + "learning_rate": 6.121450660669103e-05, + "loss": 0.1551, + "step": 10890 + }, + { + "epoch": 3.07, + "learning_rate": 6.138318807984257e-05, + "loss": 0.1595, + "step": 10920 + }, + { + "epoch": 3.08, + "learning_rate": 6.15518695529941e-05, + "loss": 0.1491, + "step": 10950 + }, + { + "epoch": 3.09, + "learning_rate": 6.172055102614564e-05, + "loss": 0.1575, + "step": 10980 + }, + { + "epoch": 3.1, + "learning_rate": 6.188923249929716e-05, + "loss": 0.1436, + "step": 11010 + }, + { + "epoch": 3.1, + "learning_rate": 6.20579139724487e-05, + "loss": 0.1531, + "step": 11040 + }, + { + "epoch": 3.11, + "learning_rate": 6.222659544560024e-05, + "loss": 0.1581, + "step": 11070 + }, + { + "epoch": 3.12, + "learning_rate": 6.239527691875175e-05, + "loss": 0.1305, + "step": 11100 + }, + { + "epoch": 3.13, + "learning_rate": 6.256395839190329e-05, + "loss": 0.1692, + "step": 11130 + }, + { + "epoch": 3.14, + "learning_rate": 6.273263986505482e-05, + "loss": 0.1425, + "step": 11160 + }, + { + "epoch": 3.15, + "learning_rate": 6.290132133820636e-05, + "loss": 0.1494, + "step": 11190 + }, + { + "epoch": 3.15, + "learning_rate": 6.307000281135788e-05, + "loss": 0.1584, + "step": 11220 + }, + { + "epoch": 3.16, + "learning_rate": 6.323868428450942e-05, + "loss": 0.1428, + "step": 11250 + }, + { + "epoch": 3.17, + "learning_rate": 6.340736575766096e-05, + "loss": 0.163, + "step": 11280 + }, + { + "epoch": 3.18, + "learning_rate": 6.357604723081248e-05, + "loss": 0.1385, + "step": 11310 + }, + { + "epoch": 3.19, + "learning_rate": 6.374472870396402e-05, + "loss": 0.147, + "step": 11340 + }, + { + "epoch": 3.2, + "learning_rate": 6.391341017711555e-05, + "loss": 0.1579, + "step": 11370 + }, + { + "epoch": 3.2, + "learning_rate": 6.408209165026709e-05, + "loss": 0.1411, + "step": 11400 + }, + { + "epoch": 3.21, + "learning_rate": 6.425077312341861e-05, + "loss": 0.1604, + "step": 11430 + }, + { + "epoch": 3.22, + "learning_rate": 6.441945459657015e-05, + "loss": 0.1443, + "step": 11460 + }, + { + "epoch": 3.23, + "learning_rate": 6.458813606972168e-05, + "loss": 0.1461, + "step": 11490 + }, + { + "epoch": 3.24, + "learning_rate": 6.475681754287322e-05, + "loss": 0.1501, + "step": 11520 + }, + { + "epoch": 3.25, + "learning_rate": 6.492549901602474e-05, + "loss": 0.1332, + "step": 11550 + }, + { + "epoch": 3.26, + "learning_rate": 6.509418048917627e-05, + "loss": 0.1569, + "step": 11580 + }, + { + "epoch": 3.26, + "learning_rate": 6.526286196232781e-05, + "loss": 0.1349, + "step": 11610 + }, + { + "epoch": 3.27, + "learning_rate": 6.543154343547933e-05, + "loss": 0.1458, + "step": 11640 + }, + { + "epoch": 3.28, + "learning_rate": 6.560022490863087e-05, + "loss": 0.1578, + "step": 11670 + }, + { + "epoch": 3.29, + "learning_rate": 6.57689063817824e-05, + "loss": 0.1379, + "step": 11700 + }, + { + "epoch": 3.3, + "learning_rate": 6.593758785493394e-05, + "loss": 0.1585, + "step": 11730 + }, + { + "epoch": 3.31, + "learning_rate": 6.610626932808546e-05, + "loss": 0.138, + "step": 11760 + }, + { + "epoch": 3.31, + "learning_rate": 6.6274950801237e-05, + "loss": 0.1526, + "step": 11790 + }, + { + "epoch": 3.32, + "learning_rate": 6.644363227438854e-05, + "loss": 0.157, + "step": 11820 + }, + { + "epoch": 3.33, + "learning_rate": 6.661231374754007e-05, + "loss": 0.1379, + "step": 11850 + }, + { + "epoch": 3.34, + "learning_rate": 6.67809952206916e-05, + "loss": 0.1561, + "step": 11880 + }, + { + "epoch": 3.35, + "learning_rate": 6.694967669384313e-05, + "loss": 0.1351, + "step": 11910 + }, + { + "epoch": 3.36, + "learning_rate": 6.711835816699467e-05, + "loss": 0.1455, + "step": 11940 + }, + { + "epoch": 3.37, + "learning_rate": 6.72870396401462e-05, + "loss": 0.1473, + "step": 11970 + }, + { + "epoch": 3.37, + "learning_rate": 6.745572111329772e-05, + "loss": 0.1342, + "step": 12000 + }, + { + "epoch": 3.38, + "learning_rate": 6.762440258644926e-05, + "loss": 0.1529, + "step": 12030 + }, + { + "epoch": 3.39, + "learning_rate": 6.779308405960078e-05, + "loss": 0.138, + "step": 12060 + }, + { + "epoch": 3.4, + "learning_rate": 6.796176553275232e-05, + "loss": 0.1462, + "step": 12090 + }, + { + "epoch": 3.41, + "learning_rate": 6.813044700590385e-05, + "loss": 0.1569, + "step": 12120 + }, + { + "epoch": 3.42, + "learning_rate": 6.829912847905539e-05, + "loss": 0.1276, + "step": 12150 + }, + { + "epoch": 3.42, + "learning_rate": 6.846780995220691e-05, + "loss": 0.1538, + "step": 12180 + }, + { + "epoch": 3.43, + "learning_rate": 6.863649142535845e-05, + "loss": 0.1323, + "step": 12210 + }, + { + "epoch": 3.44, + "learning_rate": 6.880517289850998e-05, + "loss": 0.1457, + "step": 12240 + }, + { + "epoch": 3.45, + "learning_rate": 6.897385437166152e-05, + "loss": 0.1473, + "step": 12270 + }, + { + "epoch": 3.46, + "learning_rate": 6.914253584481306e-05, + "loss": 0.14, + "step": 12300 + }, + { + "epoch": 3.47, + "learning_rate": 6.931121731796458e-05, + "loss": 0.1591, + "step": 12330 + }, + { + "epoch": 3.47, + "learning_rate": 6.947989879111612e-05, + "loss": 0.1314, + "step": 12360 + }, + { + "epoch": 3.48, + "learning_rate": 6.964858026426765e-05, + "loss": 0.1424, + "step": 12390 + }, + { + "epoch": 3.49, + "learning_rate": 6.981726173741919e-05, + "loss": 0.1491, + "step": 12420 + }, + { + "epoch": 3.5, + "learning_rate": 6.99859432105707e-05, + "loss": 0.1307, + "step": 12450 + }, + { + "epoch": 3.51, + "learning_rate": 7.015462468372224e-05, + "loss": 0.1511, + "step": 12480 + }, + { + "epoch": 3.52, + "learning_rate": 7.032330615687378e-05, + "loss": 0.1432, + "step": 12510 + }, + { + "epoch": 3.53, + "learning_rate": 7.04919876300253e-05, + "loss": 0.152, + "step": 12540 + }, + { + "epoch": 3.53, + "learning_rate": 7.066066910317684e-05, + "loss": 0.1535, + "step": 12570 + }, + { + "epoch": 3.54, + "learning_rate": 7.082935057632837e-05, + "loss": 0.1311, + "step": 12600 + }, + { + "epoch": 3.55, + "learning_rate": 7.09980320494799e-05, + "loss": 0.1493, + "step": 12630 + }, + { + "epoch": 3.56, + "learning_rate": 7.116671352263143e-05, + "loss": 0.1343, + "step": 12660 + }, + { + "epoch": 3.57, + "learning_rate": 7.133539499578297e-05, + "loss": 0.1404, + "step": 12690 + }, + { + "epoch": 3.58, + "learning_rate": 7.15040764689345e-05, + "loss": 0.1464, + "step": 12720 + }, + { + "epoch": 3.58, + "learning_rate": 7.167275794208603e-05, + "loss": 0.1255, + "step": 12750 + }, + { + "epoch": 3.59, + "learning_rate": 7.184143941523756e-05, + "loss": 0.1548, + "step": 12780 + }, + { + "epoch": 3.6, + "learning_rate": 7.20101208883891e-05, + "loss": 0.1306, + "step": 12810 + }, + { + "epoch": 3.61, + "learning_rate": 7.217880236154064e-05, + "loss": 0.144, + "step": 12840 + }, + { + "epoch": 3.62, + "learning_rate": 7.234748383469216e-05, + "loss": 0.1428, + "step": 12870 + }, + { + "epoch": 3.63, + "learning_rate": 7.251616530784369e-05, + "loss": 0.132, + "step": 12900 + }, + { + "epoch": 3.63, + "learning_rate": 7.268484678099521e-05, + "loss": 0.146, + "step": 12930 + }, + { + "epoch": 3.64, + "learning_rate": 7.285352825414675e-05, + "loss": 0.135, + "step": 12960 + }, + { + "epoch": 3.65, + "learning_rate": 7.302220972729828e-05, + "loss": 0.1459, + "step": 12990 + }, + { + "epoch": 3.66, + "learning_rate": 7.319089120044982e-05, + "loss": 0.1482, + "step": 13020 + }, + { + "epoch": 3.67, + "learning_rate": 7.335957267360136e-05, + "loss": 0.1349, + "step": 13050 + }, + { + "epoch": 3.68, + "learning_rate": 7.352825414675288e-05, + "loss": 0.1419, + "step": 13080 + }, + { + "epoch": 3.69, + "learning_rate": 7.369693561990442e-05, + "loss": 0.137, + "step": 13110 + }, + { + "epoch": 3.69, + "learning_rate": 7.386561709305595e-05, + "loss": 0.1477, + "step": 13140 + }, + { + "epoch": 3.7, + "learning_rate": 7.403429856620749e-05, + "loss": 0.1484, + "step": 13170 + }, + { + "epoch": 3.71, + "learning_rate": 7.419735732358729e-05, + "loss": 0.1337, + "step": 13200 + }, + { + "epoch": 3.72, + "learning_rate": 7.436603879673882e-05, + "loss": 0.1481, + "step": 13230 + }, + { + "epoch": 3.73, + "learning_rate": 7.453472026989036e-05, + "loss": 0.1271, + "step": 13260 + }, + { + "epoch": 3.74, + "learning_rate": 7.470340174304189e-05, + "loss": 0.1405, + "step": 13290 + }, + { + "epoch": 3.74, + "learning_rate": 7.487208321619343e-05, + "loss": 0.1385, + "step": 13320 + }, + { + "epoch": 3.75, + "learning_rate": 7.504076468934495e-05, + "loss": 0.1286, + "step": 13350 + }, + { + "epoch": 3.76, + "learning_rate": 7.520944616249649e-05, + "loss": 0.1471, + "step": 13380 + }, + { + "epoch": 3.77, + "learning_rate": 7.537812763564802e-05, + "loss": 0.1327, + "step": 13410 + }, + { + "epoch": 3.78, + "learning_rate": 7.554680910879956e-05, + "loss": 0.1433, + "step": 13440 + }, + { + "epoch": 3.79, + "learning_rate": 7.571549058195108e-05, + "loss": 0.1452, + "step": 13470 + }, + { + "epoch": 3.8, + "learning_rate": 7.588417205510262e-05, + "loss": 0.1322, + "step": 13500 + }, + { + "epoch": 3.8, + "learning_rate": 7.605285352825415e-05, + "loss": 0.1502, + "step": 13530 + }, + { + "epoch": 3.81, + "learning_rate": 7.622153500140569e-05, + "loss": 0.1287, + "step": 13560 + }, + { + "epoch": 3.82, + "learning_rate": 7.639021647455723e-05, + "loss": 0.1398, + "step": 13590 + }, + { + "epoch": 3.83, + "learning_rate": 7.655889794770875e-05, + "loss": 0.151, + "step": 13620 + }, + { + "epoch": 3.84, + "learning_rate": 7.672757942086028e-05, + "loss": 0.1299, + "step": 13650 + }, + { + "epoch": 3.85, + "learning_rate": 7.68962608940118e-05, + "loss": 0.1452, + "step": 13680 + }, + { + "epoch": 3.85, + "learning_rate": 7.706494236716334e-05, + "loss": 0.1324, + "step": 13710 + }, + { + "epoch": 3.86, + "learning_rate": 7.723362384031487e-05, + "loss": 0.1426, + "step": 13740 + }, + { + "epoch": 3.87, + "learning_rate": 7.74023053134664e-05, + "loss": 0.1505, + "step": 13770 + }, + { + "epoch": 3.88, + "learning_rate": 7.757098678661794e-05, + "loss": 0.1359, + "step": 13800 + }, + { + "epoch": 3.89, + "learning_rate": 7.773966825976947e-05, + "loss": 0.1563, + "step": 13830 + }, + { + "epoch": 3.9, + "learning_rate": 7.790834973292101e-05, + "loss": 0.1286, + "step": 13860 + }, + { + "epoch": 3.9, + "learning_rate": 7.807703120607253e-05, + "loss": 0.1375, + "step": 13890 + }, + { + "epoch": 3.91, + "learning_rate": 7.824571267922407e-05, + "loss": 0.1508, + "step": 13920 + }, + { + "epoch": 3.92, + "learning_rate": 7.84143941523756e-05, + "loss": 0.1322, + "step": 13950 + }, + { + "epoch": 3.93, + "learning_rate": 7.858307562552714e-05, + "loss": 0.1438, + "step": 13980 + }, + { + "epoch": 3.94, + "learning_rate": 7.875175709867866e-05, + "loss": 0.1308, + "step": 14010 + }, + { + "epoch": 3.95, + "learning_rate": 7.89204385718302e-05, + "loss": 0.1372, + "step": 14040 + }, + { + "epoch": 3.96, + "learning_rate": 7.908912004498173e-05, + "loss": 0.1504, + "step": 14070 + }, + { + "epoch": 3.96, + "learning_rate": 7.925780151813325e-05, + "loss": 0.1307, + "step": 14100 + }, + { + "epoch": 3.97, + "learning_rate": 7.942648299128479e-05, + "loss": 0.141, + "step": 14130 + }, + { + "epoch": 3.98, + "learning_rate": 7.959516446443632e-05, + "loss": 0.1327, + "step": 14160 + }, + { + "epoch": 3.99, + "learning_rate": 7.976384593758786e-05, + "loss": 0.1374, + "step": 14190 + }, + { + "epoch": 4.0, + "learning_rate": 7.993252741073938e-05, + "loss": 0.1436, + "step": 14220 + }, + { + "epoch": 4.0, + "eval_loss": 0.13012589514255524, + "eval_runtime": 625.1324, + "eval_samples_per_second": 25.647, + "eval_steps_per_second": 0.803, + "eval_wer": 0.12817818295961678, + "step": 14228 + }, + { + "epoch": 4.01, + "learning_rate": 8.010120888389092e-05, + "loss": 0.1245, + "step": 14250 + }, + { + "epoch": 4.01, + "learning_rate": 8.026989035704246e-05, + "loss": 0.1439, + "step": 14280 + }, + { + "epoch": 4.02, + "learning_rate": 8.043857183019399e-05, + "loss": 0.1188, + "step": 14310 + }, + { + "epoch": 4.03, + "learning_rate": 8.060725330334553e-05, + "loss": 0.1393, + "step": 14340 + }, + { + "epoch": 4.04, + "learning_rate": 8.077593477649705e-05, + "loss": 0.1295, + "step": 14370 + }, + { + "epoch": 4.05, + "learning_rate": 8.094461624964859e-05, + "loss": 0.1367, + "step": 14400 + }, + { + "epoch": 4.06, + "learning_rate": 8.111329772280012e-05, + "loss": 0.1476, + "step": 14430 + }, + { + "epoch": 4.07, + "learning_rate": 8.128197919595165e-05, + "loss": 0.1218, + "step": 14460 + }, + { + "epoch": 4.07, + "learning_rate": 8.145066066910318e-05, + "loss": 0.1414, + "step": 14490 + }, + { + "epoch": 4.08, + "learning_rate": 8.161934214225472e-05, + "loss": 0.1294, + "step": 14520 + }, + { + "epoch": 4.09, + "learning_rate": 8.178802361540624e-05, + "loss": 0.1356, + "step": 14550 + }, + { + "epoch": 4.1, + "learning_rate": 8.195670508855777e-05, + "loss": 0.1385, + "step": 14580 + }, + { + "epoch": 4.11, + "learning_rate": 8.212538656170931e-05, + "loss": 0.1148, + "step": 14610 + }, + { + "epoch": 4.12, + "learning_rate": 8.229406803486083e-05, + "loss": 0.143, + "step": 14640 + }, + { + "epoch": 4.12, + "learning_rate": 8.246274950801237e-05, + "loss": 0.1218, + "step": 14670 + }, + { + "epoch": 4.13, + "learning_rate": 8.26314309811639e-05, + "loss": 0.1396, + "step": 14700 + }, + { + "epoch": 4.14, + "learning_rate": 8.280011245431544e-05, + "loss": 0.1485, + "step": 14730 + }, + { + "epoch": 4.15, + "learning_rate": 8.296879392746696e-05, + "loss": 0.1223, + "step": 14760 + }, + { + "epoch": 4.16, + "learning_rate": 8.31374754006185e-05, + "loss": 0.1386, + "step": 14790 + }, + { + "epoch": 4.17, + "learning_rate": 8.330615687377004e-05, + "loss": 0.1233, + "step": 14820 + }, + { + "epoch": 4.17, + "learning_rate": 8.347483834692157e-05, + "loss": 0.1244, + "step": 14850 + }, + { + "epoch": 4.18, + "learning_rate": 8.36435198200731e-05, + "loss": 0.1429, + "step": 14880 + }, + { + "epoch": 4.19, + "learning_rate": 8.381220129322463e-05, + "loss": 0.1153, + "step": 14910 + }, + { + "epoch": 4.2, + "learning_rate": 8.398088276637617e-05, + "loss": 0.1345, + "step": 14940 + }, + { + "epoch": 4.21, + "learning_rate": 8.41495642395277e-05, + "loss": 0.1261, + "step": 14970 + }, + { + "epoch": 4.22, + "learning_rate": 8.431824571267924e-05, + "loss": 0.1281, + "step": 15000 + }, + { + "epoch": 4.23, + "learning_rate": 8.448692718583076e-05, + "loss": 0.1434, + "step": 15030 + }, + { + "epoch": 4.23, + "learning_rate": 8.465560865898229e-05, + "loss": 0.1189, + "step": 15060 + }, + { + "epoch": 4.24, + "learning_rate": 8.482429013213383e-05, + "loss": 0.1377, + "step": 15090 + }, + { + "epoch": 4.25, + "learning_rate": 8.499297160528535e-05, + "loss": 0.1259, + "step": 15120 + }, + { + "epoch": 4.26, + "learning_rate": 8.516165307843689e-05, + "loss": 0.1236, + "step": 15150 + }, + { + "epoch": 4.27, + "learning_rate": 8.533033455158842e-05, + "loss": 0.1369, + "step": 15180 + }, + { + "epoch": 4.28, + "learning_rate": 8.549901602473995e-05, + "loss": 0.1149, + "step": 15210 + }, + { + "epoch": 4.28, + "learning_rate": 8.566769749789148e-05, + "loss": 0.1368, + "step": 15240 + }, + { + "epoch": 4.29, + "learning_rate": 8.583637897104302e-05, + "loss": 0.1288, + "step": 15270 + }, + { + "epoch": 4.3, + "learning_rate": 8.600506044419455e-05, + "loss": 0.1219, + "step": 15300 + }, + { + "epoch": 4.31, + "learning_rate": 8.617374191734608e-05, + "loss": 0.139, + "step": 15330 + }, + { + "epoch": 4.32, + "learning_rate": 8.634242339049762e-05, + "loss": 0.116, + "step": 15360 + }, + { + "epoch": 4.33, + "learning_rate": 8.651110486364915e-05, + "loss": 0.1371, + "step": 15390 + }, + { + "epoch": 4.34, + "learning_rate": 8.667978633680069e-05, + "loss": 0.1161, + "step": 15420 + }, + { + "epoch": 4.34, + "learning_rate": 8.684846780995221e-05, + "loss": 0.1289, + "step": 15450 + }, + { + "epoch": 4.35, + "learning_rate": 8.701714928310374e-05, + "loss": 0.1379, + "step": 15480 + }, + { + "epoch": 4.36, + "learning_rate": 8.718583075625528e-05, + "loss": 0.1205, + "step": 15510 + }, + { + "epoch": 4.37, + "learning_rate": 8.73545122294068e-05, + "loss": 0.1332, + "step": 15540 + }, + { + "epoch": 4.38, + "learning_rate": 8.752319370255834e-05, + "loss": 0.1217, + "step": 15570 + }, + { + "epoch": 4.39, + "learning_rate": 8.769187517570987e-05, + "loss": 0.1257, + "step": 15600 + }, + { + "epoch": 4.39, + "learning_rate": 8.786055664886141e-05, + "loss": 0.1427, + "step": 15630 + }, + { + "epoch": 4.4, + "learning_rate": 8.802923812201293e-05, + "loss": 0.1179, + "step": 15660 + }, + { + "epoch": 4.41, + "learning_rate": 8.819791959516447e-05, + "loss": 0.1446, + "step": 15690 + }, + { + "epoch": 4.42, + "learning_rate": 8.8366601068316e-05, + "loss": 0.1253, + "step": 15720 + }, + { + "epoch": 4.43, + "learning_rate": 8.853528254146754e-05, + "loss": 0.1275, + "step": 15750 + }, + { + "epoch": 4.44, + "learning_rate": 8.870396401461906e-05, + "loss": 0.145, + "step": 15780 + }, + { + "epoch": 4.44, + "learning_rate": 8.88726454877706e-05, + "loss": 0.115, + "step": 15810 + }, + { + "epoch": 4.45, + "learning_rate": 8.904132696092214e-05, + "loss": 0.1337, + "step": 15840 + }, + { + "epoch": 4.46, + "learning_rate": 8.921000843407367e-05, + "loss": 0.1186, + "step": 15870 + }, + { + "epoch": 4.47, + "learning_rate": 8.93786899072252e-05, + "loss": 0.1335, + "step": 15900 + }, + { + "epoch": 4.48, + "learning_rate": 8.954737138037672e-05, + "loss": 0.1424, + "step": 15930 + }, + { + "epoch": 4.49, + "learning_rate": 8.971605285352826e-05, + "loss": 0.1137, + "step": 15960 + }, + { + "epoch": 4.5, + "learning_rate": 8.988473432667978e-05, + "loss": 0.1335, + "step": 15990 + }, + { + "epoch": 4.5, + "learning_rate": 9.005341579983132e-05, + "loss": 0.1251, + "step": 16020 + }, + { + "epoch": 4.51, + "learning_rate": 9.022209727298286e-05, + "loss": 0.1289, + "step": 16050 + }, + { + "epoch": 4.52, + "learning_rate": 9.039077874613438e-05, + "loss": 0.1452, + "step": 16080 + }, + { + "epoch": 4.53, + "learning_rate": 9.055946021928592e-05, + "loss": 0.1185, + "step": 16110 + }, + { + "epoch": 4.54, + "learning_rate": 9.072814169243745e-05, + "loss": 0.1337, + "step": 16140 + }, + { + "epoch": 4.55, + "learning_rate": 9.089682316558899e-05, + "loss": 0.1189, + "step": 16170 + }, + { + "epoch": 4.55, + "learning_rate": 9.10598819229688e-05, + "loss": 0.1336, + "step": 16200 + }, + { + "epoch": 4.56, + "learning_rate": 9.122856339612033e-05, + "loss": 0.1361, + "step": 16230 + }, + { + "epoch": 4.57, + "learning_rate": 9.139724486927187e-05, + "loss": 0.1131, + "step": 16260 + }, + { + "epoch": 4.58, + "learning_rate": 9.156592634242339e-05, + "loss": 0.1351, + "step": 16290 + }, + { + "epoch": 4.59, + "learning_rate": 9.173460781557493e-05, + "loss": 0.1209, + "step": 16320 + }, + { + "epoch": 4.6, + "learning_rate": 9.190328928872646e-05, + "loss": 0.1382, + "step": 16350 + }, + { + "epoch": 4.6, + "learning_rate": 9.2071970761878e-05, + "loss": 0.1471, + "step": 16380 + }, + { + "epoch": 4.61, + "learning_rate": 9.224065223502952e-05, + "loss": 0.1148, + "step": 16410 + }, + { + "epoch": 4.62, + "learning_rate": 9.240933370818106e-05, + "loss": 0.1442, + "step": 16440 + }, + { + "epoch": 4.63, + "learning_rate": 9.257801518133258e-05, + "loss": 0.1244, + "step": 16470 + }, + { + "epoch": 4.64, + "learning_rate": 9.274669665448412e-05, + "loss": 0.1324, + "step": 16500 + }, + { + "epoch": 4.65, + "learning_rate": 9.291537812763565e-05, + "loss": 0.1369, + "step": 16530 + }, + { + "epoch": 4.66, + "learning_rate": 9.308405960078719e-05, + "loss": 0.1125, + "step": 16560 + }, + { + "epoch": 4.66, + "learning_rate": 9.325274107393873e-05, + "loss": 0.1342, + "step": 16590 + }, + { + "epoch": 4.67, + "learning_rate": 9.342142254709025e-05, + "loss": 0.1169, + "step": 16620 + }, + { + "epoch": 4.68, + "learning_rate": 9.359010402024179e-05, + "loss": 0.131, + "step": 16650 + }, + { + "epoch": 4.69, + "learning_rate": 9.37587854933933e-05, + "loss": 0.1433, + "step": 16680 + }, + { + "epoch": 4.7, + "learning_rate": 9.392746696654484e-05, + "loss": 0.1083, + "step": 16710 + }, + { + "epoch": 4.71, + "learning_rate": 9.409614843969637e-05, + "loss": 0.141, + "step": 16740 + }, + { + "epoch": 4.71, + "learning_rate": 9.426482991284791e-05, + "loss": 0.1252, + "step": 16770 + }, + { + "epoch": 4.72, + "learning_rate": 9.443351138599945e-05, + "loss": 0.1307, + "step": 16800 + }, + { + "epoch": 4.73, + "learning_rate": 9.460219285915097e-05, + "loss": 0.1423, + "step": 16830 + }, + { + "epoch": 4.74, + "learning_rate": 9.477087433230251e-05, + "loss": 0.1153, + "step": 16860 + }, + { + "epoch": 4.75, + "learning_rate": 9.493955580545404e-05, + "loss": 0.1344, + "step": 16890 + }, + { + "epoch": 4.76, + "learning_rate": 9.510823727860558e-05, + "loss": 0.1187, + "step": 16920 + }, + { + "epoch": 4.77, + "learning_rate": 9.52769187517571e-05, + "loss": 0.1296, + "step": 16950 + }, + { + "epoch": 4.77, + "learning_rate": 9.544560022490864e-05, + "loss": 0.1412, + "step": 16980 + }, + { + "epoch": 4.78, + "learning_rate": 9.561428169806017e-05, + "loss": 0.117, + "step": 17010 + }, + { + "epoch": 4.79, + "learning_rate": 9.57829631712117e-05, + "loss": 0.1399, + "step": 17040 + }, + { + "epoch": 4.8, + "learning_rate": 9.595164464436323e-05, + "loss": 0.1281, + "step": 17070 + }, + { + "epoch": 4.81, + "learning_rate": 9.612032611751477e-05, + "loss": 0.1314, + "step": 17100 + }, + { + "epoch": 4.82, + "learning_rate": 9.62890075906663e-05, + "loss": 0.1426, + "step": 17130 + }, + { + "epoch": 4.82, + "learning_rate": 9.645768906381782e-05, + "loss": 0.1215, + "step": 17160 + }, + { + "epoch": 4.83, + "learning_rate": 9.662637053696936e-05, + "loss": 0.1377, + "step": 17190 + }, + { + "epoch": 4.84, + "learning_rate": 9.679505201012088e-05, + "loss": 0.1169, + "step": 17220 + }, + { + "epoch": 4.85, + "learning_rate": 9.696373348327242e-05, + "loss": 0.1264, + "step": 17250 + }, + { + "epoch": 4.86, + "learning_rate": 9.713241495642396e-05, + "loss": 0.1354, + "step": 17280 + }, + { + "epoch": 4.87, + "learning_rate": 9.730109642957549e-05, + "loss": 0.1142, + "step": 17310 + }, + { + "epoch": 4.87, + "learning_rate": 9.746977790272703e-05, + "loss": 0.1394, + "step": 17340 + }, + { + "epoch": 4.88, + "learning_rate": 9.763845937587855e-05, + "loss": 0.1206, + "step": 17370 + }, + { + "epoch": 4.89, + "learning_rate": 9.780714084903009e-05, + "loss": 0.1298, + "step": 17400 + }, + { + "epoch": 4.9, + "learning_rate": 9.797582232218162e-05, + "loss": 0.1363, + "step": 17430 + }, + { + "epoch": 4.91, + "learning_rate": 9.814450379533316e-05, + "loss": 0.1116, + "step": 17460 + }, + { + "epoch": 4.92, + "learning_rate": 9.831318526848468e-05, + "loss": 0.1366, + "step": 17490 + }, + { + "epoch": 4.93, + "learning_rate": 9.848186674163622e-05, + "loss": 0.1215, + "step": 17520 + }, + { + "epoch": 4.93, + "learning_rate": 9.865054821478775e-05, + "loss": 0.1261, + "step": 17550 + }, + { + "epoch": 4.94, + "learning_rate": 9.881922968793927e-05, + "loss": 0.1375, + "step": 17580 + }, + { + "epoch": 4.95, + "learning_rate": 9.898791116109081e-05, + "loss": 0.117, + "step": 17610 + }, + { + "epoch": 4.96, + "learning_rate": 9.915096991847062e-05, + "loss": 0.1364, + "step": 17640 + }, + { + "epoch": 4.97, + "learning_rate": 9.931965139162216e-05, + "loss": 0.122, + "step": 17670 + }, + { + "epoch": 4.98, + "learning_rate": 9.948833286477369e-05, + "loss": 0.1229, + "step": 17700 + }, + { + "epoch": 4.98, + "learning_rate": 9.965701433792523e-05, + "loss": 0.1445, + "step": 17730 + }, + { + "epoch": 4.99, + "learning_rate": 9.982569581107675e-05, + "loss": 0.1144, + "step": 17760 + }, + { + "epoch": 5.0, + "eval_loss": 0.12248270958662033, + "eval_runtime": 627.1117, + "eval_samples_per_second": 25.566, + "eval_steps_per_second": 0.8, + "eval_wer": 0.12450015694730665, + "step": 17785 + }, + { + "epoch": 5.0, + "learning_rate": 9.999437728422829e-05, + "loss": 0.1411, + "step": 17790 + }, + { + "epoch": 5.01, + "learning_rate": 9.998188236029113e-05, + "loss": 0.1146, + "step": 17820 + }, + { + "epoch": 5.02, + "learning_rate": 9.996313997438541e-05, + "loss": 0.1221, + "step": 17850 + }, + { + "epoch": 5.03, + "learning_rate": 9.99443975884797e-05, + "loss": 0.1168, + "step": 17880 + }, + { + "epoch": 5.04, + "learning_rate": 9.992565520257396e-05, + "loss": 0.1176, + "step": 17910 + }, + { + "epoch": 5.04, + "learning_rate": 9.990691281666823e-05, + "loss": 0.1309, + "step": 17940 + }, + { + "epoch": 5.05, + "learning_rate": 9.988817043076251e-05, + "loss": 0.1072, + "step": 17970 + }, + { + "epoch": 5.06, + "learning_rate": 9.986942804485678e-05, + "loss": 0.1279, + "step": 18000 + }, + { + "epoch": 5.07, + "learning_rate": 9.985068565895106e-05, + "loss": 0.1234, + "step": 18030 + }, + { + "epoch": 5.08, + "learning_rate": 9.983194327304533e-05, + "loss": 0.121, + "step": 18060 + }, + { + "epoch": 5.09, + "learning_rate": 9.98132008871396e-05, + "loss": 0.1344, + "step": 18090 + }, + { + "epoch": 5.09, + "learning_rate": 9.979445850123387e-05, + "loss": 0.1082, + "step": 18120 + }, + { + "epoch": 5.1, + "learning_rate": 9.977571611532816e-05, + "loss": 0.1277, + "step": 18150 + }, + { + "epoch": 5.11, + "learning_rate": 9.975697372942244e-05, + "loss": 0.1176, + "step": 18180 + }, + { + "epoch": 5.12, + "learning_rate": 9.97382313435167e-05, + "loss": 0.1147, + "step": 18210 + }, + { + "epoch": 5.13, + "learning_rate": 9.971948895761097e-05, + "loss": 0.1317, + "step": 18240 + }, + { + "epoch": 5.14, + "learning_rate": 9.970074657170525e-05, + "loss": 0.1043, + "step": 18270 + }, + { + "epoch": 5.14, + "learning_rate": 9.968200418579953e-05, + "loss": 0.1252, + "step": 18300 + }, + { + "epoch": 5.15, + "learning_rate": 9.96632617998938e-05, + "loss": 0.1184, + "step": 18330 + }, + { + "epoch": 5.16, + "learning_rate": 9.964451941398807e-05, + "loss": 0.1156, + "step": 18360 + }, + { + "epoch": 5.17, + "learning_rate": 9.962577702808235e-05, + "loss": 0.1261, + "step": 18390 + }, + { + "epoch": 5.18, + "learning_rate": 9.960703464217662e-05, + "loss": 0.1075, + "step": 18420 + }, + { + "epoch": 5.19, + "learning_rate": 9.95882922562709e-05, + "loss": 0.1218, + "step": 18450 + }, + { + "epoch": 5.2, + "learning_rate": 9.956954987036516e-05, + "loss": 0.1193, + "step": 18480 + }, + { + "epoch": 5.2, + "learning_rate": 9.955080748445945e-05, + "loss": 0.1216, + "step": 18510 + }, + { + "epoch": 5.21, + "learning_rate": 9.953206509855371e-05, + "loss": 0.1381, + "step": 18540 + }, + { + "epoch": 5.22, + "learning_rate": 9.9513322712648e-05, + "loss": 0.1051, + "step": 18570 + }, + { + "epoch": 5.23, + "learning_rate": 9.949458032674227e-05, + "loss": 0.1266, + "step": 18600 + }, + { + "epoch": 5.24, + "learning_rate": 9.947583794083654e-05, + "loss": 0.1243, + "step": 18630 + }, + { + "epoch": 5.25, + "learning_rate": 9.945709555493081e-05, + "loss": 0.1207, + "step": 18660 + }, + { + "epoch": 5.25, + "learning_rate": 9.943835316902509e-05, + "loss": 0.1342, + "step": 18690 + }, + { + "epoch": 5.26, + "learning_rate": 9.941961078311937e-05, + "loss": 0.1095, + "step": 18720 + }, + { + "epoch": 5.27, + "learning_rate": 9.940086839721363e-05, + "loss": 0.1304, + "step": 18750 + }, + { + "epoch": 5.28, + "learning_rate": 9.93821260113079e-05, + "loss": 0.1147, + "step": 18780 + }, + { + "epoch": 5.29, + "learning_rate": 9.936338362540219e-05, + "loss": 0.1176, + "step": 18810 + }, + { + "epoch": 5.3, + "learning_rate": 9.934464123949645e-05, + "loss": 0.129, + "step": 18840 + }, + { + "epoch": 5.3, + "learning_rate": 9.932589885359074e-05, + "loss": 0.103, + "step": 18870 + }, + { + "epoch": 5.31, + "learning_rate": 9.9307156467685e-05, + "loss": 0.1184, + "step": 18900 + }, + { + "epoch": 5.32, + "learning_rate": 9.928841408177928e-05, + "loss": 0.1172, + "step": 18930 + }, + { + "epoch": 5.33, + "learning_rate": 9.926967169587355e-05, + "loss": 0.1195, + "step": 18960 + }, + { + "epoch": 5.34, + "learning_rate": 9.925092930996783e-05, + "loss": 0.126, + "step": 18990 + }, + { + "epoch": 5.35, + "learning_rate": 9.923218692406211e-05, + "loss": 0.1127, + "step": 19020 + }, + { + "epoch": 5.36, + "learning_rate": 9.921344453815638e-05, + "loss": 0.1259, + "step": 19050 + }, + { + "epoch": 5.36, + "learning_rate": 9.919470215225065e-05, + "loss": 0.1195, + "step": 19080 + }, + { + "epoch": 5.37, + "learning_rate": 9.917595976634493e-05, + "loss": 0.1089, + "step": 19110 + }, + { + "epoch": 5.38, + "learning_rate": 9.915721738043921e-05, + "loss": 0.1389, + "step": 19140 + }, + { + "epoch": 5.39, + "learning_rate": 9.913847499453346e-05, + "loss": 0.1102, + "step": 19170 + }, + { + "epoch": 5.4, + "learning_rate": 9.911973260862774e-05, + "loss": 0.1206, + "step": 19200 + }, + { + "epoch": 5.41, + "learning_rate": 9.910099022272203e-05, + "loss": 0.1193, + "step": 19230 + }, + { + "epoch": 5.41, + "learning_rate": 9.90822478368163e-05, + "loss": 0.1218, + "step": 19260 + }, + { + "epoch": 5.42, + "learning_rate": 9.906350545091057e-05, + "loss": 0.1265, + "step": 19290 + }, + { + "epoch": 5.43, + "learning_rate": 9.904476306500484e-05, + "loss": 0.1105, + "step": 19320 + }, + { + "epoch": 5.44, + "learning_rate": 9.902602067909912e-05, + "loss": 0.1318, + "step": 19350 + }, + { + "epoch": 5.45, + "learning_rate": 9.900727829319339e-05, + "loss": 0.121, + "step": 19380 + }, + { + "epoch": 5.46, + "learning_rate": 9.898853590728767e-05, + "loss": 0.1148, + "step": 19410 + }, + { + "epoch": 5.47, + "learning_rate": 9.896979352138195e-05, + "loss": 0.1305, + "step": 19440 + }, + { + "epoch": 5.47, + "learning_rate": 9.895105113547622e-05, + "loss": 0.1039, + "step": 19470 + }, + { + "epoch": 5.48, + "learning_rate": 9.893230874957049e-05, + "loss": 0.1283, + "step": 19500 + }, + { + "epoch": 5.49, + "learning_rate": 9.891356636366477e-05, + "loss": 0.1151, + "step": 19530 + }, + { + "epoch": 5.5, + "learning_rate": 9.889482397775905e-05, + "loss": 0.121, + "step": 19560 + }, + { + "epoch": 5.51, + "learning_rate": 9.88760815918533e-05, + "loss": 0.1295, + "step": 19590 + }, + { + "epoch": 5.52, + "learning_rate": 9.885733920594758e-05, + "loss": 0.1097, + "step": 19620 + }, + { + "epoch": 5.52, + "learning_rate": 9.883922156623871e-05, + "loss": 0.1259, + "step": 19650 + }, + { + "epoch": 5.53, + "learning_rate": 9.882047918033299e-05, + "loss": 0.1212, + "step": 19680 + }, + { + "epoch": 5.54, + "learning_rate": 9.880173679442727e-05, + "loss": 0.1193, + "step": 19710 + }, + { + "epoch": 5.55, + "learning_rate": 9.878299440852154e-05, + "loss": 0.1309, + "step": 19740 + }, + { + "epoch": 5.56, + "learning_rate": 9.876425202261582e-05, + "loss": 0.1048, + "step": 19770 + }, + { + "epoch": 5.57, + "learning_rate": 9.874550963671009e-05, + "loss": 0.1282, + "step": 19800 + }, + { + "epoch": 5.57, + "learning_rate": 9.872676725080437e-05, + "loss": 0.1152, + "step": 19830 + }, + { + "epoch": 5.58, + "learning_rate": 9.870802486489864e-05, + "loss": 0.1177, + "step": 19860 + }, + { + "epoch": 5.59, + "learning_rate": 9.868928247899292e-05, + "loss": 0.1279, + "step": 19890 + }, + { + "epoch": 5.6, + "learning_rate": 9.867054009308719e-05, + "loss": 0.1092, + "step": 19920 + }, + { + "epoch": 5.61, + "learning_rate": 9.865179770718145e-05, + "loss": 0.1178, + "step": 19950 + }, + { + "epoch": 5.62, + "learning_rate": 9.863305532127573e-05, + "loss": 0.1149, + "step": 19980 + }, + { + "epoch": 5.63, + "learning_rate": 9.861431293537001e-05, + "loss": 0.1173, + "step": 20010 + }, + { + "epoch": 5.63, + "learning_rate": 9.859557054946428e-05, + "loss": 0.1246, + "step": 20040 + }, + { + "epoch": 5.64, + "learning_rate": 9.857682816355855e-05, + "loss": 0.1084, + "step": 20070 + }, + { + "epoch": 5.65, + "learning_rate": 9.855808577765283e-05, + "loss": 0.125, + "step": 20100 + }, + { + "epoch": 5.66, + "learning_rate": 9.853934339174711e-05, + "loss": 0.1209, + "step": 20130 + }, + { + "epoch": 5.67, + "learning_rate": 9.852060100584138e-05, + "loss": 0.1118, + "step": 20160 + }, + { + "epoch": 5.68, + "learning_rate": 9.850185861993566e-05, + "loss": 0.1235, + "step": 20190 + }, + { + "epoch": 5.68, + "learning_rate": 9.848311623402993e-05, + "loss": 0.1085, + "step": 20220 + }, + { + "epoch": 5.69, + "learning_rate": 9.846437384812421e-05, + "loss": 0.1163, + "step": 20250 + }, + { + "epoch": 5.7, + "learning_rate": 9.844563146221848e-05, + "loss": 0.1152, + "step": 20280 + }, + { + "epoch": 5.71, + "learning_rate": 9.842688907631276e-05, + "loss": 0.1136, + "step": 20310 + }, + { + "epoch": 5.72, + "learning_rate": 9.840814669040702e-05, + "loss": 0.1284, + "step": 20340 + }, + { + "epoch": 5.73, + "learning_rate": 9.838940430450129e-05, + "loss": 0.1105, + "step": 20370 + }, + { + "epoch": 5.74, + "learning_rate": 9.837066191859557e-05, + "loss": 0.1203, + "step": 20400 + }, + { + "epoch": 5.74, + "learning_rate": 9.835191953268985e-05, + "loss": 0.1209, + "step": 20430 + }, + { + "epoch": 5.75, + "learning_rate": 9.833317714678413e-05, + "loss": 0.1164, + "step": 20460 + }, + { + "epoch": 5.76, + "learning_rate": 9.831443476087839e-05, + "loss": 0.1279, + "step": 20490 + }, + { + "epoch": 5.77, + "learning_rate": 9.829569237497267e-05, + "loss": 0.1042, + "step": 20520 + }, + { + "epoch": 5.78, + "learning_rate": 9.827694998906695e-05, + "loss": 0.1151, + "step": 20550 + }, + { + "epoch": 5.79, + "learning_rate": 9.825820760316122e-05, + "loss": 0.1168, + "step": 20580 + }, + { + "epoch": 5.79, + "learning_rate": 9.82394652172555e-05, + "loss": 0.1163, + "step": 20610 + }, + { + "epoch": 5.8, + "learning_rate": 9.822072283134977e-05, + "loss": 0.1276, + "step": 20640 + }, + { + "epoch": 5.81, + "learning_rate": 9.820198044544405e-05, + "loss": 0.1113, + "step": 20670 + }, + { + "epoch": 5.82, + "learning_rate": 9.818323805953831e-05, + "loss": 0.1254, + "step": 20700 + }, + { + "epoch": 5.83, + "learning_rate": 9.81644956736326e-05, + "loss": 0.1181, + "step": 20730 + }, + { + "epoch": 5.84, + "learning_rate": 9.814575328772686e-05, + "loss": 0.1087, + "step": 20760 + }, + { + "epoch": 5.84, + "learning_rate": 9.812701090182113e-05, + "loss": 0.128, + "step": 20790 + }, + { + "epoch": 5.85, + "learning_rate": 9.810826851591541e-05, + "loss": 0.1078, + "step": 20820 + }, + { + "epoch": 5.86, + "learning_rate": 9.808952613000969e-05, + "loss": 0.1185, + "step": 20850 + }, + { + "epoch": 5.87, + "learning_rate": 9.807078374410397e-05, + "loss": 0.1132, + "step": 20880 + }, + { + "epoch": 5.88, + "learning_rate": 9.805204135819823e-05, + "loss": 0.1106, + "step": 20910 + }, + { + "epoch": 5.89, + "learning_rate": 9.803329897229251e-05, + "loss": 0.133, + "step": 20940 + }, + { + "epoch": 5.9, + "learning_rate": 9.801455658638679e-05, + "loss": 0.1055, + "step": 20970 + }, + { + "epoch": 5.9, + "learning_rate": 9.799581420048106e-05, + "loss": 0.1229, + "step": 21000 + }, + { + "epoch": 5.91, + "learning_rate": 9.797707181457534e-05, + "loss": 0.1156, + "step": 21030 + }, + { + "epoch": 5.92, + "learning_rate": 9.79583294286696e-05, + "loss": 0.1154, + "step": 21060 + }, + { + "epoch": 5.93, + "learning_rate": 9.793958704276389e-05, + "loss": 0.1361, + "step": 21090 + }, + { + "epoch": 5.94, + "learning_rate": 9.792084465685815e-05, + "loss": 0.1038, + "step": 21120 + }, + { + "epoch": 5.95, + "learning_rate": 9.790210227095243e-05, + "loss": 0.1232, + "step": 21150 + }, + { + "epoch": 5.95, + "learning_rate": 9.78833598850467e-05, + "loss": 0.1156, + "step": 21180 + }, + { + "epoch": 5.96, + "learning_rate": 9.786461749914098e-05, + "loss": 0.1133, + "step": 21210 + }, + { + "epoch": 5.97, + "learning_rate": 9.784587511323525e-05, + "loss": 0.1224, + "step": 21240 + }, + { + "epoch": 5.98, + "learning_rate": 9.782713272732953e-05, + "loss": 0.1007, + "step": 21270 + }, + { + "epoch": 5.99, + "learning_rate": 9.780839034142381e-05, + "loss": 0.1266, + "step": 21300 + }, + { + "epoch": 6.0, + "learning_rate": 9.778964795551807e-05, + "loss": 0.1219, + "step": 21330 + }, + { + "epoch": 6.0, + "eval_loss": 0.125444233417511, + "eval_runtime": 626.7572, + "eval_samples_per_second": 25.581, + "eval_steps_per_second": 0.801, + "eval_wer": 0.12082895473093773, + "step": 21342 + }, + { + "epoch": 6.01, + "learning_rate": 9.777090556961235e-05, + "loss": 0.1218, + "step": 21360 + }, + { + "epoch": 6.01, + "learning_rate": 9.775216318370663e-05, + "loss": 0.1176, + "step": 21390 + }, + { + "epoch": 6.02, + "learning_rate": 9.77334207978009e-05, + "loss": 0.1088, + "step": 21420 + }, + { + "epoch": 6.03, + "learning_rate": 9.771467841189518e-05, + "loss": 0.1211, + "step": 21450 + }, + { + "epoch": 6.04, + "learning_rate": 9.769593602598944e-05, + "loss": 0.103, + "step": 21480 + }, + { + "epoch": 6.05, + "learning_rate": 9.767719364008372e-05, + "loss": 0.1174, + "step": 21510 + }, + { + "epoch": 6.06, + "learning_rate": 9.765845125417799e-05, + "loss": 0.1166, + "step": 21540 + }, + { + "epoch": 6.06, + "learning_rate": 9.763970886827227e-05, + "loss": 0.1097, + "step": 21570 + }, + { + "epoch": 6.07, + "learning_rate": 9.762096648236654e-05, + "loss": 0.1197, + "step": 21600 + }, + { + "epoch": 6.08, + "learning_rate": 9.760222409646082e-05, + "loss": 0.101, + "step": 21630 + }, + { + "epoch": 6.09, + "learning_rate": 9.758348171055509e-05, + "loss": 0.1148, + "step": 21660 + }, + { + "epoch": 6.1, + "learning_rate": 9.756473932464937e-05, + "loss": 0.1132, + "step": 21690 + }, + { + "epoch": 6.11, + "learning_rate": 9.754599693874365e-05, + "loss": 0.1092, + "step": 21720 + }, + { + "epoch": 6.11, + "learning_rate": 9.75272545528379e-05, + "loss": 0.1224, + "step": 21750 + }, + { + "epoch": 6.12, + "learning_rate": 9.750851216693219e-05, + "loss": 0.1093, + "step": 21780 + }, + { + "epoch": 6.13, + "learning_rate": 9.748976978102647e-05, + "loss": 0.1147, + "step": 21810 + }, + { + "epoch": 6.14, + "learning_rate": 9.747102739512073e-05, + "loss": 0.1112, + "step": 21840 + }, + { + "epoch": 6.15, + "learning_rate": 9.745228500921501e-05, + "loss": 0.1098, + "step": 21870 + }, + { + "epoch": 6.16, + "learning_rate": 9.743354262330928e-05, + "loss": 0.1251, + "step": 21900 + }, + { + "epoch": 6.17, + "learning_rate": 9.741480023740356e-05, + "loss": 0.1047, + "step": 21930 + }, + { + "epoch": 6.17, + "learning_rate": 9.739605785149783e-05, + "loss": 0.1153, + "step": 21960 + }, + { + "epoch": 6.18, + "learning_rate": 9.737731546559211e-05, + "loss": 0.1176, + "step": 21990 + }, + { + "epoch": 6.19, + "learning_rate": 9.735857307968638e-05, + "loss": 0.1144, + "step": 22020 + }, + { + "epoch": 6.2, + "learning_rate": 9.733983069378066e-05, + "loss": 0.1197, + "step": 22050 + }, + { + "epoch": 6.21, + "learning_rate": 9.732108830787493e-05, + "loss": 0.1081, + "step": 22080 + }, + { + "epoch": 6.22, + "learning_rate": 9.730234592196921e-05, + "loss": 0.1182, + "step": 22110 + }, + { + "epoch": 6.22, + "learning_rate": 9.728360353606349e-05, + "loss": 0.1163, + "step": 22140 + }, + { + "epoch": 6.23, + "learning_rate": 9.726486115015774e-05, + "loss": 0.1116, + "step": 22170 + }, + { + "epoch": 6.24, + "learning_rate": 9.724611876425202e-05, + "loss": 0.128, + "step": 22200 + }, + { + "epoch": 6.25, + "learning_rate": 9.72273763783463e-05, + "loss": 0.1085, + "step": 22230 + }, + { + "epoch": 6.26, + "learning_rate": 9.720863399244057e-05, + "loss": 0.1119, + "step": 22260 + }, + { + "epoch": 6.27, + "learning_rate": 9.718989160653485e-05, + "loss": 0.1225, + "step": 22290 + }, + { + "epoch": 6.27, + "learning_rate": 9.717114922062912e-05, + "loss": 0.1034, + "step": 22320 + }, + { + "epoch": 6.28, + "learning_rate": 9.71524068347234e-05, + "loss": 0.1188, + "step": 22350 + }, + { + "epoch": 6.29, + "learning_rate": 9.713366444881767e-05, + "loss": 0.104, + "step": 22380 + }, + { + "epoch": 6.3, + "learning_rate": 9.711492206291195e-05, + "loss": 0.1139, + "step": 22410 + }, + { + "epoch": 6.31, + "learning_rate": 9.709617967700622e-05, + "loss": 0.1144, + "step": 22440 + }, + { + "epoch": 6.32, + "learning_rate": 9.70774372911005e-05, + "loss": 0.106, + "step": 22470 + }, + { + "epoch": 6.33, + "learning_rate": 9.705869490519477e-05, + "loss": 0.1213, + "step": 22500 + }, + { + "epoch": 6.33, + "learning_rate": 9.703995251928905e-05, + "loss": 0.1006, + "step": 22530 + }, + { + "epoch": 6.34, + "learning_rate": 9.702121013338333e-05, + "loss": 0.1111, + "step": 22560 + }, + { + "epoch": 6.35, + "learning_rate": 9.700246774747758e-05, + "loss": 0.1114, + "step": 22590 + }, + { + "epoch": 6.36, + "learning_rate": 9.698372536157186e-05, + "loss": 0.1058, + "step": 22620 + }, + { + "epoch": 6.37, + "learning_rate": 9.696498297566614e-05, + "loss": 0.1228, + "step": 22650 + }, + { + "epoch": 6.38, + "learning_rate": 9.694624058976041e-05, + "loss": 0.1041, + "step": 22680 + }, + { + "epoch": 6.38, + "learning_rate": 9.692749820385469e-05, + "loss": 0.1129, + "step": 22710 + }, + { + "epoch": 6.39, + "learning_rate": 9.690875581794896e-05, + "loss": 0.1166, + "step": 22740 + }, + { + "epoch": 6.4, + "learning_rate": 9.689001343204324e-05, + "loss": 0.1027, + "step": 22770 + }, + { + "epoch": 6.41, + "learning_rate": 9.687127104613751e-05, + "loss": 0.1201, + "step": 22800 + }, + { + "epoch": 6.42, + "learning_rate": 9.685252866023179e-05, + "loss": 0.1033, + "step": 22830 + }, + { + "epoch": 6.43, + "learning_rate": 9.683378627432606e-05, + "loss": 0.1159, + "step": 22860 + }, + { + "epoch": 6.44, + "learning_rate": 9.681504388842034e-05, + "loss": 0.1184, + "step": 22890 + }, + { + "epoch": 6.44, + "learning_rate": 9.67963015025146e-05, + "loss": 0.1047, + "step": 22920 + }, + { + "epoch": 6.45, + "learning_rate": 9.677755911660889e-05, + "loss": 0.1189, + "step": 22950 + }, + { + "epoch": 6.46, + "learning_rate": 9.675881673070317e-05, + "loss": 0.1022, + "step": 22980 + }, + { + "epoch": 6.47, + "learning_rate": 9.674007434479742e-05, + "loss": 0.1202, + "step": 23010 + }, + { + "epoch": 6.48, + "learning_rate": 9.67213319588917e-05, + "loss": 0.12, + "step": 23040 + }, + { + "epoch": 6.49, + "learning_rate": 9.670258957298598e-05, + "loss": 0.1041, + "step": 23070 + }, + { + "epoch": 6.49, + "learning_rate": 9.668384718708025e-05, + "loss": 0.1231, + "step": 23100 + }, + { + "epoch": 6.5, + "learning_rate": 9.666510480117452e-05, + "loss": 0.103, + "step": 23130 + }, + { + "epoch": 6.51, + "learning_rate": 9.66463624152688e-05, + "loss": 0.1197, + "step": 23160 + }, + { + "epoch": 6.52, + "learning_rate": 9.662762002936308e-05, + "loss": 0.1136, + "step": 23190 + }, + { + "epoch": 6.53, + "learning_rate": 9.660887764345735e-05, + "loss": 0.105, + "step": 23220 + }, + { + "epoch": 6.54, + "learning_rate": 9.659013525755163e-05, + "loss": 0.1207, + "step": 23250 + }, + { + "epoch": 6.54, + "learning_rate": 9.65713928716459e-05, + "loss": 0.1041, + "step": 23280 + }, + { + "epoch": 6.55, + "learning_rate": 9.655265048574018e-05, + "loss": 0.1146, + "step": 23310 + }, + { + "epoch": 6.56, + "learning_rate": 9.653390809983444e-05, + "loss": 0.1191, + "step": 23340 + }, + { + "epoch": 6.57, + "learning_rate": 9.651516571392872e-05, + "loss": 0.1014, + "step": 23370 + }, + { + "epoch": 6.58, + "learning_rate": 9.6496423328023e-05, + "loss": 0.1168, + "step": 23400 + }, + { + "epoch": 6.59, + "learning_rate": 9.647768094211726e-05, + "loss": 0.1076, + "step": 23430 + }, + { + "epoch": 6.6, + "learning_rate": 9.645893855621154e-05, + "loss": 0.1125, + "step": 23460 + }, + { + "epoch": 6.6, + "learning_rate": 9.644019617030582e-05, + "loss": 0.1171, + "step": 23490 + }, + { + "epoch": 6.61, + "learning_rate": 9.64214537844001e-05, + "loss": 0.1105, + "step": 23520 + }, + { + "epoch": 6.62, + "learning_rate": 9.640271139849436e-05, + "loss": 0.1239, + "step": 23550 + }, + { + "epoch": 6.63, + "learning_rate": 9.638396901258864e-05, + "loss": 0.1027, + "step": 23580 + }, + { + "epoch": 6.64, + "learning_rate": 9.636522662668292e-05, + "loss": 0.117, + "step": 23610 + }, + { + "epoch": 6.65, + "learning_rate": 9.634648424077719e-05, + "loss": 0.1105, + "step": 23640 + }, + { + "epoch": 6.65, + "learning_rate": 9.632774185487147e-05, + "loss": 0.1073, + "step": 23670 + }, + { + "epoch": 6.66, + "learning_rate": 9.630899946896573e-05, + "loss": 0.1228, + "step": 23700 + }, + { + "epoch": 6.67, + "learning_rate": 9.629025708306001e-05, + "loss": 0.1066, + "step": 23730 + }, + { + "epoch": 6.68, + "learning_rate": 9.627213944335114e-05, + "loss": 0.1145, + "step": 23760 + }, + { + "epoch": 6.69, + "learning_rate": 9.625339705744541e-05, + "loss": 0.1163, + "step": 23790 + }, + { + "epoch": 6.7, + "learning_rate": 9.623527941773655e-05, + "loss": 0.1052, + "step": 23820 + }, + { + "epoch": 6.7, + "learning_rate": 9.621653703183082e-05, + "loss": 0.1171, + "step": 23850 + }, + { + "epoch": 6.71, + "learning_rate": 9.61977946459251e-05, + "loss": 0.1045, + "step": 23880 + }, + { + "epoch": 6.72, + "learning_rate": 9.617905226001938e-05, + "loss": 0.1056, + "step": 23910 + }, + { + "epoch": 6.73, + "learning_rate": 9.616030987411365e-05, + "loss": 0.115, + "step": 23940 + }, + { + "epoch": 6.74, + "learning_rate": 9.614156748820791e-05, + "loss": 0.1036, + "step": 23970 + }, + { + "epoch": 6.75, + "learning_rate": 9.61228251023022e-05, + "loss": 0.1216, + "step": 24000 + }, + { + "epoch": 6.76, + "learning_rate": 9.610408271639648e-05, + "loss": 0.1045, + "step": 24030 + }, + { + "epoch": 6.76, + "learning_rate": 9.608534033049074e-05, + "loss": 0.1125, + "step": 24060 + }, + { + "epoch": 6.77, + "learning_rate": 9.606659794458501e-05, + "loss": 0.1166, + "step": 24090 + }, + { + "epoch": 6.78, + "learning_rate": 9.604785555867929e-05, + "loss": 0.1079, + "step": 24120 + }, + { + "epoch": 6.79, + "learning_rate": 9.602911317277356e-05, + "loss": 0.123, + "step": 24150 + }, + { + "epoch": 6.8, + "learning_rate": 9.601037078686784e-05, + "loss": 0.104, + "step": 24180 + }, + { + "epoch": 6.81, + "learning_rate": 9.599162840096212e-05, + "loss": 0.1192, + "step": 24210 + }, + { + "epoch": 6.81, + "learning_rate": 9.597288601505639e-05, + "loss": 0.1106, + "step": 24240 + }, + { + "epoch": 6.82, + "learning_rate": 9.595414362915066e-05, + "loss": 0.11, + "step": 24270 + }, + { + "epoch": 6.83, + "learning_rate": 9.593540124324494e-05, + "loss": 0.1188, + "step": 24300 + }, + { + "epoch": 6.84, + "learning_rate": 9.591665885733922e-05, + "loss": 0.1059, + "step": 24330 + }, + { + "epoch": 6.85, + "learning_rate": 9.589791647143349e-05, + "loss": 0.1184, + "step": 24360 + }, + { + "epoch": 6.86, + "learning_rate": 9.587917408552775e-05, + "loss": 0.1098, + "step": 24390 + }, + { + "epoch": 6.87, + "learning_rate": 9.586043169962203e-05, + "loss": 0.1039, + "step": 24420 + }, + { + "epoch": 6.87, + "learning_rate": 9.584168931371632e-05, + "loss": 0.1155, + "step": 24450 + }, + { + "epoch": 6.88, + "learning_rate": 9.582294692781058e-05, + "loss": 0.1036, + "step": 24480 + }, + { + "epoch": 6.89, + "learning_rate": 9.580420454190485e-05, + "loss": 0.1124, + "step": 24510 + }, + { + "epoch": 6.9, + "learning_rate": 9.578546215599913e-05, + "loss": 0.1142, + "step": 24540 + }, + { + "epoch": 6.91, + "learning_rate": 9.57667197700934e-05, + "loss": 0.1034, + "step": 24570 + }, + { + "epoch": 6.92, + "learning_rate": 9.574797738418768e-05, + "loss": 0.1178, + "step": 24600 + }, + { + "epoch": 6.92, + "learning_rate": 9.572923499828196e-05, + "loss": 0.105, + "step": 24630 + }, + { + "epoch": 6.93, + "learning_rate": 9.571049261237623e-05, + "loss": 0.1113, + "step": 24660 + }, + { + "epoch": 6.94, + "learning_rate": 9.56917502264705e-05, + "loss": 0.1224, + "step": 24690 + }, + { + "epoch": 6.95, + "learning_rate": 9.567300784056478e-05, + "loss": 0.1039, + "step": 24720 + }, + { + "epoch": 6.96, + "learning_rate": 9.565426545465906e-05, + "loss": 0.1194, + "step": 24750 + }, + { + "epoch": 6.97, + "learning_rate": 9.563552306875332e-05, + "loss": 0.104, + "step": 24780 + }, + { + "epoch": 6.97, + "learning_rate": 9.561678068284759e-05, + "loss": 0.1157, + "step": 24810 + }, + { + "epoch": 6.98, + "learning_rate": 9.559803829694187e-05, + "loss": 0.1143, + "step": 24840 + }, + { + "epoch": 6.99, + "learning_rate": 9.557929591103615e-05, + "loss": 0.104, + "step": 24870 + }, + { + "epoch": 7.0, + "eval_loss": 0.11984840035438538, + "eval_runtime": 626.0548, + "eval_samples_per_second": 25.61, + "eval_steps_per_second": 0.802, + "eval_wer": 0.1232309309022423, + "step": 24899 + }, + { + "epoch": 7.0, + "learning_rate": 9.556055352513042e-05, + "loss": 0.1258, + "step": 24900 + }, + { + "epoch": 7.01, + "learning_rate": 9.554181113922469e-05, + "loss": 0.0959, + "step": 24930 + }, + { + "epoch": 7.02, + "learning_rate": 9.552306875331897e-05, + "loss": 0.1123, + "step": 24960 + }, + { + "epoch": 7.03, + "learning_rate": 9.550432636741324e-05, + "loss": 0.1, + "step": 24990 + }, + { + "epoch": 7.03, + "learning_rate": 9.548558398150752e-05, + "loss": 0.1059, + "step": 25020 + }, + { + "epoch": 7.04, + "learning_rate": 9.546684159560179e-05, + "loss": 0.1174, + "step": 25050 + }, + { + "epoch": 7.05, + "learning_rate": 9.544809920969607e-05, + "loss": 0.0959, + "step": 25080 + }, + { + "epoch": 7.06, + "learning_rate": 9.542935682379033e-05, + "loss": 0.1112, + "step": 25110 + }, + { + "epoch": 7.07, + "learning_rate": 9.541061443788461e-05, + "loss": 0.1046, + "step": 25140 + }, + { + "epoch": 7.08, + "learning_rate": 9.53918720519789e-05, + "loss": 0.11, + "step": 25170 + }, + { + "epoch": 7.08, + "learning_rate": 9.537312966607316e-05, + "loss": 0.117, + "step": 25200 + }, + { + "epoch": 7.09, + "learning_rate": 9.535438728016743e-05, + "loss": 0.0927, + "step": 25230 + }, + { + "epoch": 7.1, + "learning_rate": 9.533564489426171e-05, + "loss": 0.1123, + "step": 25260 + }, + { + "epoch": 7.11, + "learning_rate": 9.531690250835599e-05, + "loss": 0.0996, + "step": 25290 + }, + { + "epoch": 7.12, + "learning_rate": 9.529816012245026e-05, + "loss": 0.1092, + "step": 25320 + }, + { + "epoch": 7.13, + "learning_rate": 9.527941773654453e-05, + "loss": 0.1121, + "step": 25350 + }, + { + "epoch": 7.14, + "learning_rate": 9.526067535063881e-05, + "loss": 0.0937, + "step": 25380 + }, + { + "epoch": 7.14, + "learning_rate": 9.524193296473309e-05, + "loss": 0.1096, + "step": 25410 + }, + { + "epoch": 7.15, + "learning_rate": 9.522319057882736e-05, + "loss": 0.1018, + "step": 25440 + }, + { + "epoch": 7.16, + "learning_rate": 9.520444819292162e-05, + "loss": 0.1078, + "step": 25470 + }, + { + "epoch": 7.17, + "learning_rate": 9.51857058070159e-05, + "loss": 0.115, + "step": 25500 + }, + { + "epoch": 7.18, + "learning_rate": 9.516696342111017e-05, + "loss": 0.0936, + "step": 25530 + }, + { + "epoch": 7.19, + "learning_rate": 9.514822103520445e-05, + "loss": 0.1174, + "step": 25560 + }, + { + "epoch": 7.19, + "learning_rate": 9.512947864929873e-05, + "loss": 0.1086, + "step": 25590 + }, + { + "epoch": 7.2, + "learning_rate": 9.5110736263393e-05, + "loss": 0.1098, + "step": 25620 + }, + { + "epoch": 7.21, + "learning_rate": 9.509199387748727e-05, + "loss": 0.1126, + "step": 25650 + }, + { + "epoch": 7.22, + "learning_rate": 9.507325149158155e-05, + "loss": 0.0935, + "step": 25680 + }, + { + "epoch": 7.23, + "learning_rate": 9.505450910567583e-05, + "loss": 0.1122, + "step": 25710 + }, + { + "epoch": 7.24, + "learning_rate": 9.50357667197701e-05, + "loss": 0.1018, + "step": 25740 + }, + { + "epoch": 7.24, + "learning_rate": 9.501702433386437e-05, + "loss": 0.1102, + "step": 25770 + }, + { + "epoch": 7.25, + "learning_rate": 9.499828194795865e-05, + "loss": 0.1164, + "step": 25800 + }, + { + "epoch": 7.26, + "learning_rate": 9.497953956205293e-05, + "loss": 0.092, + "step": 25830 + }, + { + "epoch": 7.27, + "learning_rate": 9.49607971761472e-05, + "loss": 0.1108, + "step": 25860 + }, + { + "epoch": 7.28, + "learning_rate": 9.494205479024146e-05, + "loss": 0.0969, + "step": 25890 + }, + { + "epoch": 7.29, + "learning_rate": 9.492331240433574e-05, + "loss": 0.1029, + "step": 25920 + }, + { + "epoch": 7.3, + "learning_rate": 9.490457001843001e-05, + "loss": 0.1139, + "step": 25950 + }, + { + "epoch": 7.3, + "learning_rate": 9.488582763252429e-05, + "loss": 0.0978, + "step": 25980 + }, + { + "epoch": 7.31, + "learning_rate": 9.486708524661857e-05, + "loss": 0.1136, + "step": 26010 + }, + { + "epoch": 7.32, + "learning_rate": 9.484834286071284e-05, + "loss": 0.0996, + "step": 26040 + }, + { + "epoch": 7.33, + "learning_rate": 9.482960047480711e-05, + "loss": 0.1053, + "step": 26070 + }, + { + "epoch": 7.34, + "learning_rate": 9.481085808890139e-05, + "loss": 0.1142, + "step": 26100 + }, + { + "epoch": 7.35, + "learning_rate": 9.479211570299567e-05, + "loss": 0.0979, + "step": 26130 + }, + { + "epoch": 7.35, + "learning_rate": 9.477337331708994e-05, + "loss": 0.1102, + "step": 26160 + }, + { + "epoch": 7.36, + "learning_rate": 9.47546309311842e-05, + "loss": 0.1011, + "step": 26190 + }, + { + "epoch": 7.37, + "learning_rate": 9.473588854527849e-05, + "loss": 0.1068, + "step": 26220 + }, + { + "epoch": 7.38, + "learning_rate": 9.471714615937277e-05, + "loss": 0.1188, + "step": 26250 + }, + { + "epoch": 7.39, + "learning_rate": 9.469840377346703e-05, + "loss": 0.0927, + "step": 26280 + }, + { + "epoch": 7.4, + "learning_rate": 9.46796613875613e-05, + "loss": 0.1174, + "step": 26310 + }, + { + "epoch": 7.41, + "learning_rate": 9.466091900165558e-05, + "loss": 0.0982, + "step": 26340 + }, + { + "epoch": 7.41, + "learning_rate": 9.464217661574985e-05, + "loss": 0.1112, + "step": 26370 + }, + { + "epoch": 7.42, + "learning_rate": 9.462405897604099e-05, + "loss": 0.1149, + "step": 26400 + }, + { + "epoch": 7.43, + "learning_rate": 9.460531659013526e-05, + "loss": 0.0922, + "step": 26430 + }, + { + "epoch": 7.44, + "learning_rate": 9.458657420422954e-05, + "loss": 0.1148, + "step": 26460 + }, + { + "epoch": 7.45, + "learning_rate": 9.456783181832382e-05, + "loss": 0.1004, + "step": 26490 + }, + { + "epoch": 7.46, + "learning_rate": 9.454908943241809e-05, + "loss": 0.1057, + "step": 26520 + }, + { + "epoch": 7.46, + "learning_rate": 9.453034704651235e-05, + "loss": 0.1195, + "step": 26550 + }, + { + "epoch": 7.47, + "learning_rate": 9.451160466060664e-05, + "loss": 0.095, + "step": 26580 + }, + { + "epoch": 7.48, + "learning_rate": 9.449286227470092e-05, + "loss": 0.1192, + "step": 26610 + }, + { + "epoch": 7.49, + "learning_rate": 9.447411988879517e-05, + "loss": 0.1084, + "step": 26640 + }, + { + "epoch": 7.5, + "learning_rate": 9.445537750288945e-05, + "loss": 0.1083, + "step": 26670 + }, + { + "epoch": 7.51, + "learning_rate": 9.443663511698373e-05, + "loss": 0.1119, + "step": 26700 + }, + { + "epoch": 7.51, + "learning_rate": 9.4417892731078e-05, + "loss": 0.096, + "step": 26730 + }, + { + "epoch": 7.52, + "learning_rate": 9.439915034517228e-05, + "loss": 0.1226, + "step": 26760 + }, + { + "epoch": 7.53, + "learning_rate": 9.438040795926655e-05, + "loss": 0.099, + "step": 26790 + }, + { + "epoch": 7.54, + "learning_rate": 9.436166557336083e-05, + "loss": 0.1103, + "step": 26820 + }, + { + "epoch": 7.55, + "learning_rate": 9.43429231874551e-05, + "loss": 0.1186, + "step": 26850 + }, + { + "epoch": 7.56, + "learning_rate": 9.432418080154938e-05, + "loss": 0.0976, + "step": 26880 + }, + { + "epoch": 7.57, + "learning_rate": 9.430543841564366e-05, + "loss": 0.1112, + "step": 26910 + }, + { + "epoch": 7.57, + "learning_rate": 9.428669602973793e-05, + "loss": 0.1035, + "step": 26940 + }, + { + "epoch": 7.58, + "learning_rate": 9.42679536438322e-05, + "loss": 0.1073, + "step": 26970 + }, + { + "epoch": 7.59, + "learning_rate": 9.424921125792647e-05, + "loss": 0.1147, + "step": 27000 + }, + { + "epoch": 7.6, + "learning_rate": 9.423046887202076e-05, + "loss": 0.0989, + "step": 27030 + }, + { + "epoch": 7.61, + "learning_rate": 9.421172648611501e-05, + "loss": 0.1166, + "step": 27060 + }, + { + "epoch": 7.62, + "learning_rate": 9.419298410020929e-05, + "loss": 0.0969, + "step": 27090 + }, + { + "epoch": 7.62, + "learning_rate": 9.417424171430357e-05, + "loss": 0.1039, + "step": 27120 + }, + { + "epoch": 7.63, + "learning_rate": 9.415549932839784e-05, + "loss": 0.1216, + "step": 27150 + }, + { + "epoch": 7.64, + "learning_rate": 9.413675694249212e-05, + "loss": 0.0946, + "step": 27180 + }, + { + "epoch": 7.65, + "learning_rate": 9.411801455658639e-05, + "loss": 0.1187, + "step": 27210 + }, + { + "epoch": 7.66, + "learning_rate": 9.409927217068067e-05, + "loss": 0.1028, + "step": 27240 + }, + { + "epoch": 7.67, + "learning_rate": 9.408052978477494e-05, + "loss": 0.1044, + "step": 27270 + }, + { + "epoch": 7.67, + "learning_rate": 9.406178739886922e-05, + "loss": 0.1126, + "step": 27300 + }, + { + "epoch": 7.68, + "learning_rate": 9.40430450129635e-05, + "loss": 0.0944, + "step": 27330 + }, + { + "epoch": 7.69, + "learning_rate": 9.402430262705776e-05, + "loss": 0.1097, + "step": 27360 + }, + { + "epoch": 7.7, + "learning_rate": 9.400556024115203e-05, + "loss": 0.1006, + "step": 27390 + }, + { + "epoch": 7.71, + "learning_rate": 9.398681785524631e-05, + "loss": 0.1033, + "step": 27420 + }, + { + "epoch": 7.72, + "learning_rate": 9.39680754693406e-05, + "loss": 0.1064, + "step": 27450 + }, + { + "epoch": 7.73, + "learning_rate": 9.394933308343485e-05, + "loss": 0.0932, + "step": 27480 + }, + { + "epoch": 7.73, + "learning_rate": 9.393059069752913e-05, + "loss": 0.1108, + "step": 27510 + }, + { + "epoch": 7.74, + "learning_rate": 9.391184831162341e-05, + "loss": 0.0994, + "step": 27540 + }, + { + "epoch": 7.75, + "learning_rate": 9.389310592571768e-05, + "loss": 0.1026, + "step": 27570 + }, + { + "epoch": 7.76, + "learning_rate": 9.387436353981196e-05, + "loss": 0.1104, + "step": 27600 + }, + { + "epoch": 7.77, + "learning_rate": 9.385562115390623e-05, + "loss": 0.0941, + "step": 27630 + }, + { + "epoch": 7.78, + "learning_rate": 9.383687876800051e-05, + "loss": 0.1146, + "step": 27660 + }, + { + "epoch": 7.78, + "learning_rate": 9.381813638209477e-05, + "loss": 0.106, + "step": 27690 + }, + { + "epoch": 7.79, + "learning_rate": 9.379939399618906e-05, + "loss": 0.1102, + "step": 27720 + }, + { + "epoch": 7.8, + "learning_rate": 9.378065161028334e-05, + "loss": 0.108, + "step": 27750 + }, + { + "epoch": 7.81, + "learning_rate": 9.37619092243776e-05, + "loss": 0.0949, + "step": 27780 + }, + { + "epoch": 7.82, + "learning_rate": 9.374316683847187e-05, + "loss": 0.1134, + "step": 27810 + }, + { + "epoch": 7.83, + "learning_rate": 9.372442445256615e-05, + "loss": 0.0981, + "step": 27840 + }, + { + "epoch": 7.84, + "learning_rate": 9.370568206666043e-05, + "loss": 0.1079, + "step": 27870 + }, + { + "epoch": 7.84, + "learning_rate": 9.368693968075469e-05, + "loss": 0.1165, + "step": 27900 + }, + { + "epoch": 7.85, + "learning_rate": 9.366819729484897e-05, + "loss": 0.0959, + "step": 27930 + }, + { + "epoch": 7.86, + "learning_rate": 9.364945490894325e-05, + "loss": 0.1193, + "step": 27960 + }, + { + "epoch": 7.87, + "learning_rate": 9.363071252303752e-05, + "loss": 0.1038, + "step": 27990 + }, + { + "epoch": 7.88, + "learning_rate": 9.36119701371318e-05, + "loss": 0.1072, + "step": 28020 + }, + { + "epoch": 7.89, + "learning_rate": 9.359322775122606e-05, + "loss": 0.1191, + "step": 28050 + }, + { + "epoch": 7.89, + "learning_rate": 9.357448536532035e-05, + "loss": 0.0997, + "step": 28080 + }, + { + "epoch": 7.9, + "learning_rate": 9.355574297941461e-05, + "loss": 0.1102, + "step": 28110 + }, + { + "epoch": 7.91, + "learning_rate": 9.35370005935089e-05, + "loss": 0.1058, + "step": 28140 + }, + { + "epoch": 7.92, + "learning_rate": 9.351825820760317e-05, + "loss": 0.0983, + "step": 28170 + }, + { + "epoch": 7.93, + "learning_rate": 9.349951582169744e-05, + "loss": 0.1127, + "step": 28200 + }, + { + "epoch": 7.94, + "learning_rate": 9.348077343579171e-05, + "loss": 0.0877, + "step": 28230 + }, + { + "epoch": 7.94, + "learning_rate": 9.346203104988599e-05, + "loss": 0.1073, + "step": 28260 + }, + { + "epoch": 7.95, + "learning_rate": 9.344328866398027e-05, + "loss": 0.0968, + "step": 28290 + }, + { + "epoch": 7.96, + "learning_rate": 9.342454627807453e-05, + "loss": 0.1089, + "step": 28320 + }, + { + "epoch": 7.97, + "learning_rate": 9.34058038921688e-05, + "loss": 0.1091, + "step": 28350 + }, + { + "epoch": 7.98, + "learning_rate": 9.338706150626309e-05, + "loss": 0.09, + "step": 28380 + }, + { + "epoch": 7.99, + "learning_rate": 9.336831912035735e-05, + "loss": 0.1115, + "step": 28410 + }, + { + "epoch": 8.0, + "learning_rate": 9.334957673445164e-05, + "loss": 0.1016, + "step": 28440 + }, + { + "epoch": 8.0, + "eval_loss": 0.11488943547010422, + "eval_runtime": 627.1988, + "eval_samples_per_second": 25.563, + "eval_steps_per_second": 0.8, + "eval_wer": 0.11741023296439343, + "step": 28456 + }, + { + "epoch": 8.0, + "learning_rate": 9.33308343485459e-05, + "loss": 0.1083, + "step": 28470 + }, + { + "epoch": 8.01, + "learning_rate": 9.331209196264018e-05, + "loss": 0.0995, + "step": 28500 + }, + { + "epoch": 8.02, + "learning_rate": 9.329334957673445e-05, + "loss": 0.1002, + "step": 28530 + }, + { + "epoch": 8.03, + "learning_rate": 9.327523193702559e-05, + "loss": 0.1104, + "step": 28560 + }, + { + "epoch": 8.04, + "learning_rate": 9.325648955111986e-05, + "loss": 0.0921, + "step": 28590 + }, + { + "epoch": 8.05, + "learning_rate": 9.323774716521414e-05, + "loss": 0.1051, + "step": 28620 + }, + { + "epoch": 8.05, + "learning_rate": 9.321900477930841e-05, + "loss": 0.0953, + "step": 28650 + }, + { + "epoch": 8.06, + "learning_rate": 9.320026239340268e-05, + "loss": 0.1033, + "step": 28680 + }, + { + "epoch": 8.07, + "learning_rate": 9.318214475369382e-05, + "loss": 0.1058, + "step": 28710 + }, + { + "epoch": 8.08, + "learning_rate": 9.316340236778808e-05, + "loss": 0.092, + "step": 28740 + }, + { + "epoch": 8.09, + "learning_rate": 9.314465998188237e-05, + "loss": 0.1034, + "step": 28770 + }, + { + "epoch": 8.1, + "learning_rate": 9.312591759597665e-05, + "loss": 0.098, + "step": 28800 + }, + { + "epoch": 8.11, + "learning_rate": 9.310717521007091e-05, + "loss": 0.1031, + "step": 28830 + }, + { + "epoch": 8.11, + "learning_rate": 9.308843282416518e-05, + "loss": 0.1135, + "step": 28860 + }, + { + "epoch": 8.12, + "learning_rate": 9.306969043825946e-05, + "loss": 0.0926, + "step": 28890 + }, + { + "epoch": 8.13, + "learning_rate": 9.305094805235374e-05, + "loss": 0.1015, + "step": 28920 + }, + { + "epoch": 8.14, + "learning_rate": 9.303220566644801e-05, + "loss": 0.0998, + "step": 28950 + }, + { + "epoch": 8.15, + "learning_rate": 9.301346328054228e-05, + "loss": 0.0955, + "step": 28980 + }, + { + "epoch": 8.16, + "learning_rate": 9.299472089463656e-05, + "loss": 0.108, + "step": 29010 + }, + { + "epoch": 8.16, + "learning_rate": 9.297597850873083e-05, + "loss": 0.0934, + "step": 29040 + }, + { + "epoch": 8.17, + "learning_rate": 9.295723612282511e-05, + "loss": 0.1025, + "step": 29070 + }, + { + "epoch": 8.18, + "learning_rate": 9.293849373691939e-05, + "loss": 0.097, + "step": 29100 + }, + { + "epoch": 8.19, + "learning_rate": 9.291975135101366e-05, + "loss": 0.1069, + "step": 29130 + }, + { + "epoch": 8.2, + "learning_rate": 9.290100896510792e-05, + "loss": 0.1104, + "step": 29160 + }, + { + "epoch": 8.21, + "learning_rate": 9.28822665792022e-05, + "loss": 0.0895, + "step": 29190 + }, + { + "epoch": 8.21, + "learning_rate": 9.286352419329648e-05, + "loss": 0.1026, + "step": 29220 + }, + { + "epoch": 8.22, + "learning_rate": 9.284478180739075e-05, + "loss": 0.0924, + "step": 29250 + }, + { + "epoch": 8.23, + "learning_rate": 9.282603942148502e-05, + "loss": 0.0973, + "step": 29280 + }, + { + "epoch": 8.24, + "learning_rate": 9.28072970355793e-05, + "loss": 0.1098, + "step": 29310 + }, + { + "epoch": 8.25, + "learning_rate": 9.278855464967358e-05, + "loss": 0.0942, + "step": 29340 + }, + { + "epoch": 8.26, + "learning_rate": 9.276981226376785e-05, + "loss": 0.1048, + "step": 29370 + }, + { + "epoch": 8.27, + "learning_rate": 9.275106987786212e-05, + "loss": 0.0945, + "step": 29400 + }, + { + "epoch": 8.27, + "learning_rate": 9.27323274919564e-05, + "loss": 0.0995, + "step": 29430 + }, + { + "epoch": 8.28, + "learning_rate": 9.271358510605066e-05, + "loss": 0.1078, + "step": 29460 + }, + { + "epoch": 8.29, + "learning_rate": 9.269484272014495e-05, + "loss": 0.0921, + "step": 29490 + }, + { + "epoch": 8.3, + "learning_rate": 9.267610033423923e-05, + "loss": 0.1061, + "step": 29520 + }, + { + "epoch": 8.31, + "learning_rate": 9.26573579483335e-05, + "loss": 0.1074, + "step": 29550 + }, + { + "epoch": 8.32, + "learning_rate": 9.263861556242776e-05, + "loss": 0.1011, + "step": 29580 + }, + { + "epoch": 8.32, + "learning_rate": 9.261987317652204e-05, + "loss": 0.1112, + "step": 29610 + }, + { + "epoch": 8.33, + "learning_rate": 9.260113079061632e-05, + "loss": 0.0914, + "step": 29640 + }, + { + "epoch": 8.34, + "learning_rate": 9.258238840471059e-05, + "loss": 0.1067, + "step": 29670 + }, + { + "epoch": 8.35, + "learning_rate": 9.256364601880486e-05, + "loss": 0.0999, + "step": 29700 + }, + { + "epoch": 8.36, + "learning_rate": 9.254490363289914e-05, + "loss": 0.1004, + "step": 29730 + }, + { + "epoch": 8.37, + "learning_rate": 9.252616124699342e-05, + "loss": 0.1104, + "step": 29760 + }, + { + "epoch": 8.37, + "learning_rate": 9.250741886108769e-05, + "loss": 0.0894, + "step": 29790 + }, + { + "epoch": 8.38, + "learning_rate": 9.248867647518196e-05, + "loss": 0.1061, + "step": 29820 + }, + { + "epoch": 8.39, + "learning_rate": 9.246993408927624e-05, + "loss": 0.0998, + "step": 29850 + }, + { + "epoch": 8.4, + "learning_rate": 9.24511917033705e-05, + "loss": 0.1022, + "step": 29880 + }, + { + "epoch": 8.41, + "learning_rate": 9.243244931746478e-05, + "loss": 0.1088, + "step": 29910 + }, + { + "epoch": 8.42, + "learning_rate": 9.241370693155907e-05, + "loss": 0.0886, + "step": 29940 + }, + { + "epoch": 8.43, + "learning_rate": 9.239496454565333e-05, + "loss": 0.1035, + "step": 29970 + }, + { + "epoch": 8.43, + "learning_rate": 9.23762221597476e-05, + "loss": 0.1044, + "step": 30000 + }, + { + "epoch": 8.44, + "learning_rate": 9.235747977384188e-05, + "loss": 0.1073, + "step": 30030 + }, + { + "epoch": 8.45, + "learning_rate": 9.233873738793616e-05, + "loss": 0.108, + "step": 30060 + }, + { + "epoch": 8.46, + "learning_rate": 9.231999500203043e-05, + "loss": 0.0909, + "step": 30090 + }, + { + "epoch": 8.47, + "learning_rate": 9.23012526161247e-05, + "loss": 0.105, + "step": 30120 + }, + { + "epoch": 8.48, + "learning_rate": 9.228251023021898e-05, + "loss": 0.1061, + "step": 30150 + }, + { + "epoch": 8.48, + "learning_rate": 9.226376784431326e-05, + "loss": 0.0993, + "step": 30180 + }, + { + "epoch": 8.49, + "learning_rate": 9.224502545840753e-05, + "loss": 0.1154, + "step": 30210 + }, + { + "epoch": 8.5, + "learning_rate": 9.22262830725018e-05, + "loss": 0.0923, + "step": 30240 + }, + { + "epoch": 8.51, + "learning_rate": 9.220754068659607e-05, + "loss": 0.1011, + "step": 30270 + }, + { + "epoch": 8.52, + "learning_rate": 9.218879830069036e-05, + "loss": 0.0979, + "step": 30300 + }, + { + "epoch": 8.53, + "learning_rate": 9.217005591478462e-05, + "loss": 0.1008, + "step": 30330 + }, + { + "epoch": 8.54, + "learning_rate": 9.21513135288789e-05, + "loss": 0.1122, + "step": 30360 + }, + { + "epoch": 8.54, + "learning_rate": 9.213257114297317e-05, + "loss": 0.0901, + "step": 30390 + }, + { + "epoch": 8.55, + "learning_rate": 9.211382875706744e-05, + "loss": 0.105, + "step": 30420 + }, + { + "epoch": 8.56, + "learning_rate": 9.209508637116172e-05, + "loss": 0.1004, + "step": 30450 + }, + { + "epoch": 8.57, + "learning_rate": 9.2076343985256e-05, + "loss": 0.1007, + "step": 30480 + }, + { + "epoch": 8.58, + "learning_rate": 9.205760159935027e-05, + "loss": 0.1087, + "step": 30510 + }, + { + "epoch": 8.59, + "learning_rate": 9.203885921344454e-05, + "loss": 0.089, + "step": 30540 + }, + { + "epoch": 8.59, + "learning_rate": 9.202011682753882e-05, + "loss": 0.1043, + "step": 30570 + }, + { + "epoch": 8.6, + "learning_rate": 9.20013744416331e-05, + "loss": 0.0993, + "step": 30600 + }, + { + "epoch": 8.61, + "learning_rate": 9.198263205572736e-05, + "loss": 0.1034, + "step": 30630 + }, + { + "epoch": 8.62, + "learning_rate": 9.196388966982163e-05, + "loss": 0.1131, + "step": 30660 + }, + { + "epoch": 8.63, + "learning_rate": 9.194514728391591e-05, + "loss": 0.0932, + "step": 30690 + }, + { + "epoch": 8.64, + "learning_rate": 9.19264048980102e-05, + "loss": 0.1048, + "step": 30720 + }, + { + "epoch": 8.64, + "learning_rate": 9.190766251210446e-05, + "loss": 0.0999, + "step": 30750 + }, + { + "epoch": 8.65, + "learning_rate": 9.188892012619874e-05, + "loss": 0.0966, + "step": 30780 + }, + { + "epoch": 8.66, + "learning_rate": 9.187017774029301e-05, + "loss": 0.1145, + "step": 30810 + }, + { + "epoch": 8.67, + "learning_rate": 9.185143535438728e-05, + "loss": 0.091, + "step": 30840 + }, + { + "epoch": 8.68, + "learning_rate": 9.183269296848156e-05, + "loss": 0.1044, + "step": 30870 + }, + { + "epoch": 8.69, + "learning_rate": 9.181395058257584e-05, + "loss": 0.1011, + "step": 30900 + }, + { + "epoch": 8.7, + "learning_rate": 9.179520819667011e-05, + "loss": 0.1018, + "step": 30930 + }, + { + "epoch": 8.7, + "learning_rate": 9.177646581076437e-05, + "loss": 0.1124, + "step": 30960 + }, + { + "epoch": 8.71, + "learning_rate": 9.175772342485866e-05, + "loss": 0.0898, + "step": 30990 + }, + { + "epoch": 8.72, + "learning_rate": 9.173898103895294e-05, + "loss": 0.1051, + "step": 31020 + }, + { + "epoch": 8.73, + "learning_rate": 9.17202386530472e-05, + "loss": 0.0969, + "step": 31050 + }, + { + "epoch": 8.74, + "learning_rate": 9.170149626714147e-05, + "loss": 0.104, + "step": 31080 + }, + { + "epoch": 8.75, + "learning_rate": 9.168275388123575e-05, + "loss": 0.1103, + "step": 31110 + }, + { + "epoch": 8.75, + "learning_rate": 9.166401149533003e-05, + "loss": 0.0957, + "step": 31140 + }, + { + "epoch": 8.76, + "learning_rate": 9.16452691094243e-05, + "loss": 0.1092, + "step": 31170 + }, + { + "epoch": 8.77, + "learning_rate": 9.162652672351858e-05, + "loss": 0.0989, + "step": 31200 + }, + { + "epoch": 8.78, + "learning_rate": 9.160778433761285e-05, + "loss": 0.1058, + "step": 31230 + }, + { + "epoch": 8.79, + "learning_rate": 9.158904195170712e-05, + "loss": 0.1142, + "step": 31260 + }, + { + "epoch": 8.8, + "learning_rate": 9.15702995658014e-05, + "loss": 0.0938, + "step": 31290 + }, + { + "epoch": 8.81, + "learning_rate": 9.155155717989568e-05, + "loss": 0.1088, + "step": 31320 + }, + { + "epoch": 8.81, + "learning_rate": 9.153281479398995e-05, + "loss": 0.097, + "step": 31350 + }, + { + "epoch": 8.82, + "learning_rate": 9.151407240808421e-05, + "loss": 0.1025, + "step": 31380 + }, + { + "epoch": 8.83, + "learning_rate": 9.14953300221785e-05, + "loss": 0.1101, + "step": 31410 + }, + { + "epoch": 8.84, + "learning_rate": 9.147658763627277e-05, + "loss": 0.0961, + "step": 31440 + }, + { + "epoch": 8.85, + "learning_rate": 9.145784525036704e-05, + "loss": 0.1039, + "step": 31470 + }, + { + "epoch": 8.86, + "learning_rate": 9.143910286446131e-05, + "loss": 0.0936, + "step": 31500 + }, + { + "epoch": 8.86, + "learning_rate": 9.142036047855559e-05, + "loss": 0.1052, + "step": 31530 + }, + { + "epoch": 8.87, + "learning_rate": 9.140161809264987e-05, + "loss": 0.1137, + "step": 31560 + }, + { + "epoch": 8.88, + "learning_rate": 9.138287570674414e-05, + "loss": 0.0901, + "step": 31590 + }, + { + "epoch": 8.89, + "learning_rate": 9.136413332083842e-05, + "loss": 0.1114, + "step": 31620 + }, + { + "epoch": 8.9, + "learning_rate": 9.134539093493269e-05, + "loss": 0.1087, + "step": 31650 + }, + { + "epoch": 8.91, + "learning_rate": 9.132664854902695e-05, + "loss": 0.0996, + "step": 31680 + }, + { + "epoch": 8.91, + "learning_rate": 9.130790616312124e-05, + "loss": 0.1099, + "step": 31710 + }, + { + "epoch": 8.92, + "learning_rate": 9.128916377721552e-05, + "loss": 0.0931, + "step": 31740 + }, + { + "epoch": 8.93, + "learning_rate": 9.127042139130978e-05, + "loss": 0.1089, + "step": 31770 + }, + { + "epoch": 8.94, + "learning_rate": 9.125167900540405e-05, + "loss": 0.0992, + "step": 31800 + }, + { + "epoch": 8.95, + "learning_rate": 9.123293661949833e-05, + "loss": 0.0979, + "step": 31830 + }, + { + "epoch": 8.96, + "learning_rate": 9.121419423359261e-05, + "loss": 0.1147, + "step": 31860 + }, + { + "epoch": 8.97, + "learning_rate": 9.119545184768688e-05, + "loss": 0.0898, + "step": 31890 + }, + { + "epoch": 8.97, + "learning_rate": 9.117670946178115e-05, + "loss": 0.11, + "step": 31920 + }, + { + "epoch": 8.98, + "learning_rate": 9.115796707587543e-05, + "loss": 0.1, + "step": 31950 + }, + { + "epoch": 8.99, + "learning_rate": 9.113922468996971e-05, + "loss": 0.0993, + "step": 31980 + }, + { + "epoch": 9.0, + "learning_rate": 9.112048230406398e-05, + "loss": 0.1093, + "step": 32010 + }, + { + "epoch": 9.0, + "eval_loss": 0.1185522973537445, + "eval_runtime": 627.341, + "eval_samples_per_second": 25.557, + "eval_steps_per_second": 0.8, + "eval_wer": 0.11861122105004572, + "step": 32013 + }, + { + "epoch": 9.01, + "learning_rate": 9.110173991815826e-05, + "loss": 0.0927, + "step": 32040 + }, + { + "epoch": 9.02, + "learning_rate": 9.108299753225253e-05, + "loss": 0.1062, + "step": 32070 + }, + { + "epoch": 9.02, + "learning_rate": 9.10642551463468e-05, + "loss": 0.0905, + "step": 32100 + }, + { + "epoch": 9.03, + "learning_rate": 9.104551276044107e-05, + "loss": 0.0989, + "step": 32130 + }, + { + "epoch": 9.04, + "learning_rate": 9.102677037453536e-05, + "loss": 0.0978, + "step": 32160 + }, + { + "epoch": 9.05, + "learning_rate": 9.100802798862962e-05, + "loss": 0.0939, + "step": 32190 + }, + { + "epoch": 9.06, + "learning_rate": 9.098928560272389e-05, + "loss": 0.1024, + "step": 32220 + }, + { + "epoch": 9.07, + "learning_rate": 9.097054321681817e-05, + "loss": 0.0957, + "step": 32250 + }, + { + "epoch": 9.08, + "learning_rate": 9.095180083091245e-05, + "loss": 0.1051, + "step": 32280 + }, + { + "epoch": 9.08, + "learning_rate": 9.093305844500672e-05, + "loss": 0.1007, + "step": 32310 + }, + { + "epoch": 9.09, + "learning_rate": 9.091431605910099e-05, + "loss": 0.0893, + "step": 32340 + }, + { + "epoch": 9.1, + "learning_rate": 9.089557367319527e-05, + "loss": 0.1098, + "step": 32370 + }, + { + "epoch": 9.11, + "learning_rate": 9.087683128728955e-05, + "loss": 0.0906, + "step": 32400 + }, + { + "epoch": 9.12, + "learning_rate": 9.085808890138382e-05, + "loss": 0.0999, + "step": 32430 + }, + { + "epoch": 9.13, + "learning_rate": 9.08393465154781e-05, + "loss": 0.0995, + "step": 32460 + }, + { + "epoch": 9.13, + "learning_rate": 9.082060412957236e-05, + "loss": 0.096, + "step": 32490 + }, + { + "epoch": 9.14, + "learning_rate": 9.080186174366663e-05, + "loss": 0.1018, + "step": 32520 + }, + { + "epoch": 9.15, + "learning_rate": 9.078311935776091e-05, + "loss": 0.0923, + "step": 32550 + }, + { + "epoch": 9.16, + "learning_rate": 9.07643769718552e-05, + "loss": 0.1083, + "step": 32580 + }, + { + "epoch": 9.17, + "learning_rate": 9.074563458594946e-05, + "loss": 0.1014, + "step": 32610 + }, + { + "epoch": 9.18, + "learning_rate": 9.072689220004373e-05, + "loss": 0.0928, + "step": 32640 + }, + { + "epoch": 9.18, + "learning_rate": 9.070814981413801e-05, + "loss": 0.1015, + "step": 32670 + }, + { + "epoch": 9.19, + "learning_rate": 9.068940742823229e-05, + "loss": 0.087, + "step": 32700 + }, + { + "epoch": 9.2, + "learning_rate": 9.067066504232656e-05, + "loss": 0.0975, + "step": 32730 + }, + { + "epoch": 9.21, + "learning_rate": 9.065192265642083e-05, + "loss": 0.1041, + "step": 32760 + }, + { + "epoch": 9.22, + "learning_rate": 9.063380501671197e-05, + "loss": 0.0955, + "step": 32790 + }, + { + "epoch": 9.23, + "learning_rate": 9.061506263080623e-05, + "loss": 0.1057, + "step": 32820 + }, + { + "epoch": 9.24, + "learning_rate": 9.059632024490052e-05, + "loss": 0.0912, + "step": 32850 + }, + { + "epoch": 9.24, + "learning_rate": 9.057757785899478e-05, + "loss": 0.1005, + "step": 32880 + }, + { + "epoch": 9.25, + "learning_rate": 9.055883547308906e-05, + "loss": 0.0988, + "step": 32910 + }, + { + "epoch": 9.26, + "learning_rate": 9.054009308718333e-05, + "loss": 0.0931, + "step": 32940 + }, + { + "epoch": 9.27, + "learning_rate": 9.052135070127761e-05, + "loss": 0.0993, + "step": 32970 + }, + { + "epoch": 9.28, + "learning_rate": 9.050260831537188e-05, + "loss": 0.0924, + "step": 33000 + }, + { + "epoch": 9.29, + "learning_rate": 9.048386592946616e-05, + "loss": 0.1019, + "step": 33030 + }, + { + "epoch": 9.29, + "learning_rate": 9.046512354356044e-05, + "loss": 0.1037, + "step": 33060 + }, + { + "epoch": 9.3, + "learning_rate": 9.044638115765471e-05, + "loss": 0.0935, + "step": 33090 + }, + { + "epoch": 9.31, + "learning_rate": 9.042763877174898e-05, + "loss": 0.1092, + "step": 33120 + }, + { + "epoch": 9.32, + "learning_rate": 9.040889638584326e-05, + "loss": 0.0934, + "step": 33150 + }, + { + "epoch": 9.33, + "learning_rate": 9.039015399993754e-05, + "loss": 0.0979, + "step": 33180 + }, + { + "epoch": 9.34, + "learning_rate": 9.03714116140318e-05, + "loss": 0.0993, + "step": 33210 + }, + { + "epoch": 9.34, + "learning_rate": 9.035266922812607e-05, + "loss": 0.097, + "step": 33240 + }, + { + "epoch": 9.35, + "learning_rate": 9.033392684222035e-05, + "loss": 0.1051, + "step": 33270 + }, + { + "epoch": 9.36, + "learning_rate": 9.031518445631462e-05, + "loss": 0.0935, + "step": 33300 + }, + { + "epoch": 9.37, + "learning_rate": 9.02964420704089e-05, + "loss": 0.1072, + "step": 33330 + }, + { + "epoch": 9.38, + "learning_rate": 9.027769968450317e-05, + "loss": 0.0984, + "step": 33360 + }, + { + "epoch": 9.39, + "learning_rate": 9.025895729859745e-05, + "loss": 0.0939, + "step": 33390 + }, + { + "epoch": 9.4, + "learning_rate": 9.024021491269172e-05, + "loss": 0.1067, + "step": 33420 + }, + { + "epoch": 9.4, + "learning_rate": 9.0221472526786e-05, + "loss": 0.0906, + "step": 33450 + }, + { + "epoch": 9.41, + "learning_rate": 9.020273014088028e-05, + "loss": 0.1041, + "step": 33480 + }, + { + "epoch": 9.42, + "learning_rate": 9.018398775497455e-05, + "loss": 0.1022, + "step": 33510 + }, + { + "epoch": 9.43, + "learning_rate": 9.016524536906881e-05, + "loss": 0.0975, + "step": 33540 + }, + { + "epoch": 9.44, + "learning_rate": 9.01465029831631e-05, + "loss": 0.1084, + "step": 33570 + }, + { + "epoch": 9.45, + "learning_rate": 9.012776059725738e-05, + "loss": 0.0915, + "step": 33600 + }, + { + "epoch": 9.45, + "learning_rate": 9.010901821135164e-05, + "loss": 0.1043, + "step": 33630 + }, + { + "epoch": 9.46, + "learning_rate": 9.009027582544591e-05, + "loss": 0.1025, + "step": 33660 + }, + { + "epoch": 9.47, + "learning_rate": 9.007153343954019e-05, + "loss": 0.0935, + "step": 33690 + }, + { + "epoch": 9.48, + "learning_rate": 9.005279105363446e-05, + "loss": 0.1033, + "step": 33720 + }, + { + "epoch": 9.49, + "learning_rate": 9.003404866772874e-05, + "loss": 0.0919, + "step": 33750 + }, + { + "epoch": 9.5, + "learning_rate": 9.001530628182301e-05, + "loss": 0.1023, + "step": 33780 + }, + { + "epoch": 9.51, + "learning_rate": 8.999656389591729e-05, + "loss": 0.1017, + "step": 33810 + }, + { + "epoch": 9.51, + "learning_rate": 8.997782151001156e-05, + "loss": 0.0952, + "step": 33840 + }, + { + "epoch": 9.52, + "learning_rate": 8.995907912410584e-05, + "loss": 0.1087, + "step": 33870 + }, + { + "epoch": 9.53, + "learning_rate": 8.994033673820012e-05, + "loss": 0.0983, + "step": 33900 + }, + { + "epoch": 9.54, + "learning_rate": 8.992159435229439e-05, + "loss": 0.1104, + "step": 33930 + }, + { + "epoch": 9.55, + "learning_rate": 8.990285196638865e-05, + "loss": 0.1017, + "step": 33960 + }, + { + "epoch": 9.56, + "learning_rate": 8.988410958048293e-05, + "loss": 0.0936, + "step": 33990 + }, + { + "epoch": 9.56, + "learning_rate": 8.986536719457722e-05, + "loss": 0.1063, + "step": 34020 + }, + { + "epoch": 9.57, + "learning_rate": 8.984662480867148e-05, + "loss": 0.0896, + "step": 34050 + }, + { + "epoch": 9.58, + "learning_rate": 8.982788242276575e-05, + "loss": 0.1027, + "step": 34080 + }, + { + "epoch": 9.59, + "learning_rate": 8.980976478305688e-05, + "loss": 0.1027, + "step": 34110 + }, + { + "epoch": 9.6, + "learning_rate": 8.979102239715116e-05, + "loss": 0.0974, + "step": 34140 + }, + { + "epoch": 9.61, + "learning_rate": 8.977228001124544e-05, + "loss": 0.1036, + "step": 34170 + }, + { + "epoch": 9.61, + "learning_rate": 8.975353762533971e-05, + "loss": 0.0923, + "step": 34200 + }, + { + "epoch": 9.62, + "learning_rate": 8.973479523943399e-05, + "loss": 0.1057, + "step": 34230 + }, + { + "epoch": 9.63, + "learning_rate": 8.971605285352826e-05, + "loss": 0.1012, + "step": 34260 + }, + { + "epoch": 9.64, + "learning_rate": 8.969731046762254e-05, + "loss": 0.0945, + "step": 34290 + }, + { + "epoch": 9.65, + "learning_rate": 8.96785680817168e-05, + "loss": 0.1056, + "step": 34320 + }, + { + "epoch": 9.66, + "learning_rate": 8.965982569581108e-05, + "loss": 0.0922, + "step": 34350 + }, + { + "epoch": 9.67, + "learning_rate": 8.964108330990537e-05, + "loss": 0.1059, + "step": 34380 + }, + { + "epoch": 9.67, + "learning_rate": 8.962234092399962e-05, + "loss": 0.0943, + "step": 34410 + }, + { + "epoch": 9.68, + "learning_rate": 8.96035985380939e-05, + "loss": 0.0954, + "step": 34440 + }, + { + "epoch": 9.69, + "learning_rate": 8.958485615218818e-05, + "loss": 0.1035, + "step": 34470 + }, + { + "epoch": 9.7, + "learning_rate": 8.956611376628246e-05, + "loss": 0.0901, + "step": 34500 + }, + { + "epoch": 9.71, + "learning_rate": 8.954737138037672e-05, + "loss": 0.1006, + "step": 34530 + }, + { + "epoch": 9.72, + "learning_rate": 8.9528628994471e-05, + "loss": 0.1073, + "step": 34560 + }, + { + "epoch": 9.72, + "learning_rate": 8.950988660856528e-05, + "loss": 0.0976, + "step": 34590 + }, + { + "epoch": 9.73, + "learning_rate": 8.949114422265955e-05, + "loss": 0.1036, + "step": 34620 + }, + { + "epoch": 9.74, + "learning_rate": 8.947240183675383e-05, + "loss": 0.0879, + "step": 34650 + }, + { + "epoch": 9.75, + "learning_rate": 8.94536594508481e-05, + "loss": 0.1058, + "step": 34680 + }, + { + "epoch": 9.76, + "learning_rate": 8.943491706494237e-05, + "loss": 0.1025, + "step": 34710 + }, + { + "epoch": 9.77, + "learning_rate": 8.941617467903664e-05, + "loss": 0.0967, + "step": 34740 + }, + { + "epoch": 9.77, + "learning_rate": 8.939743229313092e-05, + "loss": 0.1017, + "step": 34770 + }, + { + "epoch": 9.78, + "learning_rate": 8.93786899072252e-05, + "loss": 0.0916, + "step": 34800 + }, + { + "epoch": 9.79, + "learning_rate": 8.935994752131946e-05, + "loss": 0.1, + "step": 34830 + }, + { + "epoch": 9.8, + "learning_rate": 8.934120513541374e-05, + "loss": 0.0976, + "step": 34860 + }, + { + "epoch": 9.81, + "learning_rate": 8.932246274950802e-05, + "loss": 0.0907, + "step": 34890 + }, + { + "epoch": 9.82, + "learning_rate": 8.93037203636023e-05, + "loss": 0.1056, + "step": 34920 + }, + { + "epoch": 9.83, + "learning_rate": 8.928497797769655e-05, + "loss": 0.0882, + "step": 34950 + }, + { + "epoch": 9.83, + "learning_rate": 8.926623559179084e-05, + "loss": 0.104, + "step": 34980 + }, + { + "epoch": 9.84, + "learning_rate": 8.924749320588512e-05, + "loss": 0.1025, + "step": 35010 + }, + { + "epoch": 9.85, + "learning_rate": 8.922875081997938e-05, + "loss": 0.0919, + "step": 35040 + }, + { + "epoch": 9.86, + "learning_rate": 8.921000843407367e-05, + "loss": 0.1067, + "step": 35070 + }, + { + "epoch": 9.87, + "learning_rate": 8.919126604816793e-05, + "loss": 0.087, + "step": 35100 + }, + { + "epoch": 9.88, + "learning_rate": 8.917252366226221e-05, + "loss": 0.1095, + "step": 35130 + }, + { + "epoch": 9.88, + "learning_rate": 8.915378127635648e-05, + "loss": 0.1009, + "step": 35160 + }, + { + "epoch": 9.89, + "learning_rate": 8.913503889045076e-05, + "loss": 0.0953, + "step": 35190 + }, + { + "epoch": 9.9, + "learning_rate": 8.911629650454504e-05, + "loss": 0.1059, + "step": 35220 + }, + { + "epoch": 9.91, + "learning_rate": 8.909755411863931e-05, + "loss": 0.0921, + "step": 35250 + }, + { + "epoch": 9.92, + "learning_rate": 8.907881173273358e-05, + "loss": 0.1019, + "step": 35280 + }, + { + "epoch": 9.93, + "learning_rate": 8.906006934682786e-05, + "loss": 0.0956, + "step": 35310 + }, + { + "epoch": 9.94, + "learning_rate": 8.904132696092214e-05, + "loss": 0.0957, + "step": 35340 + }, + { + "epoch": 9.94, + "learning_rate": 8.90225845750164e-05, + "loss": 0.1062, + "step": 35370 + }, + { + "epoch": 9.95, + "learning_rate": 8.900384218911067e-05, + "loss": 0.0928, + "step": 35400 + }, + { + "epoch": 9.96, + "learning_rate": 8.898509980320496e-05, + "loss": 0.1012, + "step": 35430 + }, + { + "epoch": 9.97, + "learning_rate": 8.896635741729922e-05, + "loss": 0.099, + "step": 35460 + }, + { + "epoch": 9.98, + "learning_rate": 8.89476150313935e-05, + "loss": 0.0986, + "step": 35490 + }, + { + "epoch": 9.99, + "learning_rate": 8.892887264548777e-05, + "loss": 0.1049, + "step": 35520 + }, + { + "epoch": 9.99, + "learning_rate": 8.891013025958205e-05, + "loss": 0.0858, + "step": 35550 + }, + { + "epoch": 10.0, + "eval_loss": 0.11820485442876816, + "eval_runtime": 629.5769, + "eval_samples_per_second": 25.466, + "eval_steps_per_second": 0.797, + "eval_wer": 0.1163866635732125, + "step": 35570 + }, + { + "epoch": 10.0, + "learning_rate": 8.889138787367632e-05, + "loss": 0.1056, + "step": 35580 + }, + { + "epoch": 10.01, + "learning_rate": 8.88726454877706e-05, + "loss": 0.0896, + "step": 35610 + }, + { + "epoch": 10.02, + "learning_rate": 8.885390310186488e-05, + "loss": 0.0959, + "step": 35640 + }, + { + "epoch": 10.03, + "learning_rate": 8.883516071595915e-05, + "loss": 0.1004, + "step": 35670 + }, + { + "epoch": 10.04, + "learning_rate": 8.881641833005342e-05, + "loss": 0.0846, + "step": 35700 + }, + { + "epoch": 10.04, + "learning_rate": 8.87976759441477e-05, + "loss": 0.1042, + "step": 35730 + }, + { + "epoch": 10.05, + "learning_rate": 8.877893355824198e-05, + "loss": 0.0917, + "step": 35760 + }, + { + "epoch": 10.06, + "learning_rate": 8.876019117233623e-05, + "loss": 0.1016, + "step": 35790 + }, + { + "epoch": 10.07, + "learning_rate": 8.874144878643051e-05, + "loss": 0.1079, + "step": 35820 + }, + { + "epoch": 10.08, + "learning_rate": 8.87227064005248e-05, + "loss": 0.0842, + "step": 35850 + }, + { + "epoch": 10.09, + "learning_rate": 8.870396401461906e-05, + "loss": 0.0951, + "step": 35880 + }, + { + "epoch": 10.1, + "learning_rate": 8.868522162871334e-05, + "loss": 0.0838, + "step": 35910 + }, + { + "epoch": 10.1, + "learning_rate": 8.866647924280761e-05, + "loss": 0.0944, + "step": 35940 + }, + { + "epoch": 10.11, + "learning_rate": 8.864773685690189e-05, + "loss": 0.1084, + "step": 35970 + }, + { + "epoch": 10.12, + "learning_rate": 8.862899447099616e-05, + "loss": 0.0872, + "step": 36000 + }, + { + "epoch": 10.13, + "learning_rate": 8.861025208509044e-05, + "loss": 0.0977, + "step": 36030 + }, + { + "epoch": 10.14, + "learning_rate": 8.859150969918472e-05, + "loss": 0.0863, + "step": 36060 + }, + { + "epoch": 10.15, + "learning_rate": 8.857276731327899e-05, + "loss": 0.0936, + "step": 36090 + }, + { + "epoch": 10.15, + "learning_rate": 8.855402492737326e-05, + "loss": 0.0998, + "step": 36120 + }, + { + "epoch": 10.16, + "learning_rate": 8.853528254146754e-05, + "loss": 0.0858, + "step": 36150 + }, + { + "epoch": 10.17, + "learning_rate": 8.851654015556182e-05, + "loss": 0.0964, + "step": 36180 + }, + { + "epoch": 10.18, + "learning_rate": 8.849779776965607e-05, + "loss": 0.0884, + "step": 36210 + }, + { + "epoch": 10.19, + "learning_rate": 8.847905538375035e-05, + "loss": 0.0993, + "step": 36240 + }, + { + "epoch": 10.2, + "learning_rate": 8.846031299784463e-05, + "loss": 0.1069, + "step": 36270 + }, + { + "epoch": 10.21, + "learning_rate": 8.84415706119389e-05, + "loss": 0.0834, + "step": 36300 + }, + { + "epoch": 10.21, + "learning_rate": 8.842282822603318e-05, + "loss": 0.1038, + "step": 36330 + }, + { + "epoch": 10.22, + "learning_rate": 8.840408584012745e-05, + "loss": 0.0878, + "step": 36360 + }, + { + "epoch": 10.23, + "learning_rate": 8.838534345422173e-05, + "loss": 0.0933, + "step": 36390 + }, + { + "epoch": 10.24, + "learning_rate": 8.8366601068316e-05, + "loss": 0.1074, + "step": 36420 + }, + { + "epoch": 10.25, + "learning_rate": 8.834785868241028e-05, + "loss": 0.085, + "step": 36450 + }, + { + "epoch": 10.26, + "learning_rate": 8.832911629650455e-05, + "loss": 0.1005, + "step": 36480 + }, + { + "epoch": 10.26, + "learning_rate": 8.831037391059883e-05, + "loss": 0.0899, + "step": 36510 + }, + { + "epoch": 10.27, + "learning_rate": 8.82916315246931e-05, + "loss": 0.0978, + "step": 36540 + }, + { + "epoch": 10.28, + "learning_rate": 8.827288913878737e-05, + "loss": 0.1049, + "step": 36570 + }, + { + "epoch": 10.29, + "learning_rate": 8.825414675288166e-05, + "loss": 0.0886, + "step": 36600 + }, + { + "epoch": 10.3, + "learning_rate": 8.823540436697591e-05, + "loss": 0.1042, + "step": 36630 + }, + { + "epoch": 10.31, + "learning_rate": 8.821666198107019e-05, + "loss": 0.0913, + "step": 36660 + }, + { + "epoch": 10.31, + "learning_rate": 8.819791959516447e-05, + "loss": 0.0982, + "step": 36690 + }, + { + "epoch": 10.32, + "learning_rate": 8.817917720925874e-05, + "loss": 0.1019, + "step": 36720 + }, + { + "epoch": 10.33, + "learning_rate": 8.816043482335302e-05, + "loss": 0.0887, + "step": 36750 + }, + { + "epoch": 10.34, + "learning_rate": 8.814169243744729e-05, + "loss": 0.1025, + "step": 36780 + }, + { + "epoch": 10.35, + "learning_rate": 8.812295005154157e-05, + "loss": 0.0927, + "step": 36810 + }, + { + "epoch": 10.36, + "learning_rate": 8.810420766563584e-05, + "loss": 0.0999, + "step": 36840 + }, + { + "epoch": 10.37, + "learning_rate": 8.808546527973012e-05, + "loss": 0.1032, + "step": 36870 + }, + { + "epoch": 10.37, + "learning_rate": 8.806672289382438e-05, + "loss": 0.0854, + "step": 36900 + }, + { + "epoch": 10.38, + "learning_rate": 8.804798050791866e-05, + "loss": 0.0997, + "step": 36930 + }, + { + "epoch": 10.39, + "learning_rate": 8.802923812201293e-05, + "loss": 0.0915, + "step": 36960 + }, + { + "epoch": 10.4, + "learning_rate": 8.801049573610721e-05, + "loss": 0.0953, + "step": 36990 + }, + { + "epoch": 10.41, + "learning_rate": 8.79917533502015e-05, + "loss": 0.1097, + "step": 37020 + }, + { + "epoch": 10.42, + "learning_rate": 8.797301096429575e-05, + "loss": 0.0804, + "step": 37050 + }, + { + "epoch": 10.42, + "learning_rate": 8.795426857839003e-05, + "loss": 0.1011, + "step": 37080 + }, + { + "epoch": 10.43, + "learning_rate": 8.793552619248431e-05, + "loss": 0.0904, + "step": 37110 + }, + { + "epoch": 10.44, + "learning_rate": 8.791678380657858e-05, + "loss": 0.0983, + "step": 37140 + }, + { + "epoch": 10.45, + "learning_rate": 8.789804142067286e-05, + "loss": 0.1082, + "step": 37170 + }, + { + "epoch": 10.46, + "learning_rate": 8.787929903476713e-05, + "loss": 0.082, + "step": 37200 + }, + { + "epoch": 10.47, + "learning_rate": 8.786055664886141e-05, + "loss": 0.1019, + "step": 37230 + }, + { + "epoch": 10.48, + "learning_rate": 8.784181426295567e-05, + "loss": 0.0875, + "step": 37260 + }, + { + "epoch": 10.48, + "learning_rate": 8.782307187704996e-05, + "loss": 0.0968, + "step": 37290 + }, + { + "epoch": 10.49, + "learning_rate": 8.780432949114422e-05, + "loss": 0.106, + "step": 37320 + }, + { + "epoch": 10.5, + "learning_rate": 8.77855871052385e-05, + "loss": 0.0803, + "step": 37350 + }, + { + "epoch": 10.51, + "learning_rate": 8.776684471933277e-05, + "loss": 0.1021, + "step": 37380 + }, + { + "epoch": 10.52, + "learning_rate": 8.774810233342705e-05, + "loss": 0.0858, + "step": 37410 + }, + { + "epoch": 10.53, + "learning_rate": 8.772935994752133e-05, + "loss": 0.0954, + "step": 37440 + }, + { + "epoch": 10.53, + "learning_rate": 8.771061756161559e-05, + "loss": 0.1046, + "step": 37470 + }, + { + "epoch": 10.54, + "learning_rate": 8.769187517570987e-05, + "loss": 0.087, + "step": 37500 + }, + { + "epoch": 10.55, + "learning_rate": 8.767313278980415e-05, + "loss": 0.097, + "step": 37530 + }, + { + "epoch": 10.56, + "learning_rate": 8.765439040389843e-05, + "loss": 0.0873, + "step": 37560 + }, + { + "epoch": 10.57, + "learning_rate": 8.76356480179927e-05, + "loss": 0.0994, + "step": 37590 + }, + { + "epoch": 10.58, + "learning_rate": 8.761690563208696e-05, + "loss": 0.1015, + "step": 37620 + }, + { + "epoch": 10.58, + "learning_rate": 8.759816324618125e-05, + "loss": 0.0864, + "step": 37650 + }, + { + "epoch": 10.59, + "learning_rate": 8.757942086027551e-05, + "loss": 0.1043, + "step": 37680 + }, + { + "epoch": 10.6, + "learning_rate": 8.75606784743698e-05, + "loss": 0.0927, + "step": 37710 + }, + { + "epoch": 10.61, + "learning_rate": 8.754193608846406e-05, + "loss": 0.098, + "step": 37740 + }, + { + "epoch": 10.62, + "learning_rate": 8.752319370255834e-05, + "loss": 0.1059, + "step": 37770 + }, + { + "epoch": 10.63, + "learning_rate": 8.750445131665261e-05, + "loss": 0.0854, + "step": 37800 + }, + { + "epoch": 10.64, + "learning_rate": 8.748570893074689e-05, + "loss": 0.1, + "step": 37830 + }, + { + "epoch": 10.64, + "learning_rate": 8.746696654484117e-05, + "loss": 0.0915, + "step": 37860 + }, + { + "epoch": 10.65, + "learning_rate": 8.744822415893543e-05, + "loss": 0.1021, + "step": 37890 + }, + { + "epoch": 10.66, + "learning_rate": 8.74294817730297e-05, + "loss": 0.1063, + "step": 37920 + }, + { + "epoch": 10.67, + "learning_rate": 8.741073938712399e-05, + "loss": 0.0844, + "step": 37950 + }, + { + "epoch": 10.68, + "learning_rate": 8.739199700121827e-05, + "loss": 0.1025, + "step": 37980 + }, + { + "epoch": 10.69, + "learning_rate": 8.737325461531254e-05, + "loss": 0.0892, + "step": 38010 + }, + { + "epoch": 10.69, + "learning_rate": 8.73545122294068e-05, + "loss": 0.0979, + "step": 38040 + }, + { + "epoch": 10.7, + "learning_rate": 8.733576984350108e-05, + "loss": 0.107, + "step": 38070 + }, + { + "epoch": 10.71, + "learning_rate": 8.731702745759535e-05, + "loss": 0.0868, + "step": 38100 + }, + { + "epoch": 10.72, + "learning_rate": 8.729828507168963e-05, + "loss": 0.1055, + "step": 38130 + }, + { + "epoch": 10.73, + "learning_rate": 8.72795426857839e-05, + "loss": 0.0902, + "step": 38160 + }, + { + "epoch": 10.74, + "learning_rate": 8.726080029987818e-05, + "loss": 0.0985, + "step": 38190 + }, + { + "epoch": 10.74, + "learning_rate": 8.724205791397245e-05, + "loss": 0.1018, + "step": 38220 + }, + { + "epoch": 10.75, + "learning_rate": 8.722331552806673e-05, + "loss": 0.0856, + "step": 38250 + }, + { + "epoch": 10.76, + "learning_rate": 8.720457314216101e-05, + "loss": 0.1081, + "step": 38280 + }, + { + "epoch": 10.77, + "learning_rate": 8.718583075625528e-05, + "loss": 0.0907, + "step": 38310 + }, + { + "epoch": 10.78, + "learning_rate": 8.716708837034955e-05, + "loss": 0.0984, + "step": 38340 + }, + { + "epoch": 10.79, + "learning_rate": 8.714834598444383e-05, + "loss": 0.0994, + "step": 38370 + }, + { + "epoch": 10.8, + "learning_rate": 8.712960359853811e-05, + "loss": 0.0851, + "step": 38400 + }, + { + "epoch": 10.8, + "learning_rate": 8.711086121263237e-05, + "loss": 0.104, + "step": 38430 + }, + { + "epoch": 10.81, + "learning_rate": 8.709211882672664e-05, + "loss": 0.0864, + "step": 38460 + }, + { + "epoch": 10.82, + "learning_rate": 8.707337644082092e-05, + "loss": 0.0923, + "step": 38490 + }, + { + "epoch": 10.83, + "learning_rate": 8.705463405491519e-05, + "loss": 0.1031, + "step": 38520 + }, + { + "epoch": 10.84, + "learning_rate": 8.703589166900947e-05, + "loss": 0.0839, + "step": 38550 + }, + { + "epoch": 10.85, + "learning_rate": 8.701714928310374e-05, + "loss": 0.0953, + "step": 38580 + }, + { + "epoch": 10.85, + "learning_rate": 8.699840689719802e-05, + "loss": 0.0898, + "step": 38610 + }, + { + "epoch": 10.86, + "learning_rate": 8.697966451129229e-05, + "loss": 0.0942, + "step": 38640 + }, + { + "epoch": 10.87, + "learning_rate": 8.696092212538657e-05, + "loss": 0.1079, + "step": 38670 + }, + { + "epoch": 10.88, + "learning_rate": 8.694217973948085e-05, + "loss": 0.0842, + "step": 38700 + }, + { + "epoch": 10.89, + "learning_rate": 8.692343735357512e-05, + "loss": 0.1018, + "step": 38730 + }, + { + "epoch": 10.9, + "learning_rate": 8.690469496766938e-05, + "loss": 0.0843, + "step": 38760 + }, + { + "epoch": 10.91, + "learning_rate": 8.688595258176366e-05, + "loss": 0.1039, + "step": 38790 + }, + { + "epoch": 10.91, + "learning_rate": 8.686721019585795e-05, + "loss": 0.1033, + "step": 38820 + }, + { + "epoch": 10.92, + "learning_rate": 8.684846780995221e-05, + "loss": 0.0854, + "step": 38850 + }, + { + "epoch": 10.93, + "learning_rate": 8.682972542404648e-05, + "loss": 0.1018, + "step": 38880 + }, + { + "epoch": 10.94, + "learning_rate": 8.681098303814076e-05, + "loss": 0.0897, + "step": 38910 + }, + { + "epoch": 10.95, + "learning_rate": 8.679224065223503e-05, + "loss": 0.1007, + "step": 38940 + }, + { + "epoch": 10.96, + "learning_rate": 8.677349826632931e-05, + "loss": 0.1023, + "step": 38970 + }, + { + "epoch": 10.96, + "learning_rate": 8.675475588042358e-05, + "loss": 0.0866, + "step": 39000 + }, + { + "epoch": 10.97, + "learning_rate": 8.673663824071472e-05, + "loss": 0.1016, + "step": 39030 + }, + { + "epoch": 10.98, + "learning_rate": 8.671789585480899e-05, + "loss": 0.0893, + "step": 39060 + }, + { + "epoch": 10.99, + "learning_rate": 8.669915346890327e-05, + "loss": 0.0963, + "step": 39090 + }, + { + "epoch": 11.0, + "learning_rate": 8.668041108299753e-05, + "loss": 0.102, + "step": 39120 + }, + { + "epoch": 11.0, + "eval_loss": 0.11905849725008011, + "eval_runtime": 629.8349, + "eval_samples_per_second": 25.456, + "eval_steps_per_second": 0.797, + "eval_wer": 0.11857710207033968, + "step": 39127 + }, + { + "epoch": 11.01, + "learning_rate": 8.666166869709182e-05, + "loss": 0.0842, + "step": 39150 + }, + { + "epoch": 11.01, + "learning_rate": 8.66429263111861e-05, + "loss": 0.1001, + "step": 39180 + }, + { + "epoch": 11.02, + "learning_rate": 8.662418392528035e-05, + "loss": 0.0859, + "step": 39210 + }, + { + "epoch": 11.03, + "learning_rate": 8.660544153937463e-05, + "loss": 0.1002, + "step": 39240 + }, + { + "epoch": 11.04, + "learning_rate": 8.658669915346891e-05, + "loss": 0.0933, + "step": 39270 + }, + { + "epoch": 11.05, + "learning_rate": 8.656795676756318e-05, + "loss": 0.0919, + "step": 39300 + }, + { + "epoch": 11.06, + "learning_rate": 8.654921438165745e-05, + "loss": 0.0992, + "step": 39330 + }, + { + "epoch": 11.07, + "learning_rate": 8.653047199575173e-05, + "loss": 0.081, + "step": 39360 + }, + { + "epoch": 11.07, + "learning_rate": 8.651172960984601e-05, + "loss": 0.0935, + "step": 39390 + }, + { + "epoch": 11.08, + "learning_rate": 8.649298722394028e-05, + "loss": 0.0815, + "step": 39420 + }, + { + "epoch": 11.09, + "learning_rate": 8.647424483803456e-05, + "loss": 0.0923, + "step": 39450 + }, + { + "epoch": 11.1, + "learning_rate": 8.645550245212882e-05, + "loss": 0.0969, + "step": 39480 + }, + { + "epoch": 11.11, + "learning_rate": 8.64367600662231e-05, + "loss": 0.0873, + "step": 39510 + }, + { + "epoch": 11.12, + "learning_rate": 8.641801768031737e-05, + "loss": 0.0961, + "step": 39540 + }, + { + "epoch": 11.12, + "learning_rate": 8.639927529441165e-05, + "loss": 0.0933, + "step": 39570 + }, + { + "epoch": 11.13, + "learning_rate": 8.638053290850593e-05, + "loss": 0.0972, + "step": 39600 + }, + { + "epoch": 11.14, + "learning_rate": 8.636179052260019e-05, + "loss": 0.1017, + "step": 39630 + }, + { + "epoch": 11.15, + "learning_rate": 8.634304813669447e-05, + "loss": 0.0847, + "step": 39660 + }, + { + "epoch": 11.16, + "learning_rate": 8.632430575078875e-05, + "loss": 0.0971, + "step": 39690 + }, + { + "epoch": 11.17, + "learning_rate": 8.630556336488302e-05, + "loss": 0.09, + "step": 39720 + }, + { + "epoch": 11.18, + "learning_rate": 8.628682097897729e-05, + "loss": 0.0889, + "step": 39750 + }, + { + "epoch": 11.18, + "learning_rate": 8.626807859307157e-05, + "loss": 0.1016, + "step": 39780 + }, + { + "epoch": 11.19, + "learning_rate": 8.624933620716585e-05, + "loss": 0.0859, + "step": 39810 + }, + { + "epoch": 11.2, + "learning_rate": 8.623059382126011e-05, + "loss": 0.1014, + "step": 39840 + }, + { + "epoch": 11.21, + "learning_rate": 8.62118514353544e-05, + "loss": 0.0945, + "step": 39870 + }, + { + "epoch": 11.22, + "learning_rate": 8.619310904944866e-05, + "loss": 0.0887, + "step": 39900 + }, + { + "epoch": 11.23, + "learning_rate": 8.617436666354294e-05, + "loss": 0.0987, + "step": 39930 + }, + { + "epoch": 11.23, + "learning_rate": 8.615562427763721e-05, + "loss": 0.0808, + "step": 39960 + }, + { + "epoch": 11.24, + "learning_rate": 8.613688189173149e-05, + "loss": 0.1018, + "step": 39990 + }, + { + "epoch": 11.25, + "learning_rate": 8.611813950582577e-05, + "loss": 0.0971, + "step": 40020 + }, + { + "epoch": 11.26, + "learning_rate": 8.609939711992003e-05, + "loss": 0.0955, + "step": 40050 + }, + { + "epoch": 11.27, + "learning_rate": 8.608065473401431e-05, + "loss": 0.1036, + "step": 40080 + }, + { + "epoch": 11.28, + "learning_rate": 8.606191234810859e-05, + "loss": 0.0821, + "step": 40110 + }, + { + "epoch": 11.28, + "learning_rate": 8.604316996220286e-05, + "loss": 0.097, + "step": 40140 + }, + { + "epoch": 11.29, + "learning_rate": 8.602442757629712e-05, + "loss": 0.0943, + "step": 40170 + }, + { + "epoch": 11.3, + "learning_rate": 8.60056851903914e-05, + "loss": 0.0939, + "step": 40200 + }, + { + "epoch": 11.31, + "learning_rate": 8.598694280448569e-05, + "loss": 0.1064, + "step": 40230 + }, + { + "epoch": 11.32, + "learning_rate": 8.596820041857995e-05, + "loss": 0.0813, + "step": 40260 + }, + { + "epoch": 11.33, + "learning_rate": 8.594945803267423e-05, + "loss": 0.0943, + "step": 40290 + }, + { + "epoch": 11.34, + "learning_rate": 8.59307156467685e-05, + "loss": 0.0898, + "step": 40320 + }, + { + "epoch": 11.34, + "learning_rate": 8.591197326086278e-05, + "loss": 0.0902, + "step": 40350 + }, + { + "epoch": 11.35, + "learning_rate": 8.589323087495705e-05, + "loss": 0.1028, + "step": 40380 + }, + { + "epoch": 11.36, + "learning_rate": 8.587448848905133e-05, + "loss": 0.0828, + "step": 40410 + }, + { + "epoch": 11.37, + "learning_rate": 8.585574610314561e-05, + "loss": 0.0964, + "step": 40440 + }, + { + "epoch": 11.38, + "learning_rate": 8.583700371723987e-05, + "loss": 0.089, + "step": 40470 + }, + { + "epoch": 11.39, + "learning_rate": 8.581826133133415e-05, + "loss": 0.0955, + "step": 40500 + }, + { + "epoch": 11.39, + "learning_rate": 8.579951894542843e-05, + "loss": 0.1037, + "step": 40530 + }, + { + "epoch": 11.4, + "learning_rate": 8.57807765595227e-05, + "loss": 0.0833, + "step": 40560 + }, + { + "epoch": 11.41, + "learning_rate": 8.576203417361696e-05, + "loss": 0.0963, + "step": 40590 + }, + { + "epoch": 11.42, + "learning_rate": 8.574329178771124e-05, + "loss": 0.0885, + "step": 40620 + }, + { + "epoch": 11.43, + "learning_rate": 8.572454940180552e-05, + "loss": 0.0929, + "step": 40650 + }, + { + "epoch": 11.44, + "learning_rate": 8.570580701589979e-05, + "loss": 0.1005, + "step": 40680 + }, + { + "epoch": 11.44, + "learning_rate": 8.568706462999407e-05, + "loss": 0.083, + "step": 40710 + }, + { + "epoch": 11.45, + "learning_rate": 8.566832224408834e-05, + "loss": 0.0974, + "step": 40740 + }, + { + "epoch": 11.46, + "learning_rate": 8.564957985818262e-05, + "loss": 0.0894, + "step": 40770 + }, + { + "epoch": 11.47, + "learning_rate": 8.563083747227689e-05, + "loss": 0.0891, + "step": 40800 + }, + { + "epoch": 11.48, + "learning_rate": 8.561209508637117e-05, + "loss": 0.0977, + "step": 40830 + }, + { + "epoch": 11.49, + "learning_rate": 8.559335270046544e-05, + "loss": 0.0794, + "step": 40860 + }, + { + "epoch": 11.5, + "learning_rate": 8.55746103145597e-05, + "loss": 0.0966, + "step": 40890 + }, + { + "epoch": 11.5, + "learning_rate": 8.555586792865399e-05, + "loss": 0.0915, + "step": 40920 + }, + { + "epoch": 11.51, + "learning_rate": 8.553712554274827e-05, + "loss": 0.091, + "step": 40950 + }, + { + "epoch": 11.52, + "learning_rate": 8.551838315684255e-05, + "loss": 0.1046, + "step": 40980 + }, + { + "epoch": 11.53, + "learning_rate": 8.54996407709368e-05, + "loss": 0.0763, + "step": 41010 + }, + { + "epoch": 11.54, + "learning_rate": 8.548152313122794e-05, + "loss": 0.1007, + "step": 41040 + }, + { + "epoch": 11.55, + "learning_rate": 8.546278074532221e-05, + "loss": 0.0859, + "step": 41070 + }, + { + "epoch": 11.55, + "learning_rate": 8.544403835941649e-05, + "loss": 0.0962, + "step": 41100 + }, + { + "epoch": 11.56, + "learning_rate": 8.542529597351077e-05, + "loss": 0.1012, + "step": 41130 + }, + { + "epoch": 11.57, + "learning_rate": 8.540655358760504e-05, + "loss": 0.0849, + "step": 41160 + }, + { + "epoch": 11.58, + "learning_rate": 8.538781120169932e-05, + "loss": 0.0986, + "step": 41190 + }, + { + "epoch": 11.59, + "learning_rate": 8.536906881579359e-05, + "loss": 0.0927, + "step": 41220 + }, + { + "epoch": 11.6, + "learning_rate": 8.535032642988785e-05, + "loss": 0.0907, + "step": 41250 + }, + { + "epoch": 11.61, + "learning_rate": 8.533158404398214e-05, + "loss": 0.1029, + "step": 41280 + }, + { + "epoch": 11.61, + "learning_rate": 8.531284165807642e-05, + "loss": 0.0873, + "step": 41310 + }, + { + "epoch": 11.62, + "learning_rate": 8.529409927217068e-05, + "loss": 0.1019, + "step": 41340 + }, + { + "epoch": 11.63, + "learning_rate": 8.527535688626495e-05, + "loss": 0.0907, + "step": 41370 + }, + { + "epoch": 11.64, + "learning_rate": 8.525661450035923e-05, + "loss": 0.0963, + "step": 41400 + }, + { + "epoch": 11.65, + "learning_rate": 8.523787211445351e-05, + "loss": 0.1014, + "step": 41430 + }, + { + "epoch": 11.66, + "learning_rate": 8.521912972854778e-05, + "loss": 0.083, + "step": 41460 + }, + { + "epoch": 11.66, + "learning_rate": 8.520038734264205e-05, + "loss": 0.0959, + "step": 41490 + }, + { + "epoch": 11.67, + "learning_rate": 8.518164495673633e-05, + "loss": 0.0912, + "step": 41520 + }, + { + "epoch": 11.68, + "learning_rate": 8.516290257083061e-05, + "loss": 0.0932, + "step": 41550 + }, + { + "epoch": 11.69, + "learning_rate": 8.514416018492488e-05, + "loss": 0.1018, + "step": 41580 + }, + { + "epoch": 11.7, + "learning_rate": 8.512541779901915e-05, + "loss": 0.0815, + "step": 41610 + }, + { + "epoch": 11.71, + "learning_rate": 8.510667541311343e-05, + "loss": 0.0983, + "step": 41640 + }, + { + "epoch": 11.71, + "learning_rate": 8.50879330272077e-05, + "loss": 0.0904, + "step": 41670 + }, + { + "epoch": 11.72, + "learning_rate": 8.506919064130197e-05, + "loss": 0.095, + "step": 41700 + }, + { + "epoch": 11.73, + "learning_rate": 8.505044825539626e-05, + "loss": 0.1045, + "step": 41730 + }, + { + "epoch": 11.74, + "learning_rate": 8.503170586949052e-05, + "loss": 0.0825, + "step": 41760 + }, + { + "epoch": 11.75, + "learning_rate": 8.501358822978166e-05, + "loss": 0.0984, + "step": 41790 + }, + { + "epoch": 11.76, + "learning_rate": 8.499484584387593e-05, + "loss": 0.0876, + "step": 41820 + }, + { + "epoch": 11.77, + "learning_rate": 8.49761034579702e-05, + "loss": 0.0913, + "step": 41850 + }, + { + "epoch": 11.77, + "learning_rate": 8.495736107206448e-05, + "loss": 0.1007, + "step": 41880 + }, + { + "epoch": 11.78, + "learning_rate": 8.493861868615876e-05, + "loss": 0.0851, + "step": 41910 + }, + { + "epoch": 11.79, + "learning_rate": 8.491987630025303e-05, + "loss": 0.0994, + "step": 41940 + }, + { + "epoch": 11.8, + "learning_rate": 8.49011339143473e-05, + "loss": 0.0858, + "step": 41970 + }, + { + "epoch": 11.81, + "learning_rate": 8.488239152844158e-05, + "loss": 0.0924, + "step": 42000 + }, + { + "epoch": 11.82, + "learning_rate": 8.486364914253584e-05, + "loss": 0.1027, + "step": 42030 + }, + { + "epoch": 11.82, + "learning_rate": 8.484490675663012e-05, + "loss": 0.0808, + "step": 42060 + }, + { + "epoch": 11.83, + "learning_rate": 8.482678911692125e-05, + "loss": 0.0959, + "step": 42090 + }, + { + "epoch": 11.84, + "learning_rate": 8.480804673101553e-05, + "loss": 0.0849, + "step": 42120 + }, + { + "epoch": 11.85, + "learning_rate": 8.47893043451098e-05, + "loss": 0.0916, + "step": 42150 + }, + { + "epoch": 11.86, + "learning_rate": 8.477056195920408e-05, + "loss": 0.101, + "step": 42180 + }, + { + "epoch": 11.87, + "learning_rate": 8.475181957329835e-05, + "loss": 0.085, + "step": 42210 + }, + { + "epoch": 11.88, + "learning_rate": 8.473307718739263e-05, + "loss": 0.0929, + "step": 42240 + }, + { + "epoch": 11.88, + "learning_rate": 8.471433480148691e-05, + "loss": 0.0869, + "step": 42270 + }, + { + "epoch": 11.89, + "learning_rate": 8.469559241558116e-05, + "loss": 0.0961, + "step": 42300 + }, + { + "epoch": 11.9, + "learning_rate": 8.467685002967545e-05, + "loss": 0.098, + "step": 42330 + }, + { + "epoch": 11.91, + "learning_rate": 8.465810764376973e-05, + "loss": 0.0841, + "step": 42360 + }, + { + "epoch": 11.92, + "learning_rate": 8.4639365257864e-05, + "loss": 0.0983, + "step": 42390 + }, + { + "epoch": 11.93, + "learning_rate": 8.462062287195826e-05, + "loss": 0.0851, + "step": 42420 + }, + { + "epoch": 11.93, + "learning_rate": 8.460188048605254e-05, + "loss": 0.0933, + "step": 42450 + }, + { + "epoch": 11.94, + "learning_rate": 8.458313810014682e-05, + "loss": 0.0984, + "step": 42480 + }, + { + "epoch": 11.95, + "learning_rate": 8.456439571424109e-05, + "loss": 0.0844, + "step": 42510 + }, + { + "epoch": 11.96, + "learning_rate": 8.454565332833537e-05, + "loss": 0.096, + "step": 42540 + }, + { + "epoch": 11.97, + "learning_rate": 8.452691094242964e-05, + "loss": 0.0872, + "step": 42570 + }, + { + "epoch": 11.98, + "learning_rate": 8.450816855652392e-05, + "loss": 0.0938, + "step": 42600 + }, + { + "epoch": 11.98, + "learning_rate": 8.448942617061819e-05, + "loss": 0.1016, + "step": 42630 + }, + { + "epoch": 11.99, + "learning_rate": 8.447068378471247e-05, + "loss": 0.0834, + "step": 42660 + }, + { + "epoch": 12.0, + "eval_loss": 0.1160648763179779, + "eval_runtime": 629.8644, + "eval_samples_per_second": 25.455, + "eval_steps_per_second": 0.797, + "eval_wer": 0.10961745799953598, + "step": 42684 + }, + { + "epoch": 12.0, + "learning_rate": 8.445194139880675e-05, + "loss": 0.1065, + "step": 42690 + }, + { + "epoch": 12.01, + "learning_rate": 8.4433199012901e-05, + "loss": 0.0817, + "step": 42720 + }, + { + "epoch": 12.02, + "learning_rate": 8.441445662699528e-05, + "loss": 0.0949, + "step": 42750 + }, + { + "epoch": 12.03, + "learning_rate": 8.439571424108957e-05, + "loss": 0.0901, + "step": 42780 + }, + { + "epoch": 12.04, + "learning_rate": 8.437697185518383e-05, + "loss": 0.0852, + "step": 42810 + }, + { + "epoch": 12.04, + "learning_rate": 8.43582294692781e-05, + "loss": 0.095, + "step": 42840 + }, + { + "epoch": 12.05, + "learning_rate": 8.433948708337238e-05, + "loss": 0.0805, + "step": 42870 + }, + { + "epoch": 12.06, + "learning_rate": 8.432074469746666e-05, + "loss": 0.094, + "step": 42900 + }, + { + "epoch": 12.07, + "learning_rate": 8.430200231156093e-05, + "loss": 0.0886, + "step": 42930 + }, + { + "epoch": 12.08, + "learning_rate": 8.428325992565521e-05, + "loss": 0.0873, + "step": 42960 + }, + { + "epoch": 12.09, + "learning_rate": 8.426451753974948e-05, + "loss": 0.0949, + "step": 42990 + }, + { + "epoch": 12.09, + "learning_rate": 8.424577515384376e-05, + "loss": 0.0842, + "step": 43020 + }, + { + "epoch": 12.1, + "learning_rate": 8.422703276793803e-05, + "loss": 0.0899, + "step": 43050 + }, + { + "epoch": 12.11, + "learning_rate": 8.420829038203231e-05, + "loss": 0.0871, + "step": 43080 + }, + { + "epoch": 12.12, + "learning_rate": 8.418954799612657e-05, + "loss": 0.0824, + "step": 43110 + }, + { + "epoch": 12.13, + "learning_rate": 8.417080561022084e-05, + "loss": 0.0907, + "step": 43140 + }, + { + "epoch": 12.14, + "learning_rate": 8.415206322431512e-05, + "loss": 0.0786, + "step": 43170 + }, + { + "epoch": 12.15, + "learning_rate": 8.41333208384094e-05, + "loss": 0.0969, + "step": 43200 + }, + { + "epoch": 12.15, + "learning_rate": 8.411457845250369e-05, + "loss": 0.0896, + "step": 43230 + }, + { + "epoch": 12.16, + "learning_rate": 8.409583606659794e-05, + "loss": 0.0874, + "step": 43260 + }, + { + "epoch": 12.17, + "learning_rate": 8.407709368069222e-05, + "loss": 0.0962, + "step": 43290 + }, + { + "epoch": 12.18, + "learning_rate": 8.40583512947865e-05, + "loss": 0.0849, + "step": 43320 + }, + { + "epoch": 12.19, + "learning_rate": 8.403960890888077e-05, + "loss": 0.0933, + "step": 43350 + }, + { + "epoch": 12.2, + "learning_rate": 8.402086652297505e-05, + "loss": 0.0884, + "step": 43380 + }, + { + "epoch": 12.2, + "learning_rate": 8.400212413706932e-05, + "loss": 0.0829, + "step": 43410 + }, + { + "epoch": 12.21, + "learning_rate": 8.39833817511636e-05, + "loss": 0.0994, + "step": 43440 + }, + { + "epoch": 12.22, + "learning_rate": 8.396463936525787e-05, + "loss": 0.0825, + "step": 43470 + }, + { + "epoch": 12.23, + "learning_rate": 8.394589697935215e-05, + "loss": 0.0958, + "step": 43500 + }, + { + "epoch": 12.24, + "learning_rate": 8.392715459344641e-05, + "loss": 0.0949, + "step": 43530 + }, + { + "epoch": 12.25, + "learning_rate": 8.390841220754068e-05, + "loss": 0.0913, + "step": 43560 + }, + { + "epoch": 12.25, + "learning_rate": 8.388966982163496e-05, + "loss": 0.1043, + "step": 43590 + }, + { + "epoch": 12.26, + "learning_rate": 8.387092743572924e-05, + "loss": 0.0779, + "step": 43620 + }, + { + "epoch": 12.27, + "learning_rate": 8.385218504982352e-05, + "loss": 0.0942, + "step": 43650 + }, + { + "epoch": 12.28, + "learning_rate": 8.383344266391778e-05, + "loss": 0.0872, + "step": 43680 + }, + { + "epoch": 12.29, + "learning_rate": 8.381470027801206e-05, + "loss": 0.086, + "step": 43710 + }, + { + "epoch": 12.3, + "learning_rate": 8.379595789210634e-05, + "loss": 0.0961, + "step": 43740 + }, + { + "epoch": 12.31, + "learning_rate": 8.377721550620061e-05, + "loss": 0.0819, + "step": 43770 + }, + { + "epoch": 12.31, + "learning_rate": 8.375847312029489e-05, + "loss": 0.0947, + "step": 43800 + }, + { + "epoch": 12.32, + "learning_rate": 8.373973073438916e-05, + "loss": 0.0934, + "step": 43830 + }, + { + "epoch": 12.33, + "learning_rate": 8.372098834848344e-05, + "loss": 0.0897, + "step": 43860 + }, + { + "epoch": 12.34, + "learning_rate": 8.37022459625777e-05, + "loss": 0.1006, + "step": 43890 + }, + { + "epoch": 12.35, + "learning_rate": 8.368350357667198e-05, + "loss": 0.081, + "step": 43920 + }, + { + "epoch": 12.36, + "learning_rate": 8.366476119076625e-05, + "loss": 0.1011, + "step": 43950 + }, + { + "epoch": 12.36, + "learning_rate": 8.364601880486053e-05, + "loss": 0.0887, + "step": 43980 + }, + { + "epoch": 12.37, + "learning_rate": 8.36272764189548e-05, + "loss": 0.0867, + "step": 44010 + }, + { + "epoch": 12.38, + "learning_rate": 8.360853403304908e-05, + "loss": 0.0979, + "step": 44040 + }, + { + "epoch": 12.39, + "learning_rate": 8.358979164714336e-05, + "loss": 0.0821, + "step": 44070 + }, + { + "epoch": 12.4, + "learning_rate": 8.357104926123762e-05, + "loss": 0.0944, + "step": 44100 + }, + { + "epoch": 12.41, + "learning_rate": 8.35523068753319e-05, + "loss": 0.0895, + "step": 44130 + }, + { + "epoch": 12.41, + "learning_rate": 8.353356448942618e-05, + "loss": 0.0874, + "step": 44160 + }, + { + "epoch": 12.42, + "learning_rate": 8.351482210352045e-05, + "loss": 0.0974, + "step": 44190 + }, + { + "epoch": 12.43, + "learning_rate": 8.349607971761473e-05, + "loss": 0.0825, + "step": 44220 + }, + { + "epoch": 12.44, + "learning_rate": 8.3477337331709e-05, + "loss": 0.0979, + "step": 44250 + }, + { + "epoch": 12.45, + "learning_rate": 8.345859494580327e-05, + "loss": 0.094, + "step": 44280 + }, + { + "epoch": 12.46, + "learning_rate": 8.343985255989754e-05, + "loss": 0.0857, + "step": 44310 + }, + { + "epoch": 12.47, + "learning_rate": 8.342111017399182e-05, + "loss": 0.0988, + "step": 44340 + }, + { + "epoch": 12.47, + "learning_rate": 8.340236778808609e-05, + "loss": 0.0818, + "step": 44370 + }, + { + "epoch": 12.48, + "learning_rate": 8.338362540218037e-05, + "loss": 0.0924, + "step": 44400 + }, + { + "epoch": 12.49, + "learning_rate": 8.336488301627464e-05, + "loss": 0.0896, + "step": 44430 + }, + { + "epoch": 12.5, + "learning_rate": 8.334614063036892e-05, + "loss": 0.0871, + "step": 44460 + }, + { + "epoch": 12.51, + "learning_rate": 8.33273982444632e-05, + "loss": 0.0974, + "step": 44490 + }, + { + "epoch": 12.52, + "learning_rate": 8.330865585855745e-05, + "loss": 0.0854, + "step": 44520 + }, + { + "epoch": 12.52, + "learning_rate": 8.328991347265174e-05, + "loss": 0.0928, + "step": 44550 + }, + { + "epoch": 12.53, + "learning_rate": 8.327117108674602e-05, + "loss": 0.0895, + "step": 44580 + }, + { + "epoch": 12.54, + "learning_rate": 8.325242870084028e-05, + "loss": 0.0887, + "step": 44610 + }, + { + "epoch": 12.55, + "learning_rate": 8.323368631493457e-05, + "loss": 0.0931, + "step": 44640 + }, + { + "epoch": 12.56, + "learning_rate": 8.321494392902883e-05, + "loss": 0.0804, + "step": 44670 + }, + { + "epoch": 12.57, + "learning_rate": 8.319620154312311e-05, + "loss": 0.0916, + "step": 44700 + }, + { + "epoch": 12.58, + "learning_rate": 8.317745915721738e-05, + "loss": 0.0901, + "step": 44730 + }, + { + "epoch": 12.58, + "learning_rate": 8.315871677131166e-05, + "loss": 0.0874, + "step": 44760 + }, + { + "epoch": 12.59, + "learning_rate": 8.313997438540593e-05, + "loss": 0.0987, + "step": 44790 + }, + { + "epoch": 12.6, + "learning_rate": 8.312123199950021e-05, + "loss": 0.0831, + "step": 44820 + }, + { + "epoch": 12.61, + "learning_rate": 8.310248961359448e-05, + "loss": 0.0897, + "step": 44850 + }, + { + "epoch": 12.62, + "learning_rate": 8.308374722768876e-05, + "loss": 0.0943, + "step": 44880 + }, + { + "epoch": 12.63, + "learning_rate": 8.306500484178304e-05, + "loss": 0.0872, + "step": 44910 + }, + { + "epoch": 12.63, + "learning_rate": 8.30462624558773e-05, + "loss": 0.0944, + "step": 44940 + }, + { + "epoch": 12.64, + "learning_rate": 8.302752006997157e-05, + "loss": 0.081, + "step": 44970 + }, + { + "epoch": 12.65, + "learning_rate": 8.300877768406586e-05, + "loss": 0.0945, + "step": 45000 + }, + { + "epoch": 12.66, + "learning_rate": 8.299003529816012e-05, + "loss": 0.0957, + "step": 45030 + }, + { + "epoch": 12.67, + "learning_rate": 8.29712929122544e-05, + "loss": 0.086, + "step": 45060 + }, + { + "epoch": 12.68, + "learning_rate": 8.295255052634867e-05, + "loss": 0.0991, + "step": 45090 + }, + { + "epoch": 12.68, + "learning_rate": 8.293380814044295e-05, + "loss": 0.0807, + "step": 45120 + }, + { + "epoch": 12.69, + "learning_rate": 8.291506575453722e-05, + "loss": 0.0939, + "step": 45150 + }, + { + "epoch": 12.7, + "learning_rate": 8.28963233686315e-05, + "loss": 0.0891, + "step": 45180 + }, + { + "epoch": 12.71, + "learning_rate": 8.287758098272577e-05, + "loss": 0.0857, + "step": 45210 + }, + { + "epoch": 12.72, + "learning_rate": 8.285883859682005e-05, + "loss": 0.097, + "step": 45240 + }, + { + "epoch": 12.73, + "learning_rate": 8.284009621091432e-05, + "loss": 0.0795, + "step": 45270 + }, + { + "epoch": 12.74, + "learning_rate": 8.28213538250086e-05, + "loss": 0.0904, + "step": 45300 + }, + { + "epoch": 12.74, + "learning_rate": 8.280261143910288e-05, + "loss": 0.0901, + "step": 45330 + }, + { + "epoch": 12.75, + "learning_rate": 8.278386905319713e-05, + "loss": 0.0861, + "step": 45360 + }, + { + "epoch": 12.76, + "learning_rate": 8.276512666729141e-05, + "loss": 0.1011, + "step": 45390 + }, + { + "epoch": 12.77, + "learning_rate": 8.27463842813857e-05, + "loss": 0.081, + "step": 45420 + }, + { + "epoch": 12.78, + "learning_rate": 8.272764189547996e-05, + "loss": 0.0884, + "step": 45450 + }, + { + "epoch": 12.79, + "learning_rate": 8.270889950957424e-05, + "loss": 0.09, + "step": 45480 + }, + { + "epoch": 12.79, + "learning_rate": 8.269015712366851e-05, + "loss": 0.0878, + "step": 45510 + }, + { + "epoch": 12.8, + "learning_rate": 8.267141473776279e-05, + "loss": 0.1015, + "step": 45540 + }, + { + "epoch": 12.81, + "learning_rate": 8.265267235185706e-05, + "loss": 0.0795, + "step": 45570 + }, + { + "epoch": 12.82, + "learning_rate": 8.263392996595134e-05, + "loss": 0.0869, + "step": 45600 + }, + { + "epoch": 12.83, + "learning_rate": 8.261518758004561e-05, + "loss": 0.0932, + "step": 45630 + }, + { + "epoch": 12.84, + "learning_rate": 8.259644519413989e-05, + "loss": 0.0875, + "step": 45660 + }, + { + "epoch": 12.84, + "learning_rate": 8.257770280823416e-05, + "loss": 0.0951, + "step": 45690 + }, + { + "epoch": 12.85, + "learning_rate": 8.255896042232844e-05, + "loss": 0.0784, + "step": 45720 + }, + { + "epoch": 12.86, + "learning_rate": 8.254021803642272e-05, + "loss": 0.0984, + "step": 45750 + }, + { + "epoch": 12.87, + "learning_rate": 8.252147565051697e-05, + "loss": 0.0858, + "step": 45780 + }, + { + "epoch": 12.88, + "learning_rate": 8.250273326461125e-05, + "loss": 0.0857, + "step": 45810 + }, + { + "epoch": 12.89, + "learning_rate": 8.248399087870553e-05, + "loss": 0.0948, + "step": 45840 + }, + { + "epoch": 12.9, + "learning_rate": 8.24652484927998e-05, + "loss": 0.0873, + "step": 45870 + }, + { + "epoch": 12.9, + "learning_rate": 8.244650610689408e-05, + "loss": 0.0934, + "step": 45900 + }, + { + "epoch": 12.91, + "learning_rate": 8.242776372098835e-05, + "loss": 0.0895, + "step": 45930 + }, + { + "epoch": 12.92, + "learning_rate": 8.240902133508263e-05, + "loss": 0.0874, + "step": 45960 + }, + { + "epoch": 12.93, + "learning_rate": 8.23902789491769e-05, + "loss": 0.097, + "step": 45990 + }, + { + "epoch": 12.94, + "learning_rate": 8.237153656327118e-05, + "loss": 0.0841, + "step": 46020 + }, + { + "epoch": 12.95, + "learning_rate": 8.235279417736545e-05, + "loss": 0.0915, + "step": 46050 + }, + { + "epoch": 12.95, + "learning_rate": 8.233405179145973e-05, + "loss": 0.0909, + "step": 46080 + }, + { + "epoch": 12.96, + "learning_rate": 8.2315309405554e-05, + "loss": 0.0887, + "step": 46110 + }, + { + "epoch": 12.97, + "learning_rate": 8.229656701964827e-05, + "loss": 0.0965, + "step": 46140 + }, + { + "epoch": 12.98, + "learning_rate": 8.227782463374256e-05, + "loss": 0.0817, + "step": 46170 + }, + { + "epoch": 12.99, + "learning_rate": 8.225908224783681e-05, + "loss": 0.093, + "step": 46200 + }, + { + "epoch": 13.0, + "learning_rate": 8.224033986193109e-05, + "loss": 0.0916, + "step": 46230 + }, + { + "epoch": 13.0, + "eval_loss": 0.11473153531551361, + "eval_runtime": 629.489, + "eval_samples_per_second": 25.47, + "eval_steps_per_second": 0.797, + "eval_wer": 0.11070926535012897, + "step": 46241 + }, + { + "epoch": 13.01, + "learning_rate": 8.222159747602537e-05, + "loss": 0.0861, + "step": 46260 + }, + { + "epoch": 13.01, + "learning_rate": 8.220285509011965e-05, + "loss": 0.0928, + "step": 46290 + }, + { + "epoch": 13.02, + "learning_rate": 8.218411270421392e-05, + "loss": 0.0836, + "step": 46320 + }, + { + "epoch": 13.03, + "learning_rate": 8.216537031830819e-05, + "loss": 0.0949, + "step": 46350 + }, + { + "epoch": 13.04, + "learning_rate": 8.214662793240247e-05, + "loss": 0.0837, + "step": 46380 + }, + { + "epoch": 13.05, + "learning_rate": 8.212788554649674e-05, + "loss": 0.087, + "step": 46410 + }, + { + "epoch": 13.06, + "learning_rate": 8.210914316059102e-05, + "loss": 0.0893, + "step": 46440 + }, + { + "epoch": 13.06, + "learning_rate": 8.209040077468528e-05, + "loss": 0.0818, + "step": 46470 + }, + { + "epoch": 13.07, + "learning_rate": 8.207165838877957e-05, + "loss": 0.0956, + "step": 46500 + }, + { + "epoch": 13.08, + "learning_rate": 8.205291600287383e-05, + "loss": 0.0796, + "step": 46530 + }, + { + "epoch": 13.09, + "learning_rate": 8.203417361696811e-05, + "loss": 0.0904, + "step": 46560 + }, + { + "epoch": 13.1, + "learning_rate": 8.20154312310624e-05, + "loss": 0.0931, + "step": 46590 + }, + { + "epoch": 13.11, + "learning_rate": 8.199668884515665e-05, + "loss": 0.0782, + "step": 46620 + }, + { + "epoch": 13.11, + "learning_rate": 8.197794645925093e-05, + "loss": 0.0967, + "step": 46650 + }, + { + "epoch": 13.12, + "learning_rate": 8.195920407334521e-05, + "loss": 0.0818, + "step": 46680 + }, + { + "epoch": 13.13, + "learning_rate": 8.194046168743949e-05, + "loss": 0.0818, + "step": 46710 + }, + { + "epoch": 13.14, + "learning_rate": 8.192171930153375e-05, + "loss": 0.0909, + "step": 46740 + }, + { + "epoch": 13.15, + "learning_rate": 8.190297691562803e-05, + "loss": 0.081, + "step": 46770 + }, + { + "epoch": 13.16, + "learning_rate": 8.188423452972231e-05, + "loss": 0.0946, + "step": 46800 + }, + { + "epoch": 13.17, + "learning_rate": 8.186549214381657e-05, + "loss": 0.0831, + "step": 46830 + }, + { + "epoch": 13.17, + "learning_rate": 8.184674975791086e-05, + "loss": 0.0902, + "step": 46860 + }, + { + "epoch": 13.18, + "learning_rate": 8.182800737200512e-05, + "loss": 0.0988, + "step": 46890 + }, + { + "epoch": 13.19, + "learning_rate": 8.18092649860994e-05, + "loss": 0.0827, + "step": 46920 + }, + { + "epoch": 13.2, + "learning_rate": 8.179052260019367e-05, + "loss": 0.0959, + "step": 46950 + }, + { + "epoch": 13.21, + "learning_rate": 8.177178021428795e-05, + "loss": 0.0779, + "step": 46980 + }, + { + "epoch": 13.22, + "learning_rate": 8.175303782838223e-05, + "loss": 0.0918, + "step": 47010 + }, + { + "epoch": 13.22, + "learning_rate": 8.17342954424765e-05, + "loss": 0.0885, + "step": 47040 + }, + { + "epoch": 13.23, + "learning_rate": 8.171555305657077e-05, + "loss": 0.0809, + "step": 47070 + }, + { + "epoch": 13.24, + "learning_rate": 8.169681067066505e-05, + "loss": 0.0892, + "step": 47100 + }, + { + "epoch": 13.25, + "learning_rate": 8.167806828475933e-05, + "loss": 0.0831, + "step": 47130 + }, + { + "epoch": 13.26, + "learning_rate": 8.165932589885358e-05, + "loss": 0.091, + "step": 47160 + }, + { + "epoch": 13.27, + "learning_rate": 8.164058351294786e-05, + "loss": 0.0906, + "step": 47190 + }, + { + "epoch": 13.28, + "learning_rate": 8.162184112704215e-05, + "loss": 0.076, + "step": 47220 + }, + { + "epoch": 13.28, + "learning_rate": 8.160309874113641e-05, + "loss": 0.0933, + "step": 47250 + }, + { + "epoch": 13.29, + "learning_rate": 8.15843563552307e-05, + "loss": 0.0812, + "step": 47280 + }, + { + "epoch": 13.3, + "learning_rate": 8.156561396932496e-05, + "loss": 0.088, + "step": 47310 + }, + { + "epoch": 13.31, + "learning_rate": 8.154687158341924e-05, + "loss": 0.0907, + "step": 47340 + }, + { + "epoch": 13.32, + "learning_rate": 8.152812919751351e-05, + "loss": 0.0826, + "step": 47370 + }, + { + "epoch": 13.33, + "learning_rate": 8.150938681160779e-05, + "loss": 0.0933, + "step": 47400 + }, + { + "epoch": 13.33, + "learning_rate": 8.149064442570207e-05, + "loss": 0.0832, + "step": 47430 + }, + { + "epoch": 13.34, + "learning_rate": 8.147190203979634e-05, + "loss": 0.0882, + "step": 47460 + }, + { + "epoch": 13.35, + "learning_rate": 8.14531596538906e-05, + "loss": 0.0929, + "step": 47490 + }, + { + "epoch": 13.36, + "learning_rate": 8.143441726798489e-05, + "loss": 0.0805, + "step": 47520 + }, + { + "epoch": 13.37, + "learning_rate": 8.141629962827602e-05, + "loss": 0.0915, + "step": 47550 + }, + { + "epoch": 13.38, + "learning_rate": 8.13975572423703e-05, + "loss": 0.0825, + "step": 47580 + }, + { + "epoch": 13.38, + "learning_rate": 8.137881485646456e-05, + "loss": 0.0881, + "step": 47610 + }, + { + "epoch": 13.39, + "learning_rate": 8.136007247055883e-05, + "loss": 0.0948, + "step": 47640 + }, + { + "epoch": 13.4, + "learning_rate": 8.134133008465311e-05, + "loss": 0.079, + "step": 47670 + }, + { + "epoch": 13.41, + "learning_rate": 8.132258769874739e-05, + "loss": 0.0912, + "step": 47700 + }, + { + "epoch": 13.42, + "learning_rate": 8.130384531284166e-05, + "loss": 0.0813, + "step": 47730 + }, + { + "epoch": 13.43, + "learning_rate": 8.128510292693594e-05, + "loss": 0.0904, + "step": 47760 + }, + { + "epoch": 13.44, + "learning_rate": 8.126636054103021e-05, + "loss": 0.0906, + "step": 47790 + }, + { + "epoch": 13.44, + "learning_rate": 8.124761815512449e-05, + "loss": 0.081, + "step": 47820 + }, + { + "epoch": 13.45, + "learning_rate": 8.122887576921876e-05, + "loss": 0.0943, + "step": 47850 + }, + { + "epoch": 13.46, + "learning_rate": 8.121013338331304e-05, + "loss": 0.0856, + "step": 47880 + }, + { + "epoch": 13.47, + "learning_rate": 8.11913909974073e-05, + "loss": 0.0926, + "step": 47910 + }, + { + "epoch": 13.48, + "learning_rate": 8.117264861150157e-05, + "loss": 0.0904, + "step": 47940 + }, + { + "epoch": 13.49, + "learning_rate": 8.115390622559585e-05, + "loss": 0.0777, + "step": 47970 + }, + { + "epoch": 13.49, + "learning_rate": 8.113516383969013e-05, + "loss": 0.0937, + "step": 48000 + }, + { + "epoch": 13.5, + "learning_rate": 8.11164214537844e-05, + "loss": 0.0818, + "step": 48030 + }, + { + "epoch": 13.51, + "learning_rate": 8.109767906787867e-05, + "loss": 0.0923, + "step": 48060 + }, + { + "epoch": 13.52, + "learning_rate": 8.107893668197295e-05, + "loss": 0.0971, + "step": 48090 + }, + { + "epoch": 13.53, + "learning_rate": 8.106019429606723e-05, + "loss": 0.0824, + "step": 48120 + }, + { + "epoch": 13.54, + "learning_rate": 8.10414519101615e-05, + "loss": 0.0986, + "step": 48150 + }, + { + "epoch": 13.55, + "learning_rate": 8.102270952425578e-05, + "loss": 0.0822, + "step": 48180 + }, + { + "epoch": 13.55, + "learning_rate": 8.100396713835005e-05, + "loss": 0.0884, + "step": 48210 + }, + { + "epoch": 13.56, + "learning_rate": 8.098522475244433e-05, + "loss": 0.0895, + "step": 48240 + }, + { + "epoch": 13.57, + "learning_rate": 8.09664823665386e-05, + "loss": 0.0801, + "step": 48270 + }, + { + "epoch": 13.58, + "learning_rate": 8.094773998063288e-05, + "loss": 0.0971, + "step": 48300 + }, + { + "epoch": 13.59, + "learning_rate": 8.092899759472714e-05, + "loss": 0.0858, + "step": 48330 + }, + { + "epoch": 13.6, + "learning_rate": 8.091025520882141e-05, + "loss": 0.0889, + "step": 48360 + }, + { + "epoch": 13.6, + "learning_rate": 8.089151282291569e-05, + "loss": 0.0944, + "step": 48390 + }, + { + "epoch": 13.61, + "learning_rate": 8.087277043700997e-05, + "loss": 0.0848, + "step": 48420 + }, + { + "epoch": 13.62, + "learning_rate": 8.085402805110424e-05, + "loss": 0.0897, + "step": 48450 + }, + { + "epoch": 13.63, + "learning_rate": 8.083528566519851e-05, + "loss": 0.0812, + "step": 48480 + }, + { + "epoch": 13.64, + "learning_rate": 8.081654327929279e-05, + "loss": 0.0942, + "step": 48510 + }, + { + "epoch": 13.65, + "learning_rate": 8.079780089338707e-05, + "loss": 0.0925, + "step": 48540 + }, + { + "epoch": 13.65, + "learning_rate": 8.077905850748134e-05, + "loss": 0.0806, + "step": 48570 + }, + { + "epoch": 13.66, + "learning_rate": 8.076031612157562e-05, + "loss": 0.091, + "step": 48600 + }, + { + "epoch": 13.67, + "learning_rate": 8.074157373566989e-05, + "loss": 0.0816, + "step": 48630 + }, + { + "epoch": 13.68, + "learning_rate": 8.072283134976417e-05, + "loss": 0.0859, + "step": 48660 + }, + { + "epoch": 13.69, + "learning_rate": 8.070408896385843e-05, + "loss": 0.0956, + "step": 48690 + }, + { + "epoch": 13.7, + "learning_rate": 8.068534657795272e-05, + "loss": 0.0816, + "step": 48720 + }, + { + "epoch": 13.71, + "learning_rate": 8.066660419204698e-05, + "loss": 0.0919, + "step": 48750 + }, + { + "epoch": 13.71, + "learning_rate": 8.064786180614125e-05, + "loss": 0.0798, + "step": 48780 + }, + { + "epoch": 13.72, + "learning_rate": 8.062911942023553e-05, + "loss": 0.0891, + "step": 48810 + }, + { + "epoch": 13.73, + "learning_rate": 8.061037703432981e-05, + "loss": 0.0939, + "step": 48840 + }, + { + "epoch": 13.74, + "learning_rate": 8.059163464842408e-05, + "loss": 0.0796, + "step": 48870 + }, + { + "epoch": 13.75, + "learning_rate": 8.057289226251835e-05, + "loss": 0.0913, + "step": 48900 + }, + { + "epoch": 13.76, + "learning_rate": 8.055414987661263e-05, + "loss": 0.0841, + "step": 48930 + }, + { + "epoch": 13.76, + "learning_rate": 8.053540749070691e-05, + "loss": 0.0827, + "step": 48960 + }, + { + "epoch": 13.77, + "learning_rate": 8.051666510480118e-05, + "loss": 0.0944, + "step": 48990 + }, + { + "epoch": 13.78, + "learning_rate": 8.049792271889546e-05, + "loss": 0.0816, + "step": 49020 + }, + { + "epoch": 13.79, + "learning_rate": 8.047918033298972e-05, + "loss": 0.0923, + "step": 49050 + }, + { + "epoch": 13.8, + "learning_rate": 8.0460437947084e-05, + "loss": 0.0796, + "step": 49080 + }, + { + "epoch": 13.81, + "learning_rate": 8.044169556117827e-05, + "loss": 0.0896, + "step": 49110 + }, + { + "epoch": 13.81, + "learning_rate": 8.042295317527255e-05, + "loss": 0.091, + "step": 49140 + }, + { + "epoch": 13.82, + "learning_rate": 8.040421078936682e-05, + "loss": 0.0853, + "step": 49170 + }, + { + "epoch": 13.83, + "learning_rate": 8.038546840346109e-05, + "loss": 0.0954, + "step": 49200 + }, + { + "epoch": 13.84, + "learning_rate": 8.036672601755537e-05, + "loss": 0.084, + "step": 49230 + }, + { + "epoch": 13.85, + "learning_rate": 8.034798363164965e-05, + "loss": 0.0951, + "step": 49260 + }, + { + "epoch": 13.86, + "learning_rate": 8.032924124574392e-05, + "loss": 0.0924, + "step": 49290 + }, + { + "epoch": 13.87, + "learning_rate": 8.031049885983819e-05, + "loss": 0.0813, + "step": 49320 + }, + { + "epoch": 13.87, + "learning_rate": 8.029175647393247e-05, + "loss": 0.0953, + "step": 49350 + }, + { + "epoch": 13.88, + "learning_rate": 8.027301408802675e-05, + "loss": 0.0834, + "step": 49380 + }, + { + "epoch": 13.89, + "learning_rate": 8.025427170212101e-05, + "loss": 0.0869, + "step": 49410 + }, + { + "epoch": 13.9, + "learning_rate": 8.02355293162153e-05, + "loss": 0.0927, + "step": 49440 + }, + { + "epoch": 13.91, + "learning_rate": 8.021678693030956e-05, + "loss": 0.0817, + "step": 49470 + }, + { + "epoch": 13.92, + "learning_rate": 8.019804454440384e-05, + "loss": 0.0902, + "step": 49500 + }, + { + "epoch": 13.92, + "learning_rate": 8.017930215849811e-05, + "loss": 0.0805, + "step": 49530 + }, + { + "epoch": 13.93, + "learning_rate": 8.016055977259239e-05, + "loss": 0.0897, + "step": 49560 + }, + { + "epoch": 13.94, + "learning_rate": 8.014181738668666e-05, + "loss": 0.0919, + "step": 49590 + }, + { + "epoch": 13.95, + "learning_rate": 8.012307500078093e-05, + "loss": 0.0787, + "step": 49620 + }, + { + "epoch": 13.96, + "learning_rate": 8.010433261487521e-05, + "loss": 0.0947, + "step": 49650 + }, + { + "epoch": 13.97, + "learning_rate": 8.008559022896949e-05, + "loss": 0.0821, + "step": 49680 + }, + { + "epoch": 13.98, + "learning_rate": 8.006684784306377e-05, + "loss": 0.0905, + "step": 49710 + }, + { + "epoch": 13.98, + "learning_rate": 8.004810545715802e-05, + "loss": 0.0873, + "step": 49740 + }, + { + "epoch": 13.99, + "learning_rate": 8.00293630712523e-05, + "loss": 0.0811, + "step": 49770 + }, + { + "epoch": 14.0, + "eval_loss": 0.1173907220363617, + "eval_runtime": 631.7038, + "eval_samples_per_second": 25.381, + "eval_steps_per_second": 0.795, + "eval_wer": 0.11362302621702401, + "step": 49798 + }, + { + "epoch": 14.0, + "learning_rate": 8.001062068534659e-05, + "loss": 0.1005, + "step": 49800 + }, + { + "epoch": 14.01, + "learning_rate": 7.999187829944085e-05, + "loss": 0.0736, + "step": 49830 + }, + { + "epoch": 14.02, + "learning_rate": 7.997313591353513e-05, + "loss": 0.0886, + "step": 49860 + }, + { + "epoch": 14.03, + "learning_rate": 7.99543935276294e-05, + "loss": 0.0771, + "step": 49890 + }, + { + "epoch": 14.03, + "learning_rate": 7.993565114172368e-05, + "loss": 0.0816, + "step": 49920 + }, + { + "epoch": 14.04, + "learning_rate": 7.991690875581795e-05, + "loss": 0.0934, + "step": 49950 + }, + { + "epoch": 14.05, + "learning_rate": 7.989816636991223e-05, + "loss": 0.0765, + "step": 49980 + }, + { + "epoch": 14.06, + "learning_rate": 7.98794239840065e-05, + "loss": 0.0926, + "step": 50010 + }, + { + "epoch": 14.07, + "learning_rate": 7.986130634429764e-05, + "loss": 0.0839, + "step": 50040 + }, + { + "epoch": 14.08, + "learning_rate": 7.984256395839191e-05, + "loss": 0.0827, + "step": 50070 + }, + { + "epoch": 14.08, + "learning_rate": 7.982382157248617e-05, + "loss": 0.0953, + "step": 50100 + }, + { + "epoch": 14.09, + "learning_rate": 7.980507918658046e-05, + "loss": 0.0752, + "step": 50130 + }, + { + "epoch": 14.1, + "learning_rate": 7.978633680067474e-05, + "loss": 0.0905, + "step": 50160 + }, + { + "epoch": 14.11, + "learning_rate": 7.9767594414769e-05, + "loss": 0.0793, + "step": 50190 + }, + { + "epoch": 14.12, + "learning_rate": 7.974885202886327e-05, + "loss": 0.0884, + "step": 50220 + }, + { + "epoch": 14.13, + "learning_rate": 7.973010964295755e-05, + "loss": 0.0951, + "step": 50250 + }, + { + "epoch": 14.14, + "learning_rate": 7.971136725705183e-05, + "loss": 0.0748, + "step": 50280 + }, + { + "epoch": 14.14, + "learning_rate": 7.96926248711461e-05, + "loss": 0.0875, + "step": 50310 + }, + { + "epoch": 14.15, + "learning_rate": 7.967388248524037e-05, + "loss": 0.0817, + "step": 50340 + }, + { + "epoch": 14.16, + "learning_rate": 7.965514009933465e-05, + "loss": 0.0817, + "step": 50370 + }, + { + "epoch": 14.17, + "learning_rate": 7.963639771342892e-05, + "loss": 0.091, + "step": 50400 + }, + { + "epoch": 14.18, + "learning_rate": 7.96176553275232e-05, + "loss": 0.0767, + "step": 50430 + }, + { + "epoch": 14.19, + "learning_rate": 7.959891294161748e-05, + "loss": 0.09, + "step": 50460 + }, + { + "epoch": 14.19, + "learning_rate": 7.958017055571175e-05, + "loss": 0.0803, + "step": 50490 + }, + { + "epoch": 14.2, + "learning_rate": 7.956142816980601e-05, + "loss": 0.0905, + "step": 50520 + }, + { + "epoch": 14.21, + "learning_rate": 7.95426857839003e-05, + "loss": 0.0886, + "step": 50550 + }, + { + "epoch": 14.22, + "learning_rate": 7.952394339799458e-05, + "loss": 0.077, + "step": 50580 + }, + { + "epoch": 14.23, + "learning_rate": 7.950520101208884e-05, + "loss": 0.0931, + "step": 50610 + }, + { + "epoch": 14.24, + "learning_rate": 7.948645862618311e-05, + "loss": 0.083, + "step": 50640 + }, + { + "epoch": 14.25, + "learning_rate": 7.946771624027739e-05, + "loss": 0.088, + "step": 50670 + }, + { + "epoch": 14.25, + "learning_rate": 7.944897385437167e-05, + "loss": 0.0911, + "step": 50700 + }, + { + "epoch": 14.26, + "learning_rate": 7.943023146846594e-05, + "loss": 0.0779, + "step": 50730 + }, + { + "epoch": 14.27, + "learning_rate": 7.94114890825602e-05, + "loss": 0.0882, + "step": 50760 + }, + { + "epoch": 14.28, + "learning_rate": 7.939274669665449e-05, + "loss": 0.081, + "step": 50790 + }, + { + "epoch": 14.29, + "learning_rate": 7.937400431074877e-05, + "loss": 0.08, + "step": 50820 + }, + { + "epoch": 14.3, + "learning_rate": 7.935526192484304e-05, + "loss": 0.0957, + "step": 50850 + }, + { + "epoch": 14.3, + "learning_rate": 7.933651953893732e-05, + "loss": 0.0756, + "step": 50880 + }, + { + "epoch": 14.31, + "learning_rate": 7.931777715303158e-05, + "loss": 0.0878, + "step": 50910 + }, + { + "epoch": 14.32, + "learning_rate": 7.929903476712585e-05, + "loss": 0.0808, + "step": 50940 + }, + { + "epoch": 14.33, + "learning_rate": 7.928029238122013e-05, + "loss": 0.0871, + "step": 50970 + }, + { + "epoch": 14.34, + "learning_rate": 7.926154999531441e-05, + "loss": 0.089, + "step": 51000 + }, + { + "epoch": 14.35, + "learning_rate": 7.924280760940868e-05, + "loss": 0.0732, + "step": 51030 + }, + { + "epoch": 14.35, + "learning_rate": 7.922406522350295e-05, + "loss": 0.0866, + "step": 51060 + }, + { + "epoch": 14.36, + "learning_rate": 7.920532283759723e-05, + "loss": 0.084, + "step": 51090 + }, + { + "epoch": 14.37, + "learning_rate": 7.918658045169151e-05, + "loss": 0.0905, + "step": 51120 + }, + { + "epoch": 14.38, + "learning_rate": 7.916783806578578e-05, + "loss": 0.0965, + "step": 51150 + }, + { + "epoch": 14.39, + "learning_rate": 7.914909567988005e-05, + "loss": 0.0761, + "step": 51180 + }, + { + "epoch": 14.4, + "learning_rate": 7.913035329397433e-05, + "loss": 0.0914, + "step": 51210 + }, + { + "epoch": 14.41, + "learning_rate": 7.911161090806861e-05, + "loss": 0.0851, + "step": 51240 + }, + { + "epoch": 14.41, + "learning_rate": 7.909286852216287e-05, + "loss": 0.0879, + "step": 51270 + }, + { + "epoch": 14.42, + "learning_rate": 7.907412613625716e-05, + "loss": 0.0961, + "step": 51300 + }, + { + "epoch": 14.43, + "learning_rate": 7.905538375035142e-05, + "loss": 0.0748, + "step": 51330 + }, + { + "epoch": 14.44, + "learning_rate": 7.903664136444569e-05, + "loss": 0.0873, + "step": 51360 + }, + { + "epoch": 14.45, + "learning_rate": 7.901789897853997e-05, + "loss": 0.081, + "step": 51390 + }, + { + "epoch": 14.46, + "learning_rate": 7.899915659263425e-05, + "loss": 0.0856, + "step": 51420 + }, + { + "epoch": 14.46, + "learning_rate": 7.898041420672852e-05, + "loss": 0.0935, + "step": 51450 + }, + { + "epoch": 14.47, + "learning_rate": 7.896167182082279e-05, + "loss": 0.0782, + "step": 51480 + }, + { + "epoch": 14.48, + "learning_rate": 7.894292943491707e-05, + "loss": 0.0931, + "step": 51510 + }, + { + "epoch": 14.49, + "learning_rate": 7.892418704901135e-05, + "loss": 0.083, + "step": 51540 + }, + { + "epoch": 14.5, + "learning_rate": 7.890544466310562e-05, + "loss": 0.084, + "step": 51570 + }, + { + "epoch": 14.51, + "learning_rate": 7.888670227719988e-05, + "loss": 0.097, + "step": 51600 + }, + { + "epoch": 14.51, + "learning_rate": 7.886795989129416e-05, + "loss": 0.0767, + "step": 51630 + }, + { + "epoch": 14.52, + "learning_rate": 7.884921750538845e-05, + "loss": 0.0904, + "step": 51660 + }, + { + "epoch": 14.53, + "learning_rate": 7.883047511948271e-05, + "loss": 0.078, + "step": 51690 + }, + { + "epoch": 14.54, + "learning_rate": 7.8811732733577e-05, + "loss": 0.0922, + "step": 51720 + }, + { + "epoch": 14.55, + "learning_rate": 7.879299034767126e-05, + "loss": 0.0937, + "step": 51750 + }, + { + "epoch": 14.56, + "learning_rate": 7.877424796176553e-05, + "loss": 0.079, + "step": 51780 + }, + { + "epoch": 14.57, + "learning_rate": 7.875550557585981e-05, + "loss": 0.0961, + "step": 51810 + }, + { + "epoch": 14.57, + "learning_rate": 7.873676318995409e-05, + "loss": 0.0843, + "step": 51840 + }, + { + "epoch": 14.58, + "learning_rate": 7.871802080404836e-05, + "loss": 0.0878, + "step": 51870 + }, + { + "epoch": 14.59, + "learning_rate": 7.869927841814263e-05, + "loss": 0.094, + "step": 51900 + }, + { + "epoch": 14.6, + "learning_rate": 7.868053603223691e-05, + "loss": 0.0784, + "step": 51930 + }, + { + "epoch": 14.61, + "learning_rate": 7.866179364633119e-05, + "loss": 0.0955, + "step": 51960 + }, + { + "epoch": 14.62, + "learning_rate": 7.864305126042546e-05, + "loss": 0.0821, + "step": 51990 + }, + { + "epoch": 14.62, + "learning_rate": 7.862430887451972e-05, + "loss": 0.089, + "step": 52020 + }, + { + "epoch": 14.63, + "learning_rate": 7.8605566488614e-05, + "loss": 0.0965, + "step": 52050 + }, + { + "epoch": 14.64, + "learning_rate": 7.858682410270828e-05, + "loss": 0.0806, + "step": 52080 + }, + { + "epoch": 14.65, + "learning_rate": 7.856808171680255e-05, + "loss": 0.0959, + "step": 52110 + }, + { + "epoch": 14.66, + "learning_rate": 7.854933933089683e-05, + "loss": 0.0791, + "step": 52140 + }, + { + "epoch": 14.67, + "learning_rate": 7.85305969449911e-05, + "loss": 0.0813, + "step": 52170 + }, + { + "epoch": 14.68, + "learning_rate": 7.851185455908537e-05, + "loss": 0.0952, + "step": 52200 + }, + { + "epoch": 14.68, + "learning_rate": 7.849311217317965e-05, + "loss": 0.0775, + "step": 52230 + }, + { + "epoch": 14.69, + "learning_rate": 7.847436978727393e-05, + "loss": 0.0922, + "step": 52260 + }, + { + "epoch": 14.7, + "learning_rate": 7.84556274013682e-05, + "loss": 0.0799, + "step": 52290 + }, + { + "epoch": 14.71, + "learning_rate": 7.843688501546246e-05, + "loss": 0.0875, + "step": 52320 + }, + { + "epoch": 14.72, + "learning_rate": 7.84187673757536e-05, + "loss": 0.095, + "step": 52350 + }, + { + "epoch": 14.73, + "learning_rate": 7.840002498984787e-05, + "loss": 0.0759, + "step": 52380 + }, + { + "epoch": 14.73, + "learning_rate": 7.838128260394215e-05, + "loss": 0.0883, + "step": 52410 + }, + { + "epoch": 14.74, + "learning_rate": 7.836254021803643e-05, + "loss": 0.0788, + "step": 52440 + }, + { + "epoch": 14.75, + "learning_rate": 7.83437978321307e-05, + "loss": 0.0862, + "step": 52470 + }, + { + "epoch": 14.76, + "learning_rate": 7.832505544622497e-05, + "loss": 0.0953, + "step": 52500 + }, + { + "epoch": 14.77, + "learning_rate": 7.830631306031925e-05, + "loss": 0.0753, + "step": 52530 + }, + { + "epoch": 14.78, + "learning_rate": 7.828757067441352e-05, + "loss": 0.0885, + "step": 52560 + }, + { + "epoch": 14.78, + "learning_rate": 7.82688282885078e-05, + "loss": 0.0845, + "step": 52590 + }, + { + "epoch": 14.79, + "learning_rate": 7.825008590260208e-05, + "loss": 0.0848, + "step": 52620 + }, + { + "epoch": 14.8, + "learning_rate": 7.823134351669635e-05, + "loss": 0.0943, + "step": 52650 + }, + { + "epoch": 14.81, + "learning_rate": 7.821260113079061e-05, + "loss": 0.0713, + "step": 52680 + }, + { + "epoch": 14.82, + "learning_rate": 7.81938587448849e-05, + "loss": 0.0952, + "step": 52710 + }, + { + "epoch": 14.83, + "learning_rate": 7.817511635897918e-05, + "loss": 0.0814, + "step": 52740 + }, + { + "epoch": 14.84, + "learning_rate": 7.815637397307344e-05, + "loss": 0.0847, + "step": 52770 + }, + { + "epoch": 14.84, + "learning_rate": 7.813763158716771e-05, + "loss": 0.0882, + "step": 52800 + }, + { + "epoch": 14.85, + "learning_rate": 7.811888920126199e-05, + "loss": 0.0745, + "step": 52830 + }, + { + "epoch": 14.86, + "learning_rate": 7.810014681535627e-05, + "loss": 0.086, + "step": 52860 + }, + { + "epoch": 14.87, + "learning_rate": 7.808140442945054e-05, + "loss": 0.082, + "step": 52890 + }, + { + "epoch": 14.88, + "learning_rate": 7.806266204354481e-05, + "loss": 0.087, + "step": 52920 + }, + { + "epoch": 14.89, + "learning_rate": 7.804391965763909e-05, + "loss": 0.0939, + "step": 52950 + }, + { + "epoch": 14.89, + "learning_rate": 7.802517727173336e-05, + "loss": 0.0783, + "step": 52980 + }, + { + "epoch": 14.9, + "learning_rate": 7.800643488582764e-05, + "loss": 0.0911, + "step": 53010 + }, + { + "epoch": 14.91, + "learning_rate": 7.79876924999219e-05, + "loss": 0.0812, + "step": 53040 + }, + { + "epoch": 14.92, + "learning_rate": 7.796895011401619e-05, + "loss": 0.0883, + "step": 53070 + }, + { + "epoch": 14.93, + "learning_rate": 7.795020772811045e-05, + "loss": 0.0946, + "step": 53100 + }, + { + "epoch": 14.94, + "learning_rate": 7.793146534220473e-05, + "loss": 0.08, + "step": 53130 + }, + { + "epoch": 14.95, + "learning_rate": 7.791272295629902e-05, + "loss": 0.0946, + "step": 53160 + }, + { + "epoch": 14.95, + "learning_rate": 7.789398057039328e-05, + "loss": 0.0825, + "step": 53190 + }, + { + "epoch": 14.96, + "learning_rate": 7.787523818448755e-05, + "loss": 0.0829, + "step": 53220 + }, + { + "epoch": 14.97, + "learning_rate": 7.785649579858183e-05, + "loss": 0.0883, + "step": 53250 + }, + { + "epoch": 14.98, + "learning_rate": 7.783775341267611e-05, + "loss": 0.0762, + "step": 53280 + }, + { + "epoch": 14.99, + "learning_rate": 7.781901102677038e-05, + "loss": 0.0883, + "step": 53310 + }, + { + "epoch": 15.0, + "learning_rate": 7.780026864086465e-05, + "loss": 0.0814, + "step": 53340 + }, + { + "epoch": 15.0, + "eval_loss": 0.11322180926799774, + "eval_runtime": 632.5147, + "eval_samples_per_second": 25.348, + "eval_steps_per_second": 0.794, + "eval_wer": 0.111405292536132, + "step": 53355 + }, + { + "epoch": 15.0, + "learning_rate": 7.778152625495893e-05, + "loss": 0.0883, + "step": 53370 + }, + { + "epoch": 15.01, + "learning_rate": 7.77627838690532e-05, + "loss": 0.0827, + "step": 53400 + }, + { + "epoch": 15.02, + "learning_rate": 7.774404148314748e-05, + "loss": 0.0796, + "step": 53430 + }, + { + "epoch": 15.03, + "learning_rate": 7.772529909724174e-05, + "loss": 0.0921, + "step": 53460 + }, + { + "epoch": 15.04, + "learning_rate": 7.770655671133602e-05, + "loss": 0.0729, + "step": 53490 + }, + { + "epoch": 15.05, + "learning_rate": 7.768781432543029e-05, + "loss": 0.0852, + "step": 53520 + }, + { + "epoch": 15.05, + "learning_rate": 7.766907193952457e-05, + "loss": 0.0831, + "step": 53550 + }, + { + "epoch": 15.06, + "learning_rate": 7.765032955361885e-05, + "loss": 0.0817, + "step": 53580 + }, + { + "epoch": 15.07, + "learning_rate": 7.763158716771312e-05, + "loss": 0.0898, + "step": 53610 + }, + { + "epoch": 15.08, + "learning_rate": 7.761284478180739e-05, + "loss": 0.0737, + "step": 53640 + }, + { + "epoch": 15.09, + "learning_rate": 7.759410239590167e-05, + "loss": 0.0815, + "step": 53670 + }, + { + "epoch": 15.1, + "learning_rate": 7.757536000999595e-05, + "loss": 0.08, + "step": 53700 + }, + { + "epoch": 15.11, + "learning_rate": 7.755661762409022e-05, + "loss": 0.0801, + "step": 53730 + }, + { + "epoch": 15.11, + "learning_rate": 7.753787523818449e-05, + "loss": 0.0874, + "step": 53760 + }, + { + "epoch": 15.12, + "learning_rate": 7.751913285227877e-05, + "loss": 0.0756, + "step": 53790 + }, + { + "epoch": 15.13, + "learning_rate": 7.750039046637303e-05, + "loss": 0.0854, + "step": 53820 + }, + { + "epoch": 15.14, + "learning_rate": 7.748164808046732e-05, + "loss": 0.0827, + "step": 53850 + }, + { + "epoch": 15.15, + "learning_rate": 7.746290569456158e-05, + "loss": 0.0835, + "step": 53880 + }, + { + "epoch": 15.16, + "learning_rate": 7.744416330865586e-05, + "loss": 0.0916, + "step": 53910 + }, + { + "epoch": 15.16, + "learning_rate": 7.742542092275013e-05, + "loss": 0.0763, + "step": 53940 + }, + { + "epoch": 15.17, + "learning_rate": 7.740667853684441e-05, + "loss": 0.0874, + "step": 53970 + }, + { + "epoch": 15.18, + "learning_rate": 7.738793615093869e-05, + "loss": 0.0863, + "step": 54000 + }, + { + "epoch": 15.19, + "learning_rate": 7.736919376503296e-05, + "loss": 0.0826, + "step": 54030 + }, + { + "epoch": 15.2, + "learning_rate": 7.735045137912723e-05, + "loss": 0.0904, + "step": 54060 + }, + { + "epoch": 15.21, + "learning_rate": 7.733170899322151e-05, + "loss": 0.0751, + "step": 54090 + }, + { + "epoch": 15.22, + "learning_rate": 7.731296660731579e-05, + "loss": 0.0875, + "step": 54120 + }, + { + "epoch": 15.22, + "learning_rate": 7.729422422141006e-05, + "loss": 0.0827, + "step": 54150 + }, + { + "epoch": 15.23, + "learning_rate": 7.727548183550432e-05, + "loss": 0.0795, + "step": 54180 + }, + { + "epoch": 15.24, + "learning_rate": 7.72567394495986e-05, + "loss": 0.098, + "step": 54210 + }, + { + "epoch": 15.25, + "learning_rate": 7.723799706369289e-05, + "loss": 0.0755, + "step": 54240 + }, + { + "epoch": 15.26, + "learning_rate": 7.721925467778715e-05, + "loss": 0.0872, + "step": 54270 + }, + { + "epoch": 15.27, + "learning_rate": 7.720051229188142e-05, + "loss": 0.0763, + "step": 54300 + }, + { + "epoch": 15.27, + "learning_rate": 7.71817699059757e-05, + "loss": 0.0825, + "step": 54330 + }, + { + "epoch": 15.28, + "learning_rate": 7.716302752006997e-05, + "loss": 0.0878, + "step": 54360 + }, + { + "epoch": 15.29, + "learning_rate": 7.714428513416425e-05, + "loss": 0.0728, + "step": 54390 + }, + { + "epoch": 15.3, + "learning_rate": 7.712554274825853e-05, + "loss": 0.0811, + "step": 54420 + }, + { + "epoch": 15.31, + "learning_rate": 7.71068003623528e-05, + "loss": 0.0822, + "step": 54450 + }, + { + "epoch": 15.32, + "learning_rate": 7.708805797644707e-05, + "loss": 0.0817, + "step": 54480 + }, + { + "epoch": 15.32, + "learning_rate": 7.706931559054135e-05, + "loss": 0.0834, + "step": 54510 + }, + { + "epoch": 15.33, + "learning_rate": 7.705057320463563e-05, + "loss": 0.069, + "step": 54540 + }, + { + "epoch": 15.34, + "learning_rate": 7.70318308187299e-05, + "loss": 0.0891, + "step": 54570 + }, + { + "epoch": 15.35, + "learning_rate": 7.701308843282416e-05, + "loss": 0.084, + "step": 54600 + }, + { + "epoch": 15.36, + "learning_rate": 7.699434604691844e-05, + "loss": 0.0767, + "step": 54630 + }, + { + "epoch": 15.37, + "learning_rate": 7.697560366101272e-05, + "loss": 0.0847, + "step": 54660 + }, + { + "epoch": 15.38, + "learning_rate": 7.695686127510699e-05, + "loss": 0.072, + "step": 54690 + }, + { + "epoch": 15.38, + "learning_rate": 7.693811888920126e-05, + "loss": 0.0833, + "step": 54720 + }, + { + "epoch": 15.39, + "learning_rate": 7.691937650329554e-05, + "loss": 0.0797, + "step": 54750 + }, + { + "epoch": 15.4, + "learning_rate": 7.690063411738981e-05, + "loss": 0.0854, + "step": 54780 + }, + { + "epoch": 15.41, + "learning_rate": 7.688189173148409e-05, + "loss": 0.0862, + "step": 54810 + }, + { + "epoch": 15.42, + "learning_rate": 7.686314934557837e-05, + "loss": 0.075, + "step": 54840 + }, + { + "epoch": 15.43, + "learning_rate": 7.684440695967264e-05, + "loss": 0.0875, + "step": 54870 + }, + { + "epoch": 15.43, + "learning_rate": 7.68256645737669e-05, + "loss": 0.0819, + "step": 54900 + }, + { + "epoch": 15.44, + "learning_rate": 7.680692218786119e-05, + "loss": 0.0798, + "step": 54930 + }, + { + "epoch": 15.45, + "learning_rate": 7.678817980195547e-05, + "loss": 0.0926, + "step": 54960 + }, + { + "epoch": 15.46, + "learning_rate": 7.676943741604973e-05, + "loss": 0.068, + "step": 54990 + }, + { + "epoch": 15.47, + "learning_rate": 7.6750695030144e-05, + "loss": 0.0866, + "step": 55020 + }, + { + "epoch": 15.48, + "learning_rate": 7.673195264423828e-05, + "loss": 0.0796, + "step": 55050 + }, + { + "epoch": 15.48, + "learning_rate": 7.671321025833256e-05, + "loss": 0.0793, + "step": 55080 + }, + { + "epoch": 15.49, + "learning_rate": 7.669446787242683e-05, + "loss": 0.0862, + "step": 55110 + }, + { + "epoch": 15.5, + "learning_rate": 7.66757254865211e-05, + "loss": 0.0715, + "step": 55140 + }, + { + "epoch": 15.51, + "learning_rate": 7.665698310061538e-05, + "loss": 0.0907, + "step": 55170 + }, + { + "epoch": 15.52, + "learning_rate": 7.663824071470965e-05, + "loss": 0.0794, + "step": 55200 + }, + { + "epoch": 15.53, + "learning_rate": 7.661949832880393e-05, + "loss": 0.0794, + "step": 55230 + }, + { + "epoch": 15.54, + "learning_rate": 7.660075594289821e-05, + "loss": 0.0878, + "step": 55260 + }, + { + "epoch": 15.54, + "learning_rate": 7.658201355699248e-05, + "loss": 0.0693, + "step": 55290 + }, + { + "epoch": 15.55, + "learning_rate": 7.656327117108674e-05, + "loss": 0.0834, + "step": 55320 + }, + { + "epoch": 15.56, + "learning_rate": 7.654452878518102e-05, + "loss": 0.0798, + "step": 55350 + }, + { + "epoch": 15.57, + "learning_rate": 7.65257863992753e-05, + "loss": 0.0784, + "step": 55380 + }, + { + "epoch": 15.58, + "learning_rate": 7.650704401336957e-05, + "loss": 0.0943, + "step": 55410 + }, + { + "epoch": 15.59, + "learning_rate": 7.648830162746384e-05, + "loss": 0.079, + "step": 55440 + }, + { + "epoch": 15.59, + "learning_rate": 7.646955924155812e-05, + "loss": 0.0829, + "step": 55470 + }, + { + "epoch": 15.6, + "learning_rate": 7.64508168556524e-05, + "loss": 0.0832, + "step": 55500 + }, + { + "epoch": 15.61, + "learning_rate": 7.643207446974667e-05, + "loss": 0.0839, + "step": 55530 + }, + { + "epoch": 15.62, + "learning_rate": 7.641333208384094e-05, + "loss": 0.0917, + "step": 55560 + }, + { + "epoch": 15.63, + "learning_rate": 7.639458969793522e-05, + "loss": 0.0779, + "step": 55590 + }, + { + "epoch": 15.64, + "learning_rate": 7.637584731202949e-05, + "loss": 0.0846, + "step": 55620 + }, + { + "epoch": 15.65, + "learning_rate": 7.635710492612377e-05, + "loss": 0.079, + "step": 55650 + }, + { + "epoch": 15.65, + "learning_rate": 7.633836254021805e-05, + "loss": 0.0813, + "step": 55680 + }, + { + "epoch": 15.66, + "learning_rate": 7.631962015431231e-05, + "loss": 0.0871, + "step": 55710 + }, + { + "epoch": 15.67, + "learning_rate": 7.630087776840658e-05, + "loss": 0.0716, + "step": 55740 + }, + { + "epoch": 15.68, + "learning_rate": 7.628213538250086e-05, + "loss": 0.0888, + "step": 55770 + }, + { + "epoch": 15.69, + "learning_rate": 7.626339299659514e-05, + "loss": 0.0843, + "step": 55800 + }, + { + "epoch": 15.7, + "learning_rate": 7.624465061068941e-05, + "loss": 0.0837, + "step": 55830 + }, + { + "epoch": 15.7, + "learning_rate": 7.622590822478368e-05, + "loss": 0.0913, + "step": 55860 + }, + { + "epoch": 15.71, + "learning_rate": 7.620716583887796e-05, + "loss": 0.0767, + "step": 55890 + }, + { + "epoch": 15.72, + "learning_rate": 7.618842345297224e-05, + "loss": 0.0822, + "step": 55920 + }, + { + "epoch": 15.73, + "learning_rate": 7.616968106706651e-05, + "loss": 0.0824, + "step": 55950 + }, + { + "epoch": 15.74, + "learning_rate": 7.615093868116078e-05, + "loss": 0.0802, + "step": 55980 + }, + { + "epoch": 15.75, + "learning_rate": 7.613219629525506e-05, + "loss": 0.0896, + "step": 56010 + }, + { + "epoch": 15.75, + "learning_rate": 7.611345390934932e-05, + "loss": 0.0744, + "step": 56040 + }, + { + "epoch": 15.76, + "learning_rate": 7.60947115234436e-05, + "loss": 0.0874, + "step": 56070 + }, + { + "epoch": 15.77, + "learning_rate": 7.607596913753789e-05, + "loss": 0.0843, + "step": 56100 + }, + { + "epoch": 15.78, + "learning_rate": 7.605722675163215e-05, + "loss": 0.0824, + "step": 56130 + }, + { + "epoch": 15.79, + "learning_rate": 7.603848436572642e-05, + "loss": 0.0829, + "step": 56160 + }, + { + "epoch": 15.8, + "learning_rate": 7.60197419798207e-05, + "loss": 0.0741, + "step": 56190 + }, + { + "epoch": 15.81, + "learning_rate": 7.600099959391498e-05, + "loss": 0.0848, + "step": 56220 + }, + { + "epoch": 15.81, + "learning_rate": 7.598225720800925e-05, + "loss": 0.0778, + "step": 56250 + }, + { + "epoch": 15.82, + "learning_rate": 7.596351482210352e-05, + "loss": 0.0817, + "step": 56280 + }, + { + "epoch": 15.83, + "learning_rate": 7.59447724361978e-05, + "loss": 0.0897, + "step": 56310 + }, + { + "epoch": 15.84, + "learning_rate": 7.592603005029208e-05, + "loss": 0.0732, + "step": 56340 + }, + { + "epoch": 15.85, + "learning_rate": 7.590728766438635e-05, + "loss": 0.0873, + "step": 56370 + }, + { + "epoch": 15.86, + "learning_rate": 7.588854527848061e-05, + "loss": 0.0847, + "step": 56400 + }, + { + "epoch": 15.86, + "learning_rate": 7.58698028925749e-05, + "loss": 0.0816, + "step": 56430 + }, + { + "epoch": 15.87, + "learning_rate": 7.585168525286602e-05, + "loss": 0.093, + "step": 56460 + }, + { + "epoch": 15.88, + "learning_rate": 7.58329428669603e-05, + "loss": 0.0765, + "step": 56490 + }, + { + "epoch": 15.89, + "learning_rate": 7.581420048105457e-05, + "loss": 0.0946, + "step": 56520 + }, + { + "epoch": 15.9, + "learning_rate": 7.579545809514885e-05, + "loss": 0.0853, + "step": 56550 + }, + { + "epoch": 15.91, + "learning_rate": 7.577671570924313e-05, + "loss": 0.0813, + "step": 56580 + }, + { + "epoch": 15.91, + "learning_rate": 7.57579733233374e-05, + "loss": 0.0905, + "step": 56610 + }, + { + "epoch": 15.92, + "learning_rate": 7.573923093743167e-05, + "loss": 0.075, + "step": 56640 + }, + { + "epoch": 15.93, + "learning_rate": 7.572048855152595e-05, + "loss": 0.0863, + "step": 56670 + }, + { + "epoch": 15.94, + "learning_rate": 7.570174616562023e-05, + "loss": 0.0818, + "step": 56700 + }, + { + "epoch": 15.95, + "learning_rate": 7.568300377971448e-05, + "loss": 0.0797, + "step": 56730 + }, + { + "epoch": 15.96, + "learning_rate": 7.566426139380876e-05, + "loss": 0.0891, + "step": 56760 + }, + { + "epoch": 15.97, + "learning_rate": 7.564551900790305e-05, + "loss": 0.0777, + "step": 56790 + }, + { + "epoch": 15.97, + "learning_rate": 7.562677662199731e-05, + "loss": 0.0888, + "step": 56820 + }, + { + "epoch": 15.98, + "learning_rate": 7.56080342360916e-05, + "loss": 0.084, + "step": 56850 + }, + { + "epoch": 15.99, + "learning_rate": 7.558929185018586e-05, + "loss": 0.0817, + "step": 56880 + }, + { + "epoch": 16.0, + "learning_rate": 7.557054946428014e-05, + "loss": 0.0865, + "step": 56910 + }, + { + "epoch": 16.0, + "eval_loss": 0.11335010826587677, + "eval_runtime": 631.0736, + "eval_samples_per_second": 25.406, + "eval_steps_per_second": 0.795, + "eval_wer": 0.10965840077518321, + "step": 56912 + }, + { + "epoch": 16.01, + "learning_rate": 7.555180707837441e-05, + "loss": 0.0725, + "step": 56940 + }, + { + "epoch": 16.02, + "learning_rate": 7.553306469246869e-05, + "loss": 0.0876, + "step": 56970 + }, + { + "epoch": 16.02, + "learning_rate": 7.551432230656297e-05, + "loss": 0.0761, + "step": 57000 + }, + { + "epoch": 16.03, + "learning_rate": 7.549557992065724e-05, + "loss": 0.0835, + "step": 57030 + }, + { + "epoch": 16.04, + "learning_rate": 7.54768375347515e-05, + "loss": 0.0822, + "step": 57060 + }, + { + "epoch": 16.05, + "learning_rate": 7.545809514884579e-05, + "loss": 0.0788, + "step": 57090 + }, + { + "epoch": 16.06, + "learning_rate": 7.543935276294007e-05, + "loss": 0.0917, + "step": 57120 + }, + { + "epoch": 16.07, + "learning_rate": 7.542061037703432e-05, + "loss": 0.0746, + "step": 57150 + }, + { + "epoch": 16.08, + "learning_rate": 7.54018679911286e-05, + "loss": 0.0875, + "step": 57180 + }, + { + "epoch": 16.08, + "learning_rate": 7.538312560522288e-05, + "loss": 0.0808, + "step": 57210 + }, + { + "epoch": 16.09, + "learning_rate": 7.536438321931715e-05, + "loss": 0.0729, + "step": 57240 + }, + { + "epoch": 16.1, + "learning_rate": 7.534564083341143e-05, + "loss": 0.0799, + "step": 57270 + }, + { + "epoch": 16.11, + "learning_rate": 7.53268984475057e-05, + "loss": 0.0743, + "step": 57300 + }, + { + "epoch": 16.12, + "learning_rate": 7.530815606159998e-05, + "loss": 0.0852, + "step": 57330 + }, + { + "epoch": 16.13, + "learning_rate": 7.528941367569425e-05, + "loss": 0.0868, + "step": 57360 + }, + { + "epoch": 16.13, + "learning_rate": 7.527067128978853e-05, + "loss": 0.0761, + "step": 57390 + }, + { + "epoch": 16.14, + "learning_rate": 7.52519289038828e-05, + "loss": 0.0889, + "step": 57420 + }, + { + "epoch": 16.15, + "learning_rate": 7.523318651797708e-05, + "loss": 0.0749, + "step": 57450 + }, + { + "epoch": 16.16, + "learning_rate": 7.521444413207135e-05, + "loss": 0.0825, + "step": 57480 + }, + { + "epoch": 16.17, + "learning_rate": 7.519570174616563e-05, + "loss": 0.0816, + "step": 57510 + }, + { + "epoch": 16.18, + "learning_rate": 7.517695936025991e-05, + "loss": 0.0757, + "step": 57540 + }, + { + "epoch": 16.18, + "learning_rate": 7.515821697435416e-05, + "loss": 0.0887, + "step": 57570 + }, + { + "epoch": 16.19, + "learning_rate": 7.513947458844844e-05, + "loss": 0.0732, + "step": 57600 + }, + { + "epoch": 16.2, + "learning_rate": 7.512073220254272e-05, + "loss": 0.0765, + "step": 57630 + }, + { + "epoch": 16.21, + "learning_rate": 7.510198981663699e-05, + "loss": 0.0843, + "step": 57660 + }, + { + "epoch": 16.22, + "learning_rate": 7.508324743073127e-05, + "loss": 0.0758, + "step": 57690 + }, + { + "epoch": 16.23, + "learning_rate": 7.506450504482554e-05, + "loss": 0.0916, + "step": 57720 + }, + { + "epoch": 16.24, + "learning_rate": 7.504576265891982e-05, + "loss": 0.0736, + "step": 57750 + }, + { + "epoch": 16.24, + "learning_rate": 7.502702027301409e-05, + "loss": 0.0851, + "step": 57780 + }, + { + "epoch": 16.25, + "learning_rate": 7.500827788710837e-05, + "loss": 0.0807, + "step": 57810 + }, + { + "epoch": 16.26, + "learning_rate": 7.498953550120264e-05, + "loss": 0.0731, + "step": 57840 + }, + { + "epoch": 16.27, + "learning_rate": 7.497079311529692e-05, + "loss": 0.0856, + "step": 57870 + }, + { + "epoch": 16.28, + "learning_rate": 7.495205072939118e-05, + "loss": 0.0746, + "step": 57900 + }, + { + "epoch": 16.29, + "learning_rate": 7.493330834348547e-05, + "loss": 0.0786, + "step": 57930 + }, + { + "epoch": 16.29, + "learning_rate": 7.491456595757975e-05, + "loss": 0.0825, + "step": 57960 + }, + { + "epoch": 16.3, + "learning_rate": 7.4895823571674e-05, + "loss": 0.0801, + "step": 57990 + }, + { + "epoch": 16.31, + "learning_rate": 7.487708118576828e-05, + "loss": 0.0861, + "step": 58020 + }, + { + "epoch": 16.32, + "learning_rate": 7.485833879986256e-05, + "loss": 0.073, + "step": 58050 + }, + { + "epoch": 16.33, + "learning_rate": 7.483959641395684e-05, + "loss": 0.0867, + "step": 58080 + }, + { + "epoch": 16.34, + "learning_rate": 7.482085402805111e-05, + "loss": 0.0837, + "step": 58110 + }, + { + "epoch": 16.35, + "learning_rate": 7.480211164214538e-05, + "loss": 0.0742, + "step": 58140 + }, + { + "epoch": 16.35, + "learning_rate": 7.478336925623966e-05, + "loss": 0.0841, + "step": 58170 + }, + { + "epoch": 16.36, + "learning_rate": 7.476462687033393e-05, + "loss": 0.076, + "step": 58200 + }, + { + "epoch": 16.37, + "learning_rate": 7.474588448442821e-05, + "loss": 0.0824, + "step": 58230 + }, + { + "epoch": 16.38, + "learning_rate": 7.472714209852247e-05, + "loss": 0.0785, + "step": 58260 + }, + { + "epoch": 16.39, + "learning_rate": 7.470839971261676e-05, + "loss": 0.0758, + "step": 58290 + }, + { + "epoch": 16.4, + "learning_rate": 7.468965732671102e-05, + "loss": 0.0863, + "step": 58320 + }, + { + "epoch": 16.4, + "learning_rate": 7.46709149408053e-05, + "loss": 0.0778, + "step": 58350 + }, + { + "epoch": 16.41, + "learning_rate": 7.465217255489958e-05, + "loss": 0.0795, + "step": 58380 + }, + { + "epoch": 16.42, + "learning_rate": 7.463343016899385e-05, + "loss": 0.0839, + "step": 58410 + }, + { + "epoch": 16.43, + "learning_rate": 7.461468778308812e-05, + "loss": 0.0761, + "step": 58440 + }, + { + "epoch": 16.44, + "learning_rate": 7.45959453971824e-05, + "loss": 0.0846, + "step": 58470 + }, + { + "epoch": 16.45, + "learning_rate": 7.457720301127668e-05, + "loss": 0.0739, + "step": 58500 + }, + { + "epoch": 16.45, + "learning_rate": 7.455846062537095e-05, + "loss": 0.088, + "step": 58530 + }, + { + "epoch": 16.46, + "learning_rate": 7.454034298566208e-05, + "loss": 0.0839, + "step": 58560 + }, + { + "epoch": 16.47, + "learning_rate": 7.452160059975634e-05, + "loss": 0.0762, + "step": 58590 + }, + { + "epoch": 16.48, + "learning_rate": 7.450285821385062e-05, + "loss": 0.0822, + "step": 58620 + }, + { + "epoch": 16.49, + "learning_rate": 7.44841158279449e-05, + "loss": 0.0745, + "step": 58650 + }, + { + "epoch": 16.5, + "learning_rate": 7.446537344203917e-05, + "loss": 0.0805, + "step": 58680 + }, + { + "epoch": 16.51, + "learning_rate": 7.444663105613345e-05, + "loss": 0.0806, + "step": 58710 + }, + { + "epoch": 16.51, + "learning_rate": 7.442788867022772e-05, + "loss": 0.0756, + "step": 58740 + }, + { + "epoch": 16.52, + "learning_rate": 7.440914628432199e-05, + "loss": 0.0866, + "step": 58770 + }, + { + "epoch": 16.53, + "learning_rate": 7.439040389841627e-05, + "loss": 0.0762, + "step": 58800 + }, + { + "epoch": 16.54, + "learning_rate": 7.437166151251055e-05, + "loss": 0.0832, + "step": 58830 + }, + { + "epoch": 16.55, + "learning_rate": 7.435291912660483e-05, + "loss": 0.0779, + "step": 58860 + }, + { + "epoch": 16.56, + "learning_rate": 7.433417674069909e-05, + "loss": 0.0738, + "step": 58890 + }, + { + "epoch": 16.56, + "learning_rate": 7.431543435479337e-05, + "loss": 0.0825, + "step": 58920 + }, + { + "epoch": 16.57, + "learning_rate": 7.429669196888765e-05, + "loss": 0.0772, + "step": 58950 + }, + { + "epoch": 16.58, + "learning_rate": 7.427794958298191e-05, + "loss": 0.0841, + "step": 58980 + }, + { + "epoch": 16.59, + "learning_rate": 7.425920719707618e-05, + "loss": 0.084, + "step": 59010 + }, + { + "epoch": 16.6, + "learning_rate": 7.424046481117046e-05, + "loss": 0.0756, + "step": 59040 + }, + { + "epoch": 16.61, + "learning_rate": 7.422172242526474e-05, + "loss": 0.0815, + "step": 59070 + }, + { + "epoch": 16.62, + "learning_rate": 7.420298003935901e-05, + "loss": 0.0771, + "step": 59100 + }, + { + "epoch": 16.62, + "learning_rate": 7.418423765345329e-05, + "loss": 0.0805, + "step": 59130 + }, + { + "epoch": 16.63, + "learning_rate": 7.416549526754756e-05, + "loss": 0.083, + "step": 59160 + }, + { + "epoch": 16.64, + "learning_rate": 7.414675288164184e-05, + "loss": 0.0782, + "step": 59190 + }, + { + "epoch": 16.65, + "learning_rate": 7.412801049573611e-05, + "loss": 0.0888, + "step": 59220 + }, + { + "epoch": 16.66, + "learning_rate": 7.410926810983039e-05, + "loss": 0.0732, + "step": 59250 + }, + { + "epoch": 16.67, + "learning_rate": 7.409052572392467e-05, + "loss": 0.081, + "step": 59280 + }, + { + "epoch": 16.67, + "learning_rate": 7.407178333801892e-05, + "loss": 0.0761, + "step": 59310 + }, + { + "epoch": 16.68, + "learning_rate": 7.40530409521132e-05, + "loss": 0.0746, + "step": 59340 + }, + { + "epoch": 16.69, + "learning_rate": 7.403429856620749e-05, + "loss": 0.0844, + "step": 59370 + }, + { + "epoch": 16.7, + "learning_rate": 7.401555618030175e-05, + "loss": 0.0739, + "step": 59400 + }, + { + "epoch": 16.71, + "learning_rate": 7.399681379439602e-05, + "loss": 0.0863, + "step": 59430 + }, + { + "epoch": 16.72, + "learning_rate": 7.39780714084903e-05, + "loss": 0.0837, + "step": 59460 + }, + { + "epoch": 16.72, + "learning_rate": 7.395932902258458e-05, + "loss": 0.0738, + "step": 59490 + }, + { + "epoch": 16.73, + "learning_rate": 7.394058663667885e-05, + "loss": 0.085, + "step": 59520 + }, + { + "epoch": 16.74, + "learning_rate": 7.392184425077313e-05, + "loss": 0.0736, + "step": 59550 + }, + { + "epoch": 16.75, + "learning_rate": 7.39031018648674e-05, + "loss": 0.0792, + "step": 59580 + }, + { + "epoch": 16.76, + "learning_rate": 7.388435947896168e-05, + "loss": 0.0807, + "step": 59610 + }, + { + "epoch": 16.77, + "learning_rate": 7.386561709305595e-05, + "loss": 0.0703, + "step": 59640 + }, + { + "epoch": 16.78, + "learning_rate": 7.384687470715023e-05, + "loss": 0.0869, + "step": 59670 + }, + { + "epoch": 16.78, + "learning_rate": 7.382813232124451e-05, + "loss": 0.0718, + "step": 59700 + }, + { + "epoch": 16.79, + "learning_rate": 7.380938993533876e-05, + "loss": 0.0829, + "step": 59730 + }, + { + "epoch": 16.8, + "learning_rate": 7.379064754943304e-05, + "loss": 0.0795, + "step": 59760 + }, + { + "epoch": 16.81, + "learning_rate": 7.377190516352732e-05, + "loss": 0.0728, + "step": 59790 + }, + { + "epoch": 16.82, + "learning_rate": 7.375316277762159e-05, + "loss": 0.0846, + "step": 59820 + }, + { + "epoch": 16.83, + "learning_rate": 7.373442039171586e-05, + "loss": 0.0729, + "step": 59850 + }, + { + "epoch": 16.83, + "learning_rate": 7.371567800581014e-05, + "loss": 0.0789, + "step": 59880 + }, + { + "epoch": 16.84, + "learning_rate": 7.369693561990442e-05, + "loss": 0.0832, + "step": 59910 + }, + { + "epoch": 16.85, + "learning_rate": 7.367819323399869e-05, + "loss": 0.0723, + "step": 59940 + }, + { + "epoch": 16.86, + "learning_rate": 7.365945084809297e-05, + "loss": 0.0783, + "step": 59970 + }, + { + "epoch": 16.87, + "learning_rate": 7.364070846218724e-05, + "loss": 0.0742, + "step": 60000 + }, + { + "epoch": 16.88, + "learning_rate": 7.362196607628152e-05, + "loss": 0.0792, + "step": 60030 + }, + { + "epoch": 16.88, + "learning_rate": 7.360322369037579e-05, + "loss": 0.0826, + "step": 60060 + }, + { + "epoch": 16.89, + "learning_rate": 7.358448130447007e-05, + "loss": 0.0771, + "step": 60090 + }, + { + "epoch": 16.9, + "learning_rate": 7.356573891856435e-05, + "loss": 0.0814, + "step": 60120 + }, + { + "epoch": 16.91, + "learning_rate": 7.35469965326586e-05, + "loss": 0.0756, + "step": 60150 + }, + { + "epoch": 16.92, + "learning_rate": 7.352825414675288e-05, + "loss": 0.0816, + "step": 60180 + }, + { + "epoch": 16.93, + "learning_rate": 7.350951176084716e-05, + "loss": 0.0811, + "step": 60210 + }, + { + "epoch": 16.94, + "learning_rate": 7.349076937494143e-05, + "loss": 0.0722, + "step": 60240 + }, + { + "epoch": 16.94, + "learning_rate": 7.34720269890357e-05, + "loss": 0.0808, + "step": 60270 + }, + { + "epoch": 16.95, + "learning_rate": 7.345328460312998e-05, + "loss": 0.0714, + "step": 60300 + }, + { + "epoch": 16.96, + "learning_rate": 7.343454221722426e-05, + "loss": 0.0755, + "step": 60330 + }, + { + "epoch": 16.97, + "learning_rate": 7.341579983131853e-05, + "loss": 0.0794, + "step": 60360 + }, + { + "epoch": 16.98, + "learning_rate": 7.339705744541281e-05, + "loss": 0.0736, + "step": 60390 + }, + { + "epoch": 16.99, + "learning_rate": 7.337831505950708e-05, + "loss": 0.0825, + "step": 60420 + }, + { + "epoch": 16.99, + "learning_rate": 7.335957267360136e-05, + "loss": 0.0701, + "step": 60450 + }, + { + "epoch": 17.0, + "eval_loss": 0.1095786765217781, + "eval_runtime": 631.7392, + "eval_samples_per_second": 25.379, + "eval_steps_per_second": 0.795, + "eval_wer": 0.1054412948835178, + "step": 60469 + }, + { + "epoch": 17.0, + "learning_rate": 7.334083028769562e-05, + "loss": 0.0849, + "step": 60480 + }, + { + "epoch": 17.01, + "learning_rate": 7.33220879017899e-05, + "loss": 0.073, + "step": 60510 + }, + { + "epoch": 17.02, + "learning_rate": 7.330334551588419e-05, + "loss": 0.0751, + "step": 60540 + }, + { + "epoch": 17.03, + "learning_rate": 7.328522787617531e-05, + "loss": 0.0886, + "step": 60570 + }, + { + "epoch": 17.04, + "learning_rate": 7.326648549026958e-05, + "loss": 0.0696, + "step": 60600 + }, + { + "epoch": 17.05, + "learning_rate": 7.324774310436385e-05, + "loss": 0.0775, + "step": 60630 + }, + { + "epoch": 17.05, + "learning_rate": 7.322900071845813e-05, + "loss": 0.075, + "step": 60660 + }, + { + "epoch": 17.06, + "learning_rate": 7.321025833255241e-05, + "loss": 0.0763, + "step": 60690 + }, + { + "epoch": 17.07, + "learning_rate": 7.319151594664668e-05, + "loss": 0.0847, + "step": 60720 + }, + { + "epoch": 17.08, + "learning_rate": 7.317277356074095e-05, + "loss": 0.0705, + "step": 60750 + }, + { + "epoch": 17.09, + "learning_rate": 7.315403117483523e-05, + "loss": 0.0852, + "step": 60780 + }, + { + "epoch": 17.1, + "learning_rate": 7.313528878892951e-05, + "loss": 0.0728, + "step": 60810 + }, + { + "epoch": 17.1, + "learning_rate": 7.311654640302377e-05, + "loss": 0.0773, + "step": 60840 + }, + { + "epoch": 17.11, + "learning_rate": 7.309780401711806e-05, + "loss": 0.0868, + "step": 60870 + }, + { + "epoch": 17.12, + "learning_rate": 7.307906163121232e-05, + "loss": 0.0669, + "step": 60900 + }, + { + "epoch": 17.13, + "learning_rate": 7.306031924530659e-05, + "loss": 0.0827, + "step": 60930 + }, + { + "epoch": 17.14, + "learning_rate": 7.304157685940087e-05, + "loss": 0.0748, + "step": 60960 + }, + { + "epoch": 17.15, + "learning_rate": 7.302283447349515e-05, + "loss": 0.0782, + "step": 60990 + }, + { + "epoch": 17.15, + "learning_rate": 7.300409208758942e-05, + "loss": 0.0853, + "step": 61020 + }, + { + "epoch": 17.16, + "learning_rate": 7.298534970168369e-05, + "loss": 0.0705, + "step": 61050 + }, + { + "epoch": 17.17, + "learning_rate": 7.296660731577797e-05, + "loss": 0.0813, + "step": 61080 + }, + { + "epoch": 17.18, + "learning_rate": 7.294786492987225e-05, + "loss": 0.0703, + "step": 61110 + }, + { + "epoch": 17.19, + "learning_rate": 7.292912254396652e-05, + "loss": 0.0765, + "step": 61140 + }, + { + "epoch": 17.2, + "learning_rate": 7.291038015806078e-05, + "loss": 0.0864, + "step": 61170 + }, + { + "epoch": 17.21, + "learning_rate": 7.289163777215507e-05, + "loss": 0.0637, + "step": 61200 + }, + { + "epoch": 17.21, + "learning_rate": 7.287289538624935e-05, + "loss": 0.0846, + "step": 61230 + }, + { + "epoch": 17.22, + "learning_rate": 7.285415300034361e-05, + "loss": 0.0713, + "step": 61260 + }, + { + "epoch": 17.23, + "learning_rate": 7.28354106144379e-05, + "loss": 0.0796, + "step": 61290 + }, + { + "epoch": 17.24, + "learning_rate": 7.281666822853216e-05, + "loss": 0.0836, + "step": 61320 + }, + { + "epoch": 17.25, + "learning_rate": 7.279792584262643e-05, + "loss": 0.071, + "step": 61350 + }, + { + "epoch": 17.26, + "learning_rate": 7.277918345672071e-05, + "loss": 0.0842, + "step": 61380 + }, + { + "epoch": 17.26, + "learning_rate": 7.276044107081499e-05, + "loss": 0.0715, + "step": 61410 + }, + { + "epoch": 17.27, + "learning_rate": 7.274169868490926e-05, + "loss": 0.0776, + "step": 61440 + }, + { + "epoch": 17.28, + "learning_rate": 7.272295629900353e-05, + "loss": 0.0912, + "step": 61470 + }, + { + "epoch": 17.29, + "learning_rate": 7.270421391309781e-05, + "loss": 0.0693, + "step": 61500 + }, + { + "epoch": 17.3, + "learning_rate": 7.268547152719209e-05, + "loss": 0.0826, + "step": 61530 + }, + { + "epoch": 17.31, + "learning_rate": 7.266672914128636e-05, + "loss": 0.071, + "step": 61560 + }, + { + "epoch": 17.32, + "learning_rate": 7.264798675538062e-05, + "loss": 0.0761, + "step": 61590 + }, + { + "epoch": 17.32, + "learning_rate": 7.26292443694749e-05, + "loss": 0.0866, + "step": 61620 + }, + { + "epoch": 17.33, + "learning_rate": 7.261050198356918e-05, + "loss": 0.0686, + "step": 61650 + }, + { + "epoch": 17.34, + "learning_rate": 7.259175959766345e-05, + "loss": 0.0813, + "step": 61680 + }, + { + "epoch": 17.35, + "learning_rate": 7.257301721175773e-05, + "loss": 0.0735, + "step": 61710 + }, + { + "epoch": 17.36, + "learning_rate": 7.2554274825852e-05, + "loss": 0.0763, + "step": 61740 + }, + { + "epoch": 17.37, + "learning_rate": 7.253553243994627e-05, + "loss": 0.0875, + "step": 61770 + }, + { + "epoch": 17.37, + "learning_rate": 7.251679005404055e-05, + "loss": 0.0685, + "step": 61800 + }, + { + "epoch": 17.38, + "learning_rate": 7.249804766813483e-05, + "loss": 0.083, + "step": 61830 + }, + { + "epoch": 17.39, + "learning_rate": 7.24793052822291e-05, + "loss": 0.0742, + "step": 61860 + }, + { + "epoch": 17.4, + "learning_rate": 7.246056289632336e-05, + "loss": 0.0777, + "step": 61890 + }, + { + "epoch": 17.41, + "learning_rate": 7.244182051041765e-05, + "loss": 0.0847, + "step": 61920 + }, + { + "epoch": 17.42, + "learning_rate": 7.242307812451193e-05, + "loss": 0.0699, + "step": 61950 + }, + { + "epoch": 17.42, + "learning_rate": 7.24043357386062e-05, + "loss": 0.0814, + "step": 61980 + }, + { + "epoch": 17.43, + "learning_rate": 7.238559335270046e-05, + "loss": 0.0703, + "step": 62010 + }, + { + "epoch": 17.44, + "learning_rate": 7.236685096679474e-05, + "loss": 0.0774, + "step": 62040 + }, + { + "epoch": 17.45, + "learning_rate": 7.234810858088902e-05, + "loss": 0.0904, + "step": 62070 + }, + { + "epoch": 17.46, + "learning_rate": 7.232936619498329e-05, + "loss": 0.0735, + "step": 62100 + }, + { + "epoch": 17.47, + "learning_rate": 7.231062380907757e-05, + "loss": 0.0807, + "step": 62130 + }, + { + "epoch": 17.48, + "learning_rate": 7.229188142317184e-05, + "loss": 0.0728, + "step": 62160 + }, + { + "epoch": 17.48, + "learning_rate": 7.22731390372661e-05, + "loss": 0.0834, + "step": 62190 + }, + { + "epoch": 17.49, + "learning_rate": 7.225439665136039e-05, + "loss": 0.0892, + "step": 62220 + }, + { + "epoch": 17.5, + "learning_rate": 7.223565426545467e-05, + "loss": 0.0714, + "step": 62250 + }, + { + "epoch": 17.51, + "learning_rate": 7.221691187954894e-05, + "loss": 0.0876, + "step": 62280 + }, + { + "epoch": 17.52, + "learning_rate": 7.21981694936432e-05, + "loss": 0.0767, + "step": 62310 + }, + { + "epoch": 17.53, + "learning_rate": 7.217942710773748e-05, + "loss": 0.0747, + "step": 62340 + }, + { + "epoch": 17.53, + "learning_rate": 7.216068472183177e-05, + "loss": 0.0803, + "step": 62370 + }, + { + "epoch": 17.54, + "learning_rate": 7.214194233592603e-05, + "loss": 0.069, + "step": 62400 + }, + { + "epoch": 17.55, + "learning_rate": 7.21231999500203e-05, + "loss": 0.0822, + "step": 62430 + }, + { + "epoch": 17.56, + "learning_rate": 7.210445756411458e-05, + "loss": 0.0727, + "step": 62460 + }, + { + "epoch": 17.57, + "learning_rate": 7.208571517820886e-05, + "loss": 0.075, + "step": 62490 + }, + { + "epoch": 17.58, + "learning_rate": 7.206697279230313e-05, + "loss": 0.0832, + "step": 62520 + }, + { + "epoch": 17.58, + "learning_rate": 7.20482304063974e-05, + "loss": 0.0697, + "step": 62550 + }, + { + "epoch": 17.59, + "learning_rate": 7.202948802049168e-05, + "loss": 0.0852, + "step": 62580 + }, + { + "epoch": 17.6, + "learning_rate": 7.201074563458596e-05, + "loss": 0.0754, + "step": 62610 + }, + { + "epoch": 17.61, + "learning_rate": 7.199200324868023e-05, + "loss": 0.0752, + "step": 62640 + }, + { + "epoch": 17.62, + "learning_rate": 7.197326086277451e-05, + "loss": 0.0795, + "step": 62670 + }, + { + "epoch": 17.63, + "learning_rate": 7.195514322306563e-05, + "loss": 0.071, + "step": 62700 + }, + { + "epoch": 17.64, + "learning_rate": 7.193640083715992e-05, + "loss": 0.0865, + "step": 62730 + }, + { + "epoch": 17.64, + "learning_rate": 7.191765845125418e-05, + "loss": 0.0715, + "step": 62760 + }, + { + "epoch": 17.65, + "learning_rate": 7.189891606534845e-05, + "loss": 0.0827, + "step": 62790 + }, + { + "epoch": 17.66, + "learning_rate": 7.188017367944273e-05, + "loss": 0.0856, + "step": 62820 + }, + { + "epoch": 17.67, + "learning_rate": 7.186143129353701e-05, + "loss": 0.0703, + "step": 62850 + }, + { + "epoch": 17.68, + "learning_rate": 7.184331365382814e-05, + "loss": 0.083, + "step": 62880 + }, + { + "epoch": 17.69, + "learning_rate": 7.182457126792241e-05, + "loss": 0.0741, + "step": 62910 + }, + { + "epoch": 17.69, + "learning_rate": 7.180582888201667e-05, + "loss": 0.0774, + "step": 62940 + }, + { + "epoch": 17.7, + "learning_rate": 7.178708649611096e-05, + "loss": 0.085, + "step": 62970 + }, + { + "epoch": 17.71, + "learning_rate": 7.176834411020524e-05, + "loss": 0.0715, + "step": 63000 + }, + { + "epoch": 17.72, + "learning_rate": 7.17496017242995e-05, + "loss": 0.0827, + "step": 63030 + }, + { + "epoch": 17.73, + "learning_rate": 7.173085933839378e-05, + "loss": 0.0761, + "step": 63060 + }, + { + "epoch": 17.74, + "learning_rate": 7.171211695248805e-05, + "loss": 0.0745, + "step": 63090 + }, + { + "epoch": 17.75, + "learning_rate": 7.169337456658233e-05, + "loss": 0.0882, + "step": 63120 + }, + { + "epoch": 17.75, + "learning_rate": 7.16746321806766e-05, + "loss": 0.0695, + "step": 63150 + }, + { + "epoch": 17.76, + "learning_rate": 7.165588979477088e-05, + "loss": 0.0864, + "step": 63180 + }, + { + "epoch": 17.77, + "learning_rate": 7.163714740886516e-05, + "loss": 0.0712, + "step": 63210 + }, + { + "epoch": 17.78, + "learning_rate": 7.161840502295942e-05, + "loss": 0.0758, + "step": 63240 + }, + { + "epoch": 17.79, + "learning_rate": 7.15996626370537e-05, + "loss": 0.0815, + "step": 63270 + }, + { + "epoch": 17.8, + "learning_rate": 7.158092025114798e-05, + "loss": 0.0707, + "step": 63300 + }, + { + "epoch": 17.8, + "learning_rate": 7.156217786524225e-05, + "loss": 0.0863, + "step": 63330 + }, + { + "epoch": 17.81, + "learning_rate": 7.154343547933651e-05, + "loss": 0.0762, + "step": 63360 + }, + { + "epoch": 17.82, + "learning_rate": 7.15246930934308e-05, + "loss": 0.0778, + "step": 63390 + }, + { + "epoch": 17.83, + "learning_rate": 7.150595070752508e-05, + "loss": 0.0935, + "step": 63420 + }, + { + "epoch": 17.84, + "learning_rate": 7.148720832161934e-05, + "loss": 0.0699, + "step": 63450 + }, + { + "epoch": 17.85, + "learning_rate": 7.146846593571362e-05, + "loss": 0.0895, + "step": 63480 + }, + { + "epoch": 17.85, + "learning_rate": 7.144972354980789e-05, + "loss": 0.0716, + "step": 63510 + }, + { + "epoch": 17.86, + "learning_rate": 7.143098116390217e-05, + "loss": 0.078, + "step": 63540 + }, + { + "epoch": 17.87, + "learning_rate": 7.141223877799644e-05, + "loss": 0.086, + "step": 63570 + }, + { + "epoch": 17.88, + "learning_rate": 7.139349639209072e-05, + "loss": 0.0707, + "step": 63600 + }, + { + "epoch": 17.89, + "learning_rate": 7.1374754006185e-05, + "loss": 0.0843, + "step": 63630 + }, + { + "epoch": 17.9, + "learning_rate": 7.135601162027926e-05, + "loss": 0.0736, + "step": 63660 + }, + { + "epoch": 17.91, + "learning_rate": 7.133726923437354e-05, + "loss": 0.0799, + "step": 63690 + }, + { + "epoch": 17.91, + "learning_rate": 7.131852684846782e-05, + "loss": 0.0843, + "step": 63720 + }, + { + "epoch": 17.92, + "learning_rate": 7.12997844625621e-05, + "loss": 0.0764, + "step": 63750 + }, + { + "epoch": 17.93, + "learning_rate": 7.128104207665635e-05, + "loss": 0.0853, + "step": 63780 + }, + { + "epoch": 17.94, + "learning_rate": 7.126229969075063e-05, + "loss": 0.0718, + "step": 63810 + }, + { + "epoch": 17.95, + "learning_rate": 7.124355730484491e-05, + "loss": 0.0764, + "step": 63840 + }, + { + "epoch": 17.96, + "learning_rate": 7.122481491893918e-05, + "loss": 0.0894, + "step": 63870 + }, + { + "epoch": 17.96, + "learning_rate": 7.120607253303346e-05, + "loss": 0.0675, + "step": 63900 + }, + { + "epoch": 17.97, + "learning_rate": 7.118733014712773e-05, + "loss": 0.0774, + "step": 63930 + }, + { + "epoch": 17.98, + "learning_rate": 7.116858776122201e-05, + "loss": 0.0727, + "step": 63960 + }, + { + "epoch": 17.99, + "learning_rate": 7.114984537531628e-05, + "loss": 0.0752, + "step": 63990 + }, + { + "epoch": 18.0, + "learning_rate": 7.113110298941056e-05, + "loss": 0.0891, + "step": 64020 + }, + { + "epoch": 18.0, + "eval_loss": 0.11096266657114029, + "eval_runtime": 631.8647, + "eval_samples_per_second": 25.374, + "eval_steps_per_second": 0.794, + "eval_wer": 0.10757714301311534, + "step": 64026 + }, + { + "epoch": 18.01, + "learning_rate": 7.111236060350484e-05, + "loss": 0.0713, + "step": 64050 + }, + { + "epoch": 18.02, + "learning_rate": 7.10936182175991e-05, + "loss": 0.0849, + "step": 64080 + }, + { + "epoch": 18.02, + "learning_rate": 7.107487583169337e-05, + "loss": 0.0712, + "step": 64110 + }, + { + "epoch": 18.03, + "learning_rate": 7.105613344578766e-05, + "loss": 0.084, + "step": 64140 + }, + { + "epoch": 18.04, + "learning_rate": 7.103739105988194e-05, + "loss": 0.0746, + "step": 64170 + }, + { + "epoch": 18.05, + "learning_rate": 7.101864867397619e-05, + "loss": 0.072, + "step": 64200 + }, + { + "epoch": 18.06, + "learning_rate": 7.099990628807047e-05, + "loss": 0.0888, + "step": 64230 + }, + { + "epoch": 18.07, + "learning_rate": 7.098116390216475e-05, + "loss": 0.0688, + "step": 64260 + }, + { + "epoch": 18.07, + "learning_rate": 7.096242151625902e-05, + "loss": 0.0824, + "step": 64290 + }, + { + "epoch": 18.08, + "learning_rate": 7.09436791303533e-05, + "loss": 0.0756, + "step": 64320 + }, + { + "epoch": 18.09, + "learning_rate": 7.092493674444757e-05, + "loss": 0.0737, + "step": 64350 + }, + { + "epoch": 18.1, + "learning_rate": 7.090619435854185e-05, + "loss": 0.0816, + "step": 64380 + }, + { + "epoch": 18.11, + "learning_rate": 7.088745197263612e-05, + "loss": 0.07, + "step": 64410 + }, + { + "epoch": 18.12, + "learning_rate": 7.08687095867304e-05, + "loss": 0.0768, + "step": 64440 + }, + { + "epoch": 18.12, + "learning_rate": 7.084996720082467e-05, + "loss": 0.074, + "step": 64470 + }, + { + "epoch": 18.13, + "learning_rate": 7.083122481491895e-05, + "loss": 0.0739, + "step": 64500 + }, + { + "epoch": 18.14, + "learning_rate": 7.081248242901321e-05, + "loss": 0.0799, + "step": 64530 + }, + { + "epoch": 18.15, + "learning_rate": 7.07937400431075e-05, + "loss": 0.069, + "step": 64560 + }, + { + "epoch": 18.16, + "learning_rate": 7.077499765720178e-05, + "loss": 0.0774, + "step": 64590 + }, + { + "epoch": 18.17, + "learning_rate": 7.075625527129603e-05, + "loss": 0.0779, + "step": 64620 + }, + { + "epoch": 18.18, + "learning_rate": 7.073751288539031e-05, + "loss": 0.0785, + "step": 64650 + }, + { + "epoch": 18.18, + "learning_rate": 7.071877049948459e-05, + "loss": 0.0852, + "step": 64680 + }, + { + "epoch": 18.19, + "learning_rate": 7.070002811357886e-05, + "loss": 0.0702, + "step": 64710 + }, + { + "epoch": 18.2, + "learning_rate": 7.068128572767314e-05, + "loss": 0.0814, + "step": 64740 + }, + { + "epoch": 18.21, + "learning_rate": 7.066254334176741e-05, + "loss": 0.0741, + "step": 64770 + }, + { + "epoch": 18.22, + "learning_rate": 7.064380095586169e-05, + "loss": 0.0806, + "step": 64800 + }, + { + "epoch": 18.23, + "learning_rate": 7.062505856995596e-05, + "loss": 0.0827, + "step": 64830 + }, + { + "epoch": 18.23, + "learning_rate": 7.060631618405024e-05, + "loss": 0.0712, + "step": 64860 + }, + { + "epoch": 18.24, + "learning_rate": 7.05875737981445e-05, + "loss": 0.0786, + "step": 64890 + }, + { + "epoch": 18.25, + "learning_rate": 7.056883141223878e-05, + "loss": 0.0775, + "step": 64920 + }, + { + "epoch": 18.26, + "learning_rate": 7.055008902633305e-05, + "loss": 0.0702, + "step": 64950 + }, + { + "epoch": 18.27, + "learning_rate": 7.053134664042733e-05, + "loss": 0.0864, + "step": 64980 + }, + { + "epoch": 18.28, + "learning_rate": 7.051322900071846e-05, + "loss": 0.0695, + "step": 65010 + }, + { + "epoch": 18.29, + "learning_rate": 7.049448661481274e-05, + "loss": 0.0781, + "step": 65040 + }, + { + "epoch": 18.29, + "learning_rate": 7.047574422890701e-05, + "loss": 0.0763, + "step": 65070 + }, + { + "epoch": 18.3, + "learning_rate": 7.045700184300128e-05, + "loss": 0.0721, + "step": 65100 + }, + { + "epoch": 18.31, + "learning_rate": 7.043825945709556e-05, + "loss": 0.0787, + "step": 65130 + }, + { + "epoch": 18.32, + "learning_rate": 7.041951707118984e-05, + "loss": 0.0721, + "step": 65160 + }, + { + "epoch": 18.33, + "learning_rate": 7.04007746852841e-05, + "loss": 0.0787, + "step": 65190 + }, + { + "epoch": 18.34, + "learning_rate": 7.038203229937837e-05, + "loss": 0.0802, + "step": 65220 + }, + { + "epoch": 18.34, + "learning_rate": 7.036328991347265e-05, + "loss": 0.0771, + "step": 65250 + }, + { + "epoch": 18.35, + "learning_rate": 7.034454752756694e-05, + "loss": 0.0839, + "step": 65280 + }, + { + "epoch": 18.36, + "learning_rate": 7.03258051416612e-05, + "loss": 0.0652, + "step": 65310 + }, + { + "epoch": 18.37, + "learning_rate": 7.030706275575548e-05, + "loss": 0.0793, + "step": 65340 + }, + { + "epoch": 18.38, + "learning_rate": 7.028832036984975e-05, + "loss": 0.0745, + "step": 65370 + }, + { + "epoch": 18.39, + "learning_rate": 7.026957798394402e-05, + "loss": 0.073, + "step": 65400 + }, + { + "epoch": 18.39, + "learning_rate": 7.02508355980383e-05, + "loss": 0.0829, + "step": 65430 + }, + { + "epoch": 18.4, + "learning_rate": 7.023209321213258e-05, + "loss": 0.071, + "step": 65460 + }, + { + "epoch": 18.41, + "learning_rate": 7.021335082622685e-05, + "loss": 0.0768, + "step": 65490 + }, + { + "epoch": 18.42, + "learning_rate": 7.019460844032111e-05, + "loss": 0.0708, + "step": 65520 + }, + { + "epoch": 18.43, + "learning_rate": 7.01758660544154e-05, + "loss": 0.0787, + "step": 65550 + }, + { + "epoch": 18.44, + "learning_rate": 7.015712366850968e-05, + "loss": 0.0843, + "step": 65580 + }, + { + "epoch": 18.45, + "learning_rate": 7.013838128260394e-05, + "loss": 0.0689, + "step": 65610 + }, + { + "epoch": 18.45, + "learning_rate": 7.011963889669821e-05, + "loss": 0.0751, + "step": 65640 + }, + { + "epoch": 18.46, + "learning_rate": 7.010089651079249e-05, + "loss": 0.071, + "step": 65670 + }, + { + "epoch": 18.47, + "learning_rate": 7.008215412488677e-05, + "loss": 0.0748, + "step": 65700 + }, + { + "epoch": 18.48, + "learning_rate": 7.006341173898104e-05, + "loss": 0.0827, + "step": 65730 + }, + { + "epoch": 18.49, + "learning_rate": 7.004466935307532e-05, + "loss": 0.07, + "step": 65760 + }, + { + "epoch": 18.5, + "learning_rate": 7.002592696716959e-05, + "loss": 0.0818, + "step": 65790 + }, + { + "epoch": 18.5, + "learning_rate": 7.000718458126386e-05, + "loss": 0.0764, + "step": 65820 + }, + { + "epoch": 18.51, + "learning_rate": 6.998844219535814e-05, + "loss": 0.0714, + "step": 65850 + }, + { + "epoch": 18.52, + "learning_rate": 6.996969980945242e-05, + "loss": 0.0827, + "step": 65880 + }, + { + "epoch": 18.53, + "learning_rate": 6.995095742354669e-05, + "loss": 0.0721, + "step": 65910 + }, + { + "epoch": 18.54, + "learning_rate": 6.993221503764095e-05, + "loss": 0.0817, + "step": 65940 + }, + { + "epoch": 18.55, + "learning_rate": 6.991347265173523e-05, + "loss": 0.0746, + "step": 65970 + }, + { + "epoch": 18.55, + "learning_rate": 6.989473026582952e-05, + "loss": 0.0753, + "step": 66000 + }, + { + "epoch": 18.56, + "learning_rate": 6.987598787992378e-05, + "loss": 0.0887, + "step": 66030 + }, + { + "epoch": 18.57, + "learning_rate": 6.985724549401805e-05, + "loss": 0.0671, + "step": 66060 + }, + { + "epoch": 18.58, + "learning_rate": 6.983850310811233e-05, + "loss": 0.0833, + "step": 66090 + }, + { + "epoch": 18.59, + "learning_rate": 6.981976072220661e-05, + "loss": 0.0769, + "step": 66120 + }, + { + "epoch": 18.6, + "learning_rate": 6.980101833630088e-05, + "loss": 0.0754, + "step": 66150 + }, + { + "epoch": 18.61, + "learning_rate": 6.978227595039516e-05, + "loss": 0.0855, + "step": 66180 + }, + { + "epoch": 18.61, + "learning_rate": 6.976353356448943e-05, + "loss": 0.0675, + "step": 66210 + }, + { + "epoch": 18.62, + "learning_rate": 6.97447911785837e-05, + "loss": 0.0819, + "step": 66240 + }, + { + "epoch": 18.63, + "learning_rate": 6.972604879267798e-05, + "loss": 0.0741, + "step": 66270 + }, + { + "epoch": 18.64, + "learning_rate": 6.970730640677226e-05, + "loss": 0.075, + "step": 66300 + }, + { + "epoch": 18.65, + "learning_rate": 6.968856402086652e-05, + "loss": 0.0836, + "step": 66330 + }, + { + "epoch": 18.66, + "learning_rate": 6.966982163496079e-05, + "loss": 0.0685, + "step": 66360 + }, + { + "epoch": 18.66, + "learning_rate": 6.965107924905507e-05, + "loss": 0.0776, + "step": 66390 + }, + { + "epoch": 18.67, + "learning_rate": 6.963233686314935e-05, + "loss": 0.0784, + "step": 66420 + }, + { + "epoch": 18.68, + "learning_rate": 6.961359447724362e-05, + "loss": 0.076, + "step": 66450 + }, + { + "epoch": 18.69, + "learning_rate": 6.959485209133789e-05, + "loss": 0.0871, + "step": 66480 + }, + { + "epoch": 18.7, + "learning_rate": 6.957610970543217e-05, + "loss": 0.0686, + "step": 66510 + }, + { + "epoch": 18.71, + "learning_rate": 6.955736731952645e-05, + "loss": 0.0764, + "step": 66540 + }, + { + "epoch": 18.72, + "learning_rate": 6.953862493362072e-05, + "loss": 0.0749, + "step": 66570 + }, + { + "epoch": 18.72, + "learning_rate": 6.9519882547715e-05, + "loss": 0.0771, + "step": 66600 + }, + { + "epoch": 18.73, + "learning_rate": 6.950114016180927e-05, + "loss": 0.0862, + "step": 66630 + }, + { + "epoch": 18.74, + "learning_rate": 6.948239777590353e-05, + "loss": 0.0667, + "step": 66660 + }, + { + "epoch": 18.75, + "learning_rate": 6.946365538999782e-05, + "loss": 0.0809, + "step": 66690 + }, + { + "epoch": 18.76, + "learning_rate": 6.94449130040921e-05, + "loss": 0.0769, + "step": 66720 + }, + { + "epoch": 18.77, + "learning_rate": 6.942617061818636e-05, + "loss": 0.0756, + "step": 66750 + }, + { + "epoch": 18.77, + "learning_rate": 6.940742823228063e-05, + "loss": 0.0835, + "step": 66780 + }, + { + "epoch": 18.78, + "learning_rate": 6.938868584637491e-05, + "loss": 0.072, + "step": 66810 + }, + { + "epoch": 18.79, + "learning_rate": 6.936994346046919e-05, + "loss": 0.0859, + "step": 66840 + }, + { + "epoch": 18.8, + "learning_rate": 6.935120107456346e-05, + "loss": 0.0747, + "step": 66870 + }, + { + "epoch": 18.81, + "learning_rate": 6.933245868865773e-05, + "loss": 0.0723, + "step": 66900 + }, + { + "epoch": 18.82, + "learning_rate": 6.931371630275201e-05, + "loss": 0.079, + "step": 66930 + }, + { + "epoch": 18.82, + "learning_rate": 6.929497391684629e-05, + "loss": 0.0697, + "step": 66960 + }, + { + "epoch": 18.83, + "learning_rate": 6.927623153094056e-05, + "loss": 0.0786, + "step": 66990 + }, + { + "epoch": 18.84, + "learning_rate": 6.925748914503484e-05, + "loss": 0.0785, + "step": 67020 + }, + { + "epoch": 18.85, + "learning_rate": 6.92387467591291e-05, + "loss": 0.0776, + "step": 67050 + }, + { + "epoch": 18.86, + "learning_rate": 6.922000437322337e-05, + "loss": 0.0874, + "step": 67080 + }, + { + "epoch": 18.87, + "learning_rate": 6.920126198731765e-05, + "loss": 0.0705, + "step": 67110 + }, + { + "epoch": 18.88, + "learning_rate": 6.918251960141193e-05, + "loss": 0.0799, + "step": 67140 + }, + { + "epoch": 18.88, + "learning_rate": 6.916377721550622e-05, + "loss": 0.0753, + "step": 67170 + }, + { + "epoch": 18.89, + "learning_rate": 6.914503482960047e-05, + "loss": 0.0758, + "step": 67200 + }, + { + "epoch": 18.9, + "learning_rate": 6.912629244369475e-05, + "loss": 0.0837, + "step": 67230 + }, + { + "epoch": 18.91, + "learning_rate": 6.910755005778903e-05, + "loss": 0.0687, + "step": 67260 + }, + { + "epoch": 18.92, + "learning_rate": 6.90888076718833e-05, + "loss": 0.0788, + "step": 67290 + }, + { + "epoch": 18.93, + "learning_rate": 6.907006528597757e-05, + "loss": 0.0696, + "step": 67320 + }, + { + "epoch": 18.93, + "learning_rate": 6.905132290007185e-05, + "loss": 0.074, + "step": 67350 + }, + { + "epoch": 18.94, + "learning_rate": 6.903258051416613e-05, + "loss": 0.078, + "step": 67380 + }, + { + "epoch": 18.95, + "learning_rate": 6.90138381282604e-05, + "loss": 0.0681, + "step": 67410 + }, + { + "epoch": 18.96, + "learning_rate": 6.899509574235468e-05, + "loss": 0.0798, + "step": 67440 + }, + { + "epoch": 18.97, + "learning_rate": 6.897635335644894e-05, + "loss": 0.0725, + "step": 67470 + }, + { + "epoch": 18.98, + "learning_rate": 6.895823571674009e-05, + "loss": 0.0733, + "step": 67500 + }, + { + "epoch": 18.98, + "learning_rate": 6.893949333083435e-05, + "loss": 0.0848, + "step": 67530 + }, + { + "epoch": 18.99, + "learning_rate": 6.892075094492862e-05, + "loss": 0.071, + "step": 67560 + }, + { + "epoch": 19.0, + "eval_loss": 0.11411216855049133, + "eval_runtime": 631.0775, + "eval_samples_per_second": 25.406, + "eval_steps_per_second": 0.795, + "eval_wer": 0.10739290052270277, + "step": 67583 + }, + { + "epoch": 19.0, + "learning_rate": 6.89020085590229e-05, + "loss": 0.0792, + "step": 67590 + }, + { + "epoch": 19.01, + "learning_rate": 6.888326617311718e-05, + "loss": 0.0661, + "step": 67620 + }, + { + "epoch": 19.02, + "learning_rate": 6.886452378721145e-05, + "loss": 0.0769, + "step": 67650 + }, + { + "epoch": 19.03, + "learning_rate": 6.884578140130572e-05, + "loss": 0.0759, + "step": 67680 + }, + { + "epoch": 19.04, + "learning_rate": 6.88270390154e-05, + "loss": 0.069, + "step": 67710 + }, + { + "epoch": 19.04, + "learning_rate": 6.880829662949428e-05, + "loss": 0.0822, + "step": 67740 + }, + { + "epoch": 19.05, + "learning_rate": 6.878955424358855e-05, + "loss": 0.0713, + "step": 67770 + }, + { + "epoch": 19.06, + "learning_rate": 6.877081185768281e-05, + "loss": 0.0794, + "step": 67800 + }, + { + "epoch": 19.07, + "learning_rate": 6.87520694717771e-05, + "loss": 0.0757, + "step": 67830 + }, + { + "epoch": 19.08, + "learning_rate": 6.873332708587136e-05, + "loss": 0.0695, + "step": 67860 + }, + { + "epoch": 19.09, + "learning_rate": 6.871458469996564e-05, + "loss": 0.077, + "step": 67890 + }, + { + "epoch": 19.09, + "learning_rate": 6.869584231405992e-05, + "loss": 0.072, + "step": 67920 + }, + { + "epoch": 19.1, + "learning_rate": 6.867709992815419e-05, + "loss": 0.0781, + "step": 67950 + }, + { + "epoch": 19.11, + "learning_rate": 6.865835754224846e-05, + "loss": 0.075, + "step": 67980 + }, + { + "epoch": 19.12, + "learning_rate": 6.863961515634274e-05, + "loss": 0.0725, + "step": 68010 + }, + { + "epoch": 19.13, + "learning_rate": 6.862087277043702e-05, + "loss": 0.0776, + "step": 68040 + }, + { + "epoch": 19.14, + "learning_rate": 6.860213038453129e-05, + "loss": 0.069, + "step": 68070 + }, + { + "epoch": 19.15, + "learning_rate": 6.858338799862556e-05, + "loss": 0.0821, + "step": 68100 + }, + { + "epoch": 19.15, + "learning_rate": 6.856464561271984e-05, + "loss": 0.0748, + "step": 68130 + }, + { + "epoch": 19.16, + "learning_rate": 6.854590322681412e-05, + "loss": 0.0672, + "step": 68160 + }, + { + "epoch": 19.17, + "learning_rate": 6.852716084090838e-05, + "loss": 0.0828, + "step": 68190 + }, + { + "epoch": 19.18, + "learning_rate": 6.850841845500265e-05, + "loss": 0.0701, + "step": 68220 + }, + { + "epoch": 19.19, + "learning_rate": 6.848967606909693e-05, + "loss": 0.0745, + "step": 68250 + }, + { + "epoch": 19.2, + "learning_rate": 6.847093368319121e-05, + "loss": 0.0738, + "step": 68280 + }, + { + "epoch": 19.2, + "learning_rate": 6.845219129728548e-05, + "loss": 0.0706, + "step": 68310 + }, + { + "epoch": 19.21, + "learning_rate": 6.843344891137976e-05, + "loss": 0.0788, + "step": 68340 + }, + { + "epoch": 19.22, + "learning_rate": 6.841470652547403e-05, + "loss": 0.0682, + "step": 68370 + }, + { + "epoch": 19.23, + "learning_rate": 6.83959641395683e-05, + "loss": 0.077, + "step": 68400 + }, + { + "epoch": 19.24, + "learning_rate": 6.837722175366258e-05, + "loss": 0.0796, + "step": 68430 + }, + { + "epoch": 19.25, + "learning_rate": 6.835847936775686e-05, + "loss": 0.071, + "step": 68460 + }, + { + "epoch": 19.25, + "learning_rate": 6.833973698185113e-05, + "loss": 0.0796, + "step": 68490 + }, + { + "epoch": 19.26, + "learning_rate": 6.83209945959454e-05, + "loss": 0.0697, + "step": 68520 + }, + { + "epoch": 19.27, + "learning_rate": 6.830225221003968e-05, + "loss": 0.0737, + "step": 68550 + }, + { + "epoch": 19.28, + "learning_rate": 6.828350982413396e-05, + "loss": 0.0736, + "step": 68580 + }, + { + "epoch": 19.29, + "learning_rate": 6.826476743822822e-05, + "loss": 0.0753, + "step": 68610 + }, + { + "epoch": 19.3, + "learning_rate": 6.824602505232249e-05, + "loss": 0.0804, + "step": 68640 + }, + { + "epoch": 19.31, + "learning_rate": 6.822728266641677e-05, + "loss": 0.0669, + "step": 68670 + }, + { + "epoch": 19.31, + "learning_rate": 6.820854028051105e-05, + "loss": 0.0748, + "step": 68700 + }, + { + "epoch": 19.32, + "learning_rate": 6.818979789460532e-05, + "loss": 0.0714, + "step": 68730 + }, + { + "epoch": 19.33, + "learning_rate": 6.81710555086996e-05, + "loss": 0.0694, + "step": 68760 + }, + { + "epoch": 19.34, + "learning_rate": 6.815231312279387e-05, + "loss": 0.0826, + "step": 68790 + }, + { + "epoch": 19.35, + "learning_rate": 6.813357073688814e-05, + "loss": 0.0699, + "step": 68820 + }, + { + "epoch": 19.36, + "learning_rate": 6.811482835098242e-05, + "loss": 0.0767, + "step": 68850 + }, + { + "epoch": 19.36, + "learning_rate": 6.80960859650767e-05, + "loss": 0.0759, + "step": 68880 + }, + { + "epoch": 19.37, + "learning_rate": 6.807734357917097e-05, + "loss": 0.0722, + "step": 68910 + }, + { + "epoch": 19.38, + "learning_rate": 6.805860119326523e-05, + "loss": 0.0778, + "step": 68940 + }, + { + "epoch": 19.39, + "learning_rate": 6.803985880735951e-05, + "loss": 0.0665, + "step": 68970 + }, + { + "epoch": 19.4, + "learning_rate": 6.80211164214538e-05, + "loss": 0.0742, + "step": 69000 + }, + { + "epoch": 19.41, + "learning_rate": 6.800237403554806e-05, + "loss": 0.076, + "step": 69030 + }, + { + "epoch": 19.42, + "learning_rate": 6.798363164964233e-05, + "loss": 0.0732, + "step": 69060 + }, + { + "epoch": 19.42, + "learning_rate": 6.796488926373661e-05, + "loss": 0.0808, + "step": 69090 + }, + { + "epoch": 19.43, + "learning_rate": 6.794614687783089e-05, + "loss": 0.0655, + "step": 69120 + }, + { + "epoch": 19.44, + "learning_rate": 6.792740449192516e-05, + "loss": 0.0749, + "step": 69150 + }, + { + "epoch": 19.45, + "learning_rate": 6.790866210601944e-05, + "loss": 0.0761, + "step": 69180 + }, + { + "epoch": 19.46, + "learning_rate": 6.788991972011371e-05, + "loss": 0.0735, + "step": 69210 + }, + { + "epoch": 19.47, + "learning_rate": 6.787117733420797e-05, + "loss": 0.0796, + "step": 69240 + }, + { + "epoch": 19.47, + "learning_rate": 6.785243494830226e-05, + "loss": 0.0688, + "step": 69270 + }, + { + "epoch": 19.48, + "learning_rate": 6.783369256239654e-05, + "loss": 0.071, + "step": 69300 + }, + { + "epoch": 19.49, + "learning_rate": 6.78149501764908e-05, + "loss": 0.0748, + "step": 69330 + }, + { + "epoch": 19.5, + "learning_rate": 6.779620779058507e-05, + "loss": 0.0683, + "step": 69360 + }, + { + "epoch": 19.51, + "learning_rate": 6.777746540467935e-05, + "loss": 0.0797, + "step": 69390 + }, + { + "epoch": 19.52, + "learning_rate": 6.775872301877363e-05, + "loss": 0.0685, + "step": 69420 + }, + { + "epoch": 19.52, + "learning_rate": 6.77399806328679e-05, + "loss": 0.0806, + "step": 69450 + }, + { + "epoch": 19.53, + "learning_rate": 6.772123824696217e-05, + "loss": 0.0753, + "step": 69480 + }, + { + "epoch": 19.54, + "learning_rate": 6.770249586105645e-05, + "loss": 0.0716, + "step": 69510 + }, + { + "epoch": 19.55, + "learning_rate": 6.768375347515073e-05, + "loss": 0.0764, + "step": 69540 + }, + { + "epoch": 19.56, + "learning_rate": 6.7665011089245e-05, + "loss": 0.0662, + "step": 69570 + }, + { + "epoch": 19.57, + "learning_rate": 6.764626870333926e-05, + "loss": 0.0742, + "step": 69600 + }, + { + "epoch": 19.58, + "learning_rate": 6.762752631743355e-05, + "loss": 0.0755, + "step": 69630 + }, + { + "epoch": 19.58, + "learning_rate": 6.760878393152781e-05, + "loss": 0.0695, + "step": 69660 + }, + { + "epoch": 19.59, + "learning_rate": 6.75900415456221e-05, + "loss": 0.0789, + "step": 69690 + }, + { + "epoch": 19.6, + "learning_rate": 6.757129915971638e-05, + "loss": 0.0675, + "step": 69720 + }, + { + "epoch": 19.61, + "learning_rate": 6.755255677381064e-05, + "loss": 0.0775, + "step": 69750 + }, + { + "epoch": 19.62, + "learning_rate": 6.753381438790491e-05, + "loss": 0.0748, + "step": 69780 + }, + { + "epoch": 19.63, + "learning_rate": 6.751507200199919e-05, + "loss": 0.0748, + "step": 69810 + }, + { + "epoch": 19.63, + "learning_rate": 6.749632961609347e-05, + "loss": 0.0823, + "step": 69840 + }, + { + "epoch": 19.64, + "learning_rate": 6.747758723018774e-05, + "loss": 0.067, + "step": 69870 + }, + { + "epoch": 19.65, + "learning_rate": 6.745884484428201e-05, + "loss": 0.0791, + "step": 69900 + }, + { + "epoch": 19.66, + "learning_rate": 6.744010245837629e-05, + "loss": 0.0775, + "step": 69930 + }, + { + "epoch": 19.67, + "learning_rate": 6.742136007247057e-05, + "loss": 0.0684, + "step": 69960 + }, + { + "epoch": 19.68, + "learning_rate": 6.740261768656484e-05, + "loss": 0.082, + "step": 69990 + }, + { + "epoch": 19.69, + "learning_rate": 6.73838753006591e-05, + "loss": 0.068, + "step": 70020 + }, + { + "epoch": 19.69, + "learning_rate": 6.736513291475338e-05, + "loss": 0.076, + "step": 70050 + }, + { + "epoch": 19.7, + "learning_rate": 6.734639052884765e-05, + "loss": 0.0774, + "step": 70080 + }, + { + "epoch": 19.71, + "learning_rate": 6.732764814294193e-05, + "loss": 0.0734, + "step": 70110 + }, + { + "epoch": 19.72, + "learning_rate": 6.730890575703621e-05, + "loss": 0.0791, + "step": 70140 + }, + { + "epoch": 19.73, + "learning_rate": 6.729016337113048e-05, + "loss": 0.0675, + "step": 70170 + }, + { + "epoch": 19.74, + "learning_rate": 6.727142098522475e-05, + "loss": 0.0778, + "step": 70200 + }, + { + "epoch": 19.74, + "learning_rate": 6.725267859931903e-05, + "loss": 0.0786, + "step": 70230 + }, + { + "epoch": 19.75, + "learning_rate": 6.723393621341331e-05, + "loss": 0.0687, + "step": 70260 + }, + { + "epoch": 19.76, + "learning_rate": 6.721519382750758e-05, + "loss": 0.0832, + "step": 70290 + }, + { + "epoch": 19.77, + "learning_rate": 6.719645144160185e-05, + "loss": 0.0673, + "step": 70320 + }, + { + "epoch": 19.78, + "learning_rate": 6.717770905569613e-05, + "loss": 0.0807, + "step": 70350 + }, + { + "epoch": 19.79, + "learning_rate": 6.715896666979041e-05, + "loss": 0.0735, + "step": 70380 + }, + { + "epoch": 19.79, + "learning_rate": 6.714022428388467e-05, + "loss": 0.0684, + "step": 70410 + }, + { + "epoch": 19.8, + "learning_rate": 6.712148189797894e-05, + "loss": 0.0847, + "step": 70440 + }, + { + "epoch": 19.81, + "learning_rate": 6.710273951207322e-05, + "loss": 0.0683, + "step": 70470 + }, + { + "epoch": 19.82, + "learning_rate": 6.708399712616749e-05, + "loss": 0.0744, + "step": 70500 + }, + { + "epoch": 19.83, + "learning_rate": 6.706525474026177e-05, + "loss": 0.0729, + "step": 70530 + }, + { + "epoch": 19.84, + "learning_rate": 6.704651235435605e-05, + "loss": 0.0745, + "step": 70560 + }, + { + "epoch": 19.85, + "learning_rate": 6.702776996845032e-05, + "loss": 0.0777, + "step": 70590 + }, + { + "epoch": 19.85, + "learning_rate": 6.700902758254459e-05, + "loss": 0.0661, + "step": 70620 + }, + { + "epoch": 19.86, + "learning_rate": 6.699028519663887e-05, + "loss": 0.0773, + "step": 70650 + }, + { + "epoch": 19.87, + "learning_rate": 6.697154281073315e-05, + "loss": 0.0748, + "step": 70680 + }, + { + "epoch": 19.88, + "learning_rate": 6.695280042482742e-05, + "loss": 0.0717, + "step": 70710 + }, + { + "epoch": 19.89, + "learning_rate": 6.693405803892168e-05, + "loss": 0.081, + "step": 70740 + }, + { + "epoch": 19.9, + "learning_rate": 6.691531565301597e-05, + "loss": 0.0682, + "step": 70770 + }, + { + "epoch": 19.9, + "learning_rate": 6.689657326711025e-05, + "loss": 0.0766, + "step": 70800 + }, + { + "epoch": 19.91, + "learning_rate": 6.687783088120451e-05, + "loss": 0.0731, + "step": 70830 + }, + { + "epoch": 19.92, + "learning_rate": 6.685908849529878e-05, + "loss": 0.07, + "step": 70860 + }, + { + "epoch": 19.93, + "learning_rate": 6.684034610939306e-05, + "loss": 0.0782, + "step": 70890 + }, + { + "epoch": 19.94, + "learning_rate": 6.682160372348733e-05, + "loss": 0.0678, + "step": 70920 + }, + { + "epoch": 19.95, + "learning_rate": 6.680286133758161e-05, + "loss": 0.0755, + "step": 70950 + }, + { + "epoch": 19.95, + "learning_rate": 6.678411895167589e-05, + "loss": 0.0763, + "step": 70980 + }, + { + "epoch": 19.96, + "learning_rate": 6.676537656577016e-05, + "loss": 0.0731, + "step": 71010 + }, + { + "epoch": 19.97, + "learning_rate": 6.674663417986443e-05, + "loss": 0.0806, + "step": 71040 + }, + { + "epoch": 19.98, + "learning_rate": 6.672789179395871e-05, + "loss": 0.0644, + "step": 71070 + }, + { + "epoch": 19.99, + "learning_rate": 6.670914940805299e-05, + "loss": 0.0751, + "step": 71100 + }, + { + "epoch": 20.0, + "learning_rate": 6.669103176834412e-05, + "loss": 0.0726, + "step": 71130 + }, + { + "epoch": 20.0, + "eval_loss": 0.10938318818807602, + "eval_runtime": 632.7086, + "eval_samples_per_second": 25.34, + "eval_steps_per_second": 0.793, + "eval_wer": 0.10929673959029929, + "step": 71140 + }, + { + "epoch": 20.01, + "learning_rate": 6.66722893824384e-05, + "loss": 0.0718, + "step": 71160 + }, + { + "epoch": 20.01, + "learning_rate": 6.665354699653265e-05, + "loss": 0.0843, + "step": 71190 + }, + { + "epoch": 20.02, + "learning_rate": 6.663480461062693e-05, + "loss": 0.0637, + "step": 71220 + }, + { + "epoch": 20.03, + "learning_rate": 6.661606222472121e-05, + "loss": 0.0759, + "step": 71250 + }, + { + "epoch": 20.04, + "learning_rate": 6.659731983881548e-05, + "loss": 0.068, + "step": 71280 + }, + { + "epoch": 20.05, + "learning_rate": 6.657857745290976e-05, + "loss": 0.0724, + "step": 71310 + }, + { + "epoch": 20.06, + "learning_rate": 6.655983506700403e-05, + "loss": 0.0815, + "step": 71340 + }, + { + "epoch": 20.06, + "learning_rate": 6.654109268109831e-05, + "loss": 0.0639, + "step": 71370 + }, + { + "epoch": 20.07, + "learning_rate": 6.652235029519258e-05, + "loss": 0.0768, + "step": 71400 + }, + { + "epoch": 20.08, + "learning_rate": 6.650360790928686e-05, + "loss": 0.0674, + "step": 71430 + }, + { + "epoch": 20.09, + "learning_rate": 6.648486552338114e-05, + "loss": 0.0714, + "step": 71460 + }, + { + "epoch": 20.1, + "learning_rate": 6.64661231374754e-05, + "loss": 0.0785, + "step": 71490 + }, + { + "epoch": 20.11, + "learning_rate": 6.644738075156967e-05, + "loss": 0.0628, + "step": 71520 + }, + { + "epoch": 20.12, + "learning_rate": 6.642863836566395e-05, + "loss": 0.0787, + "step": 71550 + }, + { + "epoch": 20.12, + "learning_rate": 6.640989597975824e-05, + "loss": 0.0656, + "step": 71580 + }, + { + "epoch": 20.13, + "learning_rate": 6.639115359385249e-05, + "loss": 0.0701, + "step": 71610 + }, + { + "epoch": 20.14, + "learning_rate": 6.637241120794677e-05, + "loss": 0.0743, + "step": 71640 + }, + { + "epoch": 20.15, + "learning_rate": 6.635366882204105e-05, + "loss": 0.0632, + "step": 71670 + }, + { + "epoch": 20.16, + "learning_rate": 6.633492643613533e-05, + "loss": 0.0758, + "step": 71700 + }, + { + "epoch": 20.17, + "learning_rate": 6.63161840502296e-05, + "loss": 0.0652, + "step": 71730 + }, + { + "epoch": 20.17, + "learning_rate": 6.629744166432387e-05, + "loss": 0.0769, + "step": 71760 + }, + { + "epoch": 20.18, + "learning_rate": 6.627869927841815e-05, + "loss": 0.0761, + "step": 71790 + }, + { + "epoch": 20.19, + "learning_rate": 6.625995689251242e-05, + "loss": 0.0657, + "step": 71820 + }, + { + "epoch": 20.2, + "learning_rate": 6.62412145066067e-05, + "loss": 0.0763, + "step": 71850 + }, + { + "epoch": 20.21, + "learning_rate": 6.622247212070098e-05, + "loss": 0.0649, + "step": 71880 + }, + { + "epoch": 20.22, + "learning_rate": 6.620372973479524e-05, + "loss": 0.0711, + "step": 71910 + }, + { + "epoch": 20.22, + "learning_rate": 6.618498734888951e-05, + "loss": 0.0837, + "step": 71940 + }, + { + "epoch": 20.23, + "learning_rate": 6.616624496298379e-05, + "loss": 0.0623, + "step": 71970 + }, + { + "epoch": 20.24, + "learning_rate": 6.614750257707807e-05, + "loss": 0.0737, + "step": 72000 + }, + { + "epoch": 20.25, + "learning_rate": 6.612876019117233e-05, + "loss": 0.0678, + "step": 72030 + }, + { + "epoch": 20.26, + "learning_rate": 6.611001780526661e-05, + "loss": 0.0704, + "step": 72060 + }, + { + "epoch": 20.27, + "learning_rate": 6.609127541936089e-05, + "loss": 0.0771, + "step": 72090 + }, + { + "epoch": 20.28, + "learning_rate": 6.607253303345517e-05, + "loss": 0.0639, + "step": 72120 + }, + { + "epoch": 20.28, + "learning_rate": 6.605379064754944e-05, + "loss": 0.0759, + "step": 72150 + }, + { + "epoch": 20.29, + "learning_rate": 6.60350482616437e-05, + "loss": 0.0701, + "step": 72180 + }, + { + "epoch": 20.3, + "learning_rate": 6.601630587573799e-05, + "loss": 0.07, + "step": 72210 + }, + { + "epoch": 20.31, + "learning_rate": 6.599756348983225e-05, + "loss": 0.0784, + "step": 72240 + }, + { + "epoch": 20.32, + "learning_rate": 6.597882110392653e-05, + "loss": 0.0676, + "step": 72270 + }, + { + "epoch": 20.33, + "learning_rate": 6.596007871802082e-05, + "loss": 0.0814, + "step": 72300 + }, + { + "epoch": 20.33, + "learning_rate": 6.594133633211508e-05, + "loss": 0.0678, + "step": 72330 + }, + { + "epoch": 20.34, + "learning_rate": 6.592259394620935e-05, + "loss": 0.0718, + "step": 72360 + }, + { + "epoch": 20.35, + "learning_rate": 6.590385156030363e-05, + "loss": 0.0836, + "step": 72390 + }, + { + "epoch": 20.36, + "learning_rate": 6.588510917439791e-05, + "loss": 0.0626, + "step": 72420 + }, + { + "epoch": 20.37, + "learning_rate": 6.586636678849218e-05, + "loss": 0.0782, + "step": 72450 + }, + { + "epoch": 20.38, + "learning_rate": 6.584762440258645e-05, + "loss": 0.0696, + "step": 72480 + }, + { + "epoch": 20.39, + "learning_rate": 6.582888201668073e-05, + "loss": 0.069, + "step": 72510 + }, + { + "epoch": 20.39, + "learning_rate": 6.581013963077501e-05, + "loss": 0.0799, + "step": 72540 + }, + { + "epoch": 20.4, + "learning_rate": 6.579139724486928e-05, + "loss": 0.0639, + "step": 72570 + }, + { + "epoch": 20.41, + "learning_rate": 6.577265485896354e-05, + "loss": 0.0775, + "step": 72600 + }, + { + "epoch": 20.42, + "learning_rate": 6.575391247305782e-05, + "loss": 0.0689, + "step": 72630 + }, + { + "epoch": 20.43, + "learning_rate": 6.573517008715209e-05, + "loss": 0.0757, + "step": 72660 + }, + { + "epoch": 20.44, + "learning_rate": 6.571642770124637e-05, + "loss": 0.0819, + "step": 72690 + }, + { + "epoch": 20.44, + "learning_rate": 6.569768531534065e-05, + "loss": 0.0691, + "step": 72720 + }, + { + "epoch": 20.45, + "learning_rate": 6.567894292943492e-05, + "loss": 0.08, + "step": 72750 + }, + { + "epoch": 20.46, + "learning_rate": 6.566020054352919e-05, + "loss": 0.0654, + "step": 72780 + }, + { + "epoch": 20.47, + "learning_rate": 6.564145815762347e-05, + "loss": 0.0697, + "step": 72810 + }, + { + "epoch": 20.48, + "learning_rate": 6.562271577171775e-05, + "loss": 0.0783, + "step": 72840 + }, + { + "epoch": 20.49, + "learning_rate": 6.560397338581202e-05, + "loss": 0.0692, + "step": 72870 + }, + { + "epoch": 20.49, + "learning_rate": 6.558523099990629e-05, + "loss": 0.0761, + "step": 72900 + }, + { + "epoch": 20.5, + "learning_rate": 6.556648861400057e-05, + "loss": 0.0662, + "step": 72930 + }, + { + "epoch": 20.51, + "learning_rate": 6.554774622809485e-05, + "loss": 0.0752, + "step": 72960 + }, + { + "epoch": 20.52, + "learning_rate": 6.552900384218912e-05, + "loss": 0.0795, + "step": 72990 + }, + { + "epoch": 20.53, + "learning_rate": 6.551026145628338e-05, + "loss": 0.0593, + "step": 73020 + }, + { + "epoch": 20.54, + "learning_rate": 6.549151907037766e-05, + "loss": 0.0788, + "step": 73050 + }, + { + "epoch": 20.55, + "learning_rate": 6.547277668447193e-05, + "loss": 0.0711, + "step": 73080 + }, + { + "epoch": 20.55, + "learning_rate": 6.545403429856621e-05, + "loss": 0.072, + "step": 73110 + }, + { + "epoch": 20.56, + "learning_rate": 6.543529191266049e-05, + "loss": 0.0816, + "step": 73140 + }, + { + "epoch": 20.57, + "learning_rate": 6.541654952675476e-05, + "loss": 0.0643, + "step": 73170 + }, + { + "epoch": 20.58, + "learning_rate": 6.539780714084903e-05, + "loss": 0.0759, + "step": 73200 + }, + { + "epoch": 20.59, + "learning_rate": 6.537906475494331e-05, + "loss": 0.07, + "step": 73230 + }, + { + "epoch": 20.6, + "learning_rate": 6.536094711523444e-05, + "loss": 0.0754, + "step": 73260 + }, + { + "epoch": 20.6, + "learning_rate": 6.534220472932872e-05, + "loss": 0.0787, + "step": 73290 + }, + { + "epoch": 20.61, + "learning_rate": 6.5323462343423e-05, + "loss": 0.0665, + "step": 73320 + }, + { + "epoch": 20.62, + "learning_rate": 6.530471995751725e-05, + "loss": 0.0778, + "step": 73350 + }, + { + "epoch": 20.63, + "learning_rate": 6.528597757161153e-05, + "loss": 0.0681, + "step": 73380 + }, + { + "epoch": 20.64, + "learning_rate": 6.526723518570581e-05, + "loss": 0.0757, + "step": 73410 + }, + { + "epoch": 20.65, + "learning_rate": 6.524849279980008e-05, + "loss": 0.0797, + "step": 73440 + }, + { + "epoch": 20.65, + "learning_rate": 6.522975041389436e-05, + "loss": 0.0645, + "step": 73470 + }, + { + "epoch": 20.66, + "learning_rate": 6.521100802798863e-05, + "loss": 0.0796, + "step": 73500 + }, + { + "epoch": 20.67, + "learning_rate": 6.519226564208291e-05, + "loss": 0.0662, + "step": 73530 + }, + { + "epoch": 20.68, + "learning_rate": 6.517352325617718e-05, + "loss": 0.0715, + "step": 73560 + }, + { + "epoch": 20.69, + "learning_rate": 6.515478087027146e-05, + "loss": 0.0764, + "step": 73590 + }, + { + "epoch": 20.7, + "learning_rate": 6.513603848436573e-05, + "loss": 0.0633, + "step": 73620 + }, + { + "epoch": 20.71, + "learning_rate": 6.511729609846001e-05, + "loss": 0.0814, + "step": 73650 + }, + { + "epoch": 20.71, + "learning_rate": 6.509855371255427e-05, + "loss": 0.0667, + "step": 73680 + }, + { + "epoch": 20.72, + "learning_rate": 6.507981132664856e-05, + "loss": 0.0737, + "step": 73710 + }, + { + "epoch": 20.73, + "learning_rate": 6.506106894074284e-05, + "loss": 0.0809, + "step": 73740 + }, + { + "epoch": 20.74, + "learning_rate": 6.504232655483709e-05, + "loss": 0.0629, + "step": 73770 + }, + { + "epoch": 20.75, + "learning_rate": 6.502358416893137e-05, + "loss": 0.0815, + "step": 73800 + }, + { + "epoch": 20.76, + "learning_rate": 6.500484178302565e-05, + "loss": 0.0656, + "step": 73830 + }, + { + "epoch": 20.76, + "learning_rate": 6.498609939711992e-05, + "loss": 0.0706, + "step": 73860 + }, + { + "epoch": 20.77, + "learning_rate": 6.49673570112142e-05, + "loss": 0.077, + "step": 73890 + }, + { + "epoch": 20.78, + "learning_rate": 6.494861462530847e-05, + "loss": 0.0618, + "step": 73920 + }, + { + "epoch": 20.79, + "learning_rate": 6.492987223940275e-05, + "loss": 0.0761, + "step": 73950 + }, + { + "epoch": 20.8, + "learning_rate": 6.491112985349702e-05, + "loss": 0.0671, + "step": 73980 + }, + { + "epoch": 20.81, + "learning_rate": 6.48923874675913e-05, + "loss": 0.0702, + "step": 74010 + }, + { + "epoch": 20.82, + "learning_rate": 6.487364508168557e-05, + "loss": 0.0794, + "step": 74040 + }, + { + "epoch": 20.82, + "learning_rate": 6.485490269577985e-05, + "loss": 0.0656, + "step": 74070 + }, + { + "epoch": 20.83, + "learning_rate": 6.483616030987411e-05, + "loss": 0.0802, + "step": 74100 + }, + { + "epoch": 20.84, + "learning_rate": 6.48174179239684e-05, + "loss": 0.067, + "step": 74130 + }, + { + "epoch": 20.85, + "learning_rate": 6.479867553806268e-05, + "loss": 0.0695, + "step": 74160 + }, + { + "epoch": 20.86, + "learning_rate": 6.477993315215693e-05, + "loss": 0.0764, + "step": 74190 + }, + { + "epoch": 20.87, + "learning_rate": 6.476119076625121e-05, + "loss": 0.0639, + "step": 74220 + }, + { + "epoch": 20.87, + "learning_rate": 6.474244838034549e-05, + "loss": 0.0817, + "step": 74250 + }, + { + "epoch": 20.88, + "learning_rate": 6.472370599443976e-05, + "loss": 0.0686, + "step": 74280 + }, + { + "epoch": 20.89, + "learning_rate": 6.470496360853404e-05, + "loss": 0.0747, + "step": 74310 + }, + { + "epoch": 20.9, + "learning_rate": 6.468622122262831e-05, + "loss": 0.0826, + "step": 74340 + }, + { + "epoch": 20.91, + "learning_rate": 6.466747883672259e-05, + "loss": 0.0697, + "step": 74370 + }, + { + "epoch": 20.92, + "learning_rate": 6.464873645081686e-05, + "loss": 0.08, + "step": 74400 + }, + { + "epoch": 20.92, + "learning_rate": 6.462999406491114e-05, + "loss": 0.0681, + "step": 74430 + }, + { + "epoch": 20.93, + "learning_rate": 6.46112516790054e-05, + "loss": 0.0737, + "step": 74460 + }, + { + "epoch": 20.94, + "learning_rate": 6.459250929309968e-05, + "loss": 0.0777, + "step": 74490 + }, + { + "epoch": 20.95, + "learning_rate": 6.457376690719395e-05, + "loss": 0.0633, + "step": 74520 + }, + { + "epoch": 20.96, + "learning_rate": 6.455502452128823e-05, + "loss": 0.0784, + "step": 74550 + }, + { + "epoch": 20.97, + "learning_rate": 6.453628213538251e-05, + "loss": 0.0677, + "step": 74580 + }, + { + "epoch": 20.98, + "learning_rate": 6.451753974947677e-05, + "loss": 0.0742, + "step": 74610 + }, + { + "epoch": 20.98, + "learning_rate": 6.449879736357105e-05, + "loss": 0.0751, + "step": 74640 + }, + { + "epoch": 20.99, + "learning_rate": 6.448005497766533e-05, + "loss": 0.0647, + "step": 74670 + }, + { + "epoch": 21.0, + "eval_loss": 0.10879692435264587, + "eval_runtime": 632.1305, + "eval_samples_per_second": 25.363, + "eval_steps_per_second": 0.794, + "eval_wer": 0.10948780587665306, + "step": 74697 + }, + { + "epoch": 21.0, + "learning_rate": 6.44613125917596e-05, + "loss": 0.0789, + "step": 74700 + }, + { + "epoch": 21.01, + "learning_rate": 6.444257020585388e-05, + "loss": 0.0664, + "step": 74730 + }, + { + "epoch": 21.02, + "learning_rate": 6.442382781994815e-05, + "loss": 0.0746, + "step": 74760 + }, + { + "epoch": 21.03, + "learning_rate": 6.440508543404243e-05, + "loss": 0.067, + "step": 74790 + }, + { + "epoch": 21.03, + "learning_rate": 6.43863430481367e-05, + "loss": 0.0695, + "step": 74820 + }, + { + "epoch": 21.04, + "learning_rate": 6.436760066223098e-05, + "loss": 0.076, + "step": 74850 + }, + { + "epoch": 21.05, + "learning_rate": 6.434885827632524e-05, + "loss": 0.063, + "step": 74880 + }, + { + "epoch": 21.06, + "learning_rate": 6.433011589041952e-05, + "loss": 0.074, + "step": 74910 + }, + { + "epoch": 21.07, + "learning_rate": 6.431137350451379e-05, + "loss": 0.0667, + "step": 74940 + }, + { + "epoch": 21.08, + "learning_rate": 6.429263111860807e-05, + "loss": 0.0668, + "step": 74970 + }, + { + "epoch": 21.09, + "learning_rate": 6.427388873270235e-05, + "loss": 0.0764, + "step": 75000 + }, + { + "epoch": 21.09, + "learning_rate": 6.42551463467966e-05, + "loss": 0.0628, + "step": 75030 + }, + { + "epoch": 21.1, + "learning_rate": 6.423640396089089e-05, + "loss": 0.0738, + "step": 75060 + }, + { + "epoch": 21.11, + "learning_rate": 6.421766157498517e-05, + "loss": 0.0686, + "step": 75090 + }, + { + "epoch": 21.12, + "learning_rate": 6.419891918907944e-05, + "loss": 0.0706, + "step": 75120 + }, + { + "epoch": 21.13, + "learning_rate": 6.41801768031737e-05, + "loss": 0.076, + "step": 75150 + }, + { + "epoch": 21.14, + "learning_rate": 6.416143441726798e-05, + "loss": 0.0645, + "step": 75180 + }, + { + "epoch": 21.14, + "learning_rate": 6.414269203136227e-05, + "loss": 0.0768, + "step": 75210 + }, + { + "epoch": 21.15, + "learning_rate": 6.412394964545653e-05, + "loss": 0.0682, + "step": 75240 + }, + { + "epoch": 21.16, + "learning_rate": 6.410520725955081e-05, + "loss": 0.0743, + "step": 75270 + }, + { + "epoch": 21.17, + "learning_rate": 6.408646487364508e-05, + "loss": 0.0767, + "step": 75300 + }, + { + "epoch": 21.18, + "learning_rate": 6.406772248773936e-05, + "loss": 0.0631, + "step": 75330 + }, + { + "epoch": 21.19, + "learning_rate": 6.404898010183363e-05, + "loss": 0.071, + "step": 75360 + }, + { + "epoch": 21.19, + "learning_rate": 6.403023771592791e-05, + "loss": 0.0711, + "step": 75390 + }, + { + "epoch": 21.2, + "learning_rate": 6.401149533002219e-05, + "loss": 0.0755, + "step": 75420 + }, + { + "epoch": 21.21, + "learning_rate": 6.399275294411645e-05, + "loss": 0.0772, + "step": 75450 + }, + { + "epoch": 21.22, + "learning_rate": 6.397401055821073e-05, + "loss": 0.065, + "step": 75480 + }, + { + "epoch": 21.23, + "learning_rate": 6.395526817230501e-05, + "loss": 0.0749, + "step": 75510 + }, + { + "epoch": 21.24, + "learning_rate": 6.393652578639929e-05, + "loss": 0.0694, + "step": 75540 + }, + { + "epoch": 21.25, + "learning_rate": 6.391778340049354e-05, + "loss": 0.0693, + "step": 75570 + }, + { + "epoch": 21.25, + "learning_rate": 6.389904101458782e-05, + "loss": 0.0739, + "step": 75600 + }, + { + "epoch": 21.26, + "learning_rate": 6.38802986286821e-05, + "loss": 0.0633, + "step": 75630 + }, + { + "epoch": 21.27, + "learning_rate": 6.386155624277637e-05, + "loss": 0.0772, + "step": 75660 + }, + { + "epoch": 21.28, + "learning_rate": 6.384281385687065e-05, + "loss": 0.0679, + "step": 75690 + }, + { + "epoch": 21.29, + "learning_rate": 6.382407147096492e-05, + "loss": 0.0731, + "step": 75720 + }, + { + "epoch": 21.3, + "learning_rate": 6.38053290850592e-05, + "loss": 0.0798, + "step": 75750 + }, + { + "epoch": 21.3, + "learning_rate": 6.378658669915347e-05, + "loss": 0.0637, + "step": 75780 + }, + { + "epoch": 21.31, + "learning_rate": 6.376784431324775e-05, + "loss": 0.0739, + "step": 75810 + }, + { + "epoch": 21.32, + "learning_rate": 6.374910192734203e-05, + "loss": 0.0673, + "step": 75840 + }, + { + "epoch": 21.33, + "learning_rate": 6.37303595414363e-05, + "loss": 0.0685, + "step": 75870 + }, + { + "epoch": 21.34, + "learning_rate": 6.371161715553057e-05, + "loss": 0.0788, + "step": 75900 + }, + { + "epoch": 21.35, + "learning_rate": 6.369287476962485e-05, + "loss": 0.0629, + "step": 75930 + }, + { + "epoch": 21.36, + "learning_rate": 6.367413238371913e-05, + "loss": 0.0732, + "step": 75960 + }, + { + "epoch": 21.36, + "learning_rate": 6.365538999781338e-05, + "loss": 0.0739, + "step": 75990 + }, + { + "epoch": 21.37, + "learning_rate": 6.363664761190766e-05, + "loss": 0.0702, + "step": 76020 + }, + { + "epoch": 21.38, + "learning_rate": 6.361790522600194e-05, + "loss": 0.0759, + "step": 76050 + }, + { + "epoch": 21.39, + "learning_rate": 6.359916284009621e-05, + "loss": 0.062, + "step": 76080 + }, + { + "epoch": 21.4, + "learning_rate": 6.358042045419049e-05, + "loss": 0.0747, + "step": 76110 + }, + { + "epoch": 21.41, + "learning_rate": 6.356167806828476e-05, + "loss": 0.0691, + "step": 76140 + }, + { + "epoch": 21.41, + "learning_rate": 6.354293568237904e-05, + "loss": 0.0705, + "step": 76170 + }, + { + "epoch": 21.42, + "learning_rate": 6.352419329647331e-05, + "loss": 0.076, + "step": 76200 + }, + { + "epoch": 21.43, + "learning_rate": 6.350545091056759e-05, + "loss": 0.0653, + "step": 76230 + }, + { + "epoch": 21.44, + "learning_rate": 6.348670852466187e-05, + "loss": 0.0774, + "step": 76260 + }, + { + "epoch": 21.45, + "learning_rate": 6.346796613875614e-05, + "loss": 0.0697, + "step": 76290 + }, + { + "epoch": 21.46, + "learning_rate": 6.34492237528504e-05, + "loss": 0.0719, + "step": 76320 + }, + { + "epoch": 21.46, + "learning_rate": 6.343048136694468e-05, + "loss": 0.0762, + "step": 76350 + }, + { + "epoch": 21.47, + "learning_rate": 6.341173898103897e-05, + "loss": 0.06, + "step": 76380 + }, + { + "epoch": 21.48, + "learning_rate": 6.339299659513322e-05, + "loss": 0.0742, + "step": 76410 + }, + { + "epoch": 21.49, + "learning_rate": 6.33742542092275e-05, + "loss": 0.0687, + "step": 76440 + }, + { + "epoch": 21.5, + "learning_rate": 6.335551182332178e-05, + "loss": 0.0717, + "step": 76470 + }, + { + "epoch": 21.51, + "learning_rate": 6.333739418361291e-05, + "loss": 0.0793, + "step": 76500 + }, + { + "epoch": 21.52, + "learning_rate": 6.331865179770719e-05, + "loss": 0.0649, + "step": 76530 + }, + { + "epoch": 21.52, + "learning_rate": 6.329990941180146e-05, + "loss": 0.0725, + "step": 76560 + }, + { + "epoch": 21.53, + "learning_rate": 6.328116702589574e-05, + "loss": 0.0679, + "step": 76590 + }, + { + "epoch": 21.54, + "learning_rate": 6.326242463999e-05, + "loss": 0.0641, + "step": 76620 + }, + { + "epoch": 21.55, + "learning_rate": 6.324368225408429e-05, + "loss": 0.074, + "step": 76650 + }, + { + "epoch": 21.56, + "learning_rate": 6.322493986817855e-05, + "loss": 0.0634, + "step": 76680 + }, + { + "epoch": 21.57, + "learning_rate": 6.320619748227283e-05, + "loss": 0.0753, + "step": 76710 + }, + { + "epoch": 21.57, + "learning_rate": 6.31874550963671e-05, + "loss": 0.0683, + "step": 76740 + }, + { + "epoch": 21.58, + "learning_rate": 6.316871271046137e-05, + "loss": 0.0706, + "step": 76770 + }, + { + "epoch": 21.59, + "learning_rate": 6.314997032455565e-05, + "loss": 0.075, + "step": 76800 + }, + { + "epoch": 21.6, + "learning_rate": 6.313122793864993e-05, + "loss": 0.064, + "step": 76830 + }, + { + "epoch": 21.61, + "learning_rate": 6.31124855527442e-05, + "loss": 0.0723, + "step": 76860 + }, + { + "epoch": 21.62, + "learning_rate": 6.309374316683847e-05, + "loss": 0.0713, + "step": 76890 + }, + { + "epoch": 21.62, + "learning_rate": 6.307500078093275e-05, + "loss": 0.0669, + "step": 76920 + }, + { + "epoch": 21.63, + "learning_rate": 6.305625839502703e-05, + "loss": 0.079, + "step": 76950 + }, + { + "epoch": 21.64, + "learning_rate": 6.30375160091213e-05, + "loss": 0.0626, + "step": 76980 + }, + { + "epoch": 21.65, + "learning_rate": 6.301877362321558e-05, + "loss": 0.074, + "step": 77010 + }, + { + "epoch": 21.66, + "learning_rate": 6.300003123730984e-05, + "loss": 0.0726, + "step": 77040 + }, + { + "epoch": 21.67, + "learning_rate": 6.298128885140413e-05, + "loss": 0.0727, + "step": 77070 + }, + { + "epoch": 21.68, + "learning_rate": 6.296254646549839e-05, + "loss": 0.0774, + "step": 77100 + }, + { + "epoch": 21.68, + "learning_rate": 6.294380407959267e-05, + "loss": 0.0654, + "step": 77130 + }, + { + "epoch": 21.69, + "learning_rate": 6.292506169368694e-05, + "loss": 0.0763, + "step": 77160 + }, + { + "epoch": 21.7, + "learning_rate": 6.290631930778121e-05, + "loss": 0.0702, + "step": 77190 + }, + { + "epoch": 21.71, + "learning_rate": 6.288757692187549e-05, + "loss": 0.0735, + "step": 77220 + }, + { + "epoch": 21.72, + "learning_rate": 6.286883453596977e-05, + "loss": 0.0718, + "step": 77250 + }, + { + "epoch": 21.73, + "learning_rate": 6.285009215006404e-05, + "loss": 0.0632, + "step": 77280 + }, + { + "epoch": 21.73, + "learning_rate": 6.28313497641583e-05, + "loss": 0.0814, + "step": 77310 + }, + { + "epoch": 21.74, + "learning_rate": 6.281260737825259e-05, + "loss": 0.068, + "step": 77340 + }, + { + "epoch": 21.75, + "learning_rate": 6.279386499234687e-05, + "loss": 0.0704, + "step": 77370 + }, + { + "epoch": 21.76, + "learning_rate": 6.277512260644113e-05, + "loss": 0.0803, + "step": 77400 + }, + { + "epoch": 21.77, + "learning_rate": 6.275638022053542e-05, + "loss": 0.0651, + "step": 77430 + }, + { + "epoch": 21.78, + "learning_rate": 6.273763783462968e-05, + "loss": 0.074, + "step": 77460 + }, + { + "epoch": 21.79, + "learning_rate": 6.271889544872396e-05, + "loss": 0.0719, + "step": 77490 + }, + { + "epoch": 21.79, + "learning_rate": 6.270015306281823e-05, + "loss": 0.0734, + "step": 77520 + }, + { + "epoch": 21.8, + "learning_rate": 6.268141067691251e-05, + "loss": 0.0751, + "step": 77550 + }, + { + "epoch": 21.81, + "learning_rate": 6.266266829100678e-05, + "loss": 0.0611, + "step": 77580 + }, + { + "epoch": 21.82, + "learning_rate": 6.264392590510105e-05, + "loss": 0.0735, + "step": 77610 + }, + { + "epoch": 21.83, + "learning_rate": 6.262518351919533e-05, + "loss": 0.0671, + "step": 77640 + }, + { + "epoch": 21.84, + "learning_rate": 6.260644113328961e-05, + "loss": 0.0709, + "step": 77670 + }, + { + "epoch": 21.84, + "learning_rate": 6.258769874738388e-05, + "loss": 0.0753, + "step": 77700 + }, + { + "epoch": 21.85, + "learning_rate": 6.256895636147814e-05, + "loss": 0.0609, + "step": 77730 + }, + { + "epoch": 21.86, + "learning_rate": 6.255021397557242e-05, + "loss": 0.0752, + "step": 77760 + }, + { + "epoch": 21.87, + "learning_rate": 6.253209633586355e-05, + "loss": 0.0645, + "step": 77790 + }, + { + "epoch": 21.88, + "learning_rate": 6.251335394995783e-05, + "loss": 0.0729, + "step": 77820 + }, + { + "epoch": 21.89, + "learning_rate": 6.249461156405211e-05, + "loss": 0.076, + "step": 77850 + }, + { + "epoch": 21.89, + "learning_rate": 6.247586917814638e-05, + "loss": 0.0614, + "step": 77880 + }, + { + "epoch": 21.9, + "learning_rate": 6.245712679224065e-05, + "loss": 0.0782, + "step": 77910 + }, + { + "epoch": 21.91, + "learning_rate": 6.243838440633493e-05, + "loss": 0.0683, + "step": 77940 + }, + { + "epoch": 21.92, + "learning_rate": 6.24196420204292e-05, + "loss": 0.0712, + "step": 77970 + }, + { + "epoch": 21.93, + "learning_rate": 6.240089963452348e-05, + "loss": 0.0798, + "step": 78000 + }, + { + "epoch": 21.94, + "learning_rate": 6.238215724861776e-05, + "loss": 0.0626, + "step": 78030 + }, + { + "epoch": 21.95, + "learning_rate": 6.236341486271203e-05, + "loss": 0.0763, + "step": 78060 + }, + { + "epoch": 21.95, + "learning_rate": 6.23446724768063e-05, + "loss": 0.0675, + "step": 78090 + }, + { + "epoch": 21.96, + "learning_rate": 6.232593009090058e-05, + "loss": 0.0664, + "step": 78120 + }, + { + "epoch": 21.97, + "learning_rate": 6.230718770499486e-05, + "loss": 0.0785, + "step": 78150 + }, + { + "epoch": 21.98, + "learning_rate": 6.228844531908912e-05, + "loss": 0.0613, + "step": 78180 + }, + { + "epoch": 21.99, + "learning_rate": 6.226970293318339e-05, + "loss": 0.0739, + "step": 78210 + }, + { + "epoch": 22.0, + "learning_rate": 6.225096054727767e-05, + "loss": 0.0643, + "step": 78240 + }, + { + "epoch": 22.0, + "eval_loss": 0.11053762584924698, + "eval_runtime": 632.3359, + "eval_samples_per_second": 25.355, + "eval_steps_per_second": 0.794, + "eval_wer": 0.10436995892074843, + "step": 78254 + }, + { + "epoch": 22.0, + "learning_rate": 6.223221816137195e-05, + "loss": 0.0775, + "step": 78270 + }, + { + "epoch": 22.01, + "learning_rate": 6.221347577546622e-05, + "loss": 0.067, + "step": 78300 + }, + { + "epoch": 22.02, + "learning_rate": 6.219473338956049e-05, + "loss": 0.0672, + "step": 78330 + }, + { + "epoch": 22.03, + "learning_rate": 6.217599100365477e-05, + "loss": 0.0742, + "step": 78360 + }, + { + "epoch": 22.04, + "learning_rate": 6.215724861774904e-05, + "loss": 0.066, + "step": 78390 + }, + { + "epoch": 22.05, + "learning_rate": 6.213850623184332e-05, + "loss": 0.0683, + "step": 78420 + }, + { + "epoch": 22.06, + "learning_rate": 6.21197638459376e-05, + "loss": 0.0729, + "step": 78450 + }, + { + "epoch": 22.06, + "learning_rate": 6.210102146003187e-05, + "loss": 0.0682, + "step": 78480 + }, + { + "epoch": 22.07, + "learning_rate": 6.208227907412613e-05, + "loss": 0.0785, + "step": 78510 + }, + { + "epoch": 22.08, + "learning_rate": 6.206353668822041e-05, + "loss": 0.0648, + "step": 78540 + }, + { + "epoch": 22.09, + "learning_rate": 6.20447943023147e-05, + "loss": 0.07, + "step": 78570 + }, + { + "epoch": 22.1, + "learning_rate": 6.202605191640896e-05, + "loss": 0.0733, + "step": 78600 + }, + { + "epoch": 22.11, + "learning_rate": 6.200730953050323e-05, + "loss": 0.0656, + "step": 78630 + }, + { + "epoch": 22.11, + "learning_rate": 6.198856714459751e-05, + "loss": 0.0732, + "step": 78660 + }, + { + "epoch": 22.12, + "learning_rate": 6.196982475869179e-05, + "loss": 0.0634, + "step": 78690 + }, + { + "epoch": 22.13, + "learning_rate": 6.195108237278606e-05, + "loss": 0.0733, + "step": 78720 + }, + { + "epoch": 22.14, + "learning_rate": 6.193233998688033e-05, + "loss": 0.0651, + "step": 78750 + }, + { + "epoch": 22.15, + "learning_rate": 6.191359760097461e-05, + "loss": 0.068, + "step": 78780 + }, + { + "epoch": 22.16, + "learning_rate": 6.189485521506887e-05, + "loss": 0.0718, + "step": 78810 + }, + { + "epoch": 22.16, + "learning_rate": 6.187611282916316e-05, + "loss": 0.0614, + "step": 78840 + }, + { + "epoch": 22.17, + "learning_rate": 6.185737044325744e-05, + "loss": 0.0751, + "step": 78870 + }, + { + "epoch": 22.18, + "learning_rate": 6.183925280354856e-05, + "loss": 0.0744, + "step": 78900 + }, + { + "epoch": 22.19, + "learning_rate": 6.182051041764285e-05, + "loss": 0.0678, + "step": 78930 + }, + { + "epoch": 22.2, + "learning_rate": 6.180176803173711e-05, + "loss": 0.0754, + "step": 78960 + }, + { + "epoch": 22.21, + "learning_rate": 6.178302564583138e-05, + "loss": 0.0606, + "step": 78990 + }, + { + "epoch": 22.22, + "learning_rate": 6.176428325992566e-05, + "loss": 0.0704, + "step": 79020 + }, + { + "epoch": 22.22, + "learning_rate": 6.174554087401994e-05, + "loss": 0.0677, + "step": 79050 + }, + { + "epoch": 22.23, + "learning_rate": 6.17267984881142e-05, + "loss": 0.0684, + "step": 79080 + }, + { + "epoch": 22.24, + "learning_rate": 6.170805610220848e-05, + "loss": 0.0728, + "step": 79110 + }, + { + "epoch": 22.25, + "learning_rate": 6.168931371630276e-05, + "loss": 0.0615, + "step": 79140 + }, + { + "epoch": 22.26, + "learning_rate": 6.167057133039703e-05, + "loss": 0.0699, + "step": 79170 + }, + { + "epoch": 22.27, + "learning_rate": 6.16518289444913e-05, + "loss": 0.0734, + "step": 79200 + }, + { + "epoch": 22.27, + "learning_rate": 6.163308655858557e-05, + "loss": 0.0702, + "step": 79230 + }, + { + "epoch": 22.28, + "learning_rate": 6.161434417267985e-05, + "loss": 0.0776, + "step": 79260 + }, + { + "epoch": 22.29, + "learning_rate": 6.159560178677412e-05, + "loss": 0.0604, + "step": 79290 + }, + { + "epoch": 22.3, + "learning_rate": 6.15768594008684e-05, + "loss": 0.0685, + "step": 79320 + }, + { + "epoch": 22.31, + "learning_rate": 6.155811701496268e-05, + "loss": 0.0684, + "step": 79350 + }, + { + "epoch": 22.32, + "learning_rate": 6.153937462905695e-05, + "loss": 0.0694, + "step": 79380 + }, + { + "epoch": 22.32, + "learning_rate": 6.152063224315122e-05, + "loss": 0.0777, + "step": 79410 + }, + { + "epoch": 22.33, + "learning_rate": 6.15018898572455e-05, + "loss": 0.0644, + "step": 79440 + }, + { + "epoch": 22.34, + "learning_rate": 6.148314747133978e-05, + "loss": 0.0739, + "step": 79470 + }, + { + "epoch": 22.35, + "learning_rate": 6.146440508543403e-05, + "loss": 0.0732, + "step": 79500 + }, + { + "epoch": 22.36, + "learning_rate": 6.144566269952832e-05, + "loss": 0.0716, + "step": 79530 + }, + { + "epoch": 22.37, + "learning_rate": 6.14269203136226e-05, + "loss": 0.0746, + "step": 79560 + }, + { + "epoch": 22.38, + "learning_rate": 6.140817792771686e-05, + "loss": 0.0616, + "step": 79590 + }, + { + "epoch": 22.38, + "learning_rate": 6.138943554181114e-05, + "loss": 0.0698, + "step": 79620 + }, + { + "epoch": 22.39, + "learning_rate": 6.137069315590541e-05, + "loss": 0.0703, + "step": 79650 + }, + { + "epoch": 22.4, + "learning_rate": 6.135195076999969e-05, + "loss": 0.0673, + "step": 79680 + }, + { + "epoch": 22.41, + "learning_rate": 6.133320838409396e-05, + "loss": 0.0764, + "step": 79710 + }, + { + "epoch": 22.42, + "learning_rate": 6.131446599818824e-05, + "loss": 0.0598, + "step": 79740 + }, + { + "epoch": 22.43, + "learning_rate": 6.129572361228252e-05, + "loss": 0.066, + "step": 79770 + }, + { + "epoch": 22.43, + "learning_rate": 6.127698122637679e-05, + "loss": 0.07, + "step": 79800 + }, + { + "epoch": 22.44, + "learning_rate": 6.125823884047106e-05, + "loss": 0.0671, + "step": 79830 + }, + { + "epoch": 22.45, + "learning_rate": 6.123949645456534e-05, + "loss": 0.0717, + "step": 79860 + }, + { + "epoch": 22.46, + "learning_rate": 6.122075406865962e-05, + "loss": 0.0608, + "step": 79890 + }, + { + "epoch": 22.47, + "learning_rate": 6.120201168275387e-05, + "loss": 0.0703, + "step": 79920 + }, + { + "epoch": 22.48, + "learning_rate": 6.118326929684815e-05, + "loss": 0.0671, + "step": 79950 + }, + { + "epoch": 22.49, + "learning_rate": 6.116452691094243e-05, + "loss": 0.0684, + "step": 79980 + }, + { + "epoch": 22.49, + "learning_rate": 6.11457845250367e-05, + "loss": 0.0739, + "step": 80010 + }, + { + "epoch": 22.5, + "learning_rate": 6.112704213913098e-05, + "loss": 0.0601, + "step": 80040 + }, + { + "epoch": 22.51, + "learning_rate": 6.110829975322525e-05, + "loss": 0.0709, + "step": 80070 + }, + { + "epoch": 22.52, + "learning_rate": 6.108955736731953e-05, + "loss": 0.0708, + "step": 80100 + }, + { + "epoch": 22.53, + "learning_rate": 6.10708149814138e-05, + "loss": 0.067, + "step": 80130 + }, + { + "epoch": 22.54, + "learning_rate": 6.105207259550808e-05, + "loss": 0.0721, + "step": 80160 + }, + { + "epoch": 22.54, + "learning_rate": 6.1033330209602354e-05, + "loss": 0.0629, + "step": 80190 + }, + { + "epoch": 22.55, + "learning_rate": 6.101458782369662e-05, + "loss": 0.073, + "step": 80220 + }, + { + "epoch": 22.56, + "learning_rate": 6.09958454377909e-05, + "loss": 0.0669, + "step": 80250 + }, + { + "epoch": 22.57, + "learning_rate": 6.097710305188518e-05, + "loss": 0.0667, + "step": 80280 + }, + { + "epoch": 22.58, + "learning_rate": 6.095836066597945e-05, + "loss": 0.0723, + "step": 80310 + }, + { + "epoch": 22.59, + "learning_rate": 6.093961828007372e-05, + "loss": 0.0626, + "step": 80340 + }, + { + "epoch": 22.59, + "learning_rate": 6.092087589416799e-05, + "loss": 0.0693, + "step": 80370 + }, + { + "epoch": 22.6, + "learning_rate": 6.0902133508262274e-05, + "loss": 0.0697, + "step": 80400 + }, + { + "epoch": 22.61, + "learning_rate": 6.088339112235655e-05, + "loss": 0.063, + "step": 80430 + }, + { + "epoch": 22.62, + "learning_rate": 6.086464873645082e-05, + "loss": 0.0771, + "step": 80460 + }, + { + "epoch": 22.63, + "learning_rate": 6.084590635054509e-05, + "loss": 0.0635, + "step": 80490 + }, + { + "epoch": 22.64, + "learning_rate": 6.0827163964639364e-05, + "loss": 0.0707, + "step": 80520 + }, + { + "epoch": 22.65, + "learning_rate": 6.0808421578733645e-05, + "loss": 0.0681, + "step": 80550 + }, + { + "epoch": 22.65, + "learning_rate": 6.078967919282792e-05, + "loss": 0.0636, + "step": 80580 + }, + { + "epoch": 22.66, + "learning_rate": 6.077093680692219e-05, + "loss": 0.0723, + "step": 80610 + }, + { + "epoch": 22.67, + "learning_rate": 6.075219442101646e-05, + "loss": 0.059, + "step": 80640 + }, + { + "epoch": 22.68, + "learning_rate": 6.073345203511074e-05, + "loss": 0.0718, + "step": 80670 + }, + { + "epoch": 22.69, + "learning_rate": 6.0714709649205016e-05, + "loss": 0.0687, + "step": 80700 + }, + { + "epoch": 22.7, + "learning_rate": 6.069596726329929e-05, + "loss": 0.064, + "step": 80730 + }, + { + "epoch": 22.7, + "learning_rate": 6.067722487739356e-05, + "loss": 0.0753, + "step": 80760 + }, + { + "epoch": 22.71, + "learning_rate": 6.065848249148783e-05, + "loss": 0.067, + "step": 80790 + }, + { + "epoch": 22.72, + "learning_rate": 6.063974010558211e-05, + "loss": 0.072, + "step": 80820 + }, + { + "epoch": 22.73, + "learning_rate": 6.0620997719676386e-05, + "loss": 0.0687, + "step": 80850 + }, + { + "epoch": 22.74, + "learning_rate": 6.060225533377066e-05, + "loss": 0.0664, + "step": 80880 + }, + { + "epoch": 22.75, + "learning_rate": 6.058351294786493e-05, + "loss": 0.0791, + "step": 80910 + }, + { + "epoch": 22.76, + "learning_rate": 6.05647705619592e-05, + "loss": 0.0604, + "step": 80940 + }, + { + "epoch": 22.76, + "learning_rate": 6.054602817605348e-05, + "loss": 0.0726, + "step": 80970 + }, + { + "epoch": 22.77, + "learning_rate": 6.052728579014776e-05, + "loss": 0.068, + "step": 81000 + }, + { + "epoch": 22.78, + "learning_rate": 6.0508543404242025e-05, + "loss": 0.0691, + "step": 81030 + }, + { + "epoch": 22.79, + "learning_rate": 6.04898010183363e-05, + "loss": 0.0768, + "step": 81060 + }, + { + "epoch": 22.8, + "learning_rate": 6.047105863243058e-05, + "loss": 0.0681, + "step": 81090 + }, + { + "epoch": 22.81, + "learning_rate": 6.0452316246524854e-05, + "loss": 0.0712, + "step": 81120 + }, + { + "epoch": 22.81, + "learning_rate": 6.043357386061913e-05, + "loss": 0.0706, + "step": 81150 + }, + { + "epoch": 22.82, + "learning_rate": 6.0414831474713396e-05, + "loss": 0.0649, + "step": 81180 + }, + { + "epoch": 22.83, + "learning_rate": 6.039608908880767e-05, + "loss": 0.0739, + "step": 81210 + }, + { + "epoch": 22.84, + "learning_rate": 6.037734670290195e-05, + "loss": 0.0649, + "step": 81240 + }, + { + "epoch": 22.85, + "learning_rate": 6.0358604316996225e-05, + "loss": 0.0732, + "step": 81270 + }, + { + "epoch": 22.86, + "learning_rate": 6.03398619310905e-05, + "loss": 0.0731, + "step": 81300 + }, + { + "epoch": 22.86, + "learning_rate": 6.032111954518477e-05, + "loss": 0.0668, + "step": 81330 + }, + { + "epoch": 22.87, + "learning_rate": 6.030237715927904e-05, + "loss": 0.0761, + "step": 81360 + }, + { + "epoch": 22.88, + "learning_rate": 6.028363477337332e-05, + "loss": 0.0663, + "step": 81390 + }, + { + "epoch": 22.89, + "learning_rate": 6.0264892387467596e-05, + "loss": 0.0739, + "step": 81420 + }, + { + "epoch": 22.9, + "learning_rate": 6.0246150001561864e-05, + "loss": 0.0685, + "step": 81450 + }, + { + "epoch": 22.91, + "learning_rate": 6.022740761565614e-05, + "loss": 0.0705, + "step": 81480 + }, + { + "epoch": 22.92, + "learning_rate": 6.020866522975042e-05, + "loss": 0.0717, + "step": 81510 + }, + { + "epoch": 22.92, + "learning_rate": 6.018992284384469e-05, + "loss": 0.0645, + "step": 81540 + }, + { + "epoch": 22.93, + "learning_rate": 6.017118045793897e-05, + "loss": 0.0729, + "step": 81570 + }, + { + "epoch": 22.94, + "learning_rate": 6.0152438072033234e-05, + "loss": 0.0691, + "step": 81600 + }, + { + "epoch": 22.95, + "learning_rate": 6.013369568612751e-05, + "loss": 0.0706, + "step": 81630 + }, + { + "epoch": 22.96, + "learning_rate": 6.011495330022179e-05, + "loss": 0.0751, + "step": 81660 + }, + { + "epoch": 22.97, + "learning_rate": 6.0096210914316064e-05, + "loss": 0.0633, + "step": 81690 + }, + { + "epoch": 22.97, + "learning_rate": 6.007746852841034e-05, + "loss": 0.0755, + "step": 81720 + }, + { + "epoch": 22.98, + "learning_rate": 6.0058726142504605e-05, + "loss": 0.0714, + "step": 81750 + }, + { + "epoch": 22.99, + "learning_rate": 6.0039983756598886e-05, + "loss": 0.0712, + "step": 81780 + }, + { + "epoch": 23.0, + "learning_rate": 6.002124137069316e-05, + "loss": 0.0764, + "step": 81810 + }, + { + "epoch": 23.0, + "eval_loss": 0.10718846321105957, + "eval_runtime": 629.1357, + "eval_samples_per_second": 25.484, + "eval_steps_per_second": 0.798, + "eval_wer": 0.10416524504251225, + "step": 81811 + }, + { + "epoch": 23.01, + "learning_rate": 6.0002498984787435e-05, + "loss": 0.0609, + "step": 81840 + }, + { + "epoch": 23.02, + "learning_rate": 5.99837565988817e-05, + "loss": 0.0743, + "step": 81870 + }, + { + "epoch": 23.03, + "learning_rate": 5.9965014212975976e-05, + "loss": 0.0652, + "step": 81900 + }, + { + "epoch": 23.03, + "learning_rate": 5.994627182707026e-05, + "loss": 0.0694, + "step": 81930 + }, + { + "epoch": 23.04, + "learning_rate": 5.992752944116453e-05, + "loss": 0.0686, + "step": 81960 + }, + { + "epoch": 23.05, + "learning_rate": 5.9908787055258806e-05, + "loss": 0.0652, + "step": 81990 + }, + { + "epoch": 23.06, + "learning_rate": 5.989004466935307e-05, + "loss": 0.0692, + "step": 82020 + }, + { + "epoch": 23.07, + "learning_rate": 5.987130228344735e-05, + "loss": 0.0626, + "step": 82050 + }, + { + "epoch": 23.08, + "learning_rate": 5.985255989754163e-05, + "loss": 0.0718, + "step": 82080 + }, + { + "epoch": 23.08, + "learning_rate": 5.98338175116359e-05, + "loss": 0.0717, + "step": 82110 + }, + { + "epoch": 23.09, + "learning_rate": 5.981507512573018e-05, + "loss": 0.0649, + "step": 82140 + }, + { + "epoch": 23.1, + "learning_rate": 5.9796332739824444e-05, + "loss": 0.0733, + "step": 82170 + }, + { + "epoch": 23.11, + "learning_rate": 5.9777590353918725e-05, + "loss": 0.0636, + "step": 82200 + }, + { + "epoch": 23.12, + "learning_rate": 5.9758847968013e-05, + "loss": 0.0661, + "step": 82230 + }, + { + "epoch": 23.13, + "learning_rate": 5.9740105582107273e-05, + "loss": 0.0759, + "step": 82260 + }, + { + "epoch": 23.13, + "learning_rate": 5.972136319620154e-05, + "loss": 0.0637, + "step": 82290 + }, + { + "epoch": 23.14, + "learning_rate": 5.9702620810295815e-05, + "loss": 0.0702, + "step": 82320 + }, + { + "epoch": 23.15, + "learning_rate": 5.9683878424390096e-05, + "loss": 0.0607, + "step": 82350 + }, + { + "epoch": 23.16, + "learning_rate": 5.966513603848437e-05, + "loss": 0.0675, + "step": 82380 + }, + { + "epoch": 23.17, + "learning_rate": 5.9646393652578644e-05, + "loss": 0.0678, + "step": 82410 + }, + { + "epoch": 23.18, + "learning_rate": 5.962765126667291e-05, + "loss": 0.0628, + "step": 82440 + }, + { + "epoch": 23.19, + "learning_rate": 5.9608908880767186e-05, + "loss": 0.0696, + "step": 82470 + }, + { + "epoch": 23.19, + "learning_rate": 5.959016649486147e-05, + "loss": 0.06, + "step": 82500 + }, + { + "epoch": 23.2, + "learning_rate": 5.957142410895574e-05, + "loss": 0.0669, + "step": 82530 + }, + { + "epoch": 23.21, + "learning_rate": 5.955268172305002e-05, + "loss": 0.0763, + "step": 82560 + }, + { + "epoch": 23.22, + "learning_rate": 5.953393933714428e-05, + "loss": 0.0613, + "step": 82590 + }, + { + "epoch": 23.23, + "learning_rate": 5.9515196951238564e-05, + "loss": 0.0752, + "step": 82620 + }, + { + "epoch": 23.24, + "learning_rate": 5.949645456533284e-05, + "loss": 0.0613, + "step": 82650 + }, + { + "epoch": 23.24, + "learning_rate": 5.947771217942711e-05, + "loss": 0.0709, + "step": 82680 + }, + { + "epoch": 23.25, + "learning_rate": 5.945896979352138e-05, + "loss": 0.0708, + "step": 82710 + }, + { + "epoch": 23.26, + "learning_rate": 5.9440227407615654e-05, + "loss": 0.0616, + "step": 82740 + }, + { + "epoch": 23.27, + "learning_rate": 5.9421485021709935e-05, + "loss": 0.0695, + "step": 82770 + }, + { + "epoch": 23.28, + "learning_rate": 5.940274263580421e-05, + "loss": 0.0621, + "step": 82800 + }, + { + "epoch": 23.29, + "learning_rate": 5.938400024989848e-05, + "loss": 0.0664, + "step": 82830 + }, + { + "epoch": 23.29, + "learning_rate": 5.936525786399275e-05, + "loss": 0.0682, + "step": 82860 + }, + { + "epoch": 23.3, + "learning_rate": 5.9346515478087025e-05, + "loss": 0.0601, + "step": 82890 + }, + { + "epoch": 23.31, + "learning_rate": 5.9327773092181306e-05, + "loss": 0.0691, + "step": 82920 + }, + { + "epoch": 23.32, + "learning_rate": 5.930903070627558e-05, + "loss": 0.062, + "step": 82950 + }, + { + "epoch": 23.33, + "learning_rate": 5.929028832036986e-05, + "loss": 0.067, + "step": 82980 + }, + { + "epoch": 23.34, + "learning_rate": 5.927154593446412e-05, + "loss": 0.07, + "step": 83010 + }, + { + "epoch": 23.35, + "learning_rate": 5.92528035485584e-05, + "loss": 0.0639, + "step": 83040 + }, + { + "epoch": 23.35, + "learning_rate": 5.9234061162652677e-05, + "loss": 0.0749, + "step": 83070 + }, + { + "epoch": 23.36, + "learning_rate": 5.921531877674695e-05, + "loss": 0.0656, + "step": 83100 + }, + { + "epoch": 23.37, + "learning_rate": 5.919657639084122e-05, + "loss": 0.075, + "step": 83130 + }, + { + "epoch": 23.38, + "learning_rate": 5.917783400493549e-05, + "loss": 0.0749, + "step": 83160 + }, + { + "epoch": 23.39, + "learning_rate": 5.915909161902977e-05, + "loss": 0.0669, + "step": 83190 + }, + { + "epoch": 23.4, + "learning_rate": 5.914034923312405e-05, + "loss": 0.0713, + "step": 83220 + }, + { + "epoch": 23.4, + "learning_rate": 5.912160684721832e-05, + "loss": 0.0618, + "step": 83250 + }, + { + "epoch": 23.41, + "learning_rate": 5.910286446131259e-05, + "loss": 0.0689, + "step": 83280 + }, + { + "epoch": 23.42, + "learning_rate": 5.908412207540687e-05, + "loss": 0.0702, + "step": 83310 + }, + { + "epoch": 23.43, + "learning_rate": 5.9065379689501144e-05, + "loss": 0.0641, + "step": 83340 + }, + { + "epoch": 23.44, + "learning_rate": 5.904663730359542e-05, + "loss": 0.0687, + "step": 83370 + }, + { + "epoch": 23.45, + "learning_rate": 5.90278949176897e-05, + "loss": 0.0619, + "step": 83400 + }, + { + "epoch": 23.46, + "learning_rate": 5.900915253178396e-05, + "loss": 0.0723, + "step": 83430 + }, + { + "epoch": 23.46, + "learning_rate": 5.899041014587824e-05, + "loss": 0.0712, + "step": 83460 + }, + { + "epoch": 23.47, + "learning_rate": 5.8971667759972515e-05, + "loss": 0.0631, + "step": 83490 + }, + { + "epoch": 23.48, + "learning_rate": 5.895292537406679e-05, + "loss": 0.0713, + "step": 83520 + }, + { + "epoch": 23.49, + "learning_rate": 5.893418298816106e-05, + "loss": 0.0622, + "step": 83550 + }, + { + "epoch": 23.5, + "learning_rate": 5.891544060225533e-05, + "loss": 0.0719, + "step": 83580 + }, + { + "epoch": 23.51, + "learning_rate": 5.889669821634961e-05, + "loss": 0.0734, + "step": 83610 + }, + { + "epoch": 23.51, + "learning_rate": 5.8877955830443886e-05, + "loss": 0.0612, + "step": 83640 + }, + { + "epoch": 23.52, + "learning_rate": 5.885921344453816e-05, + "loss": 0.0734, + "step": 83670 + }, + { + "epoch": 23.53, + "learning_rate": 5.884047105863243e-05, + "loss": 0.0608, + "step": 83700 + }, + { + "epoch": 23.54, + "learning_rate": 5.882172867272671e-05, + "loss": 0.0667, + "step": 83730 + }, + { + "epoch": 23.55, + "learning_rate": 5.880298628682098e-05, + "loss": 0.071, + "step": 83760 + }, + { + "epoch": 23.56, + "learning_rate": 5.878424390091526e-05, + "loss": 0.0616, + "step": 83790 + }, + { + "epoch": 23.56, + "learning_rate": 5.876550151500954e-05, + "loss": 0.0768, + "step": 83820 + }, + { + "epoch": 23.57, + "learning_rate": 5.87467591291038e-05, + "loss": 0.0648, + "step": 83850 + }, + { + "epoch": 23.58, + "learning_rate": 5.872801674319808e-05, + "loss": 0.0689, + "step": 83880 + }, + { + "epoch": 23.59, + "learning_rate": 5.8709274357292354e-05, + "loss": 0.0712, + "step": 83910 + }, + { + "epoch": 23.6, + "learning_rate": 5.869053197138663e-05, + "loss": 0.0642, + "step": 83940 + }, + { + "epoch": 23.61, + "learning_rate": 5.8671789585480896e-05, + "loss": 0.0776, + "step": 83970 + }, + { + "epoch": 23.62, + "learning_rate": 5.865304719957517e-05, + "loss": 0.0607, + "step": 84000 + }, + { + "epoch": 23.62, + "learning_rate": 5.863430481366945e-05, + "loss": 0.0679, + "step": 84030 + }, + { + "epoch": 23.63, + "learning_rate": 5.8615562427763725e-05, + "loss": 0.07, + "step": 84060 + }, + { + "epoch": 23.64, + "learning_rate": 5.8596820041858006e-05, + "loss": 0.0656, + "step": 84090 + }, + { + "epoch": 23.65, + "learning_rate": 5.8578077655952267e-05, + "loss": 0.0717, + "step": 84120 + }, + { + "epoch": 23.66, + "learning_rate": 5.855933527004655e-05, + "loss": 0.0632, + "step": 84150 + }, + { + "epoch": 23.67, + "learning_rate": 5.854059288414082e-05, + "loss": 0.0705, + "step": 84180 + }, + { + "epoch": 23.67, + "learning_rate": 5.8521850498235096e-05, + "loss": 0.0703, + "step": 84210 + }, + { + "epoch": 23.68, + "learning_rate": 5.850310811232938e-05, + "loss": 0.0623, + "step": 84240 + }, + { + "epoch": 23.69, + "learning_rate": 5.848436572642364e-05, + "loss": 0.0747, + "step": 84270 + }, + { + "epoch": 23.7, + "learning_rate": 5.846562334051792e-05, + "loss": 0.063, + "step": 84300 + }, + { + "epoch": 23.71, + "learning_rate": 5.844688095461219e-05, + "loss": 0.0739, + "step": 84330 + }, + { + "epoch": 23.72, + "learning_rate": 5.842813856870647e-05, + "loss": 0.0656, + "step": 84360 + }, + { + "epoch": 23.72, + "learning_rate": 5.8409396182800734e-05, + "loss": 0.0604, + "step": 84390 + }, + { + "epoch": 23.73, + "learning_rate": 5.8390653796895015e-05, + "loss": 0.0721, + "step": 84420 + }, + { + "epoch": 23.74, + "learning_rate": 5.837191141098929e-05, + "loss": 0.0658, + "step": 84450 + }, + { + "epoch": 23.75, + "learning_rate": 5.8353169025083564e-05, + "loss": 0.065, + "step": 84480 + }, + { + "epoch": 23.76, + "learning_rate": 5.8334426639177845e-05, + "loss": 0.0705, + "step": 84510 + }, + { + "epoch": 23.77, + "learning_rate": 5.8315684253272105e-05, + "loss": 0.0614, + "step": 84540 + }, + { + "epoch": 23.78, + "learning_rate": 5.8296941867366386e-05, + "loss": 0.0742, + "step": 84570 + }, + { + "epoch": 23.78, + "learning_rate": 5.827819948146066e-05, + "loss": 0.0656, + "step": 84600 + }, + { + "epoch": 23.79, + "learning_rate": 5.8259457095554935e-05, + "loss": 0.0648, + "step": 84630 + }, + { + "epoch": 23.8, + "learning_rate": 5.82407147096492e-05, + "loss": 0.074, + "step": 84660 + }, + { + "epoch": 23.81, + "learning_rate": 5.8221972323743476e-05, + "loss": 0.0629, + "step": 84690 + }, + { + "epoch": 23.82, + "learning_rate": 5.820322993783776e-05, + "loss": 0.073, + "step": 84720 + }, + { + "epoch": 23.83, + "learning_rate": 5.818448755193203e-05, + "loss": 0.062, + "step": 84750 + }, + { + "epoch": 23.83, + "learning_rate": 5.8165745166026305e-05, + "loss": 0.0652, + "step": 84780 + }, + { + "epoch": 23.84, + "learning_rate": 5.814700278012057e-05, + "loss": 0.0726, + "step": 84810 + }, + { + "epoch": 23.85, + "learning_rate": 5.8128260394214854e-05, + "loss": 0.0597, + "step": 84840 + }, + { + "epoch": 23.86, + "learning_rate": 5.810951800830913e-05, + "loss": 0.0739, + "step": 84870 + }, + { + "epoch": 23.87, + "learning_rate": 5.80907756224034e-05, + "loss": 0.0656, + "step": 84900 + }, + { + "epoch": 23.88, + "learning_rate": 5.807203323649768e-05, + "loss": 0.0699, + "step": 84930 + }, + { + "epoch": 23.89, + "learning_rate": 5.8053290850591944e-05, + "loss": 0.0676, + "step": 84960 + }, + { + "epoch": 23.89, + "learning_rate": 5.8034548464686225e-05, + "loss": 0.0635, + "step": 84990 + }, + { + "epoch": 23.9, + "learning_rate": 5.80158060787805e-05, + "loss": 0.0709, + "step": 85020 + }, + { + "epoch": 23.91, + "learning_rate": 5.799706369287477e-05, + "loss": 0.0632, + "step": 85050 + }, + { + "epoch": 23.92, + "learning_rate": 5.797832130696904e-05, + "loss": 0.0737, + "step": 85080 + }, + { + "epoch": 23.93, + "learning_rate": 5.7959578921063315e-05, + "loss": 0.0754, + "step": 85110 + }, + { + "epoch": 23.94, + "learning_rate": 5.7940836535157596e-05, + "loss": 0.063, + "step": 85140 + }, + { + "epoch": 23.94, + "learning_rate": 5.792209414925187e-05, + "loss": 0.0731, + "step": 85170 + }, + { + "epoch": 23.95, + "learning_rate": 5.7903351763346144e-05, + "loss": 0.0618, + "step": 85200 + }, + { + "epoch": 23.96, + "learning_rate": 5.788460937744041e-05, + "loss": 0.0697, + "step": 85230 + }, + { + "epoch": 23.97, + "learning_rate": 5.786586699153469e-05, + "loss": 0.069, + "step": 85260 + }, + { + "epoch": 23.98, + "learning_rate": 5.784712460562897e-05, + "loss": 0.063, + "step": 85290 + }, + { + "epoch": 23.99, + "learning_rate": 5.782838221972324e-05, + "loss": 0.072, + "step": 85320 + }, + { + "epoch": 23.99, + "learning_rate": 5.780963983381752e-05, + "loss": 0.0605, + "step": 85350 + }, + { + "epoch": 24.0, + "eval_loss": 0.1094522774219513, + "eval_runtime": 630.878, + "eval_samples_per_second": 25.414, + "eval_steps_per_second": 0.796, + "eval_wer": 0.10262989095574086, + "step": 85368 + }, + { + "epoch": 24.0, + "learning_rate": 5.779089744791178e-05, + "loss": 0.0716, + "step": 85380 + }, + { + "epoch": 24.01, + "learning_rate": 5.7772155062006063e-05, + "loss": 0.0651, + "step": 85410 + }, + { + "epoch": 24.02, + "learning_rate": 5.775341267610034e-05, + "loss": 0.064, + "step": 85440 + }, + { + "epoch": 24.03, + "learning_rate": 5.773467029019461e-05, + "loss": 0.0738, + "step": 85470 + }, + { + "epoch": 24.04, + "learning_rate": 5.771592790428888e-05, + "loss": 0.0568, + "step": 85500 + }, + { + "epoch": 24.05, + "learning_rate": 5.7697185518383153e-05, + "loss": 0.0681, + "step": 85530 + }, + { + "epoch": 24.05, + "learning_rate": 5.7678443132477434e-05, + "loss": 0.063, + "step": 85560 + }, + { + "epoch": 24.06, + "learning_rate": 5.765970074657171e-05, + "loss": 0.0678, + "step": 85590 + }, + { + "epoch": 24.07, + "learning_rate": 5.764095836066599e-05, + "loss": 0.0677, + "step": 85620 + }, + { + "epoch": 24.08, + "learning_rate": 5.762221597476025e-05, + "loss": 0.062, + "step": 85650 + }, + { + "epoch": 24.09, + "learning_rate": 5.760347358885453e-05, + "loss": 0.0704, + "step": 85680 + }, + { + "epoch": 24.1, + "learning_rate": 5.7584731202948805e-05, + "loss": 0.0625, + "step": 85710 + }, + { + "epoch": 24.1, + "learning_rate": 5.756598881704308e-05, + "loss": 0.0695, + "step": 85740 + }, + { + "epoch": 24.11, + "learning_rate": 5.754724643113736e-05, + "loss": 0.0734, + "step": 85770 + }, + { + "epoch": 24.12, + "learning_rate": 5.752850404523162e-05, + "loss": 0.0571, + "step": 85800 + }, + { + "epoch": 24.13, + "learning_rate": 5.75097616593259e-05, + "loss": 0.0693, + "step": 85830 + }, + { + "epoch": 24.14, + "learning_rate": 5.7491019273420176e-05, + "loss": 0.06, + "step": 85860 + }, + { + "epoch": 24.15, + "learning_rate": 5.747227688751445e-05, + "loss": 0.0696, + "step": 85890 + }, + { + "epoch": 24.16, + "learning_rate": 5.745353450160872e-05, + "loss": 0.074, + "step": 85920 + }, + { + "epoch": 24.16, + "learning_rate": 5.7434792115703e-05, + "loss": 0.0605, + "step": 85950 + }, + { + "epoch": 24.17, + "learning_rate": 5.741604972979727e-05, + "loss": 0.0721, + "step": 85980 + }, + { + "epoch": 24.18, + "learning_rate": 5.739730734389155e-05, + "loss": 0.0674, + "step": 86010 + }, + { + "epoch": 24.19, + "learning_rate": 5.737856495798583e-05, + "loss": 0.0705, + "step": 86040 + }, + { + "epoch": 24.2, + "learning_rate": 5.735982257208009e-05, + "loss": 0.0727, + "step": 86070 + }, + { + "epoch": 24.21, + "learning_rate": 5.734108018617437e-05, + "loss": 0.0602, + "step": 86100 + }, + { + "epoch": 24.21, + "learning_rate": 5.7322337800268644e-05, + "loss": 0.0741, + "step": 86130 + }, + { + "epoch": 24.22, + "learning_rate": 5.730359541436292e-05, + "loss": 0.0636, + "step": 86160 + }, + { + "epoch": 24.23, + "learning_rate": 5.72848530284572e-05, + "loss": 0.0623, + "step": 86190 + }, + { + "epoch": 24.24, + "learning_rate": 5.726611064255146e-05, + "loss": 0.0734, + "step": 86220 + }, + { + "epoch": 24.25, + "learning_rate": 5.724736825664574e-05, + "loss": 0.0579, + "step": 86250 + }, + { + "epoch": 24.26, + "learning_rate": 5.7228625870740015e-05, + "loss": 0.0707, + "step": 86280 + }, + { + "epoch": 24.26, + "learning_rate": 5.720988348483429e-05, + "loss": 0.0649, + "step": 86310 + }, + { + "epoch": 24.27, + "learning_rate": 5.719114109892856e-05, + "loss": 0.0698, + "step": 86340 + }, + { + "epoch": 24.28, + "learning_rate": 5.717239871302284e-05, + "loss": 0.0752, + "step": 86370 + }, + { + "epoch": 24.29, + "learning_rate": 5.715365632711711e-05, + "loss": 0.0606, + "step": 86400 + }, + { + "epoch": 24.3, + "learning_rate": 5.7134913941211386e-05, + "loss": 0.0729, + "step": 86430 + }, + { + "epoch": 24.31, + "learning_rate": 5.711617155530567e-05, + "loss": 0.0614, + "step": 86460 + }, + { + "epoch": 24.32, + "learning_rate": 5.709742916939993e-05, + "loss": 0.0644, + "step": 86490 + }, + { + "epoch": 24.32, + "learning_rate": 5.707868678349421e-05, + "loss": 0.074, + "step": 86520 + }, + { + "epoch": 24.33, + "learning_rate": 5.705994439758848e-05, + "loss": 0.0584, + "step": 86550 + }, + { + "epoch": 24.34, + "learning_rate": 5.704182675787961e-05, + "loss": 0.0685, + "step": 86580 + }, + { + "epoch": 24.35, + "learning_rate": 5.702308437197389e-05, + "loss": 0.0673, + "step": 86610 + }, + { + "epoch": 24.36, + "learning_rate": 5.7004341986068165e-05, + "loss": 0.0714, + "step": 86640 + }, + { + "epoch": 24.37, + "learning_rate": 5.698559960016243e-05, + "loss": 0.0712, + "step": 86670 + }, + { + "epoch": 24.37, + "learning_rate": 5.696685721425671e-05, + "loss": 0.0583, + "step": 86700 + }, + { + "epoch": 24.38, + "learning_rate": 5.694811482835099e-05, + "loss": 0.0729, + "step": 86730 + }, + { + "epoch": 24.39, + "learning_rate": 5.692937244244526e-05, + "loss": 0.0615, + "step": 86760 + }, + { + "epoch": 24.4, + "learning_rate": 5.6910630056539536e-05, + "loss": 0.0648, + "step": 86790 + }, + { + "epoch": 24.41, + "learning_rate": 5.6891887670633804e-05, + "loss": 0.0729, + "step": 86820 + }, + { + "epoch": 24.42, + "learning_rate": 5.687314528472808e-05, + "loss": 0.0605, + "step": 86850 + }, + { + "epoch": 24.43, + "learning_rate": 5.685440289882236e-05, + "loss": 0.0729, + "step": 86880 + }, + { + "epoch": 24.43, + "learning_rate": 5.683566051291663e-05, + "loss": 0.0623, + "step": 86910 + }, + { + "epoch": 24.44, + "learning_rate": 5.681691812701091e-05, + "loss": 0.0662, + "step": 86940 + }, + { + "epoch": 24.45, + "learning_rate": 5.6798175741105175e-05, + "loss": 0.0737, + "step": 86970 + }, + { + "epoch": 24.46, + "learning_rate": 5.677943335519945e-05, + "loss": 0.0603, + "step": 87000 + }, + { + "epoch": 24.47, + "learning_rate": 5.676069096929373e-05, + "loss": 0.0676, + "step": 87030 + }, + { + "epoch": 24.48, + "learning_rate": 5.6741948583388004e-05, + "loss": 0.0618, + "step": 87060 + }, + { + "epoch": 24.48, + "learning_rate": 5.672320619748227e-05, + "loss": 0.065, + "step": 87090 + }, + { + "epoch": 24.49, + "learning_rate": 5.6704463811576546e-05, + "loss": 0.0732, + "step": 87120 + }, + { + "epoch": 24.5, + "learning_rate": 5.6685721425670827e-05, + "loss": 0.0606, + "step": 87150 + }, + { + "epoch": 24.51, + "learning_rate": 5.66669790397651e-05, + "loss": 0.0741, + "step": 87180 + }, + { + "epoch": 24.52, + "learning_rate": 5.6648236653859375e-05, + "loss": 0.0638, + "step": 87210 + }, + { + "epoch": 24.53, + "learning_rate": 5.662949426795364e-05, + "loss": 0.0631, + "step": 87240 + }, + { + "epoch": 24.53, + "learning_rate": 5.6610751882047917e-05, + "loss": 0.0698, + "step": 87270 + }, + { + "epoch": 24.54, + "learning_rate": 5.65920094961422e-05, + "loss": 0.06, + "step": 87300 + }, + { + "epoch": 24.55, + "learning_rate": 5.657326711023647e-05, + "loss": 0.0706, + "step": 87330 + }, + { + "epoch": 24.56, + "learning_rate": 5.6554524724330746e-05, + "loss": 0.0634, + "step": 87360 + }, + { + "epoch": 24.57, + "learning_rate": 5.653578233842501e-05, + "loss": 0.0666, + "step": 87390 + }, + { + "epoch": 24.58, + "learning_rate": 5.651703995251929e-05, + "loss": 0.0749, + "step": 87420 + }, + { + "epoch": 24.59, + "learning_rate": 5.649829756661357e-05, + "loss": 0.0614, + "step": 87450 + }, + { + "epoch": 24.59, + "learning_rate": 5.647955518070784e-05, + "loss": 0.0708, + "step": 87480 + }, + { + "epoch": 24.6, + "learning_rate": 5.646081279480211e-05, + "loss": 0.0624, + "step": 87510 + }, + { + "epoch": 24.61, + "learning_rate": 5.6442070408896384e-05, + "loss": 0.0672, + "step": 87540 + }, + { + "epoch": 24.62, + "learning_rate": 5.6423328022990665e-05, + "loss": 0.0718, + "step": 87570 + }, + { + "epoch": 24.63, + "learning_rate": 5.640458563708494e-05, + "loss": 0.059, + "step": 87600 + }, + { + "epoch": 24.64, + "learning_rate": 5.6385843251179214e-05, + "loss": 0.0733, + "step": 87630 + }, + { + "epoch": 24.64, + "learning_rate": 5.636710086527348e-05, + "loss": 0.0607, + "step": 87660 + }, + { + "epoch": 24.65, + "learning_rate": 5.634898322556462e-05, + "loss": 0.0657, + "step": 87690 + }, + { + "epoch": 24.66, + "learning_rate": 5.633024083965889e-05, + "loss": 0.0707, + "step": 87720 + }, + { + "epoch": 24.67, + "learning_rate": 5.6311498453753164e-05, + "loss": 0.0602, + "step": 87750 + }, + { + "epoch": 24.68, + "learning_rate": 5.629275606784744e-05, + "loss": 0.0665, + "step": 87780 + }, + { + "epoch": 24.69, + "learning_rate": 5.627401368194172e-05, + "loss": 0.065, + "step": 87810 + }, + { + "epoch": 24.69, + "learning_rate": 5.6255271296035986e-05, + "loss": 0.0652, + "step": 87840 + }, + { + "epoch": 24.7, + "learning_rate": 5.623652891013026e-05, + "loss": 0.0701, + "step": 87870 + }, + { + "epoch": 24.71, + "learning_rate": 5.6217786524224535e-05, + "loss": 0.0571, + "step": 87900 + }, + { + "epoch": 24.72, + "learning_rate": 5.6199044138318816e-05, + "loss": 0.0692, + "step": 87930 + }, + { + "epoch": 24.73, + "learning_rate": 5.618030175241309e-05, + "loss": 0.0617, + "step": 87960 + }, + { + "epoch": 24.74, + "learning_rate": 5.616155936650736e-05, + "loss": 0.0684, + "step": 87990 + }, + { + "epoch": 24.75, + "learning_rate": 5.614281698060163e-05, + "loss": 0.0758, + "step": 88020 + }, + { + "epoch": 24.75, + "learning_rate": 5.6124074594695906e-05, + "loss": 0.0627, + "step": 88050 + }, + { + "epoch": 24.76, + "learning_rate": 5.6105332208790186e-05, + "loss": 0.07, + "step": 88080 + }, + { + "epoch": 24.77, + "learning_rate": 5.608658982288446e-05, + "loss": 0.0656, + "step": 88110 + }, + { + "epoch": 24.78, + "learning_rate": 5.606784743697873e-05, + "loss": 0.0706, + "step": 88140 + }, + { + "epoch": 24.79, + "learning_rate": 5.6049105051073e-05, + "loss": 0.0702, + "step": 88170 + }, + { + "epoch": 24.8, + "learning_rate": 5.6030362665167276e-05, + "loss": 0.0591, + "step": 88200 + }, + { + "epoch": 24.8, + "learning_rate": 5.601162027926156e-05, + "loss": 0.0686, + "step": 88230 + }, + { + "epoch": 24.81, + "learning_rate": 5.5992877893355825e-05, + "loss": 0.0655, + "step": 88260 + }, + { + "epoch": 24.82, + "learning_rate": 5.59741355074501e-05, + "loss": 0.0697, + "step": 88290 + }, + { + "epoch": 24.83, + "learning_rate": 5.595539312154437e-05, + "loss": 0.0739, + "step": 88320 + }, + { + "epoch": 24.84, + "learning_rate": 5.5936650735638654e-05, + "loss": 0.0583, + "step": 88350 + }, + { + "epoch": 24.85, + "learning_rate": 5.591790834973293e-05, + "loss": 0.0707, + "step": 88380 + }, + { + "epoch": 24.86, + "learning_rate": 5.5899165963827196e-05, + "loss": 0.0634, + "step": 88410 + }, + { + "epoch": 24.86, + "learning_rate": 5.588042357792147e-05, + "loss": 0.0661, + "step": 88440 + }, + { + "epoch": 24.87, + "learning_rate": 5.5861681192015744e-05, + "loss": 0.0743, + "step": 88470 + }, + { + "epoch": 24.88, + "learning_rate": 5.5842938806110025e-05, + "loss": 0.0581, + "step": 88500 + }, + { + "epoch": 24.89, + "learning_rate": 5.58241964202043e-05, + "loss": 0.0681, + "step": 88530 + }, + { + "epoch": 24.9, + "learning_rate": 5.580545403429857e-05, + "loss": 0.0646, + "step": 88560 + }, + { + "epoch": 24.91, + "learning_rate": 5.578671164839284e-05, + "loss": 0.0675, + "step": 88590 + }, + { + "epoch": 24.91, + "learning_rate": 5.576796926248712e-05, + "loss": 0.0753, + "step": 88620 + }, + { + "epoch": 24.92, + "learning_rate": 5.5749226876581396e-05, + "loss": 0.0611, + "step": 88650 + }, + { + "epoch": 24.93, + "learning_rate": 5.5730484490675664e-05, + "loss": 0.0717, + "step": 88680 + }, + { + "epoch": 24.94, + "learning_rate": 5.571174210476994e-05, + "loss": 0.0637, + "step": 88710 + }, + { + "epoch": 24.95, + "learning_rate": 5.569299971886421e-05, + "loss": 0.0665, + "step": 88740 + }, + { + "epoch": 24.96, + "learning_rate": 5.567425733295849e-05, + "loss": 0.0753, + "step": 88770 + }, + { + "epoch": 24.96, + "learning_rate": 5.565551494705277e-05, + "loss": 0.0588, + "step": 88800 + }, + { + "epoch": 24.97, + "learning_rate": 5.5636772561147034e-05, + "loss": 0.0679, + "step": 88830 + }, + { + "epoch": 24.98, + "learning_rate": 5.561803017524131e-05, + "loss": 0.0613, + "step": 88860 + }, + { + "epoch": 24.99, + "learning_rate": 5.559928778933558e-05, + "loss": 0.0701, + "step": 88890 + }, + { + "epoch": 25.0, + "learning_rate": 5.5580545403429864e-05, + "loss": 0.0722, + "step": 88920 + }, + { + "epoch": 25.0, + "eval_loss": 0.1143936961889267, + "eval_runtime": 628.7306, + "eval_samples_per_second": 25.501, + "eval_steps_per_second": 0.798, + "eval_wer": 0.10660816398946406, + "step": 88925 + }, + { + "epoch": 25.01, + "learning_rate": 5.556180301752414e-05, + "loss": 0.0631, + "step": 88950 + }, + { + "epoch": 25.02, + "learning_rate": 5.5543060631618405e-05, + "loss": 0.07, + "step": 88980 + }, + { + "epoch": 25.02, + "learning_rate": 5.552431824571268e-05, + "loss": 0.0542, + "step": 89010 + }, + { + "epoch": 25.03, + "learning_rate": 5.550557585980696e-05, + "loss": 0.0706, + "step": 89040 + }, + { + "epoch": 25.04, + "learning_rate": 5.5486833473901235e-05, + "loss": 0.0644, + "step": 89070 + }, + { + "epoch": 25.05, + "learning_rate": 5.54680910879955e-05, + "loss": 0.0628, + "step": 89100 + }, + { + "epoch": 25.06, + "learning_rate": 5.5449348702089776e-05, + "loss": 0.0723, + "step": 89130 + }, + { + "epoch": 25.07, + "learning_rate": 5.543060631618405e-05, + "loss": 0.0625, + "step": 89160 + }, + { + "epoch": 25.07, + "learning_rate": 5.541186393027833e-05, + "loss": 0.0683, + "step": 89190 + }, + { + "epoch": 25.08, + "learning_rate": 5.5393121544372606e-05, + "loss": 0.0675, + "step": 89220 + }, + { + "epoch": 25.09, + "learning_rate": 5.537437915846687e-05, + "loss": 0.0657, + "step": 89250 + }, + { + "epoch": 25.1, + "learning_rate": 5.535563677256115e-05, + "loss": 0.0654, + "step": 89280 + }, + { + "epoch": 25.11, + "learning_rate": 5.533689438665542e-05, + "loss": 0.0587, + "step": 89310 + }, + { + "epoch": 25.12, + "learning_rate": 5.53181520007497e-05, + "loss": 0.0687, + "step": 89340 + }, + { + "epoch": 25.13, + "learning_rate": 5.529940961484398e-05, + "loss": 0.063, + "step": 89370 + }, + { + "epoch": 25.13, + "learning_rate": 5.5280667228938244e-05, + "loss": 0.0588, + "step": 89400 + }, + { + "epoch": 25.14, + "learning_rate": 5.526192484303252e-05, + "loss": 0.0698, + "step": 89430 + }, + { + "epoch": 25.15, + "learning_rate": 5.52431824571268e-05, + "loss": 0.0578, + "step": 89460 + }, + { + "epoch": 25.16, + "learning_rate": 5.522506481741793e-05, + "loss": 0.0683, + "step": 89490 + }, + { + "epoch": 25.17, + "learning_rate": 5.52063224315122e-05, + "loss": 0.0622, + "step": 89520 + }, + { + "epoch": 25.18, + "learning_rate": 5.518758004560648e-05, + "loss": 0.0672, + "step": 89550 + }, + { + "epoch": 25.18, + "learning_rate": 5.516883765970074e-05, + "loss": 0.0685, + "step": 89580 + }, + { + "epoch": 25.19, + "learning_rate": 5.5150095273795023e-05, + "loss": 0.057, + "step": 89610 + }, + { + "epoch": 25.2, + "learning_rate": 5.51313528878893e-05, + "loss": 0.071, + "step": 89640 + }, + { + "epoch": 25.21, + "learning_rate": 5.511261050198357e-05, + "loss": 0.0644, + "step": 89670 + }, + { + "epoch": 25.22, + "learning_rate": 5.509386811607785e-05, + "loss": 0.0595, + "step": 89700 + }, + { + "epoch": 25.23, + "learning_rate": 5.507512573017212e-05, + "loss": 0.0692, + "step": 89730 + }, + { + "epoch": 25.23, + "learning_rate": 5.5056383344266394e-05, + "loss": 0.0561, + "step": 89760 + }, + { + "epoch": 25.24, + "learning_rate": 5.503764095836067e-05, + "loss": 0.0681, + "step": 89790 + }, + { + "epoch": 25.25, + "learning_rate": 5.501889857245495e-05, + "loss": 0.06, + "step": 89820 + }, + { + "epoch": 25.26, + "learning_rate": 5.500015618654921e-05, + "loss": 0.0626, + "step": 89850 + }, + { + "epoch": 25.27, + "learning_rate": 5.498141380064349e-05, + "loss": 0.0717, + "step": 89880 + }, + { + "epoch": 25.28, + "learning_rate": 5.4962671414737765e-05, + "loss": 0.0613, + "step": 89910 + }, + { + "epoch": 25.29, + "learning_rate": 5.494392902883204e-05, + "loss": 0.0667, + "step": 89940 + }, + { + "epoch": 25.29, + "learning_rate": 5.492518664292632e-05, + "loss": 0.0636, + "step": 89970 + }, + { + "epoch": 25.3, + "learning_rate": 5.490644425702058e-05, + "loss": 0.0655, + "step": 90000 + }, + { + "epoch": 25.31, + "learning_rate": 5.488770187111486e-05, + "loss": 0.0711, + "step": 90030 + }, + { + "epoch": 25.32, + "learning_rate": 5.4868959485209136e-05, + "loss": 0.056, + "step": 90060 + }, + { + "epoch": 25.33, + "learning_rate": 5.485021709930341e-05, + "loss": 0.0722, + "step": 90090 + }, + { + "epoch": 25.34, + "learning_rate": 5.483147471339769e-05, + "loss": 0.0665, + "step": 90120 + }, + { + "epoch": 25.34, + "learning_rate": 5.481273232749196e-05, + "loss": 0.0634, + "step": 90150 + }, + { + "epoch": 25.35, + "learning_rate": 5.479398994158623e-05, + "loss": 0.0706, + "step": 90180 + }, + { + "epoch": 25.36, + "learning_rate": 5.477524755568051e-05, + "loss": 0.0586, + "step": 90210 + }, + { + "epoch": 25.37, + "learning_rate": 5.475650516977479e-05, + "loss": 0.0655, + "step": 90240 + }, + { + "epoch": 25.38, + "learning_rate": 5.473776278386905e-05, + "loss": 0.0638, + "step": 90270 + }, + { + "epoch": 25.39, + "learning_rate": 5.471902039796333e-05, + "loss": 0.0637, + "step": 90300 + }, + { + "epoch": 25.39, + "learning_rate": 5.4700278012057604e-05, + "loss": 0.0698, + "step": 90330 + }, + { + "epoch": 25.4, + "learning_rate": 5.468153562615188e-05, + "loss": 0.0572, + "step": 90360 + }, + { + "epoch": 25.41, + "learning_rate": 5.466279324024616e-05, + "loss": 0.0693, + "step": 90390 + }, + { + "epoch": 25.42, + "learning_rate": 5.464405085434042e-05, + "loss": 0.062, + "step": 90420 + }, + { + "epoch": 25.43, + "learning_rate": 5.46253084684347e-05, + "loss": 0.0624, + "step": 90450 + }, + { + "epoch": 25.44, + "learning_rate": 5.4606566082528975e-05, + "loss": 0.0695, + "step": 90480 + }, + { + "epoch": 25.45, + "learning_rate": 5.4587823696623256e-05, + "loss": 0.0575, + "step": 90510 + }, + { + "epoch": 25.45, + "learning_rate": 5.456908131071753e-05, + "loss": 0.0671, + "step": 90540 + }, + { + "epoch": 25.46, + "learning_rate": 5.45503389248118e-05, + "loss": 0.0662, + "step": 90570 + }, + { + "epoch": 25.47, + "learning_rate": 5.453159653890607e-05, + "loss": 0.0626, + "step": 90600 + }, + { + "epoch": 25.48, + "learning_rate": 5.4512854153000346e-05, + "loss": 0.0715, + "step": 90630 + }, + { + "epoch": 25.49, + "learning_rate": 5.449411176709463e-05, + "loss": 0.0581, + "step": 90660 + }, + { + "epoch": 25.5, + "learning_rate": 5.447536938118889e-05, + "loss": 0.0669, + "step": 90690 + }, + { + "epoch": 25.5, + "learning_rate": 5.445662699528317e-05, + "loss": 0.0708, + "step": 90720 + }, + { + "epoch": 25.51, + "learning_rate": 5.443788460937744e-05, + "loss": 0.0649, + "step": 90750 + }, + { + "epoch": 25.52, + "learning_rate": 5.441914222347172e-05, + "loss": 0.0704, + "step": 90780 + }, + { + "epoch": 25.53, + "learning_rate": 5.4400399837566e-05, + "loss": 0.0619, + "step": 90810 + }, + { + "epoch": 25.54, + "learning_rate": 5.438165745166026e-05, + "loss": 0.0708, + "step": 90840 + }, + { + "epoch": 25.55, + "learning_rate": 5.436291506575454e-05, + "loss": 0.0616, + "step": 90870 + }, + { + "epoch": 25.56, + "learning_rate": 5.4344172679848814e-05, + "loss": 0.0651, + "step": 90900 + }, + { + "epoch": 25.56, + "learning_rate": 5.4325430293943095e-05, + "loss": 0.069, + "step": 90930 + }, + { + "epoch": 25.57, + "learning_rate": 5.4306687908037355e-05, + "loss": 0.0606, + "step": 90960 + }, + { + "epoch": 25.58, + "learning_rate": 5.4287945522131636e-05, + "loss": 0.0689, + "step": 90990 + }, + { + "epoch": 25.59, + "learning_rate": 5.426920313622591e-05, + "loss": 0.0645, + "step": 91020 + }, + { + "epoch": 25.6, + "learning_rate": 5.4250460750320185e-05, + "loss": 0.0606, + "step": 91050 + }, + { + "epoch": 25.61, + "learning_rate": 5.4231718364414466e-05, + "loss": 0.0699, + "step": 91080 + }, + { + "epoch": 25.61, + "learning_rate": 5.4212975978508726e-05, + "loss": 0.0595, + "step": 91110 + }, + { + "epoch": 25.62, + "learning_rate": 5.419423359260301e-05, + "loss": 0.0687, + "step": 91140 + }, + { + "epoch": 25.63, + "learning_rate": 5.417549120669728e-05, + "loss": 0.0632, + "step": 91170 + }, + { + "epoch": 25.64, + "learning_rate": 5.4156748820791556e-05, + "loss": 0.0632, + "step": 91200 + }, + { + "epoch": 25.65, + "learning_rate": 5.4138006434885837e-05, + "loss": 0.072, + "step": 91230 + }, + { + "epoch": 25.66, + "learning_rate": 5.4119264048980104e-05, + "loss": 0.0603, + "step": 91260 + }, + { + "epoch": 25.66, + "learning_rate": 5.410052166307438e-05, + "loss": 0.0695, + "step": 91290 + }, + { + "epoch": 25.67, + "learning_rate": 5.408177927716865e-05, + "loss": 0.0663, + "step": 91320 + }, + { + "epoch": 25.68, + "learning_rate": 5.406303689126293e-05, + "loss": 0.0639, + "step": 91350 + }, + { + "epoch": 25.69, + "learning_rate": 5.4044294505357194e-05, + "loss": 0.0713, + "step": 91380 + }, + { + "epoch": 25.7, + "learning_rate": 5.4025552119451475e-05, + "loss": 0.063, + "step": 91410 + }, + { + "epoch": 25.71, + "learning_rate": 5.400680973354575e-05, + "loss": 0.0682, + "step": 91440 + }, + { + "epoch": 25.72, + "learning_rate": 5.398806734764002e-05, + "loss": 0.0637, + "step": 91470 + }, + { + "epoch": 25.72, + "learning_rate": 5.3969324961734304e-05, + "loss": 0.0654, + "step": 91500 + }, + { + "epoch": 25.73, + "learning_rate": 5.3950582575828565e-05, + "loss": 0.0693, + "step": 91530 + }, + { + "epoch": 25.74, + "learning_rate": 5.3931840189922846e-05, + "loss": 0.0592, + "step": 91560 + }, + { + "epoch": 25.75, + "learning_rate": 5.391309780401712e-05, + "loss": 0.0687, + "step": 91590 + }, + { + "epoch": 25.76, + "learning_rate": 5.3894355418111394e-05, + "loss": 0.0625, + "step": 91620 + }, + { + "epoch": 25.77, + "learning_rate": 5.3875613032205675e-05, + "loss": 0.0636, + "step": 91650 + }, + { + "epoch": 25.77, + "learning_rate": 5.385687064629994e-05, + "loss": 0.0687, + "step": 91680 + }, + { + "epoch": 25.78, + "learning_rate": 5.383812826039422e-05, + "loss": 0.0618, + "step": 91710 + }, + { + "epoch": 25.79, + "learning_rate": 5.381938587448849e-05, + "loss": 0.0699, + "step": 91740 + }, + { + "epoch": 25.8, + "learning_rate": 5.380064348858277e-05, + "loss": 0.0626, + "step": 91770 + }, + { + "epoch": 25.81, + "learning_rate": 5.378190110267703e-05, + "loss": 0.0649, + "step": 91800 + }, + { + "epoch": 25.82, + "learning_rate": 5.3763158716771314e-05, + "loss": 0.0729, + "step": 91830 + }, + { + "epoch": 25.83, + "learning_rate": 5.374441633086559e-05, + "loss": 0.0576, + "step": 91860 + }, + { + "epoch": 25.83, + "learning_rate": 5.372567394495986e-05, + "loss": 0.0639, + "step": 91890 + }, + { + "epoch": 25.84, + "learning_rate": 5.370693155905414e-05, + "loss": 0.0648, + "step": 91920 + }, + { + "epoch": 25.85, + "learning_rate": 5.3688189173148404e-05, + "loss": 0.0661, + "step": 91950 + }, + { + "epoch": 25.86, + "learning_rate": 5.3669446787242684e-05, + "loss": 0.07, + "step": 91980 + }, + { + "epoch": 25.87, + "learning_rate": 5.365070440133696e-05, + "loss": 0.0577, + "step": 92010 + }, + { + "epoch": 25.88, + "learning_rate": 5.363196201543124e-05, + "loss": 0.0656, + "step": 92040 + }, + { + "epoch": 25.88, + "learning_rate": 5.3613219629525514e-05, + "loss": 0.0624, + "step": 92070 + }, + { + "epoch": 25.89, + "learning_rate": 5.359447724361978e-05, + "loss": 0.0605, + "step": 92100 + }, + { + "epoch": 25.9, + "learning_rate": 5.3575734857714055e-05, + "loss": 0.0716, + "step": 92130 + }, + { + "epoch": 25.91, + "learning_rate": 5.355699247180833e-05, + "loss": 0.0552, + "step": 92160 + }, + { + "epoch": 25.92, + "learning_rate": 5.353825008590261e-05, + "loss": 0.0679, + "step": 92190 + }, + { + "epoch": 25.93, + "learning_rate": 5.351950769999687e-05, + "loss": 0.065, + "step": 92220 + }, + { + "epoch": 25.93, + "learning_rate": 5.350076531409115e-05, + "loss": 0.0645, + "step": 92250 + }, + { + "epoch": 25.94, + "learning_rate": 5.3482022928185426e-05, + "loss": 0.0723, + "step": 92280 + }, + { + "epoch": 25.95, + "learning_rate": 5.34632805422797e-05, + "loss": 0.0594, + "step": 92310 + }, + { + "epoch": 25.96, + "learning_rate": 5.344453815637398e-05, + "loss": 0.069, + "step": 92340 + }, + { + "epoch": 25.97, + "learning_rate": 5.342579577046824e-05, + "loss": 0.0617, + "step": 92370 + }, + { + "epoch": 25.98, + "learning_rate": 5.340705338456252e-05, + "loss": 0.0655, + "step": 92400 + }, + { + "epoch": 25.99, + "learning_rate": 5.33883109986568e-05, + "loss": 0.0662, + "step": 92430 + }, + { + "epoch": 25.99, + "learning_rate": 5.336956861275108e-05, + "loss": 0.0597, + "step": 92460 + }, + { + "epoch": 26.0, + "eval_loss": 0.10869389772415161, + "eval_runtime": 630.2477, + "eval_samples_per_second": 25.439, + "eval_steps_per_second": 0.797, + "eval_wer": 0.10220681560738608, + "step": 92482 + }, + { + "epoch": 26.0, + "learning_rate": 5.335082622684535e-05, + "loss": 0.0729, + "step": 92490 + }, + { + "epoch": 26.01, + "learning_rate": 5.333208384093962e-05, + "loss": 0.0565, + "step": 92520 + }, + { + "epoch": 26.02, + "learning_rate": 5.3313341455033894e-05, + "loss": 0.0647, + "step": 92550 + }, + { + "epoch": 26.03, + "learning_rate": 5.329459906912817e-05, + "loss": 0.0654, + "step": 92580 + }, + { + "epoch": 26.04, + "learning_rate": 5.327585668322245e-05, + "loss": 0.0605, + "step": 92610 + }, + { + "epoch": 26.04, + "learning_rate": 5.325711429731671e-05, + "loss": 0.068, + "step": 92640 + }, + { + "epoch": 26.05, + "learning_rate": 5.323837191141099e-05, + "loss": 0.062, + "step": 92670 + }, + { + "epoch": 26.06, + "learning_rate": 5.3219629525505265e-05, + "loss": 0.0692, + "step": 92700 + }, + { + "epoch": 26.07, + "learning_rate": 5.320088713959954e-05, + "loss": 0.0614, + "step": 92730 + }, + { + "epoch": 26.08, + "learning_rate": 5.318214475369382e-05, + "loss": 0.0604, + "step": 92760 + }, + { + "epoch": 26.09, + "learning_rate": 5.316340236778809e-05, + "loss": 0.0641, + "step": 92790 + }, + { + "epoch": 26.1, + "learning_rate": 5.314465998188236e-05, + "loss": 0.0565, + "step": 92820 + }, + { + "epoch": 26.1, + "learning_rate": 5.3125917595976636e-05, + "loss": 0.066, + "step": 92850 + }, + { + "epoch": 26.11, + "learning_rate": 5.310717521007092e-05, + "loss": 0.0658, + "step": 92880 + }, + { + "epoch": 26.12, + "learning_rate": 5.308843282416519e-05, + "loss": 0.0601, + "step": 92910 + }, + { + "epoch": 26.13, + "learning_rate": 5.306969043825946e-05, + "loss": 0.0706, + "step": 92940 + }, + { + "epoch": 26.14, + "learning_rate": 5.305094805235373e-05, + "loss": 0.0562, + "step": 92970 + }, + { + "epoch": 26.15, + "learning_rate": 5.303220566644801e-05, + "loss": 0.0639, + "step": 93000 + }, + { + "epoch": 26.15, + "learning_rate": 5.301346328054229e-05, + "loss": 0.0657, + "step": 93030 + }, + { + "epoch": 26.16, + "learning_rate": 5.299472089463655e-05, + "loss": 0.0587, + "step": 93060 + }, + { + "epoch": 26.17, + "learning_rate": 5.297597850873083e-05, + "loss": 0.0669, + "step": 93090 + }, + { + "epoch": 26.18, + "learning_rate": 5.2957236122825104e-05, + "loss": 0.0595, + "step": 93120 + }, + { + "epoch": 26.19, + "learning_rate": 5.293849373691938e-05, + "loss": 0.0666, + "step": 93150 + }, + { + "epoch": 26.2, + "learning_rate": 5.291975135101366e-05, + "loss": 0.0663, + "step": 93180 + }, + { + "epoch": 26.2, + "learning_rate": 5.2901008965107926e-05, + "loss": 0.0608, + "step": 93210 + }, + { + "epoch": 26.21, + "learning_rate": 5.28822665792022e-05, + "loss": 0.0675, + "step": 93240 + }, + { + "epoch": 26.22, + "learning_rate": 5.2863524193296475e-05, + "loss": 0.0614, + "step": 93270 + }, + { + "epoch": 26.23, + "learning_rate": 5.2844781807390756e-05, + "loss": 0.0622, + "step": 93300 + }, + { + "epoch": 26.24, + "learning_rate": 5.282603942148503e-05, + "loss": 0.0633, + "step": 93330 + }, + { + "epoch": 26.25, + "learning_rate": 5.28072970355793e-05, + "loss": 0.0621, + "step": 93360 + }, + { + "epoch": 26.26, + "learning_rate": 5.278855464967357e-05, + "loss": 0.0665, + "step": 93390 + }, + { + "epoch": 26.26, + "learning_rate": 5.2769812263767846e-05, + "loss": 0.0584, + "step": 93420 + }, + { + "epoch": 26.27, + "learning_rate": 5.275106987786213e-05, + "loss": 0.0636, + "step": 93450 + }, + { + "epoch": 26.28, + "learning_rate": 5.273232749195639e-05, + "loss": 0.0667, + "step": 93480 + }, + { + "epoch": 26.29, + "learning_rate": 5.271358510605067e-05, + "loss": 0.0599, + "step": 93510 + }, + { + "epoch": 26.3, + "learning_rate": 5.269484272014494e-05, + "loss": 0.0681, + "step": 93540 + }, + { + "epoch": 26.31, + "learning_rate": 5.267610033423922e-05, + "loss": 0.0574, + "step": 93570 + }, + { + "epoch": 26.31, + "learning_rate": 5.26573579483335e-05, + "loss": 0.0631, + "step": 93600 + }, + { + "epoch": 26.32, + "learning_rate": 5.2638615562427765e-05, + "loss": 0.0651, + "step": 93630 + }, + { + "epoch": 26.33, + "learning_rate": 5.261987317652204e-05, + "loss": 0.0595, + "step": 93660 + }, + { + "epoch": 26.34, + "learning_rate": 5.260113079061631e-05, + "loss": 0.0676, + "step": 93690 + }, + { + "epoch": 26.35, + "learning_rate": 5.2582388404710594e-05, + "loss": 0.0608, + "step": 93720 + }, + { + "epoch": 26.36, + "learning_rate": 5.256364601880487e-05, + "loss": 0.0653, + "step": 93750 + }, + { + "epoch": 26.36, + "learning_rate": 5.2544903632899136e-05, + "loss": 0.0653, + "step": 93780 + }, + { + "epoch": 26.37, + "learning_rate": 5.252616124699341e-05, + "loss": 0.0629, + "step": 93810 + }, + { + "epoch": 26.38, + "learning_rate": 5.2507418861087684e-05, + "loss": 0.0695, + "step": 93840 + }, + { + "epoch": 26.39, + "learning_rate": 5.2488676475181965e-05, + "loss": 0.0593, + "step": 93870 + }, + { + "epoch": 26.4, + "learning_rate": 5.2469934089276226e-05, + "loss": 0.065, + "step": 93900 + }, + { + "epoch": 26.41, + "learning_rate": 5.245119170337051e-05, + "loss": 0.0616, + "step": 93930 + }, + { + "epoch": 26.42, + "learning_rate": 5.243244931746478e-05, + "loss": 0.0582, + "step": 93960 + }, + { + "epoch": 26.42, + "learning_rate": 5.241370693155906e-05, + "loss": 0.0676, + "step": 93990 + }, + { + "epoch": 26.43, + "learning_rate": 5.2394964545653336e-05, + "loss": 0.0589, + "step": 94020 + }, + { + "epoch": 26.44, + "learning_rate": 5.2376222159747604e-05, + "loss": 0.0667, + "step": 94050 + }, + { + "epoch": 26.45, + "learning_rate": 5.235747977384188e-05, + "loss": 0.0653, + "step": 94080 + }, + { + "epoch": 26.46, + "learning_rate": 5.233873738793615e-05, + "loss": 0.0577, + "step": 94110 + }, + { + "epoch": 26.47, + "learning_rate": 5.231999500203043e-05, + "loss": 0.0691, + "step": 94140 + }, + { + "epoch": 26.47, + "learning_rate": 5.230125261612471e-05, + "loss": 0.0584, + "step": 94170 + }, + { + "epoch": 26.48, + "learning_rate": 5.2282510230218975e-05, + "loss": 0.065, + "step": 94200 + }, + { + "epoch": 26.49, + "learning_rate": 5.226376784431325e-05, + "loss": 0.0644, + "step": 94230 + }, + { + "epoch": 26.5, + "learning_rate": 5.224502545840752e-05, + "loss": 0.0591, + "step": 94260 + }, + { + "epoch": 26.51, + "learning_rate": 5.2226283072501804e-05, + "loss": 0.0649, + "step": 94290 + }, + { + "epoch": 26.52, + "learning_rate": 5.220754068659607e-05, + "loss": 0.0591, + "step": 94320 + }, + { + "epoch": 26.53, + "learning_rate": 5.2188798300690346e-05, + "loss": 0.0653, + "step": 94350 + }, + { + "epoch": 26.53, + "learning_rate": 5.217005591478462e-05, + "loss": 0.0668, + "step": 94380 + }, + { + "epoch": 26.54, + "learning_rate": 5.21513135288789e-05, + "loss": 0.0586, + "step": 94410 + }, + { + "epoch": 26.55, + "learning_rate": 5.2132571142973175e-05, + "loss": 0.0694, + "step": 94440 + }, + { + "epoch": 26.56, + "learning_rate": 5.211382875706744e-05, + "loss": 0.0607, + "step": 94470 + }, + { + "epoch": 26.57, + "learning_rate": 5.2095086371161717e-05, + "loss": 0.0662, + "step": 94500 + }, + { + "epoch": 26.58, + "learning_rate": 5.207634398525599e-05, + "loss": 0.0668, + "step": 94530 + }, + { + "epoch": 26.58, + "learning_rate": 5.205760159935027e-05, + "loss": 0.0608, + "step": 94560 + }, + { + "epoch": 26.59, + "learning_rate": 5.203885921344453e-05, + "loss": 0.0673, + "step": 94590 + }, + { + "epoch": 26.6, + "learning_rate": 5.202011682753881e-05, + "loss": 0.0627, + "step": 94620 + }, + { + "epoch": 26.61, + "learning_rate": 5.200137444163309e-05, + "loss": 0.0657, + "step": 94650 + }, + { + "epoch": 26.62, + "learning_rate": 5.198263205572736e-05, + "loss": 0.0628, + "step": 94680 + }, + { + "epoch": 26.63, + "learning_rate": 5.196388966982164e-05, + "loss": 0.0574, + "step": 94710 + }, + { + "epoch": 26.63, + "learning_rate": 5.194514728391591e-05, + "loss": 0.0683, + "step": 94740 + }, + { + "epoch": 26.64, + "learning_rate": 5.1926404898010184e-05, + "loss": 0.0574, + "step": 94770 + }, + { + "epoch": 26.65, + "learning_rate": 5.190766251210446e-05, + "loss": 0.0633, + "step": 94800 + }, + { + "epoch": 26.66, + "learning_rate": 5.188892012619874e-05, + "loss": 0.0629, + "step": 94830 + }, + { + "epoch": 26.67, + "learning_rate": 5.1870177740293014e-05, + "loss": 0.0647, + "step": 94860 + }, + { + "epoch": 26.68, + "learning_rate": 5.185143535438728e-05, + "loss": 0.0656, + "step": 94890 + }, + { + "epoch": 26.69, + "learning_rate": 5.1832692968481555e-05, + "loss": 0.0545, + "step": 94920 + }, + { + "epoch": 26.69, + "learning_rate": 5.181395058257583e-05, + "loss": 0.0653, + "step": 94950 + }, + { + "epoch": 26.7, + "learning_rate": 5.179520819667011e-05, + "loss": 0.0662, + "step": 94980 + }, + { + "epoch": 26.71, + "learning_rate": 5.177646581076437e-05, + "loss": 0.0585, + "step": 95010 + }, + { + "epoch": 26.72, + "learning_rate": 5.175772342485865e-05, + "loss": 0.0705, + "step": 95040 + }, + { + "epoch": 26.73, + "learning_rate": 5.1738981038952926e-05, + "loss": 0.0596, + "step": 95070 + }, + { + "epoch": 26.74, + "learning_rate": 5.172023865304721e-05, + "loss": 0.0637, + "step": 95100 + }, + { + "epoch": 26.74, + "learning_rate": 5.170149626714148e-05, + "loss": 0.0634, + "step": 95130 + }, + { + "epoch": 26.75, + "learning_rate": 5.168275388123575e-05, + "loss": 0.0633, + "step": 95160 + }, + { + "epoch": 26.76, + "learning_rate": 5.166401149533002e-05, + "loss": 0.0679, + "step": 95190 + }, + { + "epoch": 26.77, + "learning_rate": 5.16452691094243e-05, + "loss": 0.058, + "step": 95220 + }, + { + "epoch": 26.78, + "learning_rate": 5.162652672351858e-05, + "loss": 0.0693, + "step": 95250 + }, + { + "epoch": 26.79, + "learning_rate": 5.160778433761285e-05, + "loss": 0.0654, + "step": 95280 + }, + { + "epoch": 26.79, + "learning_rate": 5.158904195170712e-05, + "loss": 0.0623, + "step": 95310 + }, + { + "epoch": 26.8, + "learning_rate": 5.1570299565801394e-05, + "loss": 0.0671, + "step": 95340 + }, + { + "epoch": 26.81, + "learning_rate": 5.155155717989567e-05, + "loss": 0.0601, + "step": 95370 + }, + { + "epoch": 26.82, + "learning_rate": 5.153281479398995e-05, + "loss": 0.0634, + "step": 95400 + }, + { + "epoch": 26.83, + "learning_rate": 5.151407240808421e-05, + "loss": 0.0642, + "step": 95430 + }, + { + "epoch": 26.84, + "learning_rate": 5.149533002217849e-05, + "loss": 0.0602, + "step": 95460 + }, + { + "epoch": 26.85, + "learning_rate": 5.1476587636272765e-05, + "loss": 0.0716, + "step": 95490 + }, + { + "epoch": 26.85, + "learning_rate": 5.1457845250367046e-05, + "loss": 0.0635, + "step": 95520 + }, + { + "epoch": 26.86, + "learning_rate": 5.143972761065817e-05, + "loss": 0.0642, + "step": 95550 + }, + { + "epoch": 26.87, + "learning_rate": 5.142098522475245e-05, + "loss": 0.0648, + "step": 95580 + }, + { + "epoch": 26.88, + "learning_rate": 5.140224283884673e-05, + "loss": 0.0621, + "step": 95610 + }, + { + "epoch": 26.89, + "learning_rate": 5.138350045294099e-05, + "loss": 0.0653, + "step": 95640 + }, + { + "epoch": 26.9, + "learning_rate": 5.136475806703527e-05, + "loss": 0.0552, + "step": 95670 + }, + { + "epoch": 26.9, + "learning_rate": 5.1346015681129544e-05, + "loss": 0.0671, + "step": 95700 + }, + { + "epoch": 26.91, + "learning_rate": 5.132727329522382e-05, + "loss": 0.0613, + "step": 95730 + }, + { + "epoch": 26.92, + "learning_rate": 5.1308530909318086e-05, + "loss": 0.0615, + "step": 95760 + }, + { + "epoch": 26.93, + "learning_rate": 5.128978852341236e-05, + "loss": 0.0678, + "step": 95790 + }, + { + "epoch": 26.94, + "learning_rate": 5.127104613750664e-05, + "loss": 0.0587, + "step": 95820 + }, + { + "epoch": 26.95, + "learning_rate": 5.1252303751600915e-05, + "loss": 0.0637, + "step": 95850 + }, + { + "epoch": 26.96, + "learning_rate": 5.1233561365695196e-05, + "loss": 0.0616, + "step": 95880 + }, + { + "epoch": 26.96, + "learning_rate": 5.121481897978946e-05, + "loss": 0.0634, + "step": 95910 + }, + { + "epoch": 26.97, + "learning_rate": 5.119607659388374e-05, + "loss": 0.0672, + "step": 95940 + }, + { + "epoch": 26.98, + "learning_rate": 5.117733420797801e-05, + "loss": 0.0604, + "step": 95970 + }, + { + "epoch": 26.99, + "learning_rate": 5.1158591822072286e-05, + "loss": 0.0658, + "step": 96000 + }, + { + "epoch": 27.0, + "learning_rate": 5.113984943616657e-05, + "loss": 0.062, + "step": 96030 + }, + { + "epoch": 27.0, + "eval_loss": 0.10732191056013107, + "eval_runtime": 630.3808, + "eval_samples_per_second": 25.434, + "eval_steps_per_second": 0.796, + "eval_wer": 0.10270495271109413, + "step": 96039 + }, + { + "epoch": 27.01, + "learning_rate": 5.112110705026083e-05, + "loss": 0.0595, + "step": 96060 + }, + { + "epoch": 27.01, + "learning_rate": 5.110236466435511e-05, + "loss": 0.0678, + "step": 96090 + }, + { + "epoch": 27.02, + "learning_rate": 5.108362227844938e-05, + "loss": 0.0525, + "step": 96120 + }, + { + "epoch": 27.03, + "learning_rate": 5.106487989254366e-05, + "loss": 0.0699, + "step": 96150 + }, + { + "epoch": 27.04, + "learning_rate": 5.1046137506637924e-05, + "loss": 0.0593, + "step": 96180 + }, + { + "epoch": 27.05, + "learning_rate": 5.1027395120732205e-05, + "loss": 0.0636, + "step": 96210 + }, + { + "epoch": 27.06, + "learning_rate": 5.100865273482648e-05, + "loss": 0.0704, + "step": 96240 + }, + { + "epoch": 27.06, + "learning_rate": 5.0989910348920754e-05, + "loss": 0.0575, + "step": 96270 + }, + { + "epoch": 27.07, + "learning_rate": 5.0971167963015035e-05, + "loss": 0.0617, + "step": 96300 + }, + { + "epoch": 27.08, + "learning_rate": 5.0952425577109295e-05, + "loss": 0.0576, + "step": 96330 + }, + { + "epoch": 27.09, + "learning_rate": 5.0933683191203576e-05, + "loss": 0.0571, + "step": 96360 + }, + { + "epoch": 27.1, + "learning_rate": 5.091494080529785e-05, + "loss": 0.0673, + "step": 96390 + }, + { + "epoch": 27.11, + "learning_rate": 5.0896198419392125e-05, + "loss": 0.0561, + "step": 96420 + }, + { + "epoch": 27.12, + "learning_rate": 5.0877456033486406e-05, + "loss": 0.0685, + "step": 96450 + }, + { + "epoch": 27.12, + "learning_rate": 5.0858713647580666e-05, + "loss": 0.0611, + "step": 96480 + }, + { + "epoch": 27.13, + "learning_rate": 5.083997126167495e-05, + "loss": 0.0629, + "step": 96510 + }, + { + "epoch": 27.14, + "learning_rate": 5.082122887576922e-05, + "loss": 0.0714, + "step": 96540 + }, + { + "epoch": 27.15, + "learning_rate": 5.0802486489863496e-05, + "loss": 0.0578, + "step": 96570 + }, + { + "epoch": 27.16, + "learning_rate": 5.078374410395776e-05, + "loss": 0.0619, + "step": 96600 + }, + { + "epoch": 27.17, + "learning_rate": 5.0765001718052044e-05, + "loss": 0.0582, + "step": 96630 + }, + { + "epoch": 27.17, + "learning_rate": 5.074625933214632e-05, + "loss": 0.0638, + "step": 96660 + }, + { + "epoch": 27.18, + "learning_rate": 5.072751694624059e-05, + "loss": 0.0711, + "step": 96690 + }, + { + "epoch": 27.19, + "learning_rate": 5.0708774560334873e-05, + "loss": 0.0598, + "step": 96720 + }, + { + "epoch": 27.2, + "learning_rate": 5.0690032174429134e-05, + "loss": 0.0692, + "step": 96750 + }, + { + "epoch": 27.21, + "learning_rate": 5.0671289788523415e-05, + "loss": 0.0596, + "step": 96780 + }, + { + "epoch": 27.22, + "learning_rate": 5.065254740261769e-05, + "loss": 0.0656, + "step": 96810 + }, + { + "epoch": 27.23, + "learning_rate": 5.0633805016711963e-05, + "loss": 0.0685, + "step": 96840 + }, + { + "epoch": 27.23, + "learning_rate": 5.0615062630806244e-05, + "loss": 0.0562, + "step": 96870 + }, + { + "epoch": 27.24, + "learning_rate": 5.0596320244900505e-05, + "loss": 0.065, + "step": 96900 + }, + { + "epoch": 27.25, + "learning_rate": 5.0577577858994786e-05, + "loss": 0.057, + "step": 96930 + }, + { + "epoch": 27.26, + "learning_rate": 5.055883547308906e-05, + "loss": 0.0637, + "step": 96960 + }, + { + "epoch": 27.27, + "learning_rate": 5.054009308718334e-05, + "loss": 0.0718, + "step": 96990 + }, + { + "epoch": 27.28, + "learning_rate": 5.05213507012776e-05, + "loss": 0.0564, + "step": 97020 + }, + { + "epoch": 27.28, + "learning_rate": 5.050260831537188e-05, + "loss": 0.0638, + "step": 97050 + }, + { + "epoch": 27.29, + "learning_rate": 5.048386592946616e-05, + "loss": 0.0578, + "step": 97080 + }, + { + "epoch": 27.3, + "learning_rate": 5.046512354356043e-05, + "loss": 0.064, + "step": 97110 + }, + { + "epoch": 27.31, + "learning_rate": 5.044638115765471e-05, + "loss": 0.066, + "step": 97140 + }, + { + "epoch": 27.32, + "learning_rate": 5.042763877174897e-05, + "loss": 0.0562, + "step": 97170 + }, + { + "epoch": 27.33, + "learning_rate": 5.0408896385843254e-05, + "loss": 0.0623, + "step": 97200 + }, + { + "epoch": 27.33, + "learning_rate": 5.039015399993753e-05, + "loss": 0.0625, + "step": 97230 + }, + { + "epoch": 27.34, + "learning_rate": 5.03714116140318e-05, + "loss": 0.0596, + "step": 97260 + }, + { + "epoch": 27.35, + "learning_rate": 5.035266922812608e-05, + "loss": 0.0703, + "step": 97290 + }, + { + "epoch": 27.36, + "learning_rate": 5.0333926842220344e-05, + "loss": 0.056, + "step": 97320 + }, + { + "epoch": 27.37, + "learning_rate": 5.0315184456314625e-05, + "loss": 0.0707, + "step": 97350 + }, + { + "epoch": 27.38, + "learning_rate": 5.02964420704089e-05, + "loss": 0.0571, + "step": 97380 + }, + { + "epoch": 27.39, + "learning_rate": 5.027769968450318e-05, + "loss": 0.0614, + "step": 97410 + }, + { + "epoch": 27.39, + "learning_rate": 5.025895729859744e-05, + "loss": 0.0656, + "step": 97440 + }, + { + "epoch": 27.4, + "learning_rate": 5.024021491269172e-05, + "loss": 0.0571, + "step": 97470 + }, + { + "epoch": 27.41, + "learning_rate": 5.0221472526785996e-05, + "loss": 0.0646, + "step": 97500 + }, + { + "epoch": 27.42, + "learning_rate": 5.020273014088027e-05, + "loss": 0.0554, + "step": 97530 + }, + { + "epoch": 27.43, + "learning_rate": 5.018398775497455e-05, + "loss": 0.0613, + "step": 97560 + }, + { + "epoch": 27.44, + "learning_rate": 5.016524536906881e-05, + "loss": 0.0668, + "step": 97590 + }, + { + "epoch": 27.44, + "learning_rate": 5.014650298316309e-05, + "loss": 0.0542, + "step": 97620 + }, + { + "epoch": 27.45, + "learning_rate": 5.0127760597257367e-05, + "loss": 0.0692, + "step": 97650 + }, + { + "epoch": 27.46, + "learning_rate": 5.010901821135164e-05, + "loss": 0.0579, + "step": 97680 + }, + { + "epoch": 27.47, + "learning_rate": 5.009027582544592e-05, + "loss": 0.0613, + "step": 97710 + }, + { + "epoch": 27.48, + "learning_rate": 5.007153343954019e-05, + "loss": 0.0703, + "step": 97740 + }, + { + "epoch": 27.49, + "learning_rate": 5.005279105363446e-05, + "loss": 0.0545, + "step": 97770 + }, + { + "epoch": 27.5, + "learning_rate": 5.003404866772874e-05, + "loss": 0.0627, + "step": 97800 + }, + { + "epoch": 27.5, + "learning_rate": 5.001530628182302e-05, + "loss": 0.0578, + "step": 97830 + }, + { + "epoch": 27.51, + "learning_rate": 4.9997188642114146e-05, + "loss": 0.0654, + "step": 97860 + }, + { + "epoch": 27.52, + "learning_rate": 4.997844625620841e-05, + "loss": 0.0674, + "step": 97890 + }, + { + "epoch": 27.53, + "learning_rate": 4.9959703870302694e-05, + "loss": 0.0545, + "step": 97920 + }, + { + "epoch": 27.54, + "learning_rate": 4.994096148439696e-05, + "loss": 0.0683, + "step": 97950 + }, + { + "epoch": 27.55, + "learning_rate": 4.992221909849124e-05, + "loss": 0.0593, + "step": 97980 + }, + { + "epoch": 27.55, + "learning_rate": 4.990347671258551e-05, + "loss": 0.0622, + "step": 98010 + }, + { + "epoch": 27.56, + "learning_rate": 4.988473432667979e-05, + "loss": 0.0662, + "step": 98040 + }, + { + "epoch": 27.57, + "learning_rate": 4.9865991940774065e-05, + "loss": 0.0581, + "step": 98070 + }, + { + "epoch": 27.58, + "learning_rate": 4.984724955486833e-05, + "loss": 0.0689, + "step": 98100 + }, + { + "epoch": 27.59, + "learning_rate": 4.9828507168962614e-05, + "loss": 0.0598, + "step": 98130 + }, + { + "epoch": 27.6, + "learning_rate": 4.980976478305688e-05, + "loss": 0.0653, + "step": 98160 + }, + { + "epoch": 27.6, + "learning_rate": 4.979102239715116e-05, + "loss": 0.0679, + "step": 98190 + }, + { + "epoch": 27.61, + "learning_rate": 4.977228001124543e-05, + "loss": 0.0583, + "step": 98220 + }, + { + "epoch": 27.62, + "learning_rate": 4.975353762533971e-05, + "loss": 0.0665, + "step": 98250 + }, + { + "epoch": 27.63, + "learning_rate": 4.9734795239433985e-05, + "loss": 0.0567, + "step": 98280 + }, + { + "epoch": 27.64, + "learning_rate": 4.971605285352826e-05, + "loss": 0.0628, + "step": 98310 + }, + { + "epoch": 27.65, + "learning_rate": 4.969731046762253e-05, + "loss": 0.0661, + "step": 98340 + }, + { + "epoch": 27.66, + "learning_rate": 4.96785680817168e-05, + "loss": 0.0534, + "step": 98370 + }, + { + "epoch": 27.66, + "learning_rate": 4.965982569581108e-05, + "loss": 0.0601, + "step": 98400 + }, + { + "epoch": 27.67, + "learning_rate": 4.964108330990535e-05, + "loss": 0.0605, + "step": 98430 + }, + { + "epoch": 27.68, + "learning_rate": 4.962234092399963e-05, + "loss": 0.0637, + "step": 98460 + }, + { + "epoch": 27.69, + "learning_rate": 4.9603598538093904e-05, + "loss": 0.0658, + "step": 98490 + }, + { + "epoch": 27.7, + "learning_rate": 4.958485615218818e-05, + "loss": 0.0579, + "step": 98520 + }, + { + "epoch": 27.71, + "learning_rate": 4.956611376628245e-05, + "loss": 0.0702, + "step": 98550 + }, + { + "epoch": 27.71, + "learning_rate": 4.954737138037672e-05, + "loss": 0.0553, + "step": 98580 + }, + { + "epoch": 27.72, + "learning_rate": 4.9528628994471e-05, + "loss": 0.0621, + "step": 98610 + }, + { + "epoch": 27.73, + "learning_rate": 4.950988660856527e-05, + "loss": 0.0653, + "step": 98640 + }, + { + "epoch": 27.74, + "learning_rate": 4.949114422265955e-05, + "loss": 0.0531, + "step": 98670 + }, + { + "epoch": 27.75, + "learning_rate": 4.947240183675382e-05, + "loss": 0.0667, + "step": 98700 + }, + { + "epoch": 27.76, + "learning_rate": 4.94536594508481e-05, + "loss": 0.0586, + "step": 98730 + }, + { + "epoch": 27.76, + "learning_rate": 4.943491706494237e-05, + "loss": 0.0685, + "step": 98760 + }, + { + "epoch": 27.77, + "learning_rate": 4.941617467903664e-05, + "loss": 0.0677, + "step": 98790 + }, + { + "epoch": 27.78, + "learning_rate": 4.939743229313092e-05, + "loss": 0.0566, + "step": 98820 + }, + { + "epoch": 27.79, + "learning_rate": 4.937868990722519e-05, + "loss": 0.0662, + "step": 98850 + }, + { + "epoch": 27.8, + "learning_rate": 4.935994752131947e-05, + "loss": 0.0593, + "step": 98880 + }, + { + "epoch": 27.81, + "learning_rate": 4.934120513541374e-05, + "loss": 0.0601, + "step": 98910 + }, + { + "epoch": 27.82, + "learning_rate": 4.932246274950802e-05, + "loss": 0.0646, + "step": 98940 + }, + { + "epoch": 27.82, + "learning_rate": 4.930372036360229e-05, + "loss": 0.0543, + "step": 98970 + }, + { + "epoch": 27.83, + "learning_rate": 4.928497797769656e-05, + "loss": 0.0674, + "step": 99000 + }, + { + "epoch": 27.84, + "learning_rate": 4.926623559179084e-05, + "loss": 0.0553, + "step": 99030 + }, + { + "epoch": 27.85, + "learning_rate": 4.924749320588511e-05, + "loss": 0.0593, + "step": 99060 + }, + { + "epoch": 27.86, + "learning_rate": 4.922875081997939e-05, + "loss": 0.0636, + "step": 99090 + }, + { + "epoch": 27.87, + "learning_rate": 4.921000843407366e-05, + "loss": 0.0572, + "step": 99120 + }, + { + "epoch": 27.87, + "learning_rate": 4.9191266048167936e-05, + "loss": 0.0644, + "step": 99150 + }, + { + "epoch": 27.88, + "learning_rate": 4.917252366226221e-05, + "loss": 0.0599, + "step": 99180 + }, + { + "epoch": 27.89, + "learning_rate": 4.915378127635648e-05, + "loss": 0.0647, + "step": 99210 + }, + { + "epoch": 27.9, + "learning_rate": 4.913503889045076e-05, + "loss": 0.0717, + "step": 99240 + }, + { + "epoch": 27.91, + "learning_rate": 4.9116296504545026e-05, + "loss": 0.0548, + "step": 99270 + }, + { + "epoch": 27.92, + "learning_rate": 4.909755411863931e-05, + "loss": 0.0657, + "step": 99300 + }, + { + "epoch": 27.93, + "learning_rate": 4.907881173273358e-05, + "loss": 0.0594, + "step": 99330 + }, + { + "epoch": 27.93, + "learning_rate": 4.9060069346827855e-05, + "loss": 0.0558, + "step": 99360 + }, + { + "epoch": 27.94, + "learning_rate": 4.904132696092213e-05, + "loss": 0.0672, + "step": 99390 + }, + { + "epoch": 27.95, + "learning_rate": 4.90225845750164e-05, + "loss": 0.0531, + "step": 99420 + }, + { + "epoch": 27.96, + "learning_rate": 4.900384218911068e-05, + "loss": 0.0662, + "step": 99450 + }, + { + "epoch": 27.97, + "learning_rate": 4.8985099803204945e-05, + "loss": 0.0613, + "step": 99480 + }, + { + "epoch": 27.98, + "learning_rate": 4.8966357417299226e-05, + "loss": 0.0614, + "step": 99510 + }, + { + "epoch": 27.98, + "learning_rate": 4.89476150313935e-05, + "loss": 0.0703, + "step": 99540 + }, + { + "epoch": 27.99, + "learning_rate": 4.8928872645487775e-05, + "loss": 0.0536, + "step": 99570 + }, + { + "epoch": 28.0, + "eval_loss": 0.10675393790006638, + "eval_runtime": 629.0591, + "eval_samples_per_second": 25.487, + "eval_steps_per_second": 0.798, + "eval_wer": 0.10265036234356448, + "step": 99596 + }, + { + "epoch": 28.0, + "learning_rate": 4.891013025958205e-05, + "loss": 0.0698, + "step": 99600 + }, + { + "epoch": 28.01, + "learning_rate": 4.889138787367632e-05, + "loss": 0.0523, + "step": 99630 + }, + { + "epoch": 28.02, + "learning_rate": 4.887327023396746e-05, + "loss": 0.0634, + "step": 99660 + }, + { + "epoch": 28.03, + "learning_rate": 4.8854527848061725e-05, + "loss": 0.0593, + "step": 99690 + }, + { + "epoch": 28.03, + "learning_rate": 4.8835785462156006e-05, + "loss": 0.0598, + "step": 99720 + }, + { + "epoch": 28.04, + "learning_rate": 4.881704307625027e-05, + "loss": 0.0633, + "step": 99750 + }, + { + "epoch": 28.05, + "learning_rate": 4.879830069034455e-05, + "loss": 0.0548, + "step": 99780 + }, + { + "epoch": 28.06, + "learning_rate": 4.877955830443882e-05, + "loss": 0.0629, + "step": 99810 + }, + { + "epoch": 28.07, + "learning_rate": 4.8760815918533096e-05, + "loss": 0.0599, + "step": 99840 + }, + { + "epoch": 28.08, + "learning_rate": 4.874207353262738e-05, + "loss": 0.0584, + "step": 99870 + }, + { + "epoch": 28.09, + "learning_rate": 4.8723331146721644e-05, + "loss": 0.0631, + "step": 99900 + }, + { + "epoch": 28.09, + "learning_rate": 4.8704588760815925e-05, + "loss": 0.0546, + "step": 99930 + }, + { + "epoch": 28.1, + "learning_rate": 4.868584637491019e-05, + "loss": 0.0645, + "step": 99960 + }, + { + "epoch": 28.11, + "learning_rate": 4.866710398900447e-05, + "loss": 0.062, + "step": 99990 + }, + { + "epoch": 28.12, + "learning_rate": 4.864836160309874e-05, + "loss": 0.0613, + "step": 100020 + }, + { + "epoch": 28.13, + "learning_rate": 4.8629619217193015e-05, + "loss": 0.0665, + "step": 100050 + }, + { + "epoch": 28.14, + "learning_rate": 4.8610876831287296e-05, + "loss": 0.0534, + "step": 100080 + }, + { + "epoch": 28.14, + "learning_rate": 4.8592134445381563e-05, + "loss": 0.0639, + "step": 100110 + }, + { + "epoch": 28.15, + "learning_rate": 4.8573392059475844e-05, + "loss": 0.0589, + "step": 100140 + }, + { + "epoch": 28.16, + "learning_rate": 4.855464967357011e-05, + "loss": 0.0624, + "step": 100170 + }, + { + "epoch": 28.17, + "learning_rate": 4.853590728766439e-05, + "loss": 0.0657, + "step": 100200 + }, + { + "epoch": 28.18, + "learning_rate": 4.851716490175866e-05, + "loss": 0.0509, + "step": 100230 + }, + { + "epoch": 28.19, + "learning_rate": 4.8498422515852934e-05, + "loss": 0.0644, + "step": 100260 + }, + { + "epoch": 28.2, + "learning_rate": 4.8479680129947215e-05, + "loss": 0.06, + "step": 100290 + }, + { + "epoch": 28.2, + "learning_rate": 4.846093774404148e-05, + "loss": 0.0591, + "step": 100320 + }, + { + "epoch": 28.21, + "learning_rate": 4.8442195358135764e-05, + "loss": 0.0675, + "step": 100350 + }, + { + "epoch": 28.22, + "learning_rate": 4.842345297223003e-05, + "loss": 0.0525, + "step": 100380 + }, + { + "epoch": 28.23, + "learning_rate": 4.840471058632431e-05, + "loss": 0.0644, + "step": 100410 + }, + { + "epoch": 28.24, + "learning_rate": 4.838596820041858e-05, + "loss": 0.0593, + "step": 100440 + }, + { + "epoch": 28.25, + "learning_rate": 4.8367225814512854e-05, + "loss": 0.058, + "step": 100470 + }, + { + "epoch": 28.25, + "learning_rate": 4.8348483428607135e-05, + "loss": 0.0663, + "step": 100500 + }, + { + "epoch": 28.26, + "learning_rate": 4.83297410427014e-05, + "loss": 0.0543, + "step": 100530 + }, + { + "epoch": 28.27, + "learning_rate": 4.831099865679568e-05, + "loss": 0.0633, + "step": 100560 + }, + { + "epoch": 28.28, + "learning_rate": 4.829225627088995e-05, + "loss": 0.0585, + "step": 100590 + }, + { + "epoch": 28.29, + "learning_rate": 4.827351388498423e-05, + "loss": 0.0588, + "step": 100620 + }, + { + "epoch": 28.3, + "learning_rate": 4.82547714990785e-05, + "loss": 0.0684, + "step": 100650 + }, + { + "epoch": 28.3, + "learning_rate": 4.823602911317277e-05, + "loss": 0.0536, + "step": 100680 + }, + { + "epoch": 28.31, + "learning_rate": 4.8217286727267054e-05, + "loss": 0.0623, + "step": 100710 + }, + { + "epoch": 28.32, + "learning_rate": 4.819854434136132e-05, + "loss": 0.0586, + "step": 100740 + }, + { + "epoch": 28.33, + "learning_rate": 4.81798019554556e-05, + "loss": 0.0595, + "step": 100770 + }, + { + "epoch": 28.34, + "learning_rate": 4.816105956954987e-05, + "loss": 0.0641, + "step": 100800 + }, + { + "epoch": 28.35, + "learning_rate": 4.814231718364415e-05, + "loss": 0.0561, + "step": 100830 + }, + { + "epoch": 28.36, + "learning_rate": 4.812357479773842e-05, + "loss": 0.0643, + "step": 100860 + }, + { + "epoch": 28.36, + "learning_rate": 4.810483241183269e-05, + "loss": 0.0583, + "step": 100890 + }, + { + "epoch": 28.37, + "learning_rate": 4.808609002592697e-05, + "loss": 0.0575, + "step": 100920 + }, + { + "epoch": 28.38, + "learning_rate": 4.806734764002124e-05, + "loss": 0.0683, + "step": 100950 + }, + { + "epoch": 28.39, + "learning_rate": 4.804860525411552e-05, + "loss": 0.055, + "step": 100980 + }, + { + "epoch": 28.4, + "learning_rate": 4.802986286820979e-05, + "loss": 0.0626, + "step": 101010 + }, + { + "epoch": 28.41, + "learning_rate": 4.801112048230407e-05, + "loss": 0.0627, + "step": 101040 + }, + { + "epoch": 28.41, + "learning_rate": 4.799237809639834e-05, + "loss": 0.0636, + "step": 101070 + }, + { + "epoch": 28.42, + "learning_rate": 4.797363571049261e-05, + "loss": 0.0699, + "step": 101100 + }, + { + "epoch": 28.43, + "learning_rate": 4.795489332458689e-05, + "loss": 0.0535, + "step": 101130 + }, + { + "epoch": 28.44, + "learning_rate": 4.793615093868116e-05, + "loss": 0.0668, + "step": 101160 + }, + { + "epoch": 28.45, + "learning_rate": 4.791740855277544e-05, + "loss": 0.0601, + "step": 101190 + }, + { + "epoch": 28.46, + "learning_rate": 4.789866616686971e-05, + "loss": 0.0602, + "step": 101220 + }, + { + "epoch": 28.46, + "learning_rate": 4.787992378096399e-05, + "loss": 0.0672, + "step": 101250 + }, + { + "epoch": 28.47, + "learning_rate": 4.786118139505826e-05, + "loss": 0.0522, + "step": 101280 + }, + { + "epoch": 28.48, + "learning_rate": 4.784243900915253e-05, + "loss": 0.0665, + "step": 101310 + }, + { + "epoch": 28.49, + "learning_rate": 4.782369662324681e-05, + "loss": 0.0615, + "step": 101340 + }, + { + "epoch": 28.5, + "learning_rate": 4.780495423734108e-05, + "loss": 0.0564, + "step": 101370 + }, + { + "epoch": 28.51, + "learning_rate": 4.778621185143536e-05, + "loss": 0.0673, + "step": 101400 + }, + { + "epoch": 28.52, + "learning_rate": 4.776746946552963e-05, + "loss": 0.0568, + "step": 101430 + }, + { + "epoch": 28.52, + "learning_rate": 4.774872707962391e-05, + "loss": 0.0644, + "step": 101460 + }, + { + "epoch": 28.53, + "learning_rate": 4.7729984693718176e-05, + "loss": 0.0634, + "step": 101490 + }, + { + "epoch": 28.54, + "learning_rate": 4.771124230781245e-05, + "loss": 0.0609, + "step": 101520 + }, + { + "epoch": 28.55, + "learning_rate": 4.769249992190673e-05, + "loss": 0.0657, + "step": 101550 + }, + { + "epoch": 28.56, + "learning_rate": 4.7673757536001e-05, + "loss": 0.0544, + "step": 101580 + }, + { + "epoch": 28.57, + "learning_rate": 4.765501515009528e-05, + "loss": 0.0652, + "step": 101610 + }, + { + "epoch": 28.57, + "learning_rate": 4.763627276418955e-05, + "loss": 0.0578, + "step": 101640 + }, + { + "epoch": 28.58, + "learning_rate": 4.761753037828383e-05, + "loss": 0.0578, + "step": 101670 + }, + { + "epoch": 28.59, + "learning_rate": 4.7598787992378096e-05, + "loss": 0.0694, + "step": 101700 + }, + { + "epoch": 28.6, + "learning_rate": 4.7580045606472377e-05, + "loss": 0.055, + "step": 101730 + }, + { + "epoch": 28.61, + "learning_rate": 4.756130322056665e-05, + "loss": 0.0609, + "step": 101760 + }, + { + "epoch": 28.62, + "learning_rate": 4.754256083466092e-05, + "loss": 0.0563, + "step": 101790 + }, + { + "epoch": 28.63, + "learning_rate": 4.75238184487552e-05, + "loss": 0.0589, + "step": 101820 + }, + { + "epoch": 28.63, + "learning_rate": 4.7505076062849466e-05, + "loss": 0.0667, + "step": 101850 + }, + { + "epoch": 28.64, + "learning_rate": 4.748633367694375e-05, + "loss": 0.0564, + "step": 101880 + }, + { + "epoch": 28.65, + "learning_rate": 4.7467591291038015e-05, + "loss": 0.0707, + "step": 101910 + }, + { + "epoch": 28.66, + "learning_rate": 4.7448848905132296e-05, + "loss": 0.0598, + "step": 101940 + }, + { + "epoch": 28.67, + "learning_rate": 4.743010651922657e-05, + "loss": 0.0608, + "step": 101970 + }, + { + "epoch": 28.68, + "learning_rate": 4.741136413332084e-05, + "loss": 0.0687, + "step": 102000 + }, + { + "epoch": 28.68, + "learning_rate": 4.739262174741512e-05, + "loss": 0.0543, + "step": 102030 + }, + { + "epoch": 28.69, + "learning_rate": 4.7373879361509386e-05, + "loss": 0.0624, + "step": 102060 + }, + { + "epoch": 28.7, + "learning_rate": 4.735513697560367e-05, + "loss": 0.0582, + "step": 102090 + }, + { + "epoch": 28.71, + "learning_rate": 4.7336394589697934e-05, + "loss": 0.0604, + "step": 102120 + }, + { + "epoch": 28.72, + "learning_rate": 4.7317652203792215e-05, + "loss": 0.0683, + "step": 102150 + }, + { + "epoch": 28.73, + "learning_rate": 4.729890981788648e-05, + "loss": 0.0564, + "step": 102180 + }, + { + "epoch": 28.73, + "learning_rate": 4.728016743198076e-05, + "loss": 0.0656, + "step": 102210 + }, + { + "epoch": 28.74, + "learning_rate": 4.726142504607504e-05, + "loss": 0.0597, + "step": 102240 + }, + { + "epoch": 28.75, + "learning_rate": 4.7242682660169305e-05, + "loss": 0.0596, + "step": 102270 + }, + { + "epoch": 28.76, + "learning_rate": 4.7223940274263586e-05, + "loss": 0.0658, + "step": 102300 + }, + { + "epoch": 28.77, + "learning_rate": 4.7205197888357854e-05, + "loss": 0.0557, + "step": 102330 + }, + { + "epoch": 28.78, + "learning_rate": 4.7186455502452135e-05, + "loss": 0.0663, + "step": 102360 + }, + { + "epoch": 28.79, + "learning_rate": 4.71677131165464e-05, + "loss": 0.061, + "step": 102390 + }, + { + "epoch": 28.79, + "learning_rate": 4.7148970730640676e-05, + "loss": 0.0598, + "step": 102420 + }, + { + "epoch": 28.8, + "learning_rate": 4.713022834473496e-05, + "loss": 0.0665, + "step": 102450 + }, + { + "epoch": 28.81, + "learning_rate": 4.7111485958829224e-05, + "loss": 0.0547, + "step": 102480 + }, + { + "epoch": 28.82, + "learning_rate": 4.7092743572923505e-05, + "loss": 0.0642, + "step": 102510 + }, + { + "epoch": 28.83, + "learning_rate": 4.707400118701777e-05, + "loss": 0.0581, + "step": 102540 + }, + { + "epoch": 28.84, + "learning_rate": 4.7055258801112054e-05, + "loss": 0.06, + "step": 102570 + }, + { + "epoch": 28.84, + "learning_rate": 4.703651641520632e-05, + "loss": 0.0661, + "step": 102600 + }, + { + "epoch": 28.85, + "learning_rate": 4.7017774029300595e-05, + "loss": 0.0549, + "step": 102630 + }, + { + "epoch": 28.86, + "learning_rate": 4.6999031643394876e-05, + "loss": 0.0674, + "step": 102660 + }, + { + "epoch": 28.87, + "learning_rate": 4.6980289257489144e-05, + "loss": 0.0559, + "step": 102690 + }, + { + "epoch": 28.88, + "learning_rate": 4.6961546871583425e-05, + "loss": 0.0606, + "step": 102720 + }, + { + "epoch": 28.89, + "learning_rate": 4.694280448567769e-05, + "loss": 0.0657, + "step": 102750 + }, + { + "epoch": 28.9, + "learning_rate": 4.692406209977197e-05, + "loss": 0.0546, + "step": 102780 + }, + { + "epoch": 28.9, + "learning_rate": 4.690531971386624e-05, + "loss": 0.0619, + "step": 102810 + }, + { + "epoch": 28.91, + "learning_rate": 4.6886577327960515e-05, + "loss": 0.0607, + "step": 102840 + }, + { + "epoch": 28.92, + "learning_rate": 4.6867834942054796e-05, + "loss": 0.0588, + "step": 102870 + }, + { + "epoch": 28.93, + "learning_rate": 4.684909255614906e-05, + "loss": 0.067, + "step": 102900 + }, + { + "epoch": 28.94, + "learning_rate": 4.6830350170243344e-05, + "loss": 0.0537, + "step": 102930 + }, + { + "epoch": 28.95, + "learning_rate": 4.681160778433761e-05, + "loss": 0.0688, + "step": 102960 + }, + { + "epoch": 28.95, + "learning_rate": 4.679286539843189e-05, + "loss": 0.0612, + "step": 102990 + }, + { + "epoch": 28.96, + "learning_rate": 4.677412301252616e-05, + "loss": 0.0559, + "step": 103020 + }, + { + "epoch": 28.97, + "learning_rate": 4.6755380626620434e-05, + "loss": 0.0692, + "step": 103050 + }, + { + "epoch": 28.98, + "learning_rate": 4.6736638240714715e-05, + "loss": 0.0534, + "step": 103080 + }, + { + "epoch": 28.99, + "learning_rate": 4.671789585480898e-05, + "loss": 0.0663, + "step": 103110 + }, + { + "epoch": 29.0, + "learning_rate": 4.6699153468903263e-05, + "loss": 0.0616, + "step": 103140 + }, + { + "epoch": 29.0, + "eval_loss": 0.10966203361749649, + "eval_runtime": 631.5692, + "eval_samples_per_second": 25.386, + "eval_steps_per_second": 0.795, + "eval_wer": 0.10370805071445144, + "step": 103153 + }, + { + "epoch": 29.0, + "learning_rate": 4.668103582919439e-05, + "loss": 0.0653, + "step": 103170 + }, + { + "epoch": 29.01, + "learning_rate": 4.6662293443288665e-05, + "loss": 0.0621, + "step": 103200 + }, + { + "epoch": 29.02, + "learning_rate": 4.664355105738294e-05, + "loss": 0.0575, + "step": 103230 + }, + { + "epoch": 29.03, + "learning_rate": 4.6624808671477213e-05, + "loss": 0.0644, + "step": 103260 + }, + { + "epoch": 29.04, + "learning_rate": 4.660606628557149e-05, + "loss": 0.0525, + "step": 103290 + }, + { + "epoch": 29.05, + "learning_rate": 4.658732389966576e-05, + "loss": 0.059, + "step": 103320 + }, + { + "epoch": 29.06, + "learning_rate": 4.6568581513760036e-05, + "loss": 0.0604, + "step": 103350 + }, + { + "epoch": 29.06, + "learning_rate": 4.654983912785431e-05, + "loss": 0.0559, + "step": 103380 + }, + { + "epoch": 29.07, + "learning_rate": 4.6531096741948584e-05, + "loss": 0.0654, + "step": 103410 + }, + { + "epoch": 29.08, + "learning_rate": 4.651235435604286e-05, + "loss": 0.0553, + "step": 103440 + }, + { + "epoch": 29.09, + "learning_rate": 4.649361197013713e-05, + "loss": 0.0629, + "step": 103470 + }, + { + "epoch": 29.1, + "learning_rate": 4.647486958423141e-05, + "loss": 0.0578, + "step": 103500 + }, + { + "epoch": 29.11, + "learning_rate": 4.645612719832568e-05, + "loss": 0.0536, + "step": 103530 + }, + { + "epoch": 29.11, + "learning_rate": 4.6437384812419955e-05, + "loss": 0.0646, + "step": 103560 + }, + { + "epoch": 29.12, + "learning_rate": 4.641864242651423e-05, + "loss": 0.0535, + "step": 103590 + }, + { + "epoch": 29.13, + "learning_rate": 4.639990004060851e-05, + "loss": 0.0641, + "step": 103620 + }, + { + "epoch": 29.14, + "learning_rate": 4.638115765470278e-05, + "loss": 0.0643, + "step": 103650 + }, + { + "epoch": 29.15, + "learning_rate": 4.636241526879705e-05, + "loss": 0.0572, + "step": 103680 + }, + { + "epoch": 29.16, + "learning_rate": 4.6343672882891326e-05, + "loss": 0.0626, + "step": 103710 + }, + { + "epoch": 29.17, + "learning_rate": 4.63249304969856e-05, + "loss": 0.0576, + "step": 103740 + }, + { + "epoch": 29.17, + "learning_rate": 4.6306188111079875e-05, + "loss": 0.0621, + "step": 103770 + }, + { + "epoch": 29.18, + "learning_rate": 4.628744572517415e-05, + "loss": 0.0613, + "step": 103800 + }, + { + "epoch": 29.19, + "learning_rate": 4.626870333926843e-05, + "loss": 0.0578, + "step": 103830 + }, + { + "epoch": 29.2, + "learning_rate": 4.62499609533627e-05, + "loss": 0.0657, + "step": 103860 + }, + { + "epoch": 29.21, + "learning_rate": 4.623121856745697e-05, + "loss": 0.0561, + "step": 103890 + }, + { + "epoch": 29.22, + "learning_rate": 4.6212476181551246e-05, + "loss": 0.0651, + "step": 103920 + }, + { + "epoch": 29.22, + "learning_rate": 4.619373379564552e-05, + "loss": 0.059, + "step": 103950 + }, + { + "epoch": 29.23, + "learning_rate": 4.6174991409739794e-05, + "loss": 0.0567, + "step": 103980 + }, + { + "epoch": 29.24, + "learning_rate": 4.615624902383407e-05, + "loss": 0.0647, + "step": 104010 + }, + { + "epoch": 29.25, + "learning_rate": 4.613750663792835e-05, + "loss": 0.0572, + "step": 104040 + }, + { + "epoch": 29.26, + "learning_rate": 4.611876425202262e-05, + "loss": 0.0647, + "step": 104070 + }, + { + "epoch": 29.27, + "learning_rate": 4.610002186611689e-05, + "loss": 0.0622, + "step": 104100 + }, + { + "epoch": 29.27, + "learning_rate": 4.6081279480211165e-05, + "loss": 0.0561, + "step": 104130 + }, + { + "epoch": 29.28, + "learning_rate": 4.606253709430544e-05, + "loss": 0.0621, + "step": 104160 + }, + { + "epoch": 29.29, + "learning_rate": 4.604379470839971e-05, + "loss": 0.0559, + "step": 104190 + }, + { + "epoch": 29.3, + "learning_rate": 4.602505232249399e-05, + "loss": 0.0634, + "step": 104220 + }, + { + "epoch": 29.31, + "learning_rate": 4.600630993658827e-05, + "loss": 0.0583, + "step": 104250 + }, + { + "epoch": 29.32, + "learning_rate": 4.5987567550682536e-05, + "loss": 0.0524, + "step": 104280 + }, + { + "epoch": 29.33, + "learning_rate": 4.596882516477681e-05, + "loss": 0.0619, + "step": 104310 + }, + { + "epoch": 29.33, + "learning_rate": 4.5950082778871084e-05, + "loss": 0.0549, + "step": 104340 + }, + { + "epoch": 29.34, + "learning_rate": 4.593134039296536e-05, + "loss": 0.0624, + "step": 104370 + }, + { + "epoch": 29.35, + "learning_rate": 4.591259800705963e-05, + "loss": 0.061, + "step": 104400 + }, + { + "epoch": 29.36, + "learning_rate": 4.589385562115391e-05, + "loss": 0.0562, + "step": 104430 + }, + { + "epoch": 29.37, + "learning_rate": 4.587511323524819e-05, + "loss": 0.0619, + "step": 104460 + }, + { + "epoch": 29.38, + "learning_rate": 4.5856370849342455e-05, + "loss": 0.0508, + "step": 104490 + }, + { + "epoch": 29.38, + "learning_rate": 4.583762846343673e-05, + "loss": 0.0607, + "step": 104520 + }, + { + "epoch": 29.39, + "learning_rate": 4.5818886077531004e-05, + "loss": 0.0599, + "step": 104550 + }, + { + "epoch": 29.4, + "learning_rate": 4.580014369162528e-05, + "loss": 0.0568, + "step": 104580 + }, + { + "epoch": 29.41, + "learning_rate": 4.578140130571955e-05, + "loss": 0.0653, + "step": 104610 + }, + { + "epoch": 29.42, + "learning_rate": 4.5762658919813826e-05, + "loss": 0.0528, + "step": 104640 + }, + { + "epoch": 29.43, + "learning_rate": 4.574391653390811e-05, + "loss": 0.063, + "step": 104670 + }, + { + "epoch": 29.43, + "learning_rate": 4.5725174148002375e-05, + "loss": 0.0613, + "step": 104700 + }, + { + "epoch": 29.44, + "learning_rate": 4.570643176209665e-05, + "loss": 0.0601, + "step": 104730 + }, + { + "epoch": 29.45, + "learning_rate": 4.568768937619092e-05, + "loss": 0.0635, + "step": 104760 + }, + { + "epoch": 29.46, + "learning_rate": 4.56689469902852e-05, + "loss": 0.0555, + "step": 104790 + }, + { + "epoch": 29.47, + "learning_rate": 4.565020460437947e-05, + "loss": 0.0605, + "step": 104820 + }, + { + "epoch": 29.48, + "learning_rate": 4.5631462218473746e-05, + "loss": 0.0655, + "step": 104850 + }, + { + "epoch": 29.49, + "learning_rate": 4.5612719832568027e-05, + "loss": 0.0575, + "step": 104880 + }, + { + "epoch": 29.49, + "learning_rate": 4.5593977446662294e-05, + "loss": 0.0635, + "step": 104910 + }, + { + "epoch": 29.5, + "learning_rate": 4.557523506075657e-05, + "loss": 0.0515, + "step": 104940 + }, + { + "epoch": 29.51, + "learning_rate": 4.555649267485084e-05, + "loss": 0.0598, + "step": 104970 + }, + { + "epoch": 29.52, + "learning_rate": 4.5537750288945117e-05, + "loss": 0.0622, + "step": 105000 + }, + { + "epoch": 29.53, + "learning_rate": 4.551900790303939e-05, + "loss": 0.0523, + "step": 105030 + }, + { + "epoch": 29.54, + "learning_rate": 4.5500265517133665e-05, + "loss": 0.0659, + "step": 105060 + }, + { + "epoch": 29.54, + "learning_rate": 4.5481523131227946e-05, + "loss": 0.0532, + "step": 105090 + }, + { + "epoch": 29.55, + "learning_rate": 4.546278074532221e-05, + "loss": 0.0613, + "step": 105120 + }, + { + "epoch": 29.56, + "learning_rate": 4.5444038359416494e-05, + "loss": 0.058, + "step": 105150 + }, + { + "epoch": 29.57, + "learning_rate": 4.542529597351076e-05, + "loss": 0.0591, + "step": 105180 + }, + { + "epoch": 29.58, + "learning_rate": 4.5406553587605036e-05, + "loss": 0.0648, + "step": 105210 + }, + { + "epoch": 29.59, + "learning_rate": 4.538781120169931e-05, + "loss": 0.0531, + "step": 105240 + }, + { + "epoch": 29.6, + "learning_rate": 4.5369068815793584e-05, + "loss": 0.0633, + "step": 105270 + }, + { + "epoch": 29.6, + "learning_rate": 4.5350326429887865e-05, + "loss": 0.0593, + "step": 105300 + }, + { + "epoch": 29.61, + "learning_rate": 4.533158404398213e-05, + "loss": 0.0569, + "step": 105330 + }, + { + "epoch": 29.62, + "learning_rate": 4.5312841658076414e-05, + "loss": 0.0636, + "step": 105360 + }, + { + "epoch": 29.63, + "learning_rate": 4.529409927217068e-05, + "loss": 0.0574, + "step": 105390 + }, + { + "epoch": 29.64, + "learning_rate": 4.5275356886264955e-05, + "loss": 0.0657, + "step": 105420 + }, + { + "epoch": 29.65, + "learning_rate": 4.525661450035923e-05, + "loss": 0.0593, + "step": 105450 + }, + { + "epoch": 29.65, + "learning_rate": 4.5237872114453504e-05, + "loss": 0.0597, + "step": 105480 + }, + { + "epoch": 29.66, + "learning_rate": 4.5219129728547785e-05, + "loss": 0.0639, + "step": 105510 + }, + { + "epoch": 29.67, + "learning_rate": 4.520038734264205e-05, + "loss": 0.0552, + "step": 105540 + }, + { + "epoch": 29.68, + "learning_rate": 4.518164495673633e-05, + "loss": 0.0602, + "step": 105570 + }, + { + "epoch": 29.69, + "learning_rate": 4.51629025708306e-05, + "loss": 0.0595, + "step": 105600 + }, + { + "epoch": 29.7, + "learning_rate": 4.5144160184924875e-05, + "loss": 0.0563, + "step": 105630 + }, + { + "epoch": 29.7, + "learning_rate": 4.512541779901915e-05, + "loss": 0.0638, + "step": 105660 + }, + { + "epoch": 29.71, + "learning_rate": 4.510667541311342e-05, + "loss": 0.056, + "step": 105690 + }, + { + "epoch": 29.72, + "learning_rate": 4.5087933027207704e-05, + "loss": 0.0606, + "step": 105720 + }, + { + "epoch": 29.73, + "learning_rate": 4.506919064130197e-05, + "loss": 0.0598, + "step": 105750 + }, + { + "epoch": 29.74, + "learning_rate": 4.505044825539625e-05, + "loss": 0.0564, + "step": 105780 + }, + { + "epoch": 29.75, + "learning_rate": 4.503170586949052e-05, + "loss": 0.0631, + "step": 105810 + }, + { + "epoch": 29.76, + "learning_rate": 4.5012963483584794e-05, + "loss": 0.0554, + "step": 105840 + }, + { + "epoch": 29.76, + "learning_rate": 4.499422109767907e-05, + "loss": 0.063, + "step": 105870 + }, + { + "epoch": 29.77, + "learning_rate": 4.497547871177334e-05, + "loss": 0.0598, + "step": 105900 + }, + { + "epoch": 29.78, + "learning_rate": 4.495673632586762e-05, + "loss": 0.0588, + "step": 105930 + }, + { + "epoch": 29.79, + "learning_rate": 4.493799393996189e-05, + "loss": 0.0649, + "step": 105960 + }, + { + "epoch": 29.8, + "learning_rate": 4.491925155405617e-05, + "loss": 0.0536, + "step": 105990 + }, + { + "epoch": 29.81, + "learning_rate": 4.490050916815044e-05, + "loss": 0.0595, + "step": 106020 + }, + { + "epoch": 29.81, + "learning_rate": 4.488176678224471e-05, + "loss": 0.0591, + "step": 106050 + }, + { + "epoch": 29.82, + "learning_rate": 4.486302439633899e-05, + "loss": 0.0582, + "step": 106080 + }, + { + "epoch": 29.83, + "learning_rate": 4.484428201043326e-05, + "loss": 0.066, + "step": 106110 + }, + { + "epoch": 29.84, + "learning_rate": 4.482553962452754e-05, + "loss": 0.0534, + "step": 106140 + }, + { + "epoch": 29.85, + "learning_rate": 4.480679723862181e-05, + "loss": 0.0644, + "step": 106170 + }, + { + "epoch": 29.86, + "learning_rate": 4.478805485271609e-05, + "loss": 0.0613, + "step": 106200 + }, + { + "epoch": 29.86, + "learning_rate": 4.476931246681036e-05, + "loss": 0.058, + "step": 106230 + }, + { + "epoch": 29.87, + "learning_rate": 4.475057008090463e-05, + "loss": 0.0638, + "step": 106260 + }, + { + "epoch": 29.88, + "learning_rate": 4.473182769499891e-05, + "loss": 0.0548, + "step": 106290 + }, + { + "epoch": 29.89, + "learning_rate": 4.471308530909318e-05, + "loss": 0.0614, + "step": 106320 + }, + { + "epoch": 29.9, + "learning_rate": 4.469434292318746e-05, + "loss": 0.0605, + "step": 106350 + }, + { + "epoch": 29.91, + "learning_rate": 4.467560053728173e-05, + "loss": 0.0577, + "step": 106380 + }, + { + "epoch": 29.92, + "learning_rate": 4.465685815137601e-05, + "loss": 0.0665, + "step": 106410 + }, + { + "epoch": 29.92, + "learning_rate": 4.463811576547028e-05, + "loss": 0.0554, + "step": 106440 + }, + { + "epoch": 29.93, + "learning_rate": 4.461937337956455e-05, + "loss": 0.0607, + "step": 106470 + }, + { + "epoch": 29.94, + "learning_rate": 4.4600630993658826e-05, + "loss": 0.0595, + "step": 106500 + }, + { + "epoch": 29.95, + "learning_rate": 4.45818886077531e-05, + "loss": 0.0545, + "step": 106530 + }, + { + "epoch": 29.96, + "learning_rate": 4.4563146221847374e-05, + "loss": 0.0625, + "step": 106560 + }, + { + "epoch": 29.97, + "learning_rate": 4.454440383594165e-05, + "loss": 0.0519, + "step": 106590 + }, + { + "epoch": 29.97, + "learning_rate": 4.452566145003593e-05, + "loss": 0.0671, + "step": 106620 + }, + { + "epoch": 29.98, + "learning_rate": 4.45069190641302e-05, + "loss": 0.0617, + "step": 106650 + }, + { + "epoch": 29.99, + "learning_rate": 4.448817667822448e-05, + "loss": 0.0578, + "step": 106680 + }, + { + "epoch": 30.0, + "learning_rate": 4.4469434292318745e-05, + "loss": 0.0642, + "step": 106710 + }, + { + "epoch": 30.0, + "eval_loss": 0.11168166995048523, + "eval_runtime": 629.3759, + "eval_samples_per_second": 25.474, + "eval_steps_per_second": 0.798, + "eval_wer": 0.1020089255250911, + "step": 106710 + }, + { + "epoch": 30.01, + "learning_rate": 4.445069190641302e-05, + "loss": 0.0513, + "step": 106740 + }, + { + "epoch": 30.02, + "learning_rate": 4.4431949520507294e-05, + "loss": 0.0647, + "step": 106770 + }, + { + "epoch": 30.03, + "learning_rate": 4.441320713460157e-05, + "loss": 0.0548, + "step": 106800 + }, + { + "epoch": 30.03, + "learning_rate": 4.439446474869585e-05, + "loss": 0.0575, + "step": 106830 + }, + { + "epoch": 30.04, + "learning_rate": 4.4375722362790116e-05, + "loss": 0.0621, + "step": 106860 + }, + { + "epoch": 30.05, + "learning_rate": 4.43569799768844e-05, + "loss": 0.0499, + "step": 106890 + }, + { + "epoch": 30.06, + "learning_rate": 4.4338237590978665e-05, + "loss": 0.063, + "step": 106920 + }, + { + "epoch": 30.07, + "learning_rate": 4.431949520507294e-05, + "loss": 0.0558, + "step": 106950 + }, + { + "epoch": 30.08, + "learning_rate": 4.430075281916721e-05, + "loss": 0.0579, + "step": 106980 + }, + { + "epoch": 30.08, + "learning_rate": 4.428201043326149e-05, + "loss": 0.0643, + "step": 107010 + }, + { + "epoch": 30.09, + "learning_rate": 4.426326804735577e-05, + "loss": 0.0532, + "step": 107040 + }, + { + "epoch": 30.1, + "learning_rate": 4.4244525661450036e-05, + "loss": 0.0659, + "step": 107070 + }, + { + "epoch": 30.11, + "learning_rate": 4.422578327554432e-05, + "loss": 0.0552, + "step": 107100 + }, + { + "epoch": 30.12, + "learning_rate": 4.4207040889638584e-05, + "loss": 0.0597, + "step": 107130 + }, + { + "epoch": 30.13, + "learning_rate": 4.418892324992972e-05, + "loss": 0.0622, + "step": 107160 + }, + { + "epoch": 30.13, + "learning_rate": 4.417018086402399e-05, + "loss": 0.0526, + "step": 107190 + }, + { + "epoch": 30.14, + "learning_rate": 4.415143847811827e-05, + "loss": 0.0628, + "step": 107220 + }, + { + "epoch": 30.15, + "learning_rate": 4.413269609221254e-05, + "loss": 0.0547, + "step": 107250 + }, + { + "epoch": 30.16, + "learning_rate": 4.4113953706306815e-05, + "loss": 0.0574, + "step": 107280 + }, + { + "epoch": 30.17, + "learning_rate": 4.409521132040109e-05, + "loss": 0.0626, + "step": 107310 + }, + { + "epoch": 30.18, + "learning_rate": 4.4076468934495363e-05, + "loss": 0.0507, + "step": 107340 + }, + { + "epoch": 30.19, + "learning_rate": 4.405772654858964e-05, + "loss": 0.0583, + "step": 107370 + }, + { + "epoch": 30.19, + "learning_rate": 4.403898416268391e-05, + "loss": 0.0527, + "step": 107400 + }, + { + "epoch": 30.2, + "learning_rate": 4.4020241776778186e-05, + "loss": 0.0566, + "step": 107430 + }, + { + "epoch": 30.21, + "learning_rate": 4.400149939087246e-05, + "loss": 0.0619, + "step": 107460 + }, + { + "epoch": 30.22, + "learning_rate": 4.3982757004966734e-05, + "loss": 0.0497, + "step": 107490 + }, + { + "epoch": 30.23, + "learning_rate": 4.396401461906101e-05, + "loss": 0.065, + "step": 107520 + }, + { + "epoch": 30.24, + "learning_rate": 4.394527223315528e-05, + "loss": 0.0545, + "step": 107550 + }, + { + "epoch": 30.24, + "learning_rate": 4.392652984724956e-05, + "loss": 0.0627, + "step": 107580 + }, + { + "epoch": 30.25, + "learning_rate": 4.390778746134383e-05, + "loss": 0.0619, + "step": 107610 + }, + { + "epoch": 30.26, + "learning_rate": 4.3889045075438105e-05, + "loss": 0.0507, + "step": 107640 + }, + { + "epoch": 30.27, + "learning_rate": 4.387030268953238e-05, + "loss": 0.065, + "step": 107670 + }, + { + "epoch": 30.28, + "learning_rate": 4.3851560303626654e-05, + "loss": 0.0539, + "step": 107700 + }, + { + "epoch": 30.29, + "learning_rate": 4.383281791772093e-05, + "loss": 0.0633, + "step": 107730 + }, + { + "epoch": 30.3, + "learning_rate": 4.38140755318152e-05, + "loss": 0.0643, + "step": 107760 + }, + { + "epoch": 30.3, + "learning_rate": 4.3795333145909476e-05, + "loss": 0.0504, + "step": 107790 + }, + { + "epoch": 30.31, + "learning_rate": 4.377659076000375e-05, + "loss": 0.067, + "step": 107820 + }, + { + "epoch": 30.32, + "learning_rate": 4.3757848374098025e-05, + "loss": 0.0535, + "step": 107850 + }, + { + "epoch": 30.33, + "learning_rate": 4.37391059881923e-05, + "loss": 0.0572, + "step": 107880 + }, + { + "epoch": 30.34, + "learning_rate": 4.372036360228657e-05, + "loss": 0.0637, + "step": 107910 + }, + { + "epoch": 30.35, + "learning_rate": 4.370162121638085e-05, + "loss": 0.0524, + "step": 107940 + }, + { + "epoch": 30.35, + "learning_rate": 4.368287883047512e-05, + "loss": 0.0625, + "step": 107970 + }, + { + "epoch": 30.36, + "learning_rate": 4.3664136444569396e-05, + "loss": 0.0557, + "step": 108000 + }, + { + "epoch": 30.37, + "learning_rate": 4.364539405866367e-05, + "loss": 0.0586, + "step": 108030 + }, + { + "epoch": 30.38, + "learning_rate": 4.3626651672757944e-05, + "loss": 0.0632, + "step": 108060 + }, + { + "epoch": 30.39, + "learning_rate": 4.360790928685222e-05, + "loss": 0.0544, + "step": 108090 + }, + { + "epoch": 30.4, + "learning_rate": 4.358916690094649e-05, + "loss": 0.0607, + "step": 108120 + }, + { + "epoch": 30.4, + "learning_rate": 4.3570424515040767e-05, + "loss": 0.0562, + "step": 108150 + }, + { + "epoch": 30.41, + "learning_rate": 4.355168212913504e-05, + "loss": 0.0607, + "step": 108180 + }, + { + "epoch": 30.42, + "learning_rate": 4.3532939743229315e-05, + "loss": 0.0623, + "step": 108210 + }, + { + "epoch": 30.43, + "learning_rate": 4.351419735732359e-05, + "loss": 0.0517, + "step": 108240 + }, + { + "epoch": 30.44, + "learning_rate": 4.349545497141786e-05, + "loss": 0.0678, + "step": 108270 + }, + { + "epoch": 30.45, + "learning_rate": 4.347671258551214e-05, + "loss": 0.0573, + "step": 108300 + }, + { + "epoch": 30.46, + "learning_rate": 4.345797019960641e-05, + "loss": 0.0569, + "step": 108330 + }, + { + "epoch": 30.46, + "learning_rate": 4.3439227813700686e-05, + "loss": 0.0641, + "step": 108360 + }, + { + "epoch": 30.47, + "learning_rate": 4.342048542779496e-05, + "loss": 0.0539, + "step": 108390 + }, + { + "epoch": 30.48, + "learning_rate": 4.3401743041889234e-05, + "loss": 0.0618, + "step": 108420 + }, + { + "epoch": 30.49, + "learning_rate": 4.338300065598351e-05, + "loss": 0.0507, + "step": 108450 + }, + { + "epoch": 30.5, + "learning_rate": 4.336425827007778e-05, + "loss": 0.0559, + "step": 108480 + }, + { + "epoch": 30.51, + "learning_rate": 4.334551588417206e-05, + "loss": 0.061, + "step": 108510 + }, + { + "epoch": 30.51, + "learning_rate": 4.332677349826633e-05, + "loss": 0.055, + "step": 108540 + }, + { + "epoch": 30.52, + "learning_rate": 4.3308031112360605e-05, + "loss": 0.062, + "step": 108570 + }, + { + "epoch": 30.53, + "learning_rate": 4.328928872645488e-05, + "loss": 0.0527, + "step": 108600 + }, + { + "epoch": 30.54, + "learning_rate": 4.3270546340549154e-05, + "loss": 0.0614, + "step": 108630 + }, + { + "epoch": 30.55, + "learning_rate": 4.325180395464343e-05, + "loss": 0.0638, + "step": 108660 + }, + { + "epoch": 30.56, + "learning_rate": 4.32330615687377e-05, + "loss": 0.0509, + "step": 108690 + }, + { + "epoch": 30.57, + "learning_rate": 4.3214319182831976e-05, + "loss": 0.0633, + "step": 108720 + }, + { + "epoch": 30.57, + "learning_rate": 4.319557679692625e-05, + "loss": 0.0517, + "step": 108750 + }, + { + "epoch": 30.58, + "learning_rate": 4.3176834411020525e-05, + "loss": 0.0611, + "step": 108780 + }, + { + "epoch": 30.59, + "learning_rate": 4.31580920251148e-05, + "loss": 0.0646, + "step": 108810 + }, + { + "epoch": 30.6, + "learning_rate": 4.313934963920907e-05, + "loss": 0.0532, + "step": 108840 + }, + { + "epoch": 30.61, + "learning_rate": 4.312060725330335e-05, + "loss": 0.0609, + "step": 108870 + }, + { + "epoch": 30.62, + "learning_rate": 4.310186486739762e-05, + "loss": 0.0505, + "step": 108900 + }, + { + "epoch": 30.62, + "learning_rate": 4.3083122481491896e-05, + "loss": 0.0562, + "step": 108930 + }, + { + "epoch": 30.63, + "learning_rate": 4.306438009558617e-05, + "loss": 0.0602, + "step": 108960 + }, + { + "epoch": 30.64, + "learning_rate": 4.3045637709680444e-05, + "loss": 0.0536, + "step": 108990 + }, + { + "epoch": 30.65, + "learning_rate": 4.302689532377472e-05, + "loss": 0.0654, + "step": 109020 + }, + { + "epoch": 30.66, + "learning_rate": 4.300815293786899e-05, + "loss": 0.0553, + "step": 109050 + }, + { + "epoch": 30.67, + "learning_rate": 4.2989410551963266e-05, + "loss": 0.0605, + "step": 109080 + }, + { + "epoch": 30.67, + "learning_rate": 4.297066816605754e-05, + "loss": 0.0613, + "step": 109110 + }, + { + "epoch": 30.68, + "learning_rate": 4.2951925780151815e-05, + "loss": 0.0518, + "step": 109140 + }, + { + "epoch": 30.69, + "learning_rate": 4.293318339424609e-05, + "loss": 0.0615, + "step": 109170 + }, + { + "epoch": 30.7, + "learning_rate": 4.291444100834036e-05, + "loss": 0.0538, + "step": 109200 + }, + { + "epoch": 30.71, + "learning_rate": 4.289569862243464e-05, + "loss": 0.0599, + "step": 109230 + }, + { + "epoch": 30.72, + "learning_rate": 4.287695623652891e-05, + "loss": 0.0649, + "step": 109260 + }, + { + "epoch": 30.73, + "learning_rate": 4.2858838596820046e-05, + "loss": 0.0548, + "step": 109290 + }, + { + "epoch": 30.73, + "learning_rate": 4.284009621091431e-05, + "loss": 0.0622, + "step": 109320 + }, + { + "epoch": 30.74, + "learning_rate": 4.2821353825008594e-05, + "loss": 0.0531, + "step": 109350 + }, + { + "epoch": 30.75, + "learning_rate": 4.280261143910287e-05, + "loss": 0.0582, + "step": 109380 + }, + { + "epoch": 30.76, + "learning_rate": 4.278386905319714e-05, + "loss": 0.0657, + "step": 109410 + }, + { + "epoch": 30.77, + "learning_rate": 4.276512666729142e-05, + "loss": 0.0511, + "step": 109440 + }, + { + "epoch": 30.78, + "learning_rate": 4.2746384281385684e-05, + "loss": 0.0618, + "step": 109470 + }, + { + "epoch": 30.78, + "learning_rate": 4.2727641895479965e-05, + "loss": 0.0524, + "step": 109500 + }, + { + "epoch": 30.79, + "learning_rate": 4.270889950957423e-05, + "loss": 0.0595, + "step": 109530 + }, + { + "epoch": 30.8, + "learning_rate": 4.2690157123668514e-05, + "loss": 0.062, + "step": 109560 + }, + { + "epoch": 30.81, + "learning_rate": 4.267141473776279e-05, + "loss": 0.0522, + "step": 109590 + }, + { + "epoch": 30.82, + "learning_rate": 4.265267235185706e-05, + "loss": 0.0611, + "step": 109620 + }, + { + "epoch": 30.83, + "learning_rate": 4.2633929965951336e-05, + "loss": 0.0543, + "step": 109650 + }, + { + "epoch": 30.83, + "learning_rate": 4.2615187580045604e-05, + "loss": 0.0619, + "step": 109680 + }, + { + "epoch": 30.84, + "learning_rate": 4.2596445194139884e-05, + "loss": 0.064, + "step": 109710 + }, + { + "epoch": 30.85, + "learning_rate": 4.257770280823415e-05, + "loss": 0.0533, + "step": 109740 + }, + { + "epoch": 30.86, + "learning_rate": 4.255896042232843e-05, + "loss": 0.0599, + "step": 109770 + }, + { + "epoch": 30.87, + "learning_rate": 4.254021803642271e-05, + "loss": 0.0586, + "step": 109800 + }, + { + "epoch": 30.88, + "learning_rate": 4.252147565051698e-05, + "loss": 0.063, + "step": 109830 + }, + { + "epoch": 30.89, + "learning_rate": 4.2502733264611255e-05, + "loss": 0.0623, + "step": 109860 + }, + { + "epoch": 30.89, + "learning_rate": 4.248399087870553e-05, + "loss": 0.0551, + "step": 109890 + }, + { + "epoch": 30.9, + "learning_rate": 4.2465248492799804e-05, + "loss": 0.062, + "step": 109920 + }, + { + "epoch": 30.91, + "learning_rate": 4.244650610689407e-05, + "loss": 0.055, + "step": 109950 + }, + { + "epoch": 30.92, + "learning_rate": 4.242776372098835e-05, + "loss": 0.0566, + "step": 109980 + }, + { + "epoch": 30.93, + "learning_rate": 4.2409021335082626e-05, + "loss": 0.0622, + "step": 110010 + }, + { + "epoch": 30.94, + "learning_rate": 4.23902789491769e-05, + "loss": 0.0494, + "step": 110040 + }, + { + "epoch": 30.94, + "learning_rate": 4.2371536563271175e-05, + "loss": 0.0608, + "step": 110070 + }, + { + "epoch": 30.95, + "learning_rate": 4.235279417736545e-05, + "loss": 0.0536, + "step": 110100 + }, + { + "epoch": 30.96, + "learning_rate": 4.233405179145972e-05, + "loss": 0.059, + "step": 110130 + }, + { + "epoch": 30.97, + "learning_rate": 4.231530940555399e-05, + "loss": 0.0642, + "step": 110160 + }, + { + "epoch": 30.98, + "learning_rate": 4.229656701964827e-05, + "loss": 0.0514, + "step": 110190 + }, + { + "epoch": 30.99, + "learning_rate": 4.2277824633742546e-05, + "loss": 0.0651, + "step": 110220 + }, + { + "epoch": 31.0, + "learning_rate": 4.225908224783682e-05, + "loss": 0.0555, + "step": 110250 + }, + { + "epoch": 31.0, + "eval_loss": 0.11092609167098999, + "eval_runtime": 629.5598, + "eval_samples_per_second": 25.467, + "eval_steps_per_second": 0.797, + "eval_wer": 0.09900645531096038, + "step": 110267 + }, + { + "epoch": 31.0, + "learning_rate": 4.2240339861931094e-05, + "loss": 0.0594, + "step": 110280 + }, + { + "epoch": 31.01, + "learning_rate": 4.222159747602537e-05, + "loss": 0.0534, + "step": 110310 + }, + { + "epoch": 31.02, + "learning_rate": 4.220285509011964e-05, + "loss": 0.0538, + "step": 110340 + }, + { + "epoch": 31.03, + "learning_rate": 4.218411270421391e-05, + "loss": 0.0627, + "step": 110370 + }, + { + "epoch": 31.04, + "learning_rate": 4.216537031830819e-05, + "loss": 0.0524, + "step": 110400 + }, + { + "epoch": 31.05, + "learning_rate": 4.2146627932402465e-05, + "loss": 0.0592, + "step": 110430 + }, + { + "epoch": 31.05, + "learning_rate": 4.212788554649674e-05, + "loss": 0.0546, + "step": 110460 + }, + { + "epoch": 31.06, + "learning_rate": 4.2109143160591013e-05, + "loss": 0.0599, + "step": 110490 + }, + { + "epoch": 31.07, + "learning_rate": 4.209040077468529e-05, + "loss": 0.0606, + "step": 110520 + }, + { + "epoch": 31.08, + "learning_rate": 4.207165838877956e-05, + "loss": 0.0518, + "step": 110550 + }, + { + "epoch": 31.09, + "learning_rate": 4.205291600287383e-05, + "loss": 0.0596, + "step": 110580 + }, + { + "epoch": 31.1, + "learning_rate": 4.203417361696811e-05, + "loss": 0.0544, + "step": 110610 + }, + { + "epoch": 31.1, + "learning_rate": 4.2015431231062384e-05, + "loss": 0.057, + "step": 110640 + }, + { + "epoch": 31.11, + "learning_rate": 4.199668884515666e-05, + "loss": 0.0612, + "step": 110670 + }, + { + "epoch": 31.12, + "learning_rate": 4.197794645925093e-05, + "loss": 0.0543, + "step": 110700 + }, + { + "epoch": 31.13, + "learning_rate": 4.195920407334521e-05, + "loss": 0.0575, + "step": 110730 + }, + { + "epoch": 31.14, + "learning_rate": 4.194046168743948e-05, + "loss": 0.0601, + "step": 110760 + }, + { + "epoch": 31.15, + "learning_rate": 4.192171930153375e-05, + "loss": 0.0552, + "step": 110790 + }, + { + "epoch": 31.16, + "learning_rate": 4.190297691562803e-05, + "loss": 0.0655, + "step": 110820 + }, + { + "epoch": 31.16, + "learning_rate": 4.1884234529722304e-05, + "loss": 0.0502, + "step": 110850 + }, + { + "epoch": 31.17, + "learning_rate": 4.186549214381658e-05, + "loss": 0.0594, + "step": 110880 + }, + { + "epoch": 31.18, + "learning_rate": 4.184674975791085e-05, + "loss": 0.0557, + "step": 110910 + }, + { + "epoch": 31.19, + "learning_rate": 4.1828007372005126e-05, + "loss": 0.0574, + "step": 110940 + }, + { + "epoch": 31.2, + "learning_rate": 4.18092649860994e-05, + "loss": 0.0623, + "step": 110970 + }, + { + "epoch": 31.21, + "learning_rate": 4.179052260019367e-05, + "loss": 0.0511, + "step": 111000 + }, + { + "epoch": 31.21, + "learning_rate": 4.177178021428795e-05, + "loss": 0.0575, + "step": 111030 + }, + { + "epoch": 31.22, + "learning_rate": 4.175303782838222e-05, + "loss": 0.0584, + "step": 111060 + }, + { + "epoch": 31.23, + "learning_rate": 4.17342954424765e-05, + "loss": 0.0609, + "step": 111090 + }, + { + "epoch": 31.24, + "learning_rate": 4.171555305657077e-05, + "loss": 0.0667, + "step": 111120 + }, + { + "epoch": 31.25, + "learning_rate": 4.1696810670665046e-05, + "loss": 0.054, + "step": 111150 + }, + { + "epoch": 31.26, + "learning_rate": 4.167806828475932e-05, + "loss": 0.0587, + "step": 111180 + }, + { + "epoch": 31.27, + "learning_rate": 4.165932589885359e-05, + "loss": 0.0544, + "step": 111210 + }, + { + "epoch": 31.27, + "learning_rate": 4.164058351294787e-05, + "loss": 0.0553, + "step": 111240 + }, + { + "epoch": 31.28, + "learning_rate": 4.162184112704214e-05, + "loss": 0.0634, + "step": 111270 + }, + { + "epoch": 31.29, + "learning_rate": 4.1603098741136417e-05, + "loss": 0.0524, + "step": 111300 + }, + { + "epoch": 31.3, + "learning_rate": 4.1584981101427544e-05, + "loss": 0.0599, + "step": 111330 + }, + { + "epoch": 31.31, + "learning_rate": 4.156623871552182e-05, + "loss": 0.0543, + "step": 111360 + }, + { + "epoch": 31.32, + "learning_rate": 4.15474963296161e-05, + "loss": 0.0556, + "step": 111390 + }, + { + "epoch": 31.32, + "learning_rate": 4.1528753943710367e-05, + "loss": 0.0608, + "step": 111420 + }, + { + "epoch": 31.33, + "learning_rate": 4.151001155780465e-05, + "loss": 0.0509, + "step": 111450 + }, + { + "epoch": 31.34, + "learning_rate": 4.1491269171898915e-05, + "loss": 0.0619, + "step": 111480 + }, + { + "epoch": 31.35, + "learning_rate": 4.1472526785993196e-05, + "loss": 0.0556, + "step": 111510 + }, + { + "epoch": 31.36, + "learning_rate": 4.145378440008746e-05, + "loss": 0.0605, + "step": 111540 + }, + { + "epoch": 31.37, + "learning_rate": 4.143504201418174e-05, + "loss": 0.0625, + "step": 111570 + }, + { + "epoch": 31.37, + "learning_rate": 4.141629962827602e-05, + "loss": 0.0461, + "step": 111600 + }, + { + "epoch": 31.38, + "learning_rate": 4.1397557242370286e-05, + "loss": 0.0624, + "step": 111630 + }, + { + "epoch": 31.39, + "learning_rate": 4.137881485646457e-05, + "loss": 0.0548, + "step": 111660 + }, + { + "epoch": 31.4, + "learning_rate": 4.1360072470558834e-05, + "loss": 0.0564, + "step": 111690 + }, + { + "epoch": 31.41, + "learning_rate": 4.1341330084653115e-05, + "loss": 0.0626, + "step": 111720 + }, + { + "epoch": 31.42, + "learning_rate": 4.132258769874738e-05, + "loss": 0.0492, + "step": 111750 + }, + { + "epoch": 31.43, + "learning_rate": 4.130384531284166e-05, + "loss": 0.0601, + "step": 111780 + }, + { + "epoch": 31.43, + "learning_rate": 4.128510292693594e-05, + "loss": 0.0549, + "step": 111810 + }, + { + "epoch": 31.44, + "learning_rate": 4.1266360541030205e-05, + "loss": 0.057, + "step": 111840 + }, + { + "epoch": 31.45, + "learning_rate": 4.1247618155124486e-05, + "loss": 0.0615, + "step": 111870 + }, + { + "epoch": 31.46, + "learning_rate": 4.1228875769218754e-05, + "loss": 0.0492, + "step": 111900 + }, + { + "epoch": 31.47, + "learning_rate": 4.1210133383313035e-05, + "loss": 0.0618, + "step": 111930 + }, + { + "epoch": 31.48, + "learning_rate": 4.11913909974073e-05, + "loss": 0.058, + "step": 111960 + }, + { + "epoch": 31.48, + "learning_rate": 4.117264861150158e-05, + "loss": 0.0602, + "step": 111990 + }, + { + "epoch": 31.49, + "learning_rate": 4.115390622559586e-05, + "loss": 0.0634, + "step": 112020 + }, + { + "epoch": 31.5, + "learning_rate": 4.1135163839690125e-05, + "loss": 0.0531, + "step": 112050 + }, + { + "epoch": 31.51, + "learning_rate": 4.1116421453784406e-05, + "loss": 0.0623, + "step": 112080 + }, + { + "epoch": 31.52, + "learning_rate": 4.109767906787867e-05, + "loss": 0.0517, + "step": 112110 + }, + { + "epoch": 31.53, + "learning_rate": 4.1078936681972954e-05, + "loss": 0.0595, + "step": 112140 + }, + { + "epoch": 31.53, + "learning_rate": 4.106019429606722e-05, + "loss": 0.0601, + "step": 112170 + }, + { + "epoch": 31.54, + "learning_rate": 4.10414519101615e-05, + "loss": 0.0529, + "step": 112200 + }, + { + "epoch": 31.55, + "learning_rate": 4.1022709524255777e-05, + "loss": 0.0597, + "step": 112230 + }, + { + "epoch": 31.56, + "learning_rate": 4.1003967138350044e-05, + "loss": 0.0574, + "step": 112260 + }, + { + "epoch": 31.57, + "learning_rate": 4.0985224752444325e-05, + "loss": 0.0561, + "step": 112290 + }, + { + "epoch": 31.58, + "learning_rate": 4.096648236653859e-05, + "loss": 0.06, + "step": 112320 + }, + { + "epoch": 31.59, + "learning_rate": 4.094773998063287e-05, + "loss": 0.0509, + "step": 112350 + }, + { + "epoch": 31.59, + "learning_rate": 4.092899759472714e-05, + "loss": 0.0608, + "step": 112380 + }, + { + "epoch": 31.6, + "learning_rate": 4.091025520882142e-05, + "loss": 0.0557, + "step": 112410 + }, + { + "epoch": 31.61, + "learning_rate": 4.0891512822915696e-05, + "loss": 0.0584, + "step": 112440 + }, + { + "epoch": 31.62, + "learning_rate": 4.087277043700996e-05, + "loss": 0.0645, + "step": 112470 + }, + { + "epoch": 31.63, + "learning_rate": 4.0854028051104244e-05, + "loss": 0.0511, + "step": 112500 + }, + { + "epoch": 31.64, + "learning_rate": 4.083528566519851e-05, + "loss": 0.0581, + "step": 112530 + }, + { + "epoch": 31.64, + "learning_rate": 4.081654327929279e-05, + "loss": 0.057, + "step": 112560 + }, + { + "epoch": 31.65, + "learning_rate": 4.079780089338706e-05, + "loss": 0.0572, + "step": 112590 + }, + { + "epoch": 31.66, + "learning_rate": 4.077905850748134e-05, + "loss": 0.0644, + "step": 112620 + }, + { + "epoch": 31.67, + "learning_rate": 4.0760316121575615e-05, + "loss": 0.0508, + "step": 112650 + }, + { + "epoch": 31.68, + "learning_rate": 4.074157373566988e-05, + "loss": 0.0602, + "step": 112680 + }, + { + "epoch": 31.69, + "learning_rate": 4.0722831349764164e-05, + "loss": 0.0519, + "step": 112710 + }, + { + "epoch": 31.7, + "learning_rate": 4.070408896385843e-05, + "loss": 0.0558, + "step": 112740 + }, + { + "epoch": 31.7, + "learning_rate": 4.068534657795271e-05, + "loss": 0.0621, + "step": 112770 + }, + { + "epoch": 31.71, + "learning_rate": 4.066660419204698e-05, + "loss": 0.0505, + "step": 112800 + }, + { + "epoch": 31.72, + "learning_rate": 4.064786180614126e-05, + "loss": 0.0608, + "step": 112830 + }, + { + "epoch": 31.73, + "learning_rate": 4.062911942023553e-05, + "loss": 0.0554, + "step": 112860 + }, + { + "epoch": 31.74, + "learning_rate": 4.06103770343298e-05, + "loss": 0.0563, + "step": 112890 + }, + { + "epoch": 31.75, + "learning_rate": 4.059163464842408e-05, + "loss": 0.0666, + "step": 112920 + }, + { + "epoch": 31.75, + "learning_rate": 4.057289226251835e-05, + "loss": 0.0532, + "step": 112950 + }, + { + "epoch": 31.76, + "learning_rate": 4.055414987661263e-05, + "loss": 0.0572, + "step": 112980 + }, + { + "epoch": 31.77, + "learning_rate": 4.05354074907069e-05, + "loss": 0.0549, + "step": 113010 + }, + { + "epoch": 31.78, + "learning_rate": 4.051666510480118e-05, + "loss": 0.0577, + "step": 113040 + }, + { + "epoch": 31.79, + "learning_rate": 4.049792271889545e-05, + "loss": 0.0664, + "step": 113070 + }, + { + "epoch": 31.8, + "learning_rate": 4.047918033298972e-05, + "loss": 0.0488, + "step": 113100 + }, + { + "epoch": 31.8, + "learning_rate": 4.0460437947084e-05, + "loss": 0.0587, + "step": 113130 + }, + { + "epoch": 31.81, + "learning_rate": 4.044169556117827e-05, + "loss": 0.0551, + "step": 113160 + }, + { + "epoch": 31.82, + "learning_rate": 4.042295317527255e-05, + "loss": 0.0531, + "step": 113190 + }, + { + "epoch": 31.83, + "learning_rate": 4.040421078936682e-05, + "loss": 0.0628, + "step": 113220 + }, + { + "epoch": 31.84, + "learning_rate": 4.03854684034611e-05, + "loss": 0.052, + "step": 113250 + }, + { + "epoch": 31.85, + "learning_rate": 4.0366726017555366e-05, + "loss": 0.0608, + "step": 113280 + }, + { + "epoch": 31.86, + "learning_rate": 4.034798363164965e-05, + "loss": 0.0536, + "step": 113310 + }, + { + "epoch": 31.86, + "learning_rate": 4.032924124574392e-05, + "loss": 0.0582, + "step": 113340 + }, + { + "epoch": 31.87, + "learning_rate": 4.031049885983819e-05, + "loss": 0.0613, + "step": 113370 + }, + { + "epoch": 31.88, + "learning_rate": 4.029175647393247e-05, + "loss": 0.0509, + "step": 113400 + }, + { + "epoch": 31.89, + "learning_rate": 4.027301408802674e-05, + "loss": 0.0626, + "step": 113430 + }, + { + "epoch": 31.9, + "learning_rate": 4.025427170212102e-05, + "loss": 0.053, + "step": 113460 + }, + { + "epoch": 31.91, + "learning_rate": 4.0235529316215286e-05, + "loss": 0.054, + "step": 113490 + }, + { + "epoch": 31.91, + "learning_rate": 4.021678693030957e-05, + "loss": 0.0595, + "step": 113520 + }, + { + "epoch": 31.92, + "learning_rate": 4.019804454440384e-05, + "loss": 0.051, + "step": 113550 + }, + { + "epoch": 31.93, + "learning_rate": 4.017930215849811e-05, + "loss": 0.0603, + "step": 113580 + }, + { + "epoch": 31.94, + "learning_rate": 4.016055977259239e-05, + "loss": 0.055, + "step": 113610 + }, + { + "epoch": 31.95, + "learning_rate": 4.014181738668666e-05, + "loss": 0.0546, + "step": 113640 + }, + { + "epoch": 31.96, + "learning_rate": 4.012307500078094e-05, + "loss": 0.0595, + "step": 113670 + }, + { + "epoch": 31.97, + "learning_rate": 4.0104332614875205e-05, + "loss": 0.0509, + "step": 113700 + }, + { + "epoch": 31.97, + "learning_rate": 4.0085590228969486e-05, + "loss": 0.0595, + "step": 113730 + }, + { + "epoch": 31.98, + "learning_rate": 4.006684784306376e-05, + "loss": 0.0563, + "step": 113760 + }, + { + "epoch": 31.99, + "learning_rate": 4.004810545715803e-05, + "loss": 0.0582, + "step": 113790 + }, + { + "epoch": 32.0, + "learning_rate": 4.002936307125231e-05, + "loss": 0.0632, + "step": 113820 + }, + { + "epoch": 32.0, + "eval_loss": 0.11038082838058472, + "eval_runtime": 633.2401, + "eval_samples_per_second": 25.319, + "eval_steps_per_second": 0.793, + "eval_wer": 0.09773722926589604, + "step": 113824 + }, + { + "epoch": 32.01, + "learning_rate": 4.0010620685346576e-05, + "loss": 0.0504, + "step": 113850 + }, + { + "epoch": 32.02, + "learning_rate": 3.999187829944086e-05, + "loss": 0.0617, + "step": 113880 + }, + { + "epoch": 32.02, + "learning_rate": 3.9973135913535124e-05, + "loss": 0.0508, + "step": 113910 + }, + { + "epoch": 32.03, + "learning_rate": 3.9954393527629405e-05, + "loss": 0.0602, + "step": 113940 + }, + { + "epoch": 32.04, + "learning_rate": 3.993627588792053e-05, + "loss": 0.0588, + "step": 113970 + }, + { + "epoch": 32.05, + "learning_rate": 3.991753350201481e-05, + "loss": 0.0533, + "step": 114000 + }, + { + "epoch": 32.06, + "learning_rate": 3.989879111610908e-05, + "loss": 0.0574, + "step": 114030 + }, + { + "epoch": 32.07, + "learning_rate": 3.9880048730203355e-05, + "loss": 0.0511, + "step": 114060 + }, + { + "epoch": 32.07, + "learning_rate": 3.9861306344297636e-05, + "loss": 0.0627, + "step": 114090 + }, + { + "epoch": 32.08, + "learning_rate": 3.9842563958391904e-05, + "loss": 0.0528, + "step": 114120 + }, + { + "epoch": 32.09, + "learning_rate": 3.982382157248618e-05, + "loss": 0.0575, + "step": 114150 + }, + { + "epoch": 32.1, + "learning_rate": 3.980507918658045e-05, + "loss": 0.0627, + "step": 114180 + }, + { + "epoch": 32.11, + "learning_rate": 3.9786336800674726e-05, + "loss": 0.0525, + "step": 114210 + }, + { + "epoch": 32.12, + "learning_rate": 3.9767594414769e-05, + "loss": 0.0617, + "step": 114240 + }, + { + "epoch": 32.13, + "learning_rate": 3.9748852028863275e-05, + "loss": 0.0543, + "step": 114270 + }, + { + "epoch": 32.13, + "learning_rate": 3.9730109642957556e-05, + "loss": 0.052, + "step": 114300 + }, + { + "epoch": 32.14, + "learning_rate": 3.971199200324868e-05, + "loss": 0.0661, + "step": 114330 + }, + { + "epoch": 32.15, + "learning_rate": 3.969324961734295e-05, + "loss": 0.0487, + "step": 114360 + }, + { + "epoch": 32.16, + "learning_rate": 3.967450723143723e-05, + "loss": 0.0601, + "step": 114390 + }, + { + "epoch": 32.17, + "learning_rate": 3.9655764845531506e-05, + "loss": 0.0603, + "step": 114420 + }, + { + "epoch": 32.18, + "learning_rate": 3.963702245962578e-05, + "loss": 0.0572, + "step": 114450 + }, + { + "epoch": 32.18, + "learning_rate": 3.9618280073720054e-05, + "loss": 0.0645, + "step": 114480 + }, + { + "epoch": 32.19, + "learning_rate": 3.959953768781433e-05, + "loss": 0.0547, + "step": 114510 + }, + { + "epoch": 32.2, + "learning_rate": 3.95807953019086e-05, + "loss": 0.0625, + "step": 114540 + }, + { + "epoch": 32.21, + "learning_rate": 3.956205291600287e-05, + "loss": 0.0578, + "step": 114570 + }, + { + "epoch": 32.22, + "learning_rate": 3.954331053009715e-05, + "loss": 0.0556, + "step": 114600 + }, + { + "epoch": 32.23, + "learning_rate": 3.9524568144191425e-05, + "loss": 0.0583, + "step": 114630 + }, + { + "epoch": 32.23, + "learning_rate": 3.95058257582857e-05, + "loss": 0.0506, + "step": 114660 + }, + { + "epoch": 32.24, + "learning_rate": 3.9487083372379973e-05, + "loss": 0.0577, + "step": 114690 + }, + { + "epoch": 32.25, + "learning_rate": 3.946834098647425e-05, + "loss": 0.053, + "step": 114720 + }, + { + "epoch": 32.26, + "learning_rate": 3.944959860056852e-05, + "loss": 0.0532, + "step": 114750 + }, + { + "epoch": 32.27, + "learning_rate": 3.943085621466279e-05, + "loss": 0.0612, + "step": 114780 + }, + { + "epoch": 32.28, + "learning_rate": 3.941211382875707e-05, + "loss": 0.0496, + "step": 114810 + }, + { + "epoch": 32.29, + "learning_rate": 3.9393371442851344e-05, + "loss": 0.0563, + "step": 114840 + }, + { + "epoch": 32.29, + "learning_rate": 3.937462905694562e-05, + "loss": 0.0581, + "step": 114870 + }, + { + "epoch": 32.3, + "learning_rate": 3.935588667103989e-05, + "loss": 0.0554, + "step": 114900 + }, + { + "epoch": 32.31, + "learning_rate": 3.933714428513417e-05, + "loss": 0.06, + "step": 114930 + }, + { + "epoch": 32.32, + "learning_rate": 3.931840189922844e-05, + "loss": 0.0559, + "step": 114960 + }, + { + "epoch": 32.33, + "learning_rate": 3.929965951332271e-05, + "loss": 0.0615, + "step": 114990 + }, + { + "epoch": 32.34, + "learning_rate": 3.928091712741699e-05, + "loss": 0.0545, + "step": 115020 + }, + { + "epoch": 32.34, + "learning_rate": 3.9262174741511264e-05, + "loss": 0.0539, + "step": 115050 + }, + { + "epoch": 32.35, + "learning_rate": 3.924343235560554e-05, + "loss": 0.0599, + "step": 115080 + }, + { + "epoch": 32.36, + "learning_rate": 3.922468996969981e-05, + "loss": 0.0564, + "step": 115110 + }, + { + "epoch": 32.37, + "learning_rate": 3.9205947583794086e-05, + "loss": 0.0606, + "step": 115140 + }, + { + "epoch": 32.38, + "learning_rate": 3.918720519788836e-05, + "loss": 0.0537, + "step": 115170 + }, + { + "epoch": 32.39, + "learning_rate": 3.9168462811982635e-05, + "loss": 0.0543, + "step": 115200 + }, + { + "epoch": 32.4, + "learning_rate": 3.914972042607691e-05, + "loss": 0.0571, + "step": 115230 + }, + { + "epoch": 32.4, + "learning_rate": 3.913097804017118e-05, + "loss": 0.0523, + "step": 115260 + }, + { + "epoch": 32.41, + "learning_rate": 3.911223565426546e-05, + "loss": 0.0582, + "step": 115290 + }, + { + "epoch": 32.42, + "learning_rate": 3.909349326835973e-05, + "loss": 0.0581, + "step": 115320 + }, + { + "epoch": 32.43, + "learning_rate": 3.9074750882454006e-05, + "loss": 0.0543, + "step": 115350 + }, + { + "epoch": 32.44, + "learning_rate": 3.905600849654828e-05, + "loss": 0.0595, + "step": 115380 + }, + { + "epoch": 32.45, + "learning_rate": 3.9037266110642554e-05, + "loss": 0.0531, + "step": 115410 + }, + { + "epoch": 32.45, + "learning_rate": 3.901852372473683e-05, + "loss": 0.0582, + "step": 115440 + }, + { + "epoch": 32.46, + "learning_rate": 3.89997813388311e-05, + "loss": 0.0541, + "step": 115470 + }, + { + "epoch": 32.47, + "learning_rate": 3.8981038952925377e-05, + "loss": 0.0542, + "step": 115500 + }, + { + "epoch": 32.48, + "learning_rate": 3.896229656701965e-05, + "loss": 0.0615, + "step": 115530 + }, + { + "epoch": 32.49, + "learning_rate": 3.8943554181113925e-05, + "loss": 0.049, + "step": 115560 + }, + { + "epoch": 32.5, + "learning_rate": 3.89248117952082e-05, + "loss": 0.0594, + "step": 115590 + }, + { + "epoch": 32.5, + "learning_rate": 3.890606940930247e-05, + "loss": 0.0563, + "step": 115620 + }, + { + "epoch": 32.51, + "learning_rate": 3.888732702339675e-05, + "loss": 0.0565, + "step": 115650 + }, + { + "epoch": 32.52, + "learning_rate": 3.886858463749102e-05, + "loss": 0.0573, + "step": 115680 + }, + { + "epoch": 32.53, + "learning_rate": 3.8849842251585296e-05, + "loss": 0.0513, + "step": 115710 + }, + { + "epoch": 32.54, + "learning_rate": 3.883109986567957e-05, + "loss": 0.0586, + "step": 115740 + }, + { + "epoch": 32.55, + "learning_rate": 3.8812357479773844e-05, + "loss": 0.054, + "step": 115770 + }, + { + "epoch": 32.56, + "learning_rate": 3.879361509386812e-05, + "loss": 0.0551, + "step": 115800 + }, + { + "epoch": 32.56, + "learning_rate": 3.877487270796239e-05, + "loss": 0.055, + "step": 115830 + }, + { + "epoch": 32.57, + "learning_rate": 3.875613032205667e-05, + "loss": 0.0527, + "step": 115860 + }, + { + "epoch": 32.58, + "learning_rate": 3.873738793615094e-05, + "loss": 0.0583, + "step": 115890 + }, + { + "epoch": 32.59, + "learning_rate": 3.8718645550245215e-05, + "loss": 0.0554, + "step": 115920 + }, + { + "epoch": 32.6, + "learning_rate": 3.869990316433949e-05, + "loss": 0.0517, + "step": 115950 + }, + { + "epoch": 32.61, + "learning_rate": 3.8681160778433764e-05, + "loss": 0.0564, + "step": 115980 + }, + { + "epoch": 32.61, + "learning_rate": 3.866241839252804e-05, + "loss": 0.0497, + "step": 116010 + }, + { + "epoch": 32.62, + "learning_rate": 3.864367600662231e-05, + "loss": 0.0574, + "step": 116040 + }, + { + "epoch": 32.63, + "learning_rate": 3.8624933620716586e-05, + "loss": 0.0567, + "step": 116070 + }, + { + "epoch": 32.64, + "learning_rate": 3.860619123481086e-05, + "loss": 0.0532, + "step": 116100 + }, + { + "epoch": 32.65, + "learning_rate": 3.8587448848905135e-05, + "loss": 0.0578, + "step": 116130 + }, + { + "epoch": 32.66, + "learning_rate": 3.856870646299941e-05, + "loss": 0.0517, + "step": 116160 + }, + { + "epoch": 32.67, + "learning_rate": 3.854996407709368e-05, + "loss": 0.0601, + "step": 116190 + }, + { + "epoch": 32.67, + "learning_rate": 3.853122169118796e-05, + "loss": 0.0559, + "step": 116220 + }, + { + "epoch": 32.68, + "learning_rate": 3.851247930528223e-05, + "loss": 0.0551, + "step": 116250 + }, + { + "epoch": 32.69, + "learning_rate": 3.8493736919376506e-05, + "loss": 0.0584, + "step": 116280 + }, + { + "epoch": 32.7, + "learning_rate": 3.847499453347078e-05, + "loss": 0.0491, + "step": 116310 + }, + { + "epoch": 32.71, + "learning_rate": 3.8456252147565054e-05, + "loss": 0.0582, + "step": 116340 + }, + { + "epoch": 32.72, + "learning_rate": 3.843750976165933e-05, + "loss": 0.0589, + "step": 116370 + }, + { + "epoch": 32.72, + "learning_rate": 3.84187673757536e-05, + "loss": 0.051, + "step": 116400 + }, + { + "epoch": 32.73, + "learning_rate": 3.8400024989847876e-05, + "loss": 0.0578, + "step": 116430 + }, + { + "epoch": 32.74, + "learning_rate": 3.838128260394215e-05, + "loss": 0.0514, + "step": 116460 + }, + { + "epoch": 32.75, + "learning_rate": 3.8362540218036425e-05, + "loss": 0.0612, + "step": 116490 + }, + { + "epoch": 32.76, + "learning_rate": 3.83437978321307e-05, + "loss": 0.0564, + "step": 116520 + }, + { + "epoch": 32.77, + "learning_rate": 3.832505544622497e-05, + "loss": 0.0524, + "step": 116550 + }, + { + "epoch": 32.77, + "learning_rate": 3.830631306031925e-05, + "loss": 0.057, + "step": 116580 + }, + { + "epoch": 32.78, + "learning_rate": 3.828757067441352e-05, + "loss": 0.0519, + "step": 116610 + }, + { + "epoch": 32.79, + "learning_rate": 3.8268828288507796e-05, + "loss": 0.0581, + "step": 116640 + }, + { + "epoch": 32.8, + "learning_rate": 3.825008590260207e-05, + "loss": 0.0558, + "step": 116670 + }, + { + "epoch": 32.81, + "learning_rate": 3.8231343516696344e-05, + "loss": 0.051, + "step": 116700 + }, + { + "epoch": 32.82, + "learning_rate": 3.821260113079062e-05, + "loss": 0.0598, + "step": 116730 + }, + { + "epoch": 32.83, + "learning_rate": 3.819385874488489e-05, + "loss": 0.0492, + "step": 116760 + }, + { + "epoch": 32.83, + "learning_rate": 3.817511635897917e-05, + "loss": 0.0579, + "step": 116790 + }, + { + "epoch": 32.84, + "learning_rate": 3.815637397307344e-05, + "loss": 0.0546, + "step": 116820 + }, + { + "epoch": 32.85, + "learning_rate": 3.8137631587167715e-05, + "loss": 0.0526, + "step": 116850 + }, + { + "epoch": 32.86, + "learning_rate": 3.811888920126199e-05, + "loss": 0.0613, + "step": 116880 + }, + { + "epoch": 32.87, + "learning_rate": 3.8100146815356264e-05, + "loss": 0.0539, + "step": 116910 + }, + { + "epoch": 32.88, + "learning_rate": 3.808140442945054e-05, + "loss": 0.0537, + "step": 116940 + }, + { + "epoch": 32.88, + "learning_rate": 3.806266204354481e-05, + "loss": 0.0543, + "step": 116970 + }, + { + "epoch": 32.89, + "learning_rate": 3.8043919657639086e-05, + "loss": 0.0539, + "step": 117000 + }, + { + "epoch": 32.9, + "learning_rate": 3.802517727173336e-05, + "loss": 0.0607, + "step": 117030 + }, + { + "epoch": 32.91, + "learning_rate": 3.8006434885827634e-05, + "loss": 0.0501, + "step": 117060 + }, + { + "epoch": 32.92, + "learning_rate": 3.798831724611877e-05, + "loss": 0.0597, + "step": 117090 + }, + { + "epoch": 32.93, + "learning_rate": 3.796957486021304e-05, + "loss": 0.0578, + "step": 117120 + }, + { + "epoch": 32.93, + "learning_rate": 3.795083247430731e-05, + "loss": 0.0534, + "step": 117150 + }, + { + "epoch": 32.94, + "learning_rate": 3.793209008840159e-05, + "loss": 0.063, + "step": 117180 + }, + { + "epoch": 32.95, + "learning_rate": 3.791334770249586e-05, + "loss": 0.0546, + "step": 117210 + }, + { + "epoch": 32.96, + "learning_rate": 3.789460531659014e-05, + "loss": 0.0554, + "step": 117240 + }, + { + "epoch": 32.97, + "learning_rate": 3.7875862930684414e-05, + "loss": 0.0541, + "step": 117270 + }, + { + "epoch": 32.98, + "learning_rate": 3.785712054477869e-05, + "loss": 0.0536, + "step": 117300 + }, + { + "epoch": 32.99, + "learning_rate": 3.783837815887296e-05, + "loss": 0.0595, + "step": 117330 + }, + { + "epoch": 32.99, + "learning_rate": 3.781963577296723e-05, + "loss": 0.0482, + "step": 117360 + }, + { + "epoch": 33.0, + "eval_loss": 0.1107897162437439, + "eval_runtime": 635.0944, + "eval_samples_per_second": 25.245, + "eval_steps_per_second": 0.79, + "eval_wer": 0.09579244742265228, + "step": 117381 + } + ], + "max_steps": 177850, + "num_train_epochs": 50, + "total_flos": 2.5993382597195276e+21, + "trial_name": null, + "trial_params": null +}