voidful's picture
update model train librispeech 960h
00841b1
raw
history blame contribute delete
No virus
31 kB
{
"best_metric": 0.15721334517002106,
"best_model_checkpoint": "voidful/wav2vec2-xlsr-53-espeak-librispeech-ft-all/checkpoint-2400",
"epoch": 0.35046728971962615,
"global_step": 2400,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0,
"learning_rate": 2.34e-05,
"loss": 0.2473,
"step": 10
},
{
"epoch": 0.0,
"learning_rate": 4.68e-05,
"loss": 0.2506,
"step": 20
},
{
"epoch": 0.0,
"learning_rate": 7.02e-05,
"loss": 0.2243,
"step": 30
},
{
"epoch": 0.01,
"learning_rate": 9.36e-05,
"loss": 0.2569,
"step": 40
},
{
"epoch": 0.01,
"learning_rate": 0.000117,
"loss": 0.429,
"step": 50
},
{
"epoch": 0.01,
"learning_rate": 0.0001404,
"loss": 0.2216,
"step": 60
},
{
"epoch": 0.01,
"learning_rate": 0.0001638,
"loss": 0.2044,
"step": 70
},
{
"epoch": 0.01,
"learning_rate": 0.0001872,
"loss": 0.2037,
"step": 80
},
{
"epoch": 0.01,
"learning_rate": 0.0002106,
"loss": 0.2444,
"step": 90
},
{
"epoch": 0.01,
"learning_rate": 0.000234,
"loss": 0.4259,
"step": 100
},
{
"epoch": 0.02,
"learning_rate": 0.00023399430352013243,
"loss": 0.2284,
"step": 110
},
{
"epoch": 0.02,
"learning_rate": 0.00023398860704026487,
"loss": 0.2131,
"step": 120
},
{
"epoch": 0.02,
"learning_rate": 0.00023398291056039728,
"loss": 0.2125,
"step": 130
},
{
"epoch": 0.02,
"learning_rate": 0.0002339772140805297,
"loss": 0.2449,
"step": 140
},
{
"epoch": 0.02,
"learning_rate": 0.00023397151760066215,
"loss": 0.3585,
"step": 150
},
{
"epoch": 0.02,
"learning_rate": 0.00023396582112079458,
"loss": 0.2464,
"step": 160
},
{
"epoch": 0.02,
"learning_rate": 0.00023396012464092702,
"loss": 0.2342,
"step": 170
},
{
"epoch": 0.03,
"learning_rate": 0.00023395442816105943,
"loss": 0.2261,
"step": 180
},
{
"epoch": 0.03,
"learning_rate": 0.00023394873168119186,
"loss": 0.2682,
"step": 190
},
{
"epoch": 0.03,
"learning_rate": 0.0002339430352013243,
"loss": 0.3853,
"step": 200
},
{
"epoch": 0.03,
"learning_rate": 0.00023393733872145673,
"loss": 0.2098,
"step": 210
},
{
"epoch": 0.03,
"learning_rate": 0.00023393164224158917,
"loss": 0.2502,
"step": 220
},
{
"epoch": 0.03,
"learning_rate": 0.00023392594576172158,
"loss": 0.2289,
"step": 230
},
{
"epoch": 0.04,
"learning_rate": 0.000233920249281854,
"loss": 0.2539,
"step": 240
},
{
"epoch": 0.04,
"learning_rate": 0.00023391455280198645,
"loss": 0.3958,
"step": 250
},
{
"epoch": 0.04,
"learning_rate": 0.00023390885632211888,
"loss": 0.2165,
"step": 260
},
{
"epoch": 0.04,
"learning_rate": 0.00023390315984225135,
"loss": 0.215,
"step": 270
},
{
"epoch": 0.04,
"learning_rate": 0.00023389746336238375,
"loss": 0.2255,
"step": 280
},
{
"epoch": 0.04,
"learning_rate": 0.0002338917668825162,
"loss": 0.2072,
"step": 290
},
{
"epoch": 0.04,
"learning_rate": 0.00023388607040264863,
"loss": 0.3403,
"step": 300
},
{
"epoch": 0.05,
"learning_rate": 0.00023388037392278106,
"loss": 0.2147,
"step": 310
},
{
"epoch": 0.05,
"learning_rate": 0.0002338746774429135,
"loss": 0.1936,
"step": 320
},
{
"epoch": 0.05,
"learning_rate": 0.0002338689809630459,
"loss": 0.2352,
"step": 330
},
{
"epoch": 0.05,
"learning_rate": 0.00023386328448317834,
"loss": 0.2696,
"step": 340
},
{
"epoch": 0.05,
"learning_rate": 0.00023385758800331078,
"loss": 0.3343,
"step": 350
},
{
"epoch": 0.05,
"learning_rate": 0.0002338518915234432,
"loss": 0.202,
"step": 360
},
{
"epoch": 0.05,
"learning_rate": 0.00023384619504357565,
"loss": 0.2138,
"step": 370
},
{
"epoch": 0.06,
"learning_rate": 0.00023384049856370806,
"loss": 0.2142,
"step": 380
},
{
"epoch": 0.06,
"learning_rate": 0.0002338348020838405,
"loss": 0.2535,
"step": 390
},
{
"epoch": 0.06,
"learning_rate": 0.00023382910560397293,
"loss": 0.392,
"step": 400
},
{
"epoch": 0.06,
"eval_cer": 0.13186392030593033,
"eval_loss": 0.17454230785369873,
"eval_runtime": 360.3554,
"eval_samples_per_second": 14.516,
"eval_steps_per_second": 0.486,
"eval_wer": 0.9709424584209521,
"step": 400
},
{
"epoch": 0.06,
"learning_rate": 0.00023382340912410536,
"loss": 0.225,
"step": 410
},
{
"epoch": 0.06,
"learning_rate": 0.0002338177126442378,
"loss": 0.2077,
"step": 420
},
{
"epoch": 0.06,
"learning_rate": 0.0002338120161643702,
"loss": 0.2306,
"step": 430
},
{
"epoch": 0.06,
"learning_rate": 0.00023380631968450264,
"loss": 0.2642,
"step": 440
},
{
"epoch": 0.07,
"learning_rate": 0.00023380119285262182,
"loss": 0.3968,
"step": 450
},
{
"epoch": 0.07,
"learning_rate": 0.00023379549637275425,
"loss": 0.1817,
"step": 460
},
{
"epoch": 0.07,
"learning_rate": 0.0002337897998928867,
"loss": 0.2048,
"step": 470
},
{
"epoch": 0.07,
"learning_rate": 0.00023378410341301912,
"loss": 0.211,
"step": 480
},
{
"epoch": 0.07,
"learning_rate": 0.00023377840693315156,
"loss": 0.2555,
"step": 490
},
{
"epoch": 0.07,
"learning_rate": 0.000233772710453284,
"loss": 0.3959,
"step": 500
},
{
"epoch": 0.07,
"learning_rate": 0.00023376701397341643,
"loss": 0.2082,
"step": 510
},
{
"epoch": 0.08,
"learning_rate": 0.00023376131749354887,
"loss": 0.1888,
"step": 520
},
{
"epoch": 0.08,
"learning_rate": 0.0002337556210136813,
"loss": 0.2242,
"step": 530
},
{
"epoch": 0.08,
"learning_rate": 0.0002337499245338137,
"loss": 0.2365,
"step": 540
},
{
"epoch": 0.08,
"learning_rate": 0.00023374422805394615,
"loss": 0.3182,
"step": 550
},
{
"epoch": 0.08,
"learning_rate": 0.00023373853157407858,
"loss": 0.2074,
"step": 560
},
{
"epoch": 0.08,
"learning_rate": 0.00023373283509421102,
"loss": 0.2005,
"step": 570
},
{
"epoch": 0.08,
"learning_rate": 0.00023372713861434345,
"loss": 0.2163,
"step": 580
},
{
"epoch": 0.09,
"learning_rate": 0.0002337214421344759,
"loss": 0.2461,
"step": 590
},
{
"epoch": 0.09,
"learning_rate": 0.0002337157456546083,
"loss": 0.3741,
"step": 600
},
{
"epoch": 0.09,
"learning_rate": 0.00023371061882272747,
"loss": 0.21,
"step": 610
},
{
"epoch": 0.09,
"learning_rate": 0.0002337049223428599,
"loss": 0.2095,
"step": 620
},
{
"epoch": 0.09,
"learning_rate": 0.00023369922586299234,
"loss": 0.1971,
"step": 630
},
{
"epoch": 0.09,
"learning_rate": 0.00023369352938312478,
"loss": 0.2462,
"step": 640
},
{
"epoch": 0.09,
"learning_rate": 0.00023368783290325722,
"loss": 0.3378,
"step": 650
},
{
"epoch": 0.1,
"learning_rate": 0.00023368213642338962,
"loss": 0.2211,
"step": 660
},
{
"epoch": 0.1,
"learning_rate": 0.00023367643994352206,
"loss": 0.1843,
"step": 670
},
{
"epoch": 0.1,
"learning_rate": 0.0002336707434636545,
"loss": 0.198,
"step": 680
},
{
"epoch": 0.1,
"learning_rate": 0.00023366504698378693,
"loss": 0.2688,
"step": 690
},
{
"epoch": 0.1,
"learning_rate": 0.00023365935050391937,
"loss": 0.3775,
"step": 700
},
{
"epoch": 0.1,
"learning_rate": 0.00023365365402405177,
"loss": 0.1945,
"step": 710
},
{
"epoch": 0.11,
"learning_rate": 0.00023364795754418424,
"loss": 0.2172,
"step": 720
},
{
"epoch": 0.11,
"learning_rate": 0.00023364226106431667,
"loss": 0.2145,
"step": 730
},
{
"epoch": 0.11,
"learning_rate": 0.0002336365645844491,
"loss": 0.2712,
"step": 740
},
{
"epoch": 0.11,
"learning_rate": 0.00023363086810458154,
"loss": 0.3371,
"step": 750
},
{
"epoch": 0.11,
"learning_rate": 0.00023362517162471395,
"loss": 0.2176,
"step": 760
},
{
"epoch": 0.11,
"learning_rate": 0.0002336194751448464,
"loss": 0.1926,
"step": 770
},
{
"epoch": 0.11,
"learning_rate": 0.00023361377866497882,
"loss": 0.2002,
"step": 780
},
{
"epoch": 0.12,
"learning_rate": 0.00023360808218511126,
"loss": 0.2345,
"step": 790
},
{
"epoch": 0.12,
"learning_rate": 0.0002336023857052437,
"loss": 0.3921,
"step": 800
},
{
"epoch": 0.12,
"eval_cer": 0.10110303888191077,
"eval_loss": 0.17119961977005005,
"eval_runtime": 359.8523,
"eval_samples_per_second": 14.537,
"eval_steps_per_second": 0.486,
"eval_wer": 0.941884916841904,
"step": 800
},
{
"epoch": 0.12,
"learning_rate": 0.0002335966892253761,
"loss": 0.2154,
"step": 810
},
{
"epoch": 0.12,
"learning_rate": 0.00023359099274550854,
"loss": 0.213,
"step": 820
},
{
"epoch": 0.12,
"learning_rate": 0.00023358529626564097,
"loss": 0.1914,
"step": 830
},
{
"epoch": 0.12,
"learning_rate": 0.0002335795997857734,
"loss": 0.2188,
"step": 840
},
{
"epoch": 0.12,
"learning_rate": 0.00023357390330590585,
"loss": 0.344,
"step": 850
},
{
"epoch": 0.13,
"learning_rate": 0.00023356820682603825,
"loss": 0.1963,
"step": 860
},
{
"epoch": 0.13,
"learning_rate": 0.0002335625103461707,
"loss": 0.198,
"step": 870
},
{
"epoch": 0.13,
"learning_rate": 0.00023355681386630312,
"loss": 0.2368,
"step": 880
},
{
"epoch": 0.13,
"learning_rate": 0.00023355111738643556,
"loss": 0.2333,
"step": 890
},
{
"epoch": 0.13,
"learning_rate": 0.000233545420906568,
"loss": 0.3454,
"step": 900
},
{
"epoch": 0.13,
"learning_rate": 0.0002335397244267004,
"loss": 0.21,
"step": 910
},
{
"epoch": 0.13,
"learning_rate": 0.00023353402794683284,
"loss": 0.1849,
"step": 920
},
{
"epoch": 0.14,
"learning_rate": 0.00023352833146696528,
"loss": 0.1982,
"step": 930
},
{
"epoch": 0.14,
"learning_rate": 0.0002335226349870977,
"loss": 0.2371,
"step": 940
},
{
"epoch": 0.14,
"learning_rate": 0.00023351750815521691,
"loss": 0.346,
"step": 950
},
{
"epoch": 0.14,
"learning_rate": 0.00023351181167534935,
"loss": 0.2024,
"step": 960
},
{
"epoch": 0.14,
"learning_rate": 0.00023350611519548179,
"loss": 0.1852,
"step": 970
},
{
"epoch": 0.14,
"learning_rate": 0.0002335004187156142,
"loss": 0.2196,
"step": 980
},
{
"epoch": 0.14,
"learning_rate": 0.00023349472223574663,
"loss": 0.2333,
"step": 990
},
{
"epoch": 0.15,
"learning_rate": 0.00023348902575587906,
"loss": 0.3275,
"step": 1000
},
{
"epoch": 0.15,
"learning_rate": 0.0002334833292760115,
"loss": 0.1848,
"step": 1010
},
{
"epoch": 0.15,
"learning_rate": 0.00023347763279614394,
"loss": 0.1784,
"step": 1020
},
{
"epoch": 0.15,
"learning_rate": 0.00023347193631627634,
"loss": 0.1954,
"step": 1030
},
{
"epoch": 0.15,
"learning_rate": 0.00023346623983640878,
"loss": 0.211,
"step": 1040
},
{
"epoch": 0.15,
"learning_rate": 0.00023346054335654122,
"loss": 0.3037,
"step": 1050
},
{
"epoch": 0.15,
"learning_rate": 0.00023345484687667365,
"loss": 0.2249,
"step": 1060
},
{
"epoch": 0.16,
"learning_rate": 0.0002334491503968061,
"loss": 0.1877,
"step": 1070
},
{
"epoch": 0.16,
"learning_rate": 0.0002334434539169385,
"loss": 0.1877,
"step": 1080
},
{
"epoch": 0.16,
"learning_rate": 0.00023343775743707093,
"loss": 0.2514,
"step": 1090
},
{
"epoch": 0.16,
"learning_rate": 0.00023343206095720337,
"loss": 0.3478,
"step": 1100
},
{
"epoch": 0.16,
"learning_rate": 0.0002334263644773358,
"loss": 0.2016,
"step": 1110
},
{
"epoch": 0.16,
"learning_rate": 0.00023342066799746824,
"loss": 0.1919,
"step": 1120
},
{
"epoch": 0.17,
"learning_rate": 0.00023341497151760065,
"loss": 0.2027,
"step": 1130
},
{
"epoch": 0.17,
"learning_rate": 0.00023340927503773308,
"loss": 0.2362,
"step": 1140
},
{
"epoch": 0.17,
"learning_rate": 0.00023340357855786552,
"loss": 0.3776,
"step": 1150
},
{
"epoch": 0.17,
"learning_rate": 0.00023339788207799795,
"loss": 0.2072,
"step": 1160
},
{
"epoch": 0.17,
"learning_rate": 0.0002333921855981304,
"loss": 0.21,
"step": 1170
},
{
"epoch": 0.17,
"learning_rate": 0.0002333864891182628,
"loss": 0.2136,
"step": 1180
},
{
"epoch": 0.17,
"learning_rate": 0.00023338079263839523,
"loss": 0.2236,
"step": 1190
},
{
"epoch": 0.18,
"learning_rate": 0.00023337509615852767,
"loss": 0.3523,
"step": 1200
},
{
"epoch": 0.18,
"eval_cer": 0.10916811901518182,
"eval_loss": 0.16797101497650146,
"eval_runtime": 357.2006,
"eval_samples_per_second": 14.644,
"eval_steps_per_second": 0.49,
"eval_wer": 0.9625310648059644,
"step": 1200
},
{
"epoch": 0.18,
"learning_rate": 0.0002333693996786601,
"loss": 0.1918,
"step": 1210
},
{
"epoch": 0.18,
"learning_rate": 0.00023336370319879254,
"loss": 0.2046,
"step": 1220
},
{
"epoch": 0.18,
"learning_rate": 0.00023335800671892495,
"loss": 0.2033,
"step": 1230
},
{
"epoch": 0.18,
"learning_rate": 0.00023335231023905738,
"loss": 0.2217,
"step": 1240
},
{
"epoch": 0.18,
"learning_rate": 0.00023334661375918982,
"loss": 0.332,
"step": 1250
},
{
"epoch": 0.18,
"learning_rate": 0.00023334091727932228,
"loss": 0.2168,
"step": 1260
},
{
"epoch": 0.19,
"learning_rate": 0.00023333522079945472,
"loss": 0.1957,
"step": 1270
},
{
"epoch": 0.19,
"learning_rate": 0.00023332952431958713,
"loss": 0.1912,
"step": 1280
},
{
"epoch": 0.19,
"learning_rate": 0.00023332382783971956,
"loss": 0.2479,
"step": 1290
},
{
"epoch": 0.19,
"learning_rate": 0.000233318131359852,
"loss": 0.3616,
"step": 1300
},
{
"epoch": 0.19,
"learning_rate": 0.00023331243487998443,
"loss": 0.2171,
"step": 1310
},
{
"epoch": 0.19,
"learning_rate": 0.00023330673840011687,
"loss": 0.1931,
"step": 1320
},
{
"epoch": 0.19,
"learning_rate": 0.00023330104192024928,
"loss": 0.2406,
"step": 1330
},
{
"epoch": 0.2,
"learning_rate": 0.0002332953454403817,
"loss": 0.2337,
"step": 1340
},
{
"epoch": 0.2,
"learning_rate": 0.00023328964896051415,
"loss": 0.3704,
"step": 1350
},
{
"epoch": 0.2,
"learning_rate": 0.00023328395248064658,
"loss": 0.2246,
"step": 1360
},
{
"epoch": 0.2,
"learning_rate": 0.00023327825600077902,
"loss": 0.2027,
"step": 1370
},
{
"epoch": 0.2,
"learning_rate": 0.00023327255952091143,
"loss": 0.2162,
"step": 1380
},
{
"epoch": 0.2,
"learning_rate": 0.00023326686304104386,
"loss": 0.238,
"step": 1390
},
{
"epoch": 0.2,
"learning_rate": 0.0002332611665611763,
"loss": 0.3327,
"step": 1400
},
{
"epoch": 0.21,
"learning_rate": 0.00023325547008130873,
"loss": 0.2206,
"step": 1410
},
{
"epoch": 0.21,
"learning_rate": 0.00023324977360144117,
"loss": 0.2087,
"step": 1420
},
{
"epoch": 0.21,
"learning_rate": 0.00023324407712157358,
"loss": 0.2095,
"step": 1430
},
{
"epoch": 0.21,
"learning_rate": 0.000233238380641706,
"loss": 0.2335,
"step": 1440
},
{
"epoch": 0.21,
"learning_rate": 0.00023323268416183845,
"loss": 0.3777,
"step": 1450
},
{
"epoch": 0.21,
"learning_rate": 0.00023322698768197088,
"loss": 0.1873,
"step": 1460
},
{
"epoch": 0.21,
"learning_rate": 0.00023322129120210332,
"loss": 0.1953,
"step": 1470
},
{
"epoch": 0.22,
"learning_rate": 0.00023321559472223573,
"loss": 0.2137,
"step": 1480
},
{
"epoch": 0.22,
"learning_rate": 0.00023320989824236816,
"loss": 0.2647,
"step": 1490
},
{
"epoch": 0.22,
"learning_rate": 0.0002332042017625006,
"loss": 0.3354,
"step": 1500
},
{
"epoch": 0.22,
"learning_rate": 0.00023319850528263303,
"loss": 0.2053,
"step": 1510
},
{
"epoch": 0.22,
"learning_rate": 0.00023319280880276547,
"loss": 0.2,
"step": 1520
},
{
"epoch": 0.22,
"learning_rate": 0.00023318711232289788,
"loss": 0.2223,
"step": 1530
},
{
"epoch": 0.22,
"learning_rate": 0.00023318141584303031,
"loss": 0.2289,
"step": 1540
},
{
"epoch": 0.23,
"learning_rate": 0.00023317571936316275,
"loss": 0.3805,
"step": 1550
},
{
"epoch": 0.23,
"learning_rate": 0.00023317002288329519,
"loss": 0.2144,
"step": 1560
},
{
"epoch": 0.23,
"learning_rate": 0.00023316432640342762,
"loss": 0.1852,
"step": 1570
},
{
"epoch": 0.23,
"learning_rate": 0.00023315862992356006,
"loss": 0.1926,
"step": 1580
},
{
"epoch": 0.23,
"learning_rate": 0.0002331529334436925,
"loss": 0.2233,
"step": 1590
},
{
"epoch": 0.23,
"learning_rate": 0.00023314723696382493,
"loss": 0.3165,
"step": 1600
},
{
"epoch": 0.23,
"eval_cer": 0.10628673416007632,
"eval_loss": 0.16792798042297363,
"eval_runtime": 368.4708,
"eval_samples_per_second": 14.197,
"eval_steps_per_second": 0.475,
"eval_wer": 0.9545020072643854,
"step": 1600
},
{
"epoch": 0.24,
"learning_rate": 0.00023314154048395736,
"loss": 0.2055,
"step": 1610
},
{
"epoch": 0.24,
"learning_rate": 0.0002331358440040898,
"loss": 0.1796,
"step": 1620
},
{
"epoch": 0.24,
"learning_rate": 0.0002331301475242222,
"loss": 0.2126,
"step": 1630
},
{
"epoch": 0.24,
"learning_rate": 0.00023312445104435464,
"loss": 0.2269,
"step": 1640
},
{
"epoch": 0.24,
"learning_rate": 0.00023311875456448708,
"loss": 0.3827,
"step": 1650
},
{
"epoch": 0.24,
"learning_rate": 0.00023311305808461951,
"loss": 0.2356,
"step": 1660
},
{
"epoch": 0.24,
"learning_rate": 0.00023310736160475195,
"loss": 0.2162,
"step": 1670
},
{
"epoch": 0.25,
"learning_rate": 0.00023310166512488436,
"loss": 0.2021,
"step": 1680
},
{
"epoch": 0.25,
"learning_rate": 0.0002330959686450168,
"loss": 0.2629,
"step": 1690
},
{
"epoch": 0.25,
"learning_rate": 0.00023309027216514923,
"loss": 0.3539,
"step": 1700
},
{
"epoch": 0.25,
"learning_rate": 0.00023308457568528166,
"loss": 0.1938,
"step": 1710
},
{
"epoch": 0.25,
"learning_rate": 0.0002330788792054141,
"loss": 0.2117,
"step": 1720
},
{
"epoch": 0.25,
"learning_rate": 0.0002330731827255465,
"loss": 0.2037,
"step": 1730
},
{
"epoch": 0.25,
"learning_rate": 0.00023306748624567894,
"loss": 0.2314,
"step": 1740
},
{
"epoch": 0.26,
"learning_rate": 0.00023306178976581138,
"loss": 0.3471,
"step": 1750
},
{
"epoch": 0.26,
"learning_rate": 0.00023305609328594382,
"loss": 0.206,
"step": 1760
},
{
"epoch": 0.26,
"learning_rate": 0.00023305039680607625,
"loss": 0.1968,
"step": 1770
},
{
"epoch": 0.26,
"learning_rate": 0.00023304470032620866,
"loss": 0.2046,
"step": 1780
},
{
"epoch": 0.26,
"learning_rate": 0.0002330390038463411,
"loss": 0.2072,
"step": 1790
},
{
"epoch": 0.26,
"learning_rate": 0.00023303330736647353,
"loss": 0.3442,
"step": 1800
},
{
"epoch": 0.26,
"learning_rate": 0.00023302761088660597,
"loss": 0.2232,
"step": 1810
},
{
"epoch": 0.27,
"learning_rate": 0.0002330219144067384,
"loss": 0.1899,
"step": 1820
},
{
"epoch": 0.27,
"learning_rate": 0.0002330162179268708,
"loss": 0.2074,
"step": 1830
},
{
"epoch": 0.27,
"learning_rate": 0.00023301052144700325,
"loss": 0.2778,
"step": 1840
},
{
"epoch": 0.27,
"learning_rate": 0.00023300482496713568,
"loss": 0.367,
"step": 1850
},
{
"epoch": 0.27,
"learning_rate": 0.00023299912848726812,
"loss": 0.2327,
"step": 1860
},
{
"epoch": 0.27,
"learning_rate": 0.00023299343200740055,
"loss": 0.1955,
"step": 1870
},
{
"epoch": 0.27,
"learning_rate": 0.00023298773552753296,
"loss": 0.2023,
"step": 1880
},
{
"epoch": 0.28,
"learning_rate": 0.0002329820390476654,
"loss": 0.2603,
"step": 1890
},
{
"epoch": 0.28,
"learning_rate": 0.00023297634256779786,
"loss": 0.3668,
"step": 1900
},
{
"epoch": 0.28,
"learning_rate": 0.0002329706460879303,
"loss": 0.1981,
"step": 1910
},
{
"epoch": 0.28,
"learning_rate": 0.00023296494960806273,
"loss": 0.2515,
"step": 1920
},
{
"epoch": 0.28,
"learning_rate": 0.00023295925312819514,
"loss": 0.1854,
"step": 1930
},
{
"epoch": 0.28,
"learning_rate": 0.00023295355664832757,
"loss": 0.2656,
"step": 1940
},
{
"epoch": 0.28,
"learning_rate": 0.00023294786016846,
"loss": 0.3529,
"step": 1950
},
{
"epoch": 0.29,
"learning_rate": 0.00023294216368859245,
"loss": 0.2059,
"step": 1960
},
{
"epoch": 0.29,
"learning_rate": 0.00023293646720872488,
"loss": 0.1898,
"step": 1970
},
{
"epoch": 0.29,
"learning_rate": 0.0002329307707288573,
"loss": 0.2393,
"step": 1980
},
{
"epoch": 0.29,
"learning_rate": 0.00023292507424898973,
"loss": 0.2417,
"step": 1990
},
{
"epoch": 0.29,
"learning_rate": 0.00023291937776912216,
"loss": 0.3633,
"step": 2000
},
{
"epoch": 0.29,
"eval_cer": 0.09183784796918316,
"eval_loss": 0.1622667759656906,
"eval_runtime": 378.6594,
"eval_samples_per_second": 13.815,
"eval_steps_per_second": 0.462,
"eval_wer": 0.9124450391894475,
"step": 2000
},
{
"epoch": 0.29,
"learning_rate": 0.0002329136812892546,
"loss": 0.2131,
"step": 2010
},
{
"epoch": 0.29,
"learning_rate": 0.00023290798480938703,
"loss": 0.2096,
"step": 2020
},
{
"epoch": 0.3,
"learning_rate": 0.00023290228832951944,
"loss": 0.2113,
"step": 2030
},
{
"epoch": 0.3,
"learning_rate": 0.00023289659184965188,
"loss": 0.2428,
"step": 2040
},
{
"epoch": 0.3,
"learning_rate": 0.0002328908953697843,
"loss": 0.364,
"step": 2050
},
{
"epoch": 0.3,
"learning_rate": 0.00023288519888991675,
"loss": 0.1823,
"step": 2060
},
{
"epoch": 0.3,
"learning_rate": 0.00023287950241004918,
"loss": 0.1999,
"step": 2070
},
{
"epoch": 0.3,
"learning_rate": 0.0002328738059301816,
"loss": 0.1921,
"step": 2080
},
{
"epoch": 0.31,
"learning_rate": 0.00023286810945031403,
"loss": 0.2185,
"step": 2090
},
{
"epoch": 0.31,
"learning_rate": 0.00023286241297044646,
"loss": 0.3339,
"step": 2100
},
{
"epoch": 0.31,
"learning_rate": 0.0002328567164905789,
"loss": 0.1856,
"step": 2110
},
{
"epoch": 0.31,
"learning_rate": 0.00023285102001071133,
"loss": 0.1971,
"step": 2120
},
{
"epoch": 0.31,
"learning_rate": 0.00023284532353084374,
"loss": 0.1749,
"step": 2130
},
{
"epoch": 0.31,
"learning_rate": 0.00023283962705097618,
"loss": 0.202,
"step": 2140
},
{
"epoch": 0.31,
"learning_rate": 0.0002328339305711086,
"loss": 0.3775,
"step": 2150
},
{
"epoch": 0.32,
"learning_rate": 0.00023282823409124105,
"loss": 0.2029,
"step": 2160
},
{
"epoch": 0.32,
"learning_rate": 0.00023282253761137348,
"loss": 0.2078,
"step": 2170
},
{
"epoch": 0.32,
"learning_rate": 0.0002328168411315059,
"loss": 0.2169,
"step": 2180
},
{
"epoch": 0.32,
"learning_rate": 0.00023281114465163833,
"loss": 0.2519,
"step": 2190
},
{
"epoch": 0.32,
"learning_rate": 0.00023280544817177076,
"loss": 0.3249,
"step": 2200
},
{
"epoch": 0.32,
"learning_rate": 0.0002327997516919032,
"loss": 0.1929,
"step": 2210
},
{
"epoch": 0.32,
"learning_rate": 0.00023279405521203563,
"loss": 0.192,
"step": 2220
},
{
"epoch": 0.33,
"learning_rate": 0.00023278835873216807,
"loss": 0.1953,
"step": 2230
},
{
"epoch": 0.33,
"learning_rate": 0.0002327826622523005,
"loss": 0.2662,
"step": 2240
},
{
"epoch": 0.33,
"learning_rate": 0.00023277696577243294,
"loss": 0.3353,
"step": 2250
},
{
"epoch": 0.33,
"learning_rate": 0.00023277126929256538,
"loss": 0.2348,
"step": 2260
},
{
"epoch": 0.33,
"learning_rate": 0.0002327655728126978,
"loss": 0.207,
"step": 2270
},
{
"epoch": 0.33,
"learning_rate": 0.00023275987633283022,
"loss": 0.221,
"step": 2280
},
{
"epoch": 0.33,
"learning_rate": 0.00023275417985296266,
"loss": 0.2328,
"step": 2290
},
{
"epoch": 0.34,
"learning_rate": 0.0002327484833730951,
"loss": 0.3737,
"step": 2300
},
{
"epoch": 0.34,
"learning_rate": 0.00023274278689322753,
"loss": 0.2214,
"step": 2310
},
{
"epoch": 0.34,
"learning_rate": 0.00023273709041335996,
"loss": 0.2035,
"step": 2320
},
{
"epoch": 0.34,
"learning_rate": 0.00023273139393349237,
"loss": 0.2373,
"step": 2330
},
{
"epoch": 0.34,
"learning_rate": 0.0002327256974536248,
"loss": 0.2607,
"step": 2340
},
{
"epoch": 0.34,
"learning_rate": 0.00023272000097375724,
"loss": 0.3317,
"step": 2350
},
{
"epoch": 0.34,
"learning_rate": 0.00023271430449388968,
"loss": 0.1983,
"step": 2360
},
{
"epoch": 0.35,
"learning_rate": 0.00023270860801402211,
"loss": 0.2118,
"step": 2370
},
{
"epoch": 0.35,
"learning_rate": 0.00023270291153415452,
"loss": 0.2143,
"step": 2380
},
{
"epoch": 0.35,
"learning_rate": 0.00023269721505428696,
"loss": 0.2277,
"step": 2390
},
{
"epoch": 0.35,
"learning_rate": 0.0002326915185744194,
"loss": 0.3574,
"step": 2400
},
{
"epoch": 0.35,
"eval_cer": 0.0956312051182347,
"eval_loss": 0.15721334517002106,
"eval_runtime": 363.9845,
"eval_samples_per_second": 14.371,
"eval_steps_per_second": 0.481,
"eval_wer": 0.9361498757407761,
"step": 2400
}
],
"max_steps": 410880,
"num_train_epochs": 60,
"total_flos": 2.442475321551867e+19,
"trial_name": null,
"trial_params": null
}