{ "best_metric": 0.294111043214798, "best_model_checkpoint": "wav2vec2-large-xlsr-mecita-coraa-portuguese-random-all-02/checkpoint-1978", "epoch": 43.0, "global_step": 3698, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.01, "learning_rate": 3e-05, "loss": 26.6237, "step": 1 }, { "epoch": 1.0, "eval_cer": 0.7321738336528805, "eval_loss": 2.7489612102508545, "eval_runtime": 8.9523, "eval_samples_per_second": 38.091, "eval_steps_per_second": 4.803, "eval_wer": 0.9341623994147769, "step": 86 }, { "epoch": 1.16, "learning_rate": 2.966511627906977e-05, "loss": 5.3366, "step": 100 }, { "epoch": 2.0, "eval_cer": 0.4202045101798594, "eval_loss": 1.6393556594848633, "eval_runtime": 8.8583, "eval_samples_per_second": 38.495, "eval_steps_per_second": 4.854, "eval_wer": 0.7008046817849305, "step": 172 }, { "epoch": 2.33, "learning_rate": 2.9316279069767443e-05, "loss": 3.393, "step": 200 }, { "epoch": 3.0, "eval_cer": 0.2307586962476034, "eval_loss": 1.015175700187683, "eval_runtime": 8.7977, "eval_samples_per_second": 38.76, "eval_steps_per_second": 4.888, "eval_wer": 0.49280663252865153, "step": 258 }, { "epoch": 3.49, "learning_rate": 2.8967441860465116e-05, "loss": 2.1045, "step": 300 }, { "epoch": 4.0, "eval_cer": 0.15105450561490003, "eval_loss": 0.6938430070877075, "eval_runtime": 8.4884, "eval_samples_per_second": 40.173, "eval_steps_per_second": 5.066, "eval_wer": 0.3511338697878566, "step": 344 }, { "epoch": 4.65, "learning_rate": 2.861860465116279e-05, "loss": 1.8687, "step": 400 }, { "epoch": 5.0, "eval_cer": 0.11325664201588606, "eval_loss": 0.5804391503334045, "eval_runtime": 8.8411, "eval_samples_per_second": 38.57, "eval_steps_per_second": 4.864, "eval_wer": 0.29748841745915633, "step": 430 }, { "epoch": 5.81, "learning_rate": 2.8269767441860464e-05, "loss": 1.0808, "step": 500 }, { "epoch": 6.0, "eval_cer": 0.09864877202592896, "eval_loss": 0.4938930869102478, "eval_runtime": 8.7485, "eval_samples_per_second": 38.978, "eval_steps_per_second": 4.915, "eval_wer": 0.2553035844915874, "step": 516 }, { "epoch": 6.98, "learning_rate": 2.7920930232558138e-05, "loss": 0.9453, "step": 600 }, { "epoch": 7.0, "eval_cer": 0.08577558659727928, "eval_loss": 0.45988404750823975, "eval_runtime": 8.5437, "eval_samples_per_second": 39.912, "eval_steps_per_second": 5.033, "eval_wer": 0.23165081687393319, "step": 602 }, { "epoch": 8.0, "eval_cer": 0.07390669223043915, "eval_loss": 0.4172210097312927, "eval_runtime": 8.6637, "eval_samples_per_second": 39.359, "eval_steps_per_second": 4.963, "eval_wer": 0.2138502804194099, "step": 688 }, { "epoch": 8.14, "learning_rate": 2.7572093023255812e-05, "loss": 0.7718, "step": 700 }, { "epoch": 9.0, "eval_cer": 0.062174746644754864, "eval_loss": 0.37932026386260986, "eval_runtime": 8.5731, "eval_samples_per_second": 39.775, "eval_steps_per_second": 5.016, "eval_wer": 0.18068763716166789, "step": 774 }, { "epoch": 9.3, "learning_rate": 2.722325581395349e-05, "loss": 0.72, "step": 800 }, { "epoch": 10.0, "eval_cer": 0.06358988405003195, "eval_loss": 0.4070007801055908, "eval_runtime": 8.5357, "eval_samples_per_second": 39.95, "eval_steps_per_second": 5.038, "eval_wer": 0.18141916605705927, "step": 860 }, { "epoch": 10.47, "learning_rate": 2.6874418604651163e-05, "loss": 0.4718, "step": 900 }, { "epoch": 11.0, "eval_cer": 0.056970692960832646, "eval_loss": 0.4255421757698059, "eval_runtime": 9.3648, "eval_samples_per_second": 36.413, "eval_steps_per_second": 4.592, "eval_wer": 0.16435015849792733, "step": 946 }, { "epoch": 11.63, "learning_rate": 2.6525581395348837e-05, "loss": 0.5514, "step": 1000 }, { "epoch": 12.0, "eval_cer": 0.0510818953711312, "eval_loss": 0.3528519868850708, "eval_runtime": 8.4978, "eval_samples_per_second": 40.128, "eval_steps_per_second": 5.06, "eval_wer": 0.15264569617166546, "step": 1032 }, { "epoch": 12.79, "learning_rate": 2.617674418604651e-05, "loss": 0.3473, "step": 1100 }, { "epoch": 13.0, "eval_cer": 0.05048845065278919, "eval_loss": 0.34577953815460205, "eval_runtime": 8.4874, "eval_samples_per_second": 40.177, "eval_steps_per_second": 5.066, "eval_wer": 0.1528895391367959, "step": 1118 }, { "epoch": 13.95, "learning_rate": 2.5827906976744185e-05, "loss": 0.4885, "step": 1200 }, { "epoch": 14.0, "eval_cer": 0.049575458778416875, "eval_loss": 0.3216852843761444, "eval_runtime": 8.6413, "eval_samples_per_second": 39.462, "eval_steps_per_second": 4.976, "eval_wer": 0.14435503535722993, "step": 1204 }, { "epoch": 15.0, "eval_cer": 0.04802337259198393, "eval_loss": 0.31070542335510254, "eval_runtime": 8.5878, "eval_samples_per_second": 39.708, "eval_steps_per_second": 5.007, "eval_wer": 0.14484272128749084, "step": 1290 }, { "epoch": 15.12, "learning_rate": 2.5479069767441862e-05, "loss": 0.3774, "step": 1300 }, { "epoch": 16.0, "eval_cer": 0.0487994156852004, "eval_loss": 0.4008086621761322, "eval_runtime": 8.7031, "eval_samples_per_second": 39.181, "eval_steps_per_second": 4.941, "eval_wer": 0.14606193611314314, "step": 1376 }, { "epoch": 16.28, "learning_rate": 2.5130232558139536e-05, "loss": 0.3974, "step": 1400 }, { "epoch": 17.0, "eval_cer": 0.05012325390304026, "eval_loss": 0.38569143414497375, "eval_runtime": 8.6577, "eval_samples_per_second": 39.387, "eval_steps_per_second": 4.967, "eval_wer": 0.15191416727627408, "step": 1462 }, { "epoch": 17.44, "learning_rate": 2.478139534883721e-05, "loss": 0.3398, "step": 1500 }, { "epoch": 18.0, "eval_cer": 0.04222587418971971, "eval_loss": 0.3497083783149719, "eval_runtime": 8.7914, "eval_samples_per_second": 38.788, "eval_steps_per_second": 4.891, "eval_wer": 0.13094367227505485, "step": 1548 }, { "epoch": 18.6, "learning_rate": 2.4432558139534884e-05, "loss": 0.2741, "step": 1600 }, { "epoch": 19.0, "eval_cer": 0.042636720533187254, "eval_loss": 0.31500518321990967, "eval_runtime": 8.7036, "eval_samples_per_second": 39.179, "eval_steps_per_second": 4.94, "eval_wer": 0.13118751524018532, "step": 1634 }, { "epoch": 19.77, "learning_rate": 2.4083720930232558e-05, "loss": 0.2805, "step": 1700 }, { "epoch": 20.0, "eval_cer": 0.040491189628412305, "eval_loss": 0.3533484637737274, "eval_runtime": 8.6203, "eval_samples_per_second": 39.558, "eval_steps_per_second": 4.988, "eval_wer": 0.12362838332114119, "step": 1720 }, { "epoch": 20.93, "learning_rate": 2.373488372093023e-05, "loss": 0.3292, "step": 1800 }, { "epoch": 21.0, "eval_cer": 0.04240847256459417, "eval_loss": 0.32265007495880127, "eval_runtime": 8.657, "eval_samples_per_second": 39.39, "eval_steps_per_second": 4.967, "eval_wer": 0.12777371372835894, "step": 1806 }, { "epoch": 22.0, "eval_cer": 0.04158677987765909, "eval_loss": 0.2969246506690979, "eval_runtime": 8.6619, "eval_samples_per_second": 39.368, "eval_steps_per_second": 4.964, "eval_wer": 0.12948061448427212, "step": 1892 }, { "epoch": 22.09, "learning_rate": 2.338604651162791e-05, "loss": 0.2255, "step": 1900 }, { "epoch": 23.0, "eval_cer": 0.03848260750479321, "eval_loss": 0.294111043214798, "eval_runtime": 8.643, "eval_samples_per_second": 39.454, "eval_steps_per_second": 4.975, "eval_wer": 0.11923920994879297, "step": 1978 }, { "epoch": 23.26, "learning_rate": 2.3037209302325583e-05, "loss": 0.2107, "step": 2000 }, { "epoch": 24.0, "eval_cer": 0.04213457500228248, "eval_loss": 0.3290224075317383, "eval_runtime": 8.3985, "eval_samples_per_second": 40.603, "eval_steps_per_second": 5.12, "eval_wer": 0.12606681297244574, "step": 2064 }, { "epoch": 24.42, "learning_rate": 2.2688372093023257e-05, "loss": 0.1922, "step": 2100 }, { "epoch": 25.0, "eval_cer": 0.039943394503788913, "eval_loss": 0.34917840361595154, "eval_runtime": 8.2683, "eval_samples_per_second": 41.242, "eval_steps_per_second": 5.201, "eval_wer": 0.12216532553035844, "step": 2150 }, { "epoch": 25.58, "learning_rate": 2.233953488372093e-05, "loss": 0.1829, "step": 2200 }, { "epoch": 26.0, "eval_cer": 0.03825435953620013, "eval_loss": 0.3639993667602539, "eval_runtime": 8.5021, "eval_samples_per_second": 40.108, "eval_steps_per_second": 5.058, "eval_wer": 0.11728846622774933, "step": 2236 }, { "epoch": 26.74, "learning_rate": 2.1990697674418605e-05, "loss": 0.1911, "step": 2300 }, { "epoch": 27.0, "eval_cer": 0.039578197754039986, "eval_loss": 0.3595152497291565, "eval_runtime": 8.5431, "eval_samples_per_second": 39.915, "eval_steps_per_second": 5.033, "eval_wer": 0.1224091684954889, "step": 2322 }, { "epoch": 27.91, "learning_rate": 2.1641860465116282e-05, "loss": 0.1712, "step": 2400 }, { "epoch": 28.0, "eval_cer": 0.03898475303569798, "eval_loss": 0.352108359336853, "eval_runtime": 8.4845, "eval_samples_per_second": 40.191, "eval_steps_per_second": 5.068, "eval_wer": 0.12192148256522799, "step": 2408 }, { "epoch": 29.0, "eval_cer": 0.037432666849265044, "eval_loss": 0.3313020169734955, "eval_runtime": 8.6842, "eval_samples_per_second": 39.267, "eval_steps_per_second": 4.952, "eval_wer": 0.11363082175079249, "step": 2494 }, { "epoch": 29.07, "learning_rate": 2.1293023255813956e-05, "loss": 0.1708, "step": 2500 }, { "epoch": 30.0, "eval_cer": 0.03811741075504428, "eval_loss": 0.3219456076622009, "eval_runtime": 8.383, "eval_samples_per_second": 40.677, "eval_steps_per_second": 5.129, "eval_wer": 0.12070226773957571, "step": 2580 }, { "epoch": 30.23, "learning_rate": 2.094418604651163e-05, "loss": 0.1389, "step": 2600 }, { "epoch": 31.0, "eval_cer": 0.03610882863142518, "eval_loss": 0.3261343240737915, "eval_runtime": 8.5295, "eval_samples_per_second": 39.979, "eval_steps_per_second": 5.041, "eval_wer": 0.11143623506461839, "step": 2666 }, { "epoch": 31.4, "learning_rate": 2.0595348837209304e-05, "loss": 0.1516, "step": 2700 }, { "epoch": 32.0, "eval_cer": 0.035926230256550715, "eval_loss": 0.3445923328399658, "eval_runtime": 8.7722, "eval_samples_per_second": 38.873, "eval_steps_per_second": 4.902, "eval_wer": 0.11021702023896611, "step": 2752 }, { "epoch": 32.56, "learning_rate": 2.025e-05, "loss": 0.2601, "step": 2800 }, { "epoch": 33.0, "eval_cer": 0.03670227334976719, "eval_loss": 0.35051313042640686, "eval_runtime": 8.461, "eval_samples_per_second": 40.303, "eval_steps_per_second": 5.082, "eval_wer": 0.11509387954157523, "step": 2838 }, { "epoch": 33.72, "learning_rate": 1.9901162790697675e-05, "loss": 0.1392, "step": 2900 }, { "epoch": 34.0, "eval_cer": 0.03670227334976719, "eval_loss": 0.3281579315662384, "eval_runtime": 8.5326, "eval_samples_per_second": 39.964, "eval_steps_per_second": 5.039, "eval_wer": 0.11314313582053158, "step": 2924 }, { "epoch": 34.88, "learning_rate": 1.955232558139535e-05, "loss": 0.1286, "step": 3000 }, { "epoch": 35.0, "eval_cer": 0.035926230256550715, "eval_loss": 0.3351230025291443, "eval_runtime": 9.1156, "eval_samples_per_second": 37.408, "eval_steps_per_second": 4.717, "eval_wer": 0.11289929285540112, "step": 3010 }, { "epoch": 36.0, "eval_cer": 0.03565233269423902, "eval_loss": 0.348171591758728, "eval_runtime": 8.8289, "eval_samples_per_second": 38.623, "eval_steps_per_second": 4.87, "eval_wer": 0.1119239209948793, "step": 3096 }, { "epoch": 36.05, "learning_rate": 1.9203488372093023e-05, "loss": 0.1497, "step": 3100 }, { "epoch": 37.0, "eval_cer": 0.03734136766182781, "eval_loss": 0.37620189785957336, "eval_runtime": 8.8804, "eval_samples_per_second": 38.399, "eval_steps_per_second": 4.842, "eval_wer": 0.11558156547183614, "step": 3182 }, { "epoch": 37.21, "learning_rate": 1.8854651162790697e-05, "loss": 0.1319, "step": 3200 }, { "epoch": 38.0, "eval_cer": 0.03725006847439058, "eval_loss": 0.3732824921607971, "eval_runtime": 8.3326, "eval_samples_per_second": 40.924, "eval_steps_per_second": 5.16, "eval_wer": 0.11485003657644477, "step": 3268 }, { "epoch": 38.37, "learning_rate": 1.8505813953488374e-05, "loss": 0.1294, "step": 3300 }, { "epoch": 39.0, "eval_cer": 0.037158769286953344, "eval_loss": 0.3463388681411743, "eval_runtime": 8.7462, "eval_samples_per_second": 38.988, "eval_steps_per_second": 4.916, "eval_wer": 0.11777615215801024, "step": 3354 }, { "epoch": 39.53, "learning_rate": 1.8156976744186048e-05, "loss": 0.1459, "step": 3400 }, { "epoch": 40.0, "eval_cer": 0.03784351319273258, "eval_loss": 0.34395572543144226, "eval_runtime": 8.9131, "eval_samples_per_second": 38.258, "eval_steps_per_second": 4.824, "eval_wer": 0.11460619361131431, "step": 3440 }, { "epoch": 40.7, "learning_rate": 1.780813953488372e-05, "loss": 0.0998, "step": 3500 }, { "epoch": 41.0, "eval_cer": 0.03656532456861134, "eval_loss": 0.34668025374412537, "eval_runtime": 8.643, "eval_samples_per_second": 39.454, "eval_steps_per_second": 4.975, "eval_wer": 0.11314313582053158, "step": 3526 }, { "epoch": 41.86, "learning_rate": 1.7459302325581396e-05, "loss": 0.1036, "step": 3600 }, { "epoch": 42.0, "eval_cer": 0.036200127818862414, "eval_loss": 0.32251447439193726, "eval_runtime": 8.672, "eval_samples_per_second": 39.322, "eval_steps_per_second": 4.959, "eval_wer": 0.11265544989027067, "step": 3612 }, { "epoch": 43.0, "eval_cer": 0.03505888797589701, "eval_loss": 0.3630313277244568, "eval_runtime": 8.7676, "eval_samples_per_second": 38.893, "eval_steps_per_second": 4.904, "eval_wer": 0.11046086320409657, "step": 3698 }, { "epoch": 43.0, "step": 3698, "total_flos": 9.439881750406878e+19, "train_loss": 0.6348635904075908, "train_runtime": 13996.2801, "train_samples_per_second": 19.598, "train_steps_per_second": 0.614 } ], "max_steps": 8600, "num_train_epochs": 100, "total_flos": 9.439881750406878e+19, "trial_name": null, "trial_params": null }