|
{ |
|
"best_metric": 0.9442970822281167, |
|
"best_model_checkpoint": "wav2vec2-large/checkpoint-11500", |
|
"epoch": 31.998484082870135, |
|
"global_step": 15808, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.01, |
|
"learning_rate": 9.487666034155598e-06, |
|
"loss": 4.6314, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.01, |
|
"eval_accuracy": 0.02046229632436529, |
|
"eval_f1": 0.004873418863566646, |
|
"eval_loss": 4.916522026062012, |
|
"eval_precision": 0.0027763277100147127, |
|
"eval_runtime": 123.5513, |
|
"eval_samples_per_second": 21.36, |
|
"eval_steps_per_second": 1.781, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 2.02, |
|
"learning_rate": 1.8975332068311197e-05, |
|
"loss": 3.7739, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.02, |
|
"eval_accuracy": 0.03561955286093217, |
|
"eval_f1": 0.02524670069279936, |
|
"eval_loss": 4.449059009552002, |
|
"eval_precision": 0.0750288473053048, |
|
"eval_runtime": 121.7021, |
|
"eval_samples_per_second": 21.684, |
|
"eval_steps_per_second": 1.808, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 3.04, |
|
"learning_rate": 2.846299810246679e-05, |
|
"loss": 2.5035, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 3.04, |
|
"eval_accuracy": 0.11292156119742326, |
|
"eval_f1": 0.11144842685774854, |
|
"eval_loss": 4.142854690551758, |
|
"eval_precision": 0.2671650922898445, |
|
"eval_runtime": 120.9962, |
|
"eval_samples_per_second": 21.811, |
|
"eval_steps_per_second": 1.818, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 4.05, |
|
"learning_rate": 2.9116468686300697e-05, |
|
"loss": 1.5633, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 4.05, |
|
"eval_accuracy": 0.36756347101174686, |
|
"eval_f1": 0.3830364851222239, |
|
"eval_loss": 3.1973092555999756, |
|
"eval_precision": 0.6598356853987439, |
|
"eval_runtime": 122.0663, |
|
"eval_samples_per_second": 21.619, |
|
"eval_steps_per_second": 1.802, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 5.06, |
|
"learning_rate": 2.8062135376396992e-05, |
|
"loss": 1.0538, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 5.06, |
|
"eval_accuracy": 0.5888594164456233, |
|
"eval_f1": 0.6556643570555963, |
|
"eval_loss": 2.5479371547698975, |
|
"eval_precision": 0.8416636658887603, |
|
"eval_runtime": 121.3195, |
|
"eval_samples_per_second": 21.752, |
|
"eval_steps_per_second": 1.813, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 6.07, |
|
"learning_rate": 2.700780206649329e-05, |
|
"loss": 0.7422, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 6.07, |
|
"eval_accuracy": 0.7824933687002652, |
|
"eval_f1": 0.8194352733059617, |
|
"eval_loss": 1.4494293928146362, |
|
"eval_precision": 0.8920845853165854, |
|
"eval_runtime": 120.4455, |
|
"eval_samples_per_second": 21.91, |
|
"eval_steps_per_second": 1.827, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 7.08, |
|
"learning_rate": 2.5953468756589585e-05, |
|
"loss": 0.5762, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 7.08, |
|
"eval_accuracy": 0.7726411519514967, |
|
"eval_f1": 0.8267111468977018, |
|
"eval_loss": 1.316819190979004, |
|
"eval_precision": 0.9277444722087854, |
|
"eval_runtime": 122.3892, |
|
"eval_samples_per_second": 21.562, |
|
"eval_steps_per_second": 1.798, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 8.1, |
|
"learning_rate": 2.489913544668588e-05, |
|
"loss": 0.46, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 8.1, |
|
"eval_accuracy": 0.8563849943160288, |
|
"eval_f1": 0.898213371629901, |
|
"eval_loss": 0.8782555460929871, |
|
"eval_precision": 0.9531998814815654, |
|
"eval_runtime": 120.9059, |
|
"eval_samples_per_second": 21.827, |
|
"eval_steps_per_second": 1.82, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 9.11, |
|
"learning_rate": 2.3844802136782175e-05, |
|
"loss": 0.4007, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 9.11, |
|
"eval_accuracy": 0.8738158393330807, |
|
"eval_f1": 0.913683470937564, |
|
"eval_loss": 0.752358615398407, |
|
"eval_precision": 0.9636991964706034, |
|
"eval_runtime": 120.9904, |
|
"eval_samples_per_second": 21.812, |
|
"eval_steps_per_second": 1.818, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 10.12, |
|
"learning_rate": 2.279046882687847e-05, |
|
"loss": 0.3374, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 10.12, |
|
"eval_accuracy": 0.8851837817355058, |
|
"eval_f1": 0.9220598204792498, |
|
"eval_loss": 0.6385864615440369, |
|
"eval_precision": 0.9677694535212527, |
|
"eval_runtime": 120.467, |
|
"eval_samples_per_second": 21.906, |
|
"eval_steps_per_second": 1.826, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 11.13, |
|
"learning_rate": 2.1736135516974768e-05, |
|
"loss": 0.3108, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 11.13, |
|
"eval_accuracy": 0.9105721864342554, |
|
"eval_f1": 0.9372909559856852, |
|
"eval_loss": 0.5049420595169067, |
|
"eval_precision": 0.9680582892579286, |
|
"eval_runtime": 121.8653, |
|
"eval_samples_per_second": 21.655, |
|
"eval_steps_per_second": 1.805, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 12.15, |
|
"learning_rate": 2.0681802207071063e-05, |
|
"loss": 0.2735, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 12.15, |
|
"eval_accuracy": 0.8904888215233043, |
|
"eval_f1": 0.9225848099506897, |
|
"eval_loss": 0.6096966862678528, |
|
"eval_precision": 0.9623634379449385, |
|
"eval_runtime": 121.4949, |
|
"eval_samples_per_second": 21.721, |
|
"eval_steps_per_second": 1.811, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 13.16, |
|
"learning_rate": 1.9627468897167357e-05, |
|
"loss": 0.2716, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 13.16, |
|
"eval_accuracy": 0.8999621068586586, |
|
"eval_f1": 0.9206365230401724, |
|
"eval_loss": 0.4542546570301056, |
|
"eval_precision": 0.9569343688614892, |
|
"eval_runtime": 120.692, |
|
"eval_samples_per_second": 21.866, |
|
"eval_steps_per_second": 1.823, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 14.17, |
|
"learning_rate": 1.8573135587263652e-05, |
|
"loss": 0.2484, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 14.17, |
|
"eval_accuracy": 0.9272451686244789, |
|
"eval_f1": 0.9489393378254958, |
|
"eval_loss": 0.3964819610118866, |
|
"eval_precision": 0.9742030978909282, |
|
"eval_runtime": 121.4363, |
|
"eval_samples_per_second": 21.732, |
|
"eval_steps_per_second": 1.812, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 15.18, |
|
"learning_rate": 1.751880227735995e-05, |
|
"loss": 0.228, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 15.18, |
|
"eval_accuracy": 0.8855627131489201, |
|
"eval_f1": 0.9256828810141209, |
|
"eval_loss": 0.6806507110595703, |
|
"eval_precision": 0.9777330671722411, |
|
"eval_runtime": 122.0415, |
|
"eval_samples_per_second": 21.624, |
|
"eval_steps_per_second": 1.803, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 16.19, |
|
"learning_rate": 1.6464468967456245e-05, |
|
"loss": 0.2307, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 16.19, |
|
"eval_accuracy": 0.9173929518757105, |
|
"eval_f1": 0.946436431649072, |
|
"eval_loss": 0.5219454765319824, |
|
"eval_precision": 0.9801938448683835, |
|
"eval_runtime": 120.3841, |
|
"eval_samples_per_second": 21.921, |
|
"eval_steps_per_second": 1.827, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 17.21, |
|
"learning_rate": 1.541013565755254e-05, |
|
"loss": 0.2169, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 17.21, |
|
"eval_accuracy": 0.9120879120879121, |
|
"eval_f1": 0.9337616922587397, |
|
"eval_loss": 0.4630146920681, |
|
"eval_precision": 0.9677088927055834, |
|
"eval_runtime": 121.7745, |
|
"eval_samples_per_second": 21.671, |
|
"eval_steps_per_second": 1.807, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 18.22, |
|
"learning_rate": 1.4355802347648837e-05, |
|
"loss": 0.1997, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 18.22, |
|
"eval_accuracy": 0.9128457749147404, |
|
"eval_f1": 0.9397548887949031, |
|
"eval_loss": 0.5151729583740234, |
|
"eval_precision": 0.9740319117972248, |
|
"eval_runtime": 121.0656, |
|
"eval_samples_per_second": 21.798, |
|
"eval_steps_per_second": 1.817, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 19.23, |
|
"learning_rate": 1.3301469037745133e-05, |
|
"loss": 0.1921, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 19.23, |
|
"eval_accuracy": 0.9143615005683972, |
|
"eval_f1": 0.9475938884984938, |
|
"eval_loss": 0.510482668876648, |
|
"eval_precision": 0.9867250624910348, |
|
"eval_runtime": 122.1644, |
|
"eval_samples_per_second": 21.602, |
|
"eval_steps_per_second": 1.801, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 20.24, |
|
"learning_rate": 1.2247135727841428e-05, |
|
"loss": 0.1825, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 20.24, |
|
"eval_accuracy": 0.905267146646457, |
|
"eval_f1": 0.9406773355537659, |
|
"eval_loss": 0.6302403807640076, |
|
"eval_precision": 0.9831536512710705, |
|
"eval_runtime": 121.7536, |
|
"eval_samples_per_second": 21.675, |
|
"eval_steps_per_second": 1.807, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 21.25, |
|
"learning_rate": 1.1192802417937724e-05, |
|
"loss": 0.1786, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 21.25, |
|
"eval_accuracy": 0.9272451686244789, |
|
"eval_f1": 0.952370485075943, |
|
"eval_loss": 0.460215300321579, |
|
"eval_precision": 0.9813011833529409, |
|
"eval_runtime": 124.2398, |
|
"eval_samples_per_second": 21.241, |
|
"eval_steps_per_second": 1.771, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 22.27, |
|
"learning_rate": 1.013846910803402e-05, |
|
"loss": 0.1671, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 22.27, |
|
"eval_accuracy": 0.9147404319818113, |
|
"eval_f1": 0.9444178129216141, |
|
"eval_loss": 0.544323205947876, |
|
"eval_precision": 0.9794231668433278, |
|
"eval_runtime": 120.9552, |
|
"eval_samples_per_second": 21.818, |
|
"eval_steps_per_second": 1.819, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 23.28, |
|
"learning_rate": 9.084135798130316e-06, |
|
"loss": 0.1623, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 23.28, |
|
"eval_accuracy": 0.9442970822281167, |
|
"eval_f1": 0.9604353051727885, |
|
"eval_loss": 0.3412924110889435, |
|
"eval_precision": 0.9780145058039889, |
|
"eval_runtime": 122.6656, |
|
"eval_samples_per_second": 21.514, |
|
"eval_steps_per_second": 1.793, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 24.29, |
|
"learning_rate": 8.029802488226612e-06, |
|
"loss": 0.1595, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 24.29, |
|
"eval_accuracy": 0.9287608942781357, |
|
"eval_f1": 0.9531334781334764, |
|
"eval_loss": 0.44775113463401794, |
|
"eval_precision": 0.9812894876888261, |
|
"eval_runtime": 120.6582, |
|
"eval_samples_per_second": 21.872, |
|
"eval_steps_per_second": 1.823, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 25.3, |
|
"learning_rate": 6.975469178322908e-06, |
|
"loss": 0.151, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 25.3, |
|
"eval_accuracy": 0.9359605911330049, |
|
"eval_f1": 0.9571224982425287, |
|
"eval_loss": 0.41782599687576294, |
|
"eval_precision": 0.9818213438674759, |
|
"eval_runtime": 121.5443, |
|
"eval_samples_per_second": 21.712, |
|
"eval_steps_per_second": 1.81, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 26.32, |
|
"learning_rate": 5.9211358684192026e-06, |
|
"loss": 0.1472, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 26.32, |
|
"eval_accuracy": 0.9355816597195907, |
|
"eval_f1": 0.9577691906088884, |
|
"eval_loss": 0.41541919112205505, |
|
"eval_precision": 0.9832631333451843, |
|
"eval_runtime": 122.2041, |
|
"eval_samples_per_second": 21.595, |
|
"eval_steps_per_second": 1.8, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 27.33, |
|
"learning_rate": 4.866802558515498e-06, |
|
"loss": 0.1473, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 27.33, |
|
"eval_accuracy": 0.931792345585449, |
|
"eval_f1": 0.9560631584126075, |
|
"eval_loss": 0.4548525810241699, |
|
"eval_precision": 0.9837464944410116, |
|
"eval_runtime": 121.1061, |
|
"eval_samples_per_second": 21.791, |
|
"eval_steps_per_second": 1.817, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 28.34, |
|
"learning_rate": 3.8124692486117947e-06, |
|
"loss": 0.131, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 28.34, |
|
"eval_accuracy": 0.9424024251610459, |
|
"eval_f1": 0.9620998995027674, |
|
"eval_loss": 0.3574429154396057, |
|
"eval_precision": 0.984478231442749, |
|
"eval_runtime": 120.0382, |
|
"eval_samples_per_second": 21.985, |
|
"eval_steps_per_second": 1.833, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 29.35, |
|
"learning_rate": 2.7581359387080904e-06, |
|
"loss": 0.134, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 29.35, |
|
"eval_accuracy": 0.9333080712391058, |
|
"eval_f1": 0.9568214460159893, |
|
"eval_loss": 0.4474771022796631, |
|
"eval_precision": 0.9840495545740223, |
|
"eval_runtime": 123.1013, |
|
"eval_samples_per_second": 21.438, |
|
"eval_steps_per_second": 1.787, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 30.36, |
|
"learning_rate": 1.7038026288043862e-06, |
|
"loss": 0.1282, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 30.36, |
|
"eval_accuracy": 0.93823417961349, |
|
"eval_f1": 0.959091295015073, |
|
"eval_loss": 0.401244193315506, |
|
"eval_precision": 0.9836786405574566, |
|
"eval_runtime": 121.7667, |
|
"eval_samples_per_second": 21.673, |
|
"eval_steps_per_second": 1.807, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 31.38, |
|
"learning_rate": 6.494693189006819e-07, |
|
"loss": 0.1307, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 31.38, |
|
"eval_accuracy": 0.94278135657446, |
|
"eval_f1": 0.9623515495402261, |
|
"eval_loss": 0.35516688227653503, |
|
"eval_precision": 0.9847235247308098, |
|
"eval_runtime": 121.4163, |
|
"eval_samples_per_second": 21.735, |
|
"eval_steps_per_second": 1.812, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"step": 15808, |
|
"total_flos": 1.2696466131100762e+20, |
|
"train_loss": 0.6361874522950485, |
|
"train_runtime": 48273.5986, |
|
"train_samples_per_second": 15.742, |
|
"train_steps_per_second": 0.327 |
|
} |
|
], |
|
"max_steps": 15808, |
|
"num_train_epochs": 32, |
|
"total_flos": 1.2696466131100762e+20, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|