|
{ |
|
"best_metric": 0.8632057597574839, |
|
"best_model_checkpoint": "wav2vec2-base/checkpoint-5500", |
|
"epoch": 32.0, |
|
"global_step": 6336, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 2.53, |
|
"learning_rate": 2.3659305993690853e-05, |
|
"loss": 4.3647, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 2.53, |
|
"eval_accuracy": 0.011746873815839333, |
|
"eval_f1": 0.0031732207431106035, |
|
"eval_loss": 4.820202350616455, |
|
"eval_precision": 0.013376466669245454, |
|
"eval_runtime": 109.2278, |
|
"eval_samples_per_second": 24.161, |
|
"eval_steps_per_second": 0.806, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 5.05, |
|
"learning_rate": 2.8074359873728517e-05, |
|
"loss": 2.6202, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 5.05, |
|
"eval_accuracy": 0.06252368321333839, |
|
"eval_f1": 0.035540285078168796, |
|
"eval_loss": 4.223803520202637, |
|
"eval_precision": 0.07806791077535753, |
|
"eval_runtime": 106.4124, |
|
"eval_samples_per_second": 24.8, |
|
"eval_steps_per_second": 0.827, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 7.58, |
|
"learning_rate": 2.5443703963521573e-05, |
|
"loss": 1.38, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 7.58, |
|
"eval_accuracy": 0.2940507768093975, |
|
"eval_f1": 0.31740258677108446, |
|
"eval_loss": 3.6391522884368896, |
|
"eval_precision": 0.5210640247794917, |
|
"eval_runtime": 107.4509, |
|
"eval_samples_per_second": 24.56, |
|
"eval_steps_per_second": 0.819, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 10.1, |
|
"learning_rate": 2.2813048053314627e-05, |
|
"loss": 0.8601, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 10.1, |
|
"eval_accuracy": 0.4907161803713528, |
|
"eval_f1": 0.5656528274556744, |
|
"eval_loss": 2.7952940464019775, |
|
"eval_precision": 0.7446099073666071, |
|
"eval_runtime": 108.5624, |
|
"eval_samples_per_second": 24.309, |
|
"eval_steps_per_second": 0.811, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 12.63, |
|
"learning_rate": 2.0182392143107683e-05, |
|
"loss": 0.5645, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 12.63, |
|
"eval_accuracy": 0.6862447896930656, |
|
"eval_f1": 0.7421301241460049, |
|
"eval_loss": 1.9828652143478394, |
|
"eval_precision": 0.836316121433408, |
|
"eval_runtime": 101.2702, |
|
"eval_samples_per_second": 26.059, |
|
"eval_steps_per_second": 0.869, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 15.15, |
|
"learning_rate": 1.7551736232900737e-05, |
|
"loss": 0.4009, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 15.15, |
|
"eval_accuracy": 0.7635467980295566, |
|
"eval_f1": 0.8174024577222706, |
|
"eval_loss": 1.453549861907959, |
|
"eval_precision": 0.9000157931943787, |
|
"eval_runtime": 107.7592, |
|
"eval_samples_per_second": 24.49, |
|
"eval_steps_per_second": 0.817, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 17.68, |
|
"learning_rate": 1.4921080322693792e-05, |
|
"loss": 0.3054, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 17.68, |
|
"eval_accuracy": 0.7881773399014779, |
|
"eval_f1": 0.8297806830083403, |
|
"eval_loss": 1.1425673961639404, |
|
"eval_precision": 0.905752007054303, |
|
"eval_runtime": 106.3252, |
|
"eval_samples_per_second": 24.82, |
|
"eval_steps_per_second": 0.828, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 20.2, |
|
"learning_rate": 1.2290424412486847e-05, |
|
"loss": 0.2448, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 20.2, |
|
"eval_accuracy": 0.8188707843880257, |
|
"eval_f1": 0.8593023386044745, |
|
"eval_loss": 0.9859854578971863, |
|
"eval_precision": 0.9206175798530246, |
|
"eval_runtime": 107.5476, |
|
"eval_samples_per_second": 24.538, |
|
"eval_steps_per_second": 0.818, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 22.73, |
|
"learning_rate": 9.659768502279902e-06, |
|
"loss": 0.2116, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 22.73, |
|
"eval_accuracy": 0.8325123152709359, |
|
"eval_f1": 0.8711410752519451, |
|
"eval_loss": 0.8820037841796875, |
|
"eval_precision": 0.9261488248866633, |
|
"eval_runtime": 107.1712, |
|
"eval_samples_per_second": 24.624, |
|
"eval_steps_per_second": 0.821, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 25.25, |
|
"learning_rate": 7.029112592072957e-06, |
|
"loss": 0.1863, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 25.25, |
|
"eval_accuracy": 0.8465327775672603, |
|
"eval_f1": 0.8848136570821419, |
|
"eval_loss": 0.8190948367118835, |
|
"eval_precision": 0.9366165612791744, |
|
"eval_runtime": 101.4217, |
|
"eval_samples_per_second": 26.02, |
|
"eval_steps_per_second": 0.868, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 27.78, |
|
"learning_rate": 4.398456681866012e-06, |
|
"loss": 0.1701, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 27.78, |
|
"eval_accuracy": 0.8632057597574839, |
|
"eval_f1": 0.8953598709937869, |
|
"eval_loss": 0.7504324913024902, |
|
"eval_precision": 0.9379743242290526, |
|
"eval_runtime": 106.5347, |
|
"eval_samples_per_second": 24.771, |
|
"eval_steps_per_second": 0.826, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 30.3, |
|
"learning_rate": 1.767800771659067e-06, |
|
"loss": 0.1558, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 30.3, |
|
"eval_accuracy": 0.8609321712769988, |
|
"eval_f1": 0.8955970854963186, |
|
"eval_loss": 0.7665356993675232, |
|
"eval_precision": 0.9398430168070748, |
|
"eval_runtime": 106.7434, |
|
"eval_samples_per_second": 24.723, |
|
"eval_steps_per_second": 0.824, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"step": 6336, |
|
"total_flos": 3.804433776973221e+19, |
|
"train_loss": 0.9127645113251426, |
|
"train_runtime": 39385.6266, |
|
"train_samples_per_second": 19.295, |
|
"train_steps_per_second": 0.161 |
|
} |
|
], |
|
"max_steps": 6336, |
|
"num_train_epochs": 32, |
|
"total_flos": 3.804433776973221e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|