|
{ |
|
"best_metric": 0.06379657983779907, |
|
"best_model_checkpoint": "/home/cloudwalker/ASVmodel/wavlm-base_4/checkpoint-200", |
|
"epoch": 9.98109640831758, |
|
"eval_steps": 100, |
|
"global_step": 3960, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.25, |
|
"learning_rate": 7.575757575757576e-05, |
|
"loss": 0.3784, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.25, |
|
"eval_f1": 0.9905683736634776, |
|
"eval_loss": 0.07838701456785202, |
|
"eval_runtime": 494.4493, |
|
"eval_samples_per_second": 50.246, |
|
"eval_steps_per_second": 25.123, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"learning_rate": 0.00015151515151515152, |
|
"loss": 0.1125, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_f1": 0.9925361354770335, |
|
"eval_loss": 0.06379657983779907, |
|
"eval_runtime": 495.4697, |
|
"eval_samples_per_second": 50.142, |
|
"eval_steps_per_second": 25.071, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.76, |
|
"learning_rate": 0.00022727272727272725, |
|
"loss": 0.1158, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 0.76, |
|
"eval_f1": 0.9773465624725612, |
|
"eval_loss": 0.1715879738330841, |
|
"eval_runtime": 495.6685, |
|
"eval_samples_per_second": 50.122, |
|
"eval_steps_per_second": 25.061, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 1.01, |
|
"learning_rate": 0.00029966329966329963, |
|
"loss": 0.327, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 1.01, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3308480978012085, |
|
"eval_runtime": 495.7404, |
|
"eval_samples_per_second": 50.115, |
|
"eval_steps_per_second": 25.057, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 1.26, |
|
"learning_rate": 0.00029124579124579125, |
|
"loss": 0.3346, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.26, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.34493646025657654, |
|
"eval_runtime": 495.7377, |
|
"eval_samples_per_second": 50.115, |
|
"eval_steps_per_second": 25.058, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.51, |
|
"learning_rate": 0.0002828282828282828, |
|
"loss": 0.3345, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 1.51, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3316415250301361, |
|
"eval_runtime": 495.8008, |
|
"eval_samples_per_second": 50.109, |
|
"eval_steps_per_second": 25.054, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 1.76, |
|
"learning_rate": 0.0002744107744107744, |
|
"loss": 0.3313, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 1.76, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3320470452308655, |
|
"eval_runtime": 495.8537, |
|
"eval_samples_per_second": 50.103, |
|
"eval_steps_per_second": 25.052, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 2.02, |
|
"learning_rate": 0.00026599326599326595, |
|
"loss": 0.3249, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 2.02, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.33273717761039734, |
|
"eval_runtime": 496.067, |
|
"eval_samples_per_second": 50.082, |
|
"eval_steps_per_second": 25.041, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 2.27, |
|
"learning_rate": 0.00025757575757575756, |
|
"loss": 0.3403, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 2.27, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3314824402332306, |
|
"eval_runtime": 496.0647, |
|
"eval_samples_per_second": 50.082, |
|
"eval_steps_per_second": 25.041, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 2.52, |
|
"learning_rate": 0.00024915824915824913, |
|
"loss": 0.3345, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.52, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3381609320640564, |
|
"eval_runtime": 496.3675, |
|
"eval_samples_per_second": 50.052, |
|
"eval_steps_per_second": 25.026, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.77, |
|
"learning_rate": 0.00024074074074074072, |
|
"loss": 0.3174, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 2.77, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.33755871653556824, |
|
"eval_runtime": 496.1396, |
|
"eval_samples_per_second": 50.075, |
|
"eval_steps_per_second": 25.037, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 3.02, |
|
"learning_rate": 0.0002323232323232323, |
|
"loss": 0.3274, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 3.02, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3353538513183594, |
|
"eval_runtime": 496.3912, |
|
"eval_samples_per_second": 50.049, |
|
"eval_steps_per_second": 25.025, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 3.28, |
|
"learning_rate": 0.0002239057239057239, |
|
"loss": 0.3296, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 3.28, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.33069172501564026, |
|
"eval_runtime": 496.1466, |
|
"eval_samples_per_second": 50.074, |
|
"eval_steps_per_second": 25.037, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 3.53, |
|
"learning_rate": 0.00021548821548821544, |
|
"loss": 0.3175, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 3.53, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3341147303581238, |
|
"eval_runtime": 496.5334, |
|
"eval_samples_per_second": 50.035, |
|
"eval_steps_per_second": 25.017, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 3.78, |
|
"learning_rate": 0.00020707070707070703, |
|
"loss": 0.3416, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 3.78, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3344402611255646, |
|
"eval_runtime": 496.2158, |
|
"eval_samples_per_second": 50.067, |
|
"eval_steps_per_second": 25.033, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 4.03, |
|
"learning_rate": 0.00019865319865319862, |
|
"loss": 0.3412, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 4.03, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3307790160179138, |
|
"eval_runtime": 496.5097, |
|
"eval_samples_per_second": 50.037, |
|
"eval_steps_per_second": 25.019, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 4.28, |
|
"learning_rate": 0.00019023569023569022, |
|
"loss": 0.3293, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 4.28, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3313847482204437, |
|
"eval_runtime": 496.395, |
|
"eval_samples_per_second": 50.049, |
|
"eval_steps_per_second": 25.024, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 4.54, |
|
"learning_rate": 0.0001818181818181818, |
|
"loss": 0.3346, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 4.54, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.33080053329467773, |
|
"eval_runtime": 496.4252, |
|
"eval_samples_per_second": 50.046, |
|
"eval_steps_per_second": 25.023, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 4.79, |
|
"learning_rate": 0.0001734006734006734, |
|
"loss": 0.3279, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 4.79, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3317018449306488, |
|
"eval_runtime": 496.5163, |
|
"eval_samples_per_second": 50.037, |
|
"eval_steps_per_second": 25.018, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 5.04, |
|
"learning_rate": 0.000164983164983165, |
|
"loss": 0.3246, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 5.04, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.33184757828712463, |
|
"eval_runtime": 496.5592, |
|
"eval_samples_per_second": 50.032, |
|
"eval_steps_per_second": 25.016, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 5.29, |
|
"learning_rate": 0.00015656565656565653, |
|
"loss": 0.3373, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 5.29, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.33109256625175476, |
|
"eval_runtime": 496.5149, |
|
"eval_samples_per_second": 50.037, |
|
"eval_steps_per_second": 25.018, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 5.55, |
|
"learning_rate": 0.00014814814814814812, |
|
"loss": 0.3262, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 5.55, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.33351102471351624, |
|
"eval_runtime": 496.6308, |
|
"eval_samples_per_second": 50.025, |
|
"eval_steps_per_second": 25.013, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 5.8, |
|
"learning_rate": 0.0001397306397306397, |
|
"loss": 0.3279, |
|
"step": 2300 |
|
}, |
|
{ |
|
"epoch": 5.8, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3326103985309601, |
|
"eval_runtime": 496.8717, |
|
"eval_samples_per_second": 50.001, |
|
"eval_steps_per_second": 25.0, |
|
"step": 2300 |
|
}, |
|
{ |
|
"epoch": 6.05, |
|
"learning_rate": 0.0001313131313131313, |
|
"loss": 0.3298, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 6.05, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3322770297527313, |
|
"eval_runtime": 496.7239, |
|
"eval_samples_per_second": 50.016, |
|
"eval_steps_per_second": 25.008, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 6.3, |
|
"learning_rate": 0.0001228956228956229, |
|
"loss": 0.3397, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 6.3, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3311246633529663, |
|
"eval_runtime": 496.772, |
|
"eval_samples_per_second": 50.011, |
|
"eval_steps_per_second": 25.005, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 6.55, |
|
"learning_rate": 0.00011447811447811446, |
|
"loss": 0.3312, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 6.55, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.33860132098197937, |
|
"eval_runtime": 496.8085, |
|
"eval_samples_per_second": 50.007, |
|
"eval_steps_per_second": 25.004, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 6.81, |
|
"learning_rate": 0.00010606060606060605, |
|
"loss": 0.3291, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 6.81, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3316628634929657, |
|
"eval_runtime": 496.6873, |
|
"eval_samples_per_second": 50.019, |
|
"eval_steps_per_second": 25.01, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 7.06, |
|
"learning_rate": 9.764309764309764e-05, |
|
"loss": 0.3146, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 7.06, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.33230647444725037, |
|
"eval_runtime": 496.6634, |
|
"eval_samples_per_second": 50.022, |
|
"eval_steps_per_second": 25.011, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 7.31, |
|
"learning_rate": 8.92255892255892e-05, |
|
"loss": 0.3296, |
|
"step": 2900 |
|
}, |
|
{ |
|
"epoch": 7.31, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3313485085964203, |
|
"eval_runtime": 496.6247, |
|
"eval_samples_per_second": 50.026, |
|
"eval_steps_per_second": 25.013, |
|
"step": 2900 |
|
}, |
|
{ |
|
"epoch": 7.56, |
|
"learning_rate": 8.08080808080808e-05, |
|
"loss": 0.3367, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 7.56, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.33174964785575867, |
|
"eval_runtime": 496.735, |
|
"eval_samples_per_second": 50.015, |
|
"eval_steps_per_second": 25.007, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 7.81, |
|
"learning_rate": 7.239057239057239e-05, |
|
"loss": 0.3232, |
|
"step": 3100 |
|
}, |
|
{ |
|
"epoch": 7.81, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3318324387073517, |
|
"eval_runtime": 496.5843, |
|
"eval_samples_per_second": 50.03, |
|
"eval_steps_per_second": 25.015, |
|
"step": 3100 |
|
}, |
|
{ |
|
"epoch": 8.07, |
|
"learning_rate": 6.397306397306397e-05, |
|
"loss": 0.3314, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 8.07, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3325050175189972, |
|
"eval_runtime": 496.7125, |
|
"eval_samples_per_second": 50.017, |
|
"eval_steps_per_second": 25.008, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 8.32, |
|
"learning_rate": 5.5555555555555545e-05, |
|
"loss": 0.3201, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 8.32, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.33225715160369873, |
|
"eval_runtime": 496.6425, |
|
"eval_samples_per_second": 50.024, |
|
"eval_steps_per_second": 25.012, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 8.57, |
|
"learning_rate": 4.7138047138047136e-05, |
|
"loss": 0.3301, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 8.57, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3346656262874603, |
|
"eval_runtime": 496.595, |
|
"eval_samples_per_second": 50.029, |
|
"eval_steps_per_second": 25.014, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 8.82, |
|
"learning_rate": 3.8720538720538714e-05, |
|
"loss": 0.3268, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 8.82, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.33254188299179077, |
|
"eval_runtime": 496.5109, |
|
"eval_samples_per_second": 50.037, |
|
"eval_steps_per_second": 25.019, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 9.07, |
|
"learning_rate": 3.03030303030303e-05, |
|
"loss": 0.3361, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 9.07, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.33214762806892395, |
|
"eval_runtime": 496.8406, |
|
"eval_samples_per_second": 50.004, |
|
"eval_steps_per_second": 25.002, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 9.33, |
|
"learning_rate": 2.1885521885521884e-05, |
|
"loss": 0.3395, |
|
"step": 3700 |
|
}, |
|
{ |
|
"epoch": 9.33, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3312663733959198, |
|
"eval_runtime": 496.7467, |
|
"eval_samples_per_second": 50.013, |
|
"eval_steps_per_second": 25.007, |
|
"step": 3700 |
|
}, |
|
{ |
|
"epoch": 9.58, |
|
"learning_rate": 1.3468013468013465e-05, |
|
"loss": 0.3231, |
|
"step": 3800 |
|
}, |
|
{ |
|
"epoch": 9.58, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3319169878959656, |
|
"eval_runtime": 496.7702, |
|
"eval_samples_per_second": 50.011, |
|
"eval_steps_per_second": 25.006, |
|
"step": 3800 |
|
}, |
|
{ |
|
"epoch": 9.83, |
|
"learning_rate": 5.05050505050505e-06, |
|
"loss": 0.3197, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 9.83, |
|
"eval_f1": 0.9459482392872296, |
|
"eval_loss": 0.3325766921043396, |
|
"eval_runtime": 496.6934, |
|
"eval_samples_per_second": 50.019, |
|
"eval_steps_per_second": 25.009, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 9.98, |
|
"step": 3960, |
|
"total_flos": 1.506420070651024e+19, |
|
"train_loss": 0.32019265878080116, |
|
"train_runtime": 22716.823, |
|
"train_samples_per_second": 11.172, |
|
"train_steps_per_second": 0.174 |
|
} |
|
], |
|
"logging_steps": 100, |
|
"max_steps": 3960, |
|
"num_train_epochs": 10, |
|
"save_steps": 100, |
|
"total_flos": 1.506420070651024e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|