{ "best_metric": 0.06379657983779907, "best_model_checkpoint": "/home/cloudwalker/ASVmodel/wavlm-base_4/checkpoint-200", "epoch": 9.98109640831758, "eval_steps": 100, "global_step": 3960, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.25, "learning_rate": 7.575757575757576e-05, "loss": 0.3784, "step": 100 }, { "epoch": 0.25, "eval_f1": 0.9905683736634776, "eval_loss": 0.07838701456785202, "eval_runtime": 494.4493, "eval_samples_per_second": 50.246, "eval_steps_per_second": 25.123, "step": 100 }, { "epoch": 0.5, "learning_rate": 0.00015151515151515152, "loss": 0.1125, "step": 200 }, { "epoch": 0.5, "eval_f1": 0.9925361354770335, "eval_loss": 0.06379657983779907, "eval_runtime": 495.4697, "eval_samples_per_second": 50.142, "eval_steps_per_second": 25.071, "step": 200 }, { "epoch": 0.76, "learning_rate": 0.00022727272727272725, "loss": 0.1158, "step": 300 }, { "epoch": 0.76, "eval_f1": 0.9773465624725612, "eval_loss": 0.1715879738330841, "eval_runtime": 495.6685, "eval_samples_per_second": 50.122, "eval_steps_per_second": 25.061, "step": 300 }, { "epoch": 1.01, "learning_rate": 0.00029966329966329963, "loss": 0.327, "step": 400 }, { "epoch": 1.01, "eval_f1": 0.9459482392872296, "eval_loss": 0.3308480978012085, "eval_runtime": 495.7404, "eval_samples_per_second": 50.115, "eval_steps_per_second": 25.057, "step": 400 }, { "epoch": 1.26, "learning_rate": 0.00029124579124579125, "loss": 0.3346, "step": 500 }, { "epoch": 1.26, "eval_f1": 0.9459482392872296, "eval_loss": 0.34493646025657654, "eval_runtime": 495.7377, "eval_samples_per_second": 50.115, "eval_steps_per_second": 25.058, "step": 500 }, { "epoch": 1.51, "learning_rate": 0.0002828282828282828, "loss": 0.3345, "step": 600 }, { "epoch": 1.51, "eval_f1": 0.9459482392872296, "eval_loss": 0.3316415250301361, "eval_runtime": 495.8008, "eval_samples_per_second": 50.109, "eval_steps_per_second": 25.054, "step": 600 }, { "epoch": 1.76, "learning_rate": 0.0002744107744107744, "loss": 0.3313, "step": 700 }, { "epoch": 1.76, "eval_f1": 0.9459482392872296, "eval_loss": 0.3320470452308655, "eval_runtime": 495.8537, "eval_samples_per_second": 50.103, "eval_steps_per_second": 25.052, "step": 700 }, { "epoch": 2.02, "learning_rate": 0.00026599326599326595, "loss": 0.3249, "step": 800 }, { "epoch": 2.02, "eval_f1": 0.9459482392872296, "eval_loss": 0.33273717761039734, "eval_runtime": 496.067, "eval_samples_per_second": 50.082, "eval_steps_per_second": 25.041, "step": 800 }, { "epoch": 2.27, "learning_rate": 0.00025757575757575756, "loss": 0.3403, "step": 900 }, { "epoch": 2.27, "eval_f1": 0.9459482392872296, "eval_loss": 0.3314824402332306, "eval_runtime": 496.0647, "eval_samples_per_second": 50.082, "eval_steps_per_second": 25.041, "step": 900 }, { "epoch": 2.52, "learning_rate": 0.00024915824915824913, "loss": 0.3345, "step": 1000 }, { "epoch": 2.52, "eval_f1": 0.9459482392872296, "eval_loss": 0.3381609320640564, "eval_runtime": 496.3675, "eval_samples_per_second": 50.052, "eval_steps_per_second": 25.026, "step": 1000 }, { "epoch": 2.77, "learning_rate": 0.00024074074074074072, "loss": 0.3174, "step": 1100 }, { "epoch": 2.77, "eval_f1": 0.9459482392872296, "eval_loss": 0.33755871653556824, "eval_runtime": 496.1396, "eval_samples_per_second": 50.075, "eval_steps_per_second": 25.037, "step": 1100 }, { "epoch": 3.02, "learning_rate": 0.0002323232323232323, "loss": 0.3274, "step": 1200 }, { "epoch": 3.02, "eval_f1": 0.9459482392872296, "eval_loss": 0.3353538513183594, "eval_runtime": 496.3912, "eval_samples_per_second": 50.049, "eval_steps_per_second": 25.025, "step": 1200 }, { "epoch": 3.28, "learning_rate": 0.0002239057239057239, "loss": 0.3296, "step": 1300 }, { "epoch": 3.28, "eval_f1": 0.9459482392872296, "eval_loss": 0.33069172501564026, "eval_runtime": 496.1466, "eval_samples_per_second": 50.074, "eval_steps_per_second": 25.037, "step": 1300 }, { "epoch": 3.53, "learning_rate": 0.00021548821548821544, "loss": 0.3175, "step": 1400 }, { "epoch": 3.53, "eval_f1": 0.9459482392872296, "eval_loss": 0.3341147303581238, "eval_runtime": 496.5334, "eval_samples_per_second": 50.035, "eval_steps_per_second": 25.017, "step": 1400 }, { "epoch": 3.78, "learning_rate": 0.00020707070707070703, "loss": 0.3416, "step": 1500 }, { "epoch": 3.78, "eval_f1": 0.9459482392872296, "eval_loss": 0.3344402611255646, "eval_runtime": 496.2158, "eval_samples_per_second": 50.067, "eval_steps_per_second": 25.033, "step": 1500 }, { "epoch": 4.03, "learning_rate": 0.00019865319865319862, "loss": 0.3412, "step": 1600 }, { "epoch": 4.03, "eval_f1": 0.9459482392872296, "eval_loss": 0.3307790160179138, "eval_runtime": 496.5097, "eval_samples_per_second": 50.037, "eval_steps_per_second": 25.019, "step": 1600 }, { "epoch": 4.28, "learning_rate": 0.00019023569023569022, "loss": 0.3293, "step": 1700 }, { "epoch": 4.28, "eval_f1": 0.9459482392872296, "eval_loss": 0.3313847482204437, "eval_runtime": 496.395, "eval_samples_per_second": 50.049, "eval_steps_per_second": 25.024, "step": 1700 }, { "epoch": 4.54, "learning_rate": 0.0001818181818181818, "loss": 0.3346, "step": 1800 }, { "epoch": 4.54, "eval_f1": 0.9459482392872296, "eval_loss": 0.33080053329467773, "eval_runtime": 496.4252, "eval_samples_per_second": 50.046, "eval_steps_per_second": 25.023, "step": 1800 }, { "epoch": 4.79, "learning_rate": 0.0001734006734006734, "loss": 0.3279, "step": 1900 }, { "epoch": 4.79, "eval_f1": 0.9459482392872296, "eval_loss": 0.3317018449306488, "eval_runtime": 496.5163, "eval_samples_per_second": 50.037, "eval_steps_per_second": 25.018, "step": 1900 }, { "epoch": 5.04, "learning_rate": 0.000164983164983165, "loss": 0.3246, "step": 2000 }, { "epoch": 5.04, "eval_f1": 0.9459482392872296, "eval_loss": 0.33184757828712463, "eval_runtime": 496.5592, "eval_samples_per_second": 50.032, "eval_steps_per_second": 25.016, "step": 2000 }, { "epoch": 5.29, "learning_rate": 0.00015656565656565653, "loss": 0.3373, "step": 2100 }, { "epoch": 5.29, "eval_f1": 0.9459482392872296, "eval_loss": 0.33109256625175476, "eval_runtime": 496.5149, "eval_samples_per_second": 50.037, "eval_steps_per_second": 25.018, "step": 2100 }, { "epoch": 5.55, "learning_rate": 0.00014814814814814812, "loss": 0.3262, "step": 2200 }, { "epoch": 5.55, "eval_f1": 0.9459482392872296, "eval_loss": 0.33351102471351624, "eval_runtime": 496.6308, "eval_samples_per_second": 50.025, "eval_steps_per_second": 25.013, "step": 2200 }, { "epoch": 5.8, "learning_rate": 0.0001397306397306397, "loss": 0.3279, "step": 2300 }, { "epoch": 5.8, "eval_f1": 0.9459482392872296, "eval_loss": 0.3326103985309601, "eval_runtime": 496.8717, "eval_samples_per_second": 50.001, "eval_steps_per_second": 25.0, "step": 2300 }, { "epoch": 6.05, "learning_rate": 0.0001313131313131313, "loss": 0.3298, "step": 2400 }, { "epoch": 6.05, "eval_f1": 0.9459482392872296, "eval_loss": 0.3322770297527313, "eval_runtime": 496.7239, "eval_samples_per_second": 50.016, "eval_steps_per_second": 25.008, "step": 2400 }, { "epoch": 6.3, "learning_rate": 0.0001228956228956229, "loss": 0.3397, "step": 2500 }, { "epoch": 6.3, "eval_f1": 0.9459482392872296, "eval_loss": 0.3311246633529663, "eval_runtime": 496.772, "eval_samples_per_second": 50.011, "eval_steps_per_second": 25.005, "step": 2500 }, { "epoch": 6.55, "learning_rate": 0.00011447811447811446, "loss": 0.3312, "step": 2600 }, { "epoch": 6.55, "eval_f1": 0.9459482392872296, "eval_loss": 0.33860132098197937, "eval_runtime": 496.8085, "eval_samples_per_second": 50.007, "eval_steps_per_second": 25.004, "step": 2600 }, { "epoch": 6.81, "learning_rate": 0.00010606060606060605, "loss": 0.3291, "step": 2700 }, { "epoch": 6.81, "eval_f1": 0.9459482392872296, "eval_loss": 0.3316628634929657, "eval_runtime": 496.6873, "eval_samples_per_second": 50.019, "eval_steps_per_second": 25.01, "step": 2700 }, { "epoch": 7.06, "learning_rate": 9.764309764309764e-05, "loss": 0.3146, "step": 2800 }, { "epoch": 7.06, "eval_f1": 0.9459482392872296, "eval_loss": 0.33230647444725037, "eval_runtime": 496.6634, "eval_samples_per_second": 50.022, "eval_steps_per_second": 25.011, "step": 2800 }, { "epoch": 7.31, "learning_rate": 8.92255892255892e-05, "loss": 0.3296, "step": 2900 }, { "epoch": 7.31, "eval_f1": 0.9459482392872296, "eval_loss": 0.3313485085964203, "eval_runtime": 496.6247, "eval_samples_per_second": 50.026, "eval_steps_per_second": 25.013, "step": 2900 }, { "epoch": 7.56, "learning_rate": 8.08080808080808e-05, "loss": 0.3367, "step": 3000 }, { "epoch": 7.56, "eval_f1": 0.9459482392872296, "eval_loss": 0.33174964785575867, "eval_runtime": 496.735, "eval_samples_per_second": 50.015, "eval_steps_per_second": 25.007, "step": 3000 }, { "epoch": 7.81, "learning_rate": 7.239057239057239e-05, "loss": 0.3232, "step": 3100 }, { "epoch": 7.81, "eval_f1": 0.9459482392872296, "eval_loss": 0.3318324387073517, "eval_runtime": 496.5843, "eval_samples_per_second": 50.03, "eval_steps_per_second": 25.015, "step": 3100 }, { "epoch": 8.07, "learning_rate": 6.397306397306397e-05, "loss": 0.3314, "step": 3200 }, { "epoch": 8.07, "eval_f1": 0.9459482392872296, "eval_loss": 0.3325050175189972, "eval_runtime": 496.7125, "eval_samples_per_second": 50.017, "eval_steps_per_second": 25.008, "step": 3200 }, { "epoch": 8.32, "learning_rate": 5.5555555555555545e-05, "loss": 0.3201, "step": 3300 }, { "epoch": 8.32, "eval_f1": 0.9459482392872296, "eval_loss": 0.33225715160369873, "eval_runtime": 496.6425, "eval_samples_per_second": 50.024, "eval_steps_per_second": 25.012, "step": 3300 }, { "epoch": 8.57, "learning_rate": 4.7138047138047136e-05, "loss": 0.3301, "step": 3400 }, { "epoch": 8.57, "eval_f1": 0.9459482392872296, "eval_loss": 0.3346656262874603, "eval_runtime": 496.595, "eval_samples_per_second": 50.029, "eval_steps_per_second": 25.014, "step": 3400 }, { "epoch": 8.82, "learning_rate": 3.8720538720538714e-05, "loss": 0.3268, "step": 3500 }, { "epoch": 8.82, "eval_f1": 0.9459482392872296, "eval_loss": 0.33254188299179077, "eval_runtime": 496.5109, "eval_samples_per_second": 50.037, "eval_steps_per_second": 25.019, "step": 3500 }, { "epoch": 9.07, "learning_rate": 3.03030303030303e-05, "loss": 0.3361, "step": 3600 }, { "epoch": 9.07, "eval_f1": 0.9459482392872296, "eval_loss": 0.33214762806892395, "eval_runtime": 496.8406, "eval_samples_per_second": 50.004, "eval_steps_per_second": 25.002, "step": 3600 }, { "epoch": 9.33, "learning_rate": 2.1885521885521884e-05, "loss": 0.3395, "step": 3700 }, { "epoch": 9.33, "eval_f1": 0.9459482392872296, "eval_loss": 0.3312663733959198, "eval_runtime": 496.7467, "eval_samples_per_second": 50.013, "eval_steps_per_second": 25.007, "step": 3700 }, { "epoch": 9.58, "learning_rate": 1.3468013468013465e-05, "loss": 0.3231, "step": 3800 }, { "epoch": 9.58, "eval_f1": 0.9459482392872296, "eval_loss": 0.3319169878959656, "eval_runtime": 496.7702, "eval_samples_per_second": 50.011, "eval_steps_per_second": 25.006, "step": 3800 }, { "epoch": 9.83, "learning_rate": 5.05050505050505e-06, "loss": 0.3197, "step": 3900 }, { "epoch": 9.83, "eval_f1": 0.9459482392872296, "eval_loss": 0.3325766921043396, "eval_runtime": 496.6934, "eval_samples_per_second": 50.019, "eval_steps_per_second": 25.009, "step": 3900 }, { "epoch": 9.98, "step": 3960, "total_flos": 1.506420070651024e+19, "train_loss": 0.32019265878080116, "train_runtime": 22716.823, "train_samples_per_second": 11.172, "train_steps_per_second": 0.174 } ], "logging_steps": 100, "max_steps": 3960, "num_train_epochs": 10, "save_steps": 100, "total_flos": 1.506420070651024e+19, "trial_name": null, "trial_params": null }