{ "best_metric": 0.7415140921427528, "best_model_checkpoint": "tiny-llama-lora-new/checkpoint-643", "epoch": 8.995334370139968, "eval_steps": 500, "global_step": 1446, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.8001549186676995, "eval_f1_macro": 0.6790360166213908, "eval_f1_micro": 0.8001549186676995, "eval_f1_weighted": 0.7959404181222782, "eval_loss": 0.6614832282066345, "eval_macro_fpr": 0.01824293967244035, "eval_macro_sensitivity": 0.6677834011062839, "eval_macro_specificity": 0.9848478627893485, "eval_precision": 0.8040294558027004, "eval_precision_macro": 0.7265846774862527, "eval_recall": 0.8001549186676995, "eval_recall_macro": 0.6677834011062839, "eval_runtime": 225.9328, "eval_samples_per_second": 5.714, "eval_steps_per_second": 0.717, "eval_weighted_fpr": 0.017527173913043478, "eval_weighted_sensitivity": 0.8001549186676995, "eval_weighted_specificity": 0.97256302317253, "step": 160 }, { "epoch": 2.0, "eval_accuracy": 0.8063516653756778, "eval_f1_macro": 0.723523893027765, "eval_f1_micro": 0.8063516653756778, "eval_f1_weighted": 0.8039099652383133, "eval_loss": 0.6995529532432556, "eval_macro_fpr": 0.01771710819775641, "eval_macro_sensitivity": 0.7207263437235008, "eval_macro_specificity": 0.9853387258716434, "eval_precision": 0.8110438944279544, "eval_precision_macro": 0.7448100337436813, "eval_recall": 0.8063516653756778, "eval_recall_macro": 0.7207263437235008, "eval_runtime": 230.7469, "eval_samples_per_second": 5.595, "eval_steps_per_second": 0.702, "eval_weighted_fpr": 0.01686454398273071, "eval_weighted_sensitivity": 0.8063516653756778, "eval_weighted_specificity": 0.9737292226989717, "step": 321 }, { "epoch": 3.0, "eval_accuracy": 0.8125484120836561, "eval_f1_macro": 0.7179663090811256, "eval_f1_micro": 0.8125484120836561, "eval_f1_weighted": 0.8085118934271095, "eval_loss": 0.8202366828918457, "eval_macro_fpr": 0.017097652587672894, "eval_macro_sensitivity": 0.7080107913825292, "eval_macro_specificity": 0.985578595986596, "eval_precision": 0.8118501609528374, "eval_precision_macro": 0.7576540712122397, "eval_recall": 0.8125484120836561, "eval_recall_macro": 0.7080107913825292, "eval_runtime": 231.655, "eval_samples_per_second": 5.573, "eval_steps_per_second": 0.699, "eval_weighted_fpr": 0.016211146838156484, "eval_weighted_sensitivity": 0.8125484120836561, "eval_weighted_specificity": 0.9711305277152844, "step": 482 }, { "epoch": 3.11, "learning_rate": 3.958333333333333e-05, "loss": 0.2932, "step": 500 }, { "epoch": 4.0, "eval_accuracy": 0.8140975987606507, "eval_f1_macro": 0.7415140921427528, "eval_f1_micro": 0.8140975987606507, "eval_f1_weighted": 0.8153735617531811, "eval_loss": 0.9493006467819214, "eval_macro_fpr": 0.016573672675540378, "eval_macro_sensitivity": 0.7326751453453961, "eval_macro_specificity": 0.9859001747376132, "eval_precision": 0.8204052204072106, "eval_precision_macro": 0.759251934556511, "eval_recall": 0.8140975987606507, "eval_recall_macro": 0.7326751453453961, "eval_runtime": 230.2371, "eval_samples_per_second": 5.607, "eval_steps_per_second": 0.704, "eval_weighted_fpr": 0.016049217600641968, "eval_weighted_sensitivity": 0.8140975987606507, "eval_weighted_specificity": 0.974405022303545, "step": 643 }, { "epoch": 5.0, "eval_accuracy": 0.8109992254066615, "eval_f1_macro": 0.7413292975124365, "eval_f1_micro": 0.8109992254066615, "eval_f1_weighted": 0.8086569922767037, "eval_loss": 1.0610005855560303, "eval_macro_fpr": 0.017150663222076427, "eval_macro_sensitivity": 0.7427303328596474, "eval_macro_specificity": 0.9856545654845559, "eval_precision": 0.8110273755487133, "eval_precision_macro": 0.7595846993577862, "eval_recall": 0.8109992254066615, "eval_recall_macro": 0.7427303328596474, "eval_runtime": 232.3513, "eval_samples_per_second": 5.556, "eval_steps_per_second": 0.697, "eval_weighted_fpr": 0.016373641121997046, "eval_weighted_sensitivity": 0.8109992254066615, "eval_weighted_specificity": 0.9738192568616761, "step": 803 }, { "epoch": 6.0, "eval_accuracy": 0.814872192099148, "eval_f1_macro": 0.740834009056896, "eval_f1_micro": 0.814872192099148, "eval_f1_weighted": 0.812828873292886, "eval_loss": 1.1361573934555054, "eval_macro_fpr": 0.016745822161733162, "eval_macro_sensitivity": 0.7380044964762863, "eval_macro_specificity": 0.9859281636821422, "eval_precision": 0.8159522433901665, "eval_precision_macro": 0.7731408058998965, "eval_recall": 0.814872192099148, "eval_recall_macro": 0.7380044964762863, "eval_runtime": 230.3919, "eval_samples_per_second": 5.603, "eval_steps_per_second": 0.703, "eval_weighted_fpr": 0.015968463954032203, "eval_weighted_sensitivity": 0.814872192099148, "eval_weighted_specificity": 0.9740502631329879, "step": 964 }, { "epoch": 6.22, "learning_rate": 2.916666666666667e-05, "loss": 0.0107, "step": 1000 }, { "epoch": 7.0, "eval_accuracy": 0.8102246320681642, "eval_f1_macro": 0.734324336127792, "eval_f1_micro": 0.8102246320681642, "eval_f1_weighted": 0.8084846815925374, "eval_loss": 1.1712960004806519, "eval_macro_fpr": 0.017129374121876983, "eval_macro_sensitivity": 0.730990149259248, "eval_macro_specificity": 0.9855872802214631, "eval_precision": 0.812320444346659, "eval_precision_macro": 0.7734170589513789, "eval_recall": 0.8102246320681642, "eval_recall_macro": 0.730990149259248, "eval_runtime": 232.06, "eval_samples_per_second": 5.563, "eval_steps_per_second": 0.698, "eval_weighted_fpr": 0.016455101081335213, "eval_weighted_sensitivity": 0.8102246320681642, "eval_weighted_specificity": 0.973584571253782, "step": 1125 }, { "epoch": 8.0, "eval_accuracy": 0.8156467854376452, "eval_f1_macro": 0.7374069155892726, "eval_f1_micro": 0.8156467854376452, "eval_f1_weighted": 0.8127779657126307, "eval_loss": 1.1785770654678345, "eval_macro_fpr": 0.016642226736202675, "eval_macro_sensitivity": 0.7348966803697986, "eval_macro_specificity": 0.9859780376275717, "eval_precision": 0.8140580469506681, "eval_precision_macro": 0.7655811603242806, "eval_recall": 0.8156467854376452, "eval_recall_macro": 0.7348966803697986, "eval_runtime": 230.6812, "eval_samples_per_second": 5.596, "eval_steps_per_second": 0.702, "eval_weighted_fpr": 0.01588785046728972, "eval_weighted_sensitivity": 0.8156467854376452, "eval_weighted_specificity": 0.9740237789759322, "step": 1286 }, { "epoch": 9.0, "eval_accuracy": 0.8187451587916343, "eval_f1_macro": 0.7400115374685853, "eval_f1_micro": 0.8187451587916342, "eval_f1_weighted": 0.8156936902580679, "eval_loss": 1.1960150003433228, "eval_macro_fpr": 0.01632755569207043, "eval_macro_sensitivity": 0.7367529624892385, "eval_macro_specificity": 0.9862031650054388, "eval_precision": 0.8170206925865887, "eval_precision_macro": 0.769266125041975, "eval_recall": 0.8187451587916343, "eval_recall_macro": 0.7367529624892385, "eval_runtime": 231.8038, "eval_samples_per_second": 5.569, "eval_steps_per_second": 0.699, "eval_weighted_fpr": 0.015566790846194785, "eval_weighted_sensitivity": 0.8187451587916343, "eval_weighted_specificity": 0.9743023162899509, "step": 1446 } ], "logging_steps": 500, "max_steps": 2400, "num_train_epochs": 15, "save_steps": 500, "total_flos": 1.394492047318057e+17, "trial_name": null, "trial_params": null }