{ "best_metric": 0.7667275846579111, "best_model_checkpoint": "xlnet-base-cased/checkpoint-4501", "epoch": 10.0, "eval_steps": 500, "global_step": 6430, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.78, "learning_rate": 4.871695178849145e-05, "loss": 1.2613, "step": 500 }, { "epoch": 1.0, "eval_accuracy": 0.7676219984508134, "eval_f1_macro": 0.4818756771742453, "eval_f1_micro": 0.7676219984508135, "eval_f1_weighted": 0.7524385212708887, "eval_loss": 0.775787353515625, "eval_macro_fpr": 0.022019799606126652, "eval_macro_sensitivity": 0.5128622254580788, "eval_macro_specificity": 0.9823717840367622, "eval_precision": 0.7672637518290021, "eval_precision_macro": 0.5269420024270713, "eval_recall": 0.7676219984508134, "eval_recall_macro": 0.5128622254580788, "eval_runtime": 65.0712, "eval_samples_per_second": 19.84, "eval_steps_per_second": 2.49, "eval_weighted_fpr": 0.021165514321998025, "eval_weighted_sensitivity": 0.7676219984508134, "eval_weighted_specificity": 0.9679547621006213, "step": 643 }, { "epoch": 1.56, "learning_rate": 4.7420943494038366e-05, "loss": 0.7364, "step": 1000 }, { "epoch": 2.0, "eval_accuracy": 0.8071262587141751, "eval_f1_macro": 0.701878478303997, "eval_f1_micro": 0.8071262587141751, "eval_f1_weighted": 0.8012788916547595, "eval_loss": 0.6754755973815918, "eval_macro_fpr": 0.01739858713969909, "eval_macro_sensitivity": 0.6971761972643127, "eval_macro_specificity": 0.9854830758512745, "eval_precision": 0.8087721671110009, "eval_precision_macro": 0.7425135911700289, "eval_recall": 0.8071262587141751, "eval_recall_macro": 0.6971761972643127, "eval_runtime": 86.774, "eval_samples_per_second": 14.878, "eval_steps_per_second": 1.867, "eval_weighted_fpr": 0.016782368403316036, "eval_weighted_sensitivity": 0.8071262587141751, "eval_weighted_specificity": 0.9751198790549438, "step": 1286 }, { "epoch": 2.33, "learning_rate": 4.612493519958528e-05, "loss": 0.6021, "step": 1500 }, { "epoch": 3.0, "eval_accuracy": 0.8063516653756778, "eval_f1_macro": 0.722931923188587, "eval_f1_micro": 0.8063516653756778, "eval_f1_weighted": 0.8013697737227732, "eval_loss": 0.8442708253860474, "eval_macro_fpr": 0.01757802934678216, "eval_macro_sensitivity": 0.7262014539622089, "eval_macro_specificity": 0.9852110484486459, "eval_precision": 0.8016312862866737, "eval_precision_macro": 0.7269969408457856, "eval_recall": 0.8063516653756778, "eval_recall_macro": 0.7262014539622089, "eval_runtime": 89.8454, "eval_samples_per_second": 14.369, "eval_steps_per_second": 1.803, "eval_weighted_fpr": 0.01686454398273071, "eval_weighted_sensitivity": 0.8063516653756778, "eval_weighted_specificity": 0.9718140613540133, "step": 1929 }, { "epoch": 3.11, "learning_rate": 4.4828926905132196e-05, "loss": 0.5435, "step": 2000 }, { "epoch": 3.89, "learning_rate": 4.353551062726802e-05, "loss": 0.4361, "step": 2500 }, { "epoch": 4.0, "eval_accuracy": 0.8001549186676995, "eval_f1_macro": 0.7051095861561788, "eval_f1_micro": 0.8001549186676995, "eval_f1_weighted": 0.7970808578587494, "eval_loss": 0.8849796056747437, "eval_macro_fpr": 0.017973543700983616, "eval_macro_sensitivity": 0.704754303632947, "eval_macro_specificity": 0.984883284344937, "eval_precision": 0.8001040615771999, "eval_precision_macro": 0.716655759638538, "eval_recall": 0.8001549186676995, "eval_recall_macro": 0.704754303632947, "eval_runtime": 88.029, "eval_samples_per_second": 14.666, "eval_steps_per_second": 1.84, "eval_weighted_fpr": 0.017527173913043478, "eval_weighted_sensitivity": 0.8001549186676995, "eval_weighted_specificity": 0.9730943465063553, "step": 2572 }, { "epoch": 4.67, "learning_rate": 4.223950233281493e-05, "loss": 0.3359, "step": 3000 }, { "epoch": 5.0, "eval_accuracy": 0.801704105344694, "eval_f1_macro": 0.6458763793901992, "eval_f1_micro": 0.801704105344694, "eval_f1_weighted": 0.7961730342415405, "eval_loss": 1.126444935798645, "eval_macro_fpr": 0.01805997413754306, "eval_macro_sensitivity": 0.6681366041180199, "eval_macro_specificity": 0.9849908327913178, "eval_precision": 0.7981459541145973, "eval_precision_macro": 0.6531140613829887, "eval_recall": 0.801704105344694, "eval_recall_macro": 0.6681366041180199, "eval_runtime": 90.8127, "eval_samples_per_second": 14.216, "eval_steps_per_second": 1.784, "eval_weighted_fpr": 0.0173606401736064, "eval_weighted_sensitivity": 0.801704105344694, "eval_weighted_specificity": 0.973158386525071, "step": 3215 }, { "epoch": 5.44, "learning_rate": 4.0943494038361847e-05, "loss": 0.2827, "step": 3500 }, { "epoch": 6.0, "eval_accuracy": 0.7993803253292022, "eval_f1_macro": 0.7042383323872946, "eval_f1_micro": 0.7993803253292022, "eval_f1_weighted": 0.7951558065494785, "eval_loss": 1.1471006870269775, "eval_macro_fpr": 0.01833120632003448, "eval_macro_sensitivity": 0.692160115457962, "eval_macro_specificity": 0.9845339432297603, "eval_precision": 0.8091520232110664, "eval_precision_macro": 0.7389074945114087, "eval_recall": 0.7993803253292022, "eval_recall_macro": 0.692160115457962, "eval_runtime": 89.506, "eval_samples_per_second": 14.424, "eval_steps_per_second": 1.81, "eval_weighted_fpr": 0.017610661589719183, "eval_weighted_sensitivity": 0.7993803253292022, "eval_weighted_specificity": 0.9686288231172028, "step": 3858 }, { "epoch": 6.22, "learning_rate": 3.964748574390876e-05, "loss": 0.2626, "step": 4000 }, { "epoch": 7.0, "learning_rate": 3.835147744945568e-05, "loss": 0.1945, "step": 4500 }, { "epoch": 7.0, "eval_accuracy": 0.814872192099148, "eval_f1_macro": 0.7667275846579111, "eval_f1_micro": 0.814872192099148, "eval_f1_weighted": 0.812156980007075, "eval_loss": 1.1841164827346802, "eval_macro_fpr": 0.016569799909363286, "eval_macro_sensitivity": 0.7598143558862378, "eval_macro_specificity": 0.9859673331635007, "eval_precision": 0.8128843369221012, "eval_precision_macro": 0.7850186311075981, "eval_recall": 0.814872192099148, "eval_recall_macro": 0.7598143558862378, "eval_runtime": 89.1729, "eval_samples_per_second": 14.477, "eval_steps_per_second": 1.817, "eval_weighted_fpr": 0.015968463954032203, "eval_weighted_sensitivity": 0.814872192099148, "eval_weighted_specificity": 0.974637805353365, "step": 4501 }, { "epoch": 7.78, "learning_rate": 3.705546915500259e-05, "loss": 0.1286, "step": 5000 }, { "epoch": 8.0, "eval_accuracy": 0.8079008520526724, "eval_f1_macro": 0.728267610383121, "eval_f1_micro": 0.8079008520526724, "eval_f1_weighted": 0.8067061599230408, "eval_loss": 1.3231384754180908, "eval_macro_fpr": 0.01714064720569306, "eval_macro_sensitivity": 0.7216321376051643, "eval_macro_specificity": 0.9855732952526467, "eval_precision": 0.8105008603379217, "eval_precision_macro": 0.763038482726323, "eval_recall": 0.8079008520526724, "eval_recall_macro": 0.7216321376051643, "eval_runtime": 93.4716, "eval_samples_per_second": 13.812, "eval_steps_per_second": 1.733, "eval_weighted_fpr": 0.0167003367003367, "eval_weighted_sensitivity": 0.8079008520526724, "eval_weighted_specificity": 0.9756985767370285, "step": 5144 }, { "epoch": 8.55, "learning_rate": 3.576205287713841e-05, "loss": 0.1304, "step": 5500 }, { "epoch": 9.0, "eval_accuracy": 0.8102246320681642, "eval_f1_macro": 0.7569552546114842, "eval_f1_micro": 0.8102246320681642, "eval_f1_weighted": 0.808840893500485, "eval_loss": 1.3869109153747559, "eval_macro_fpr": 0.017055465242864547, "eval_macro_sensitivity": 0.7602881393177737, "eval_macro_specificity": 0.9856184320870693, "eval_precision": 0.811846243162855, "eval_precision_macro": 0.7704913288832418, "eval_recall": 0.8102246320681642, "eval_recall_macro": 0.7602881393177737, "eval_runtime": 88.7368, "eval_samples_per_second": 14.549, "eval_steps_per_second": 1.826, "eval_weighted_fpr": 0.016455101081335213, "eval_weighted_sensitivity": 0.8102246320681642, "eval_weighted_specificity": 0.9740518492378762, "step": 5787 }, { "epoch": 9.33, "learning_rate": 3.4466044582685334e-05, "loss": 0.0875, "step": 6000 }, { "epoch": 10.0, "eval_accuracy": 0.7823392718822618, "eval_f1_macro": 0.7192346851166359, "eval_f1_micro": 0.7823392718822618, "eval_f1_weighted": 0.7816836829450283, "eval_loss": 1.690091609954834, "eval_macro_fpr": 0.01985842187936775, "eval_macro_sensitivity": 0.7020361329217759, "eval_macro_specificity": 0.9833585449617043, "eval_precision": 0.7931868181724199, "eval_precision_macro": 0.7600588253545632, "eval_recall": 0.7823392718822618, "eval_recall_macro": 0.7020361329217759, "eval_runtime": 88.4203, "eval_samples_per_second": 14.601, "eval_steps_per_second": 1.832, "eval_weighted_fpr": 0.019485472574717427, "eval_weighted_sensitivity": 0.7823392718822618, "eval_weighted_specificity": 0.9680389025433043, "step": 6430 } ], "logging_steps": 500, "max_steps": 19290, "num_train_epochs": 30, "save_steps": 500, "total_flos": 1.463872668346368e+16, "trial_name": null, "trial_params": null }