|
{ |
|
"best_metric": 0.7667275846579111, |
|
"best_model_checkpoint": "xlnet-base-cased/checkpoint-4501", |
|
"epoch": 11.0, |
|
"eval_steps": 500, |
|
"global_step": 7073, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.78, |
|
"learning_rate": 4.871695178849145e-05, |
|
"loss": 1.2613, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.7676219984508134, |
|
"eval_f1_macro": 0.4818756771742453, |
|
"eval_f1_micro": 0.7676219984508135, |
|
"eval_f1_weighted": 0.7524385212708887, |
|
"eval_loss": 0.775787353515625, |
|
"eval_macro_fpr": 0.022019799606126652, |
|
"eval_macro_sensitivity": 0.5128622254580788, |
|
"eval_macro_specificity": 0.9823717840367622, |
|
"eval_precision": 0.7672637518290021, |
|
"eval_precision_macro": 0.5269420024270713, |
|
"eval_recall": 0.7676219984508134, |
|
"eval_recall_macro": 0.5128622254580788, |
|
"eval_runtime": 65.0712, |
|
"eval_samples_per_second": 19.84, |
|
"eval_steps_per_second": 2.49, |
|
"eval_weighted_fpr": 0.021165514321998025, |
|
"eval_weighted_sensitivity": 0.7676219984508134, |
|
"eval_weighted_specificity": 0.9679547621006213, |
|
"step": 643 |
|
}, |
|
{ |
|
"epoch": 1.56, |
|
"learning_rate": 4.7420943494038366e-05, |
|
"loss": 0.7364, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.8071262587141751, |
|
"eval_f1_macro": 0.701878478303997, |
|
"eval_f1_micro": 0.8071262587141751, |
|
"eval_f1_weighted": 0.8012788916547595, |
|
"eval_loss": 0.6754755973815918, |
|
"eval_macro_fpr": 0.01739858713969909, |
|
"eval_macro_sensitivity": 0.6971761972643127, |
|
"eval_macro_specificity": 0.9854830758512745, |
|
"eval_precision": 0.8087721671110009, |
|
"eval_precision_macro": 0.7425135911700289, |
|
"eval_recall": 0.8071262587141751, |
|
"eval_recall_macro": 0.6971761972643127, |
|
"eval_runtime": 86.774, |
|
"eval_samples_per_second": 14.878, |
|
"eval_steps_per_second": 1.867, |
|
"eval_weighted_fpr": 0.016782368403316036, |
|
"eval_weighted_sensitivity": 0.8071262587141751, |
|
"eval_weighted_specificity": 0.9751198790549438, |
|
"step": 1286 |
|
}, |
|
{ |
|
"epoch": 2.33, |
|
"learning_rate": 4.612493519958528e-05, |
|
"loss": 0.6021, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.8063516653756778, |
|
"eval_f1_macro": 0.722931923188587, |
|
"eval_f1_micro": 0.8063516653756778, |
|
"eval_f1_weighted": 0.8013697737227732, |
|
"eval_loss": 0.8442708253860474, |
|
"eval_macro_fpr": 0.01757802934678216, |
|
"eval_macro_sensitivity": 0.7262014539622089, |
|
"eval_macro_specificity": 0.9852110484486459, |
|
"eval_precision": 0.8016312862866737, |
|
"eval_precision_macro": 0.7269969408457856, |
|
"eval_recall": 0.8063516653756778, |
|
"eval_recall_macro": 0.7262014539622089, |
|
"eval_runtime": 89.8454, |
|
"eval_samples_per_second": 14.369, |
|
"eval_steps_per_second": 1.803, |
|
"eval_weighted_fpr": 0.01686454398273071, |
|
"eval_weighted_sensitivity": 0.8063516653756778, |
|
"eval_weighted_specificity": 0.9718140613540133, |
|
"step": 1929 |
|
}, |
|
{ |
|
"epoch": 3.11, |
|
"learning_rate": 4.4828926905132196e-05, |
|
"loss": 0.5435, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 3.89, |
|
"learning_rate": 4.353551062726802e-05, |
|
"loss": 0.4361, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.8001549186676995, |
|
"eval_f1_macro": 0.7051095861561788, |
|
"eval_f1_micro": 0.8001549186676995, |
|
"eval_f1_weighted": 0.7970808578587494, |
|
"eval_loss": 0.8849796056747437, |
|
"eval_macro_fpr": 0.017973543700983616, |
|
"eval_macro_sensitivity": 0.704754303632947, |
|
"eval_macro_specificity": 0.984883284344937, |
|
"eval_precision": 0.8001040615771999, |
|
"eval_precision_macro": 0.716655759638538, |
|
"eval_recall": 0.8001549186676995, |
|
"eval_recall_macro": 0.704754303632947, |
|
"eval_runtime": 88.029, |
|
"eval_samples_per_second": 14.666, |
|
"eval_steps_per_second": 1.84, |
|
"eval_weighted_fpr": 0.017527173913043478, |
|
"eval_weighted_sensitivity": 0.8001549186676995, |
|
"eval_weighted_specificity": 0.9730943465063553, |
|
"step": 2572 |
|
}, |
|
{ |
|
"epoch": 4.67, |
|
"learning_rate": 4.223950233281493e-05, |
|
"loss": 0.3359, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.801704105344694, |
|
"eval_f1_macro": 0.6458763793901992, |
|
"eval_f1_micro": 0.801704105344694, |
|
"eval_f1_weighted": 0.7961730342415405, |
|
"eval_loss": 1.126444935798645, |
|
"eval_macro_fpr": 0.01805997413754306, |
|
"eval_macro_sensitivity": 0.6681366041180199, |
|
"eval_macro_specificity": 0.9849908327913178, |
|
"eval_precision": 0.7981459541145973, |
|
"eval_precision_macro": 0.6531140613829887, |
|
"eval_recall": 0.801704105344694, |
|
"eval_recall_macro": 0.6681366041180199, |
|
"eval_runtime": 90.8127, |
|
"eval_samples_per_second": 14.216, |
|
"eval_steps_per_second": 1.784, |
|
"eval_weighted_fpr": 0.0173606401736064, |
|
"eval_weighted_sensitivity": 0.801704105344694, |
|
"eval_weighted_specificity": 0.973158386525071, |
|
"step": 3215 |
|
}, |
|
{ |
|
"epoch": 5.44, |
|
"learning_rate": 4.0943494038361847e-05, |
|
"loss": 0.2827, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.7993803253292022, |
|
"eval_f1_macro": 0.7042383323872946, |
|
"eval_f1_micro": 0.7993803253292022, |
|
"eval_f1_weighted": 0.7951558065494785, |
|
"eval_loss": 1.1471006870269775, |
|
"eval_macro_fpr": 0.01833120632003448, |
|
"eval_macro_sensitivity": 0.692160115457962, |
|
"eval_macro_specificity": 0.9845339432297603, |
|
"eval_precision": 0.8091520232110664, |
|
"eval_precision_macro": 0.7389074945114087, |
|
"eval_recall": 0.7993803253292022, |
|
"eval_recall_macro": 0.692160115457962, |
|
"eval_runtime": 89.506, |
|
"eval_samples_per_second": 14.424, |
|
"eval_steps_per_second": 1.81, |
|
"eval_weighted_fpr": 0.017610661589719183, |
|
"eval_weighted_sensitivity": 0.7993803253292022, |
|
"eval_weighted_specificity": 0.9686288231172028, |
|
"step": 3858 |
|
}, |
|
{ |
|
"epoch": 6.22, |
|
"learning_rate": 3.964748574390876e-05, |
|
"loss": 0.2626, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 3.835147744945568e-05, |
|
"loss": 0.1945, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.814872192099148, |
|
"eval_f1_macro": 0.7667275846579111, |
|
"eval_f1_micro": 0.814872192099148, |
|
"eval_f1_weighted": 0.812156980007075, |
|
"eval_loss": 1.1841164827346802, |
|
"eval_macro_fpr": 0.016569799909363286, |
|
"eval_macro_sensitivity": 0.7598143558862378, |
|
"eval_macro_specificity": 0.9859673331635007, |
|
"eval_precision": 0.8128843369221012, |
|
"eval_precision_macro": 0.7850186311075981, |
|
"eval_recall": 0.814872192099148, |
|
"eval_recall_macro": 0.7598143558862378, |
|
"eval_runtime": 89.1729, |
|
"eval_samples_per_second": 14.477, |
|
"eval_steps_per_second": 1.817, |
|
"eval_weighted_fpr": 0.015968463954032203, |
|
"eval_weighted_sensitivity": 0.814872192099148, |
|
"eval_weighted_specificity": 0.974637805353365, |
|
"step": 4501 |
|
}, |
|
{ |
|
"epoch": 7.78, |
|
"learning_rate": 3.705546915500259e-05, |
|
"loss": 0.1286, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.8079008520526724, |
|
"eval_f1_macro": 0.728267610383121, |
|
"eval_f1_micro": 0.8079008520526724, |
|
"eval_f1_weighted": 0.8067061599230408, |
|
"eval_loss": 1.3231384754180908, |
|
"eval_macro_fpr": 0.01714064720569306, |
|
"eval_macro_sensitivity": 0.7216321376051643, |
|
"eval_macro_specificity": 0.9855732952526467, |
|
"eval_precision": 0.8105008603379217, |
|
"eval_precision_macro": 0.763038482726323, |
|
"eval_recall": 0.8079008520526724, |
|
"eval_recall_macro": 0.7216321376051643, |
|
"eval_runtime": 93.4716, |
|
"eval_samples_per_second": 13.812, |
|
"eval_steps_per_second": 1.733, |
|
"eval_weighted_fpr": 0.0167003367003367, |
|
"eval_weighted_sensitivity": 0.8079008520526724, |
|
"eval_weighted_specificity": 0.9756985767370285, |
|
"step": 5144 |
|
}, |
|
{ |
|
"epoch": 8.55, |
|
"learning_rate": 3.576205287713841e-05, |
|
"loss": 0.1304, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.8102246320681642, |
|
"eval_f1_macro": 0.7569552546114842, |
|
"eval_f1_micro": 0.8102246320681642, |
|
"eval_f1_weighted": 0.808840893500485, |
|
"eval_loss": 1.3869109153747559, |
|
"eval_macro_fpr": 0.017055465242864547, |
|
"eval_macro_sensitivity": 0.7602881393177737, |
|
"eval_macro_specificity": 0.9856184320870693, |
|
"eval_precision": 0.811846243162855, |
|
"eval_precision_macro": 0.7704913288832418, |
|
"eval_recall": 0.8102246320681642, |
|
"eval_recall_macro": 0.7602881393177737, |
|
"eval_runtime": 88.7368, |
|
"eval_samples_per_second": 14.549, |
|
"eval_steps_per_second": 1.826, |
|
"eval_weighted_fpr": 0.016455101081335213, |
|
"eval_weighted_sensitivity": 0.8102246320681642, |
|
"eval_weighted_specificity": 0.9740518492378762, |
|
"step": 5787 |
|
}, |
|
{ |
|
"epoch": 9.33, |
|
"learning_rate": 3.4466044582685334e-05, |
|
"loss": 0.0875, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.7823392718822618, |
|
"eval_f1_macro": 0.7192346851166359, |
|
"eval_f1_micro": 0.7823392718822618, |
|
"eval_f1_weighted": 0.7816836829450283, |
|
"eval_loss": 1.690091609954834, |
|
"eval_macro_fpr": 0.01985842187936775, |
|
"eval_macro_sensitivity": 0.7020361329217759, |
|
"eval_macro_specificity": 0.9833585449617043, |
|
"eval_precision": 0.7931868181724199, |
|
"eval_precision_macro": 0.7600588253545632, |
|
"eval_recall": 0.7823392718822618, |
|
"eval_recall_macro": 0.7020361329217759, |
|
"eval_runtime": 88.4203, |
|
"eval_samples_per_second": 14.601, |
|
"eval_steps_per_second": 1.832, |
|
"eval_weighted_fpr": 0.019485472574717427, |
|
"eval_weighted_sensitivity": 0.7823392718822618, |
|
"eval_weighted_specificity": 0.9680389025433043, |
|
"step": 6430 |
|
}, |
|
{ |
|
"epoch": 10.11, |
|
"learning_rate": 3.317003628823225e-05, |
|
"loss": 0.1088, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 10.89, |
|
"learning_rate": 3.187402799377916e-05, |
|
"loss": 0.1075, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_accuracy": 0.7978311386522076, |
|
"eval_f1_macro": 0.7470393699186935, |
|
"eval_f1_micro": 0.7978311386522076, |
|
"eval_f1_weighted": 0.793529238632398, |
|
"eval_loss": 1.6517162322998047, |
|
"eval_macro_fpr": 0.01832601410957563, |
|
"eval_macro_sensitivity": 0.7566567183934103, |
|
"eval_macro_specificity": 0.9849074579220182, |
|
"eval_precision": 0.8021421826960871, |
|
"eval_precision_macro": 0.7513026067404466, |
|
"eval_recall": 0.7978311386522076, |
|
"eval_recall_macro": 0.7566567183934103, |
|
"eval_runtime": 91.1007, |
|
"eval_samples_per_second": 14.171, |
|
"eval_steps_per_second": 1.778, |
|
"eval_weighted_fpr": 0.017778080512226686, |
|
"eval_weighted_sensitivity": 0.7978311386522076, |
|
"eval_weighted_specificity": 0.9757807301780667, |
|
"step": 7073 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 19290, |
|
"num_train_epochs": 30, |
|
"save_steps": 500, |
|
"total_flos": 1.6102599351810048e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|