File size: 3,414 Bytes
8c8e5fc |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 |
{
"best_metric": 0.722931923188587,
"best_model_checkpoint": "xlnet-base-cased/checkpoint-1929",
"epoch": 3.0,
"eval_steps": 500,
"global_step": 1929,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.78,
"learning_rate": 4.871695178849145e-05,
"loss": 1.2613,
"step": 500
},
{
"epoch": 1.0,
"eval_accuracy": 0.7676219984508134,
"eval_f1_macro": 0.4818756771742453,
"eval_f1_micro": 0.7676219984508135,
"eval_f1_weighted": 0.7524385212708887,
"eval_loss": 0.775787353515625,
"eval_macro_fpr": 0.022019799606126652,
"eval_macro_sensitivity": 0.5128622254580788,
"eval_macro_specificity": 0.9823717840367622,
"eval_precision": 0.7672637518290021,
"eval_precision_macro": 0.5269420024270713,
"eval_recall": 0.7676219984508134,
"eval_recall_macro": 0.5128622254580788,
"eval_runtime": 65.0712,
"eval_samples_per_second": 19.84,
"eval_steps_per_second": 2.49,
"eval_weighted_fpr": 0.021165514321998025,
"eval_weighted_sensitivity": 0.7676219984508134,
"eval_weighted_specificity": 0.9679547621006213,
"step": 643
},
{
"epoch": 1.56,
"learning_rate": 4.7420943494038366e-05,
"loss": 0.7364,
"step": 1000
},
{
"epoch": 2.0,
"eval_accuracy": 0.8071262587141751,
"eval_f1_macro": 0.701878478303997,
"eval_f1_micro": 0.8071262587141751,
"eval_f1_weighted": 0.8012788916547595,
"eval_loss": 0.6754755973815918,
"eval_macro_fpr": 0.01739858713969909,
"eval_macro_sensitivity": 0.6971761972643127,
"eval_macro_specificity": 0.9854830758512745,
"eval_precision": 0.8087721671110009,
"eval_precision_macro": 0.7425135911700289,
"eval_recall": 0.8071262587141751,
"eval_recall_macro": 0.6971761972643127,
"eval_runtime": 86.774,
"eval_samples_per_second": 14.878,
"eval_steps_per_second": 1.867,
"eval_weighted_fpr": 0.016782368403316036,
"eval_weighted_sensitivity": 0.8071262587141751,
"eval_weighted_specificity": 0.9751198790549438,
"step": 1286
},
{
"epoch": 2.33,
"learning_rate": 4.612493519958528e-05,
"loss": 0.6021,
"step": 1500
},
{
"epoch": 3.0,
"eval_accuracy": 0.8063516653756778,
"eval_f1_macro": 0.722931923188587,
"eval_f1_micro": 0.8063516653756778,
"eval_f1_weighted": 0.8013697737227732,
"eval_loss": 0.8442708253860474,
"eval_macro_fpr": 0.01757802934678216,
"eval_macro_sensitivity": 0.7262014539622089,
"eval_macro_specificity": 0.9852110484486459,
"eval_precision": 0.8016312862866737,
"eval_precision_macro": 0.7269969408457856,
"eval_recall": 0.8063516653756778,
"eval_recall_macro": 0.7262014539622089,
"eval_runtime": 89.8454,
"eval_samples_per_second": 14.369,
"eval_steps_per_second": 1.803,
"eval_weighted_fpr": 0.01686454398273071,
"eval_weighted_sensitivity": 0.8063516653756778,
"eval_weighted_specificity": 0.9718140613540133,
"step": 1929
}
],
"logging_steps": 500,
"max_steps": 19290,
"num_train_epochs": 30,
"save_steps": 500,
"total_flos": 4391618005039104.0,
"trial_name": null,
"trial_params": null
}
|