cite-text-analysis's picture
Upload folder using huggingface_hub
21d503a verified
raw
history blame
6.05 kB
{
"best_metric": 0.6299493260025852,
"best_model_checkpoint": "case-analysis-bert-base-uncased/checkpoint-896",
"epoch": 6.0,
"eval_steps": 500,
"global_step": 1344,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.7861915367483296,
"eval_f1_macro": 0.5606209513919795,
"eval_f1_micro": 0.7861915367483298,
"eval_f1_weighted": 0.7596863457967054,
"eval_loss": 0.7283128499984741,
"eval_macro_fpr": 0.1142150114777894,
"eval_macro_sensitivity": 0.5571958513134984,
"eval_macro_specificity": 0.8974437739369907,
"eval_precision": 0.7487100743874461,
"eval_precision_macro": 0.584767668299669,
"eval_recall": 0.7861915367483296,
"eval_recall_macro": 0.5571958513134984,
"eval_runtime": 9.7006,
"eval_samples_per_second": 46.286,
"eval_steps_per_second": 5.876,
"eval_weighted_fpr": 0.08311688311688312,
"eval_weighted_sensitivity": 0.7861915367483296,
"eval_weighted_specificity": 0.8035835589996332,
"step": 224
},
{
"epoch": 2.0,
"eval_accuracy": 0.799554565701559,
"eval_f1_macro": 0.5913567856292314,
"eval_f1_micro": 0.799554565701559,
"eval_f1_weighted": 0.7794312570974847,
"eval_loss": 0.816001296043396,
"eval_macro_fpr": 0.09972743460349152,
"eval_macro_sensitivity": 0.6065148418089594,
"eval_macro_specificity": 0.910318444398066,
"eval_precision": 0.7603126937076594,
"eval_precision_macro": 0.5769576335614072,
"eval_recall": 0.799554565701559,
"eval_recall_macro": 0.6065148418089594,
"eval_runtime": 39.2963,
"eval_samples_per_second": 11.426,
"eval_steps_per_second": 1.451,
"eval_weighted_fpr": 0.07712082262210797,
"eval_weighted_sensitivity": 0.799554565701559,
"eval_weighted_specificity": 0.8417192118907049,
"step": 448
},
{
"epoch": 2.232142857142857,
"grad_norm": 10.089143753051758,
"learning_rate": 4.6302083333333335e-05,
"loss": 0.6512,
"step": 500
},
{
"epoch": 3.0,
"eval_accuracy": 0.7906458797327395,
"eval_f1_macro": 0.5840451851613266,
"eval_f1_micro": 0.7906458797327395,
"eval_f1_weighted": 0.771952482046502,
"eval_loss": 0.8587548136711121,
"eval_macro_fpr": 0.10045553338392213,
"eval_macro_sensitivity": 0.5989408048231577,
"eval_macro_specificity": 0.9104668136432382,
"eval_precision": 0.7597703984690992,
"eval_precision_macro": 0.5770004879708264,
"eval_recall": 0.7906458797327395,
"eval_recall_macro": 0.5989408048231577,
"eval_runtime": 36.0068,
"eval_samples_per_second": 12.47,
"eval_steps_per_second": 1.583,
"eval_weighted_fpr": 0.0811044003451251,
"eval_weighted_sensitivity": 0.7906458797327395,
"eval_weighted_specificity": 0.8512213748402133,
"step": 672
},
{
"epoch": 4.0,
"eval_accuracy": 0.7817371937639198,
"eval_f1_macro": 0.6299493260025852,
"eval_f1_micro": 0.7817371937639198,
"eval_f1_weighted": 0.7804892003577936,
"eval_loss": 1.0820659399032593,
"eval_macro_fpr": 0.09955325556886446,
"eval_macro_sensitivity": 0.6429130620307091,
"eval_macro_specificity": 0.9124114631310538,
"eval_precision": 0.7819490155060428,
"eval_precision_macro": 0.6213857962213225,
"eval_recall": 0.7817371937639198,
"eval_recall_macro": 0.6429130620307091,
"eval_runtime": 32.7545,
"eval_samples_per_second": 13.708,
"eval_steps_per_second": 1.74,
"eval_weighted_fpr": 0.08514335360556038,
"eval_weighted_sensitivity": 0.7817371937639198,
"eval_weighted_specificity": 0.8679086587602954,
"step": 896
},
{
"epoch": 4.464285714285714,
"grad_norm": 0.3640059232711792,
"learning_rate": 4.258184523809524e-05,
"loss": 0.3466,
"step": 1000
},
{
"epoch": 5.0,
"eval_accuracy": 0.8084632516703786,
"eval_f1_macro": 0.619470115868435,
"eval_f1_micro": 0.8084632516703786,
"eval_f1_weighted": 0.7927603955642376,
"eval_loss": 1.0612273216247559,
"eval_macro_fpr": 0.09480480467421379,
"eval_macro_sensitivity": 0.6262706556824204,
"eval_macro_specificity": 0.9138770264258179,
"eval_precision": 0.7999415514782998,
"eval_precision_macro": 0.7128659611992946,
"eval_recall": 0.8084632516703786,
"eval_recall_macro": 0.6262706556824204,
"eval_runtime": 34.7281,
"eval_samples_per_second": 12.929,
"eval_steps_per_second": 1.641,
"eval_weighted_fpr": 0.07319148936170213,
"eval_weighted_sensitivity": 0.8084632516703786,
"eval_weighted_specificity": 0.847044854032893,
"step": 1120
},
{
"epoch": 6.0,
"eval_accuracy": 0.7928730512249443,
"eval_f1_macro": 0.6273476992208005,
"eval_f1_micro": 0.7928730512249443,
"eval_f1_weighted": 0.7896519709076985,
"eval_loss": 1.2559400796890259,
"eval_macro_fpr": 0.09508832825281638,
"eval_macro_sensitivity": 0.6361528640940406,
"eval_macro_specificity": 0.9161350599199577,
"eval_precision": 0.7876580739535682,
"eval_precision_macro": 0.6205792331164909,
"eval_recall": 0.7928730512249443,
"eval_recall_macro": 0.6361528640940406,
"eval_runtime": 38.0322,
"eval_samples_per_second": 11.806,
"eval_steps_per_second": 1.499,
"eval_weighted_fpr": 0.08010335917312661,
"eval_weighted_sensitivity": 0.7928730512249443,
"eval_weighted_specificity": 0.8716671884548861,
"step": 1344
}
],
"logging_steps": 500,
"max_steps": 6720,
"num_input_tokens_seen": 0,
"num_train_epochs": 30,
"save_steps": 500,
"total_flos": 2829020867592192.0,
"train_batch_size": 8,
"trial_name": null,
"trial_params": null
}