{ "best_metric": 0.5913567856292314, "best_model_checkpoint": "case-analysis-bert-base-uncased/checkpoint-448", "epoch": 3.0, "eval_steps": 500, "global_step": 672, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.7861915367483296, "eval_f1_macro": 0.5606209513919795, "eval_f1_micro": 0.7861915367483298, "eval_f1_weighted": 0.7596863457967054, "eval_loss": 0.7283128499984741, "eval_macro_fpr": 0.1142150114777894, "eval_macro_sensitivity": 0.5571958513134984, "eval_macro_specificity": 0.8974437739369907, "eval_precision": 0.7487100743874461, "eval_precision_macro": 0.584767668299669, "eval_recall": 0.7861915367483296, "eval_recall_macro": 0.5571958513134984, "eval_runtime": 9.7006, "eval_samples_per_second": 46.286, "eval_steps_per_second": 5.876, "eval_weighted_fpr": 0.08311688311688312, "eval_weighted_sensitivity": 0.7861915367483296, "eval_weighted_specificity": 0.8035835589996332, "step": 224 }, { "epoch": 2.0, "eval_accuracy": 0.799554565701559, "eval_f1_macro": 0.5913567856292314, "eval_f1_micro": 0.799554565701559, "eval_f1_weighted": 0.7794312570974847, "eval_loss": 0.816001296043396, "eval_macro_fpr": 0.09972743460349152, "eval_macro_sensitivity": 0.6065148418089594, "eval_macro_specificity": 0.910318444398066, "eval_precision": 0.7603126937076594, "eval_precision_macro": 0.5769576335614072, "eval_recall": 0.799554565701559, "eval_recall_macro": 0.6065148418089594, "eval_runtime": 39.2963, "eval_samples_per_second": 11.426, "eval_steps_per_second": 1.451, "eval_weighted_fpr": 0.07712082262210797, "eval_weighted_sensitivity": 0.799554565701559, "eval_weighted_specificity": 0.8417192118907049, "step": 448 }, { "epoch": 2.232142857142857, "grad_norm": 10.089143753051758, "learning_rate": 4.6302083333333335e-05, "loss": 0.6512, "step": 500 }, { "epoch": 3.0, "eval_accuracy": 0.7906458797327395, "eval_f1_macro": 0.5840451851613266, "eval_f1_micro": 0.7906458797327395, "eval_f1_weighted": 0.771952482046502, "eval_loss": 0.8587548136711121, "eval_macro_fpr": 0.10045553338392213, "eval_macro_sensitivity": 0.5989408048231577, "eval_macro_specificity": 0.9104668136432382, "eval_precision": 0.7597703984690992, "eval_precision_macro": 0.5770004879708264, "eval_recall": 0.7906458797327395, "eval_recall_macro": 0.5989408048231577, "eval_runtime": 36.0068, "eval_samples_per_second": 12.47, "eval_steps_per_second": 1.583, "eval_weighted_fpr": 0.0811044003451251, "eval_weighted_sensitivity": 0.7906458797327395, "eval_weighted_specificity": 0.8512213748402133, "step": 672 } ], "logging_steps": 500, "max_steps": 6720, "num_input_tokens_seen": 0, "num_train_epochs": 30, "save_steps": 500, "total_flos": 1414510433796096.0, "train_batch_size": 8, "trial_name": null, "trial_params": null }