{ "best_metric": 0.6528931773500395, "best_model_checkpoint": "case-analysis-bert-base-uncased/checkpoint-2912", "epoch": 13.0, "eval_steps": 500, "global_step": 2912, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.7861915367483296, "eval_f1_macro": 0.5606209513919795, "eval_f1_micro": 0.7861915367483298, "eval_f1_weighted": 0.7596863457967054, "eval_loss": 0.7283128499984741, "eval_macro_fpr": 0.1142150114777894, "eval_macro_sensitivity": 0.5571958513134984, "eval_macro_specificity": 0.8974437739369907, "eval_precision": 0.7487100743874461, "eval_precision_macro": 0.584767668299669, "eval_recall": 0.7861915367483296, "eval_recall_macro": 0.5571958513134984, "eval_runtime": 9.7006, "eval_samples_per_second": 46.286, "eval_steps_per_second": 5.876, "eval_weighted_fpr": 0.08311688311688312, "eval_weighted_sensitivity": 0.7861915367483296, "eval_weighted_specificity": 0.8035835589996332, "step": 224 }, { "epoch": 2.0, "eval_accuracy": 0.799554565701559, "eval_f1_macro": 0.5913567856292314, "eval_f1_micro": 0.799554565701559, "eval_f1_weighted": 0.7794312570974847, "eval_loss": 0.816001296043396, "eval_macro_fpr": 0.09972743460349152, "eval_macro_sensitivity": 0.6065148418089594, "eval_macro_specificity": 0.910318444398066, "eval_precision": 0.7603126937076594, "eval_precision_macro": 0.5769576335614072, "eval_recall": 0.799554565701559, "eval_recall_macro": 0.6065148418089594, "eval_runtime": 39.2963, "eval_samples_per_second": 11.426, "eval_steps_per_second": 1.451, "eval_weighted_fpr": 0.07712082262210797, "eval_weighted_sensitivity": 0.799554565701559, "eval_weighted_specificity": 0.8417192118907049, "step": 448 }, { "epoch": 2.232142857142857, "grad_norm": 10.089143753051758, "learning_rate": 4.6302083333333335e-05, "loss": 0.6512, "step": 500 }, { "epoch": 3.0, "eval_accuracy": 0.7906458797327395, "eval_f1_macro": 0.5840451851613266, "eval_f1_micro": 0.7906458797327395, "eval_f1_weighted": 0.771952482046502, "eval_loss": 0.8587548136711121, "eval_macro_fpr": 0.10045553338392213, "eval_macro_sensitivity": 0.5989408048231577, "eval_macro_specificity": 0.9104668136432382, "eval_precision": 0.7597703984690992, "eval_precision_macro": 0.5770004879708264, "eval_recall": 0.7906458797327395, "eval_recall_macro": 0.5989408048231577, "eval_runtime": 36.0068, "eval_samples_per_second": 12.47, "eval_steps_per_second": 1.583, "eval_weighted_fpr": 0.0811044003451251, "eval_weighted_sensitivity": 0.7906458797327395, "eval_weighted_specificity": 0.8512213748402133, "step": 672 }, { "epoch": 4.0, "eval_accuracy": 0.7817371937639198, "eval_f1_macro": 0.6299493260025852, "eval_f1_micro": 0.7817371937639198, "eval_f1_weighted": 0.7804892003577936, "eval_loss": 1.0820659399032593, "eval_macro_fpr": 0.09955325556886446, "eval_macro_sensitivity": 0.6429130620307091, "eval_macro_specificity": 0.9124114631310538, "eval_precision": 0.7819490155060428, "eval_precision_macro": 0.6213857962213225, "eval_recall": 0.7817371937639198, "eval_recall_macro": 0.6429130620307091, "eval_runtime": 32.7545, "eval_samples_per_second": 13.708, "eval_steps_per_second": 1.74, "eval_weighted_fpr": 0.08514335360556038, "eval_weighted_sensitivity": 0.7817371937639198, "eval_weighted_specificity": 0.8679086587602954, "step": 896 }, { "epoch": 4.464285714285714, "grad_norm": 0.3640059232711792, "learning_rate": 4.258184523809524e-05, "loss": 0.3466, "step": 1000 }, { "epoch": 5.0, "eval_accuracy": 0.8084632516703786, "eval_f1_macro": 0.619470115868435, "eval_f1_micro": 0.8084632516703786, "eval_f1_weighted": 0.7927603955642376, "eval_loss": 1.0612273216247559, "eval_macro_fpr": 0.09480480467421379, "eval_macro_sensitivity": 0.6262706556824204, "eval_macro_specificity": 0.9138770264258179, "eval_precision": 0.7999415514782998, "eval_precision_macro": 0.7128659611992946, "eval_recall": 0.8084632516703786, "eval_recall_macro": 0.6262706556824204, "eval_runtime": 34.7281, "eval_samples_per_second": 12.929, "eval_steps_per_second": 1.641, "eval_weighted_fpr": 0.07319148936170213, "eval_weighted_sensitivity": 0.8084632516703786, "eval_weighted_specificity": 0.847044854032893, "step": 1120 }, { "epoch": 6.0, "eval_accuracy": 0.7928730512249443, "eval_f1_macro": 0.6273476992208005, "eval_f1_micro": 0.7928730512249443, "eval_f1_weighted": 0.7896519709076985, "eval_loss": 1.2559400796890259, "eval_macro_fpr": 0.09508832825281638, "eval_macro_sensitivity": 0.6361528640940406, "eval_macro_specificity": 0.9161350599199577, "eval_precision": 0.7876580739535682, "eval_precision_macro": 0.6205792331164909, "eval_recall": 0.7928730512249443, "eval_recall_macro": 0.6361528640940406, "eval_runtime": 38.0322, "eval_samples_per_second": 11.806, "eval_steps_per_second": 1.499, "eval_weighted_fpr": 0.08010335917312661, "eval_weighted_sensitivity": 0.7928730512249443, "eval_weighted_specificity": 0.8716671884548861, "step": 1344 }, { "epoch": 6.696428571428571, "grad_norm": 0.05509716644883156, "learning_rate": 3.8869047619047625e-05, "loss": 0.1715, "step": 1500 }, { "epoch": 7.0, "eval_accuracy": 0.7928730512249443, "eval_f1_macro": 0.623650691198171, "eval_f1_micro": 0.7928730512249443, "eval_f1_weighted": 0.7892792124992886, "eval_loss": 1.3700848817825317, "eval_macro_fpr": 0.09905686727492574, "eval_macro_sensitivity": 0.6178801987625516, "eval_macro_specificity": 0.9121558558439, "eval_precision": 0.7889374292245007, "eval_precision_macro": 0.6344745555953697, "eval_recall": 0.7928730512249443, "eval_recall_macro": 0.6178801987625516, "eval_runtime": 38.6276, "eval_samples_per_second": 11.624, "eval_steps_per_second": 1.476, "eval_weighted_fpr": 0.08010335917312661, "eval_weighted_sensitivity": 0.7928730512249443, "eval_weighted_specificity": 0.8557503721506562, "step": 1568 }, { "epoch": 8.0, "eval_accuracy": 0.8106904231625836, "eval_f1_macro": 0.6464437798898967, "eval_f1_micro": 0.8106904231625834, "eval_f1_weighted": 0.8064189899649085, "eval_loss": 1.4005118608474731, "eval_macro_fpr": 0.0921754708102674, "eval_macro_sensitivity": 0.6370398282162988, "eval_macro_specificity": 0.9178527413440807, "eval_precision": 0.8034816923327339, "eval_precision_macro": 0.6578060011883542, "eval_recall": 0.8106904231625836, "eval_recall_macro": 0.6370398282162988, "eval_runtime": 35.6698, "eval_samples_per_second": 12.588, "eval_steps_per_second": 1.598, "eval_weighted_fpr": 0.07221750212404418, "eval_weighted_sensitivity": 0.8106904231625836, "eval_weighted_specificity": 0.860720542213739, "step": 1792 }, { "epoch": 8.928571428571429, "grad_norm": 0.005432427860796452, "learning_rate": 3.514880952380952e-05, "loss": 0.0636, "step": 2000 }, { "epoch": 9.0, "eval_accuracy": 0.8017817371937639, "eval_f1_macro": 0.6263115408785538, "eval_f1_micro": 0.8017817371937639, "eval_f1_weighted": 0.7896240754364972, "eval_loss": 1.473650336265564, "eval_macro_fpr": 0.10259295399855256, "eval_macro_sensitivity": 0.6149052987288282, "eval_macro_specificity": 0.9072211454744684, "eval_precision": 0.788055851480147, "eval_precision_macro": 0.6582800876341822, "eval_recall": 0.8017817371937639, "eval_recall_macro": 0.6149052987288282, "eval_runtime": 34.11, "eval_samples_per_second": 13.163, "eval_steps_per_second": 1.671, "eval_weighted_fpr": 0.07613344739093242, "eval_weighted_sensitivity": 0.8017817371937639, "eval_weighted_specificity": 0.8271028447041098, "step": 2016 }, { "epoch": 10.0, "eval_accuracy": 0.7884187082405345, "eval_f1_macro": 0.6331690370327951, "eval_f1_micro": 0.7884187082405345, "eval_f1_weighted": 0.7909426185077314, "eval_loss": 1.7568920850753784, "eval_macro_fpr": 0.09595908153187079, "eval_macro_sensitivity": 0.6428373560726501, "eval_macro_specificity": 0.91584307980206, "eval_precision": 0.7961677526311304, "eval_precision_macro": 0.6275270485563467, "eval_recall": 0.7884187082405345, "eval_recall_macro": 0.6428373560726501, "eval_runtime": 42.7436, "eval_samples_per_second": 10.504, "eval_steps_per_second": 1.334, "eval_weighted_fpr": 0.08210890233362143, "eval_weighted_sensitivity": 0.7884187082405345, "eval_weighted_specificity": 0.8749536109677053, "step": 2240 }, { "epoch": 11.0, "eval_accuracy": 0.7906458797327395, "eval_f1_macro": 0.6101321036639349, "eval_f1_micro": 0.7906458797327395, "eval_f1_weighted": 0.7845175231806186, "eval_loss": 1.7140623331069946, "eval_macro_fpr": 0.1035198920558284, "eval_macro_sensitivity": 0.6082973730032554, "eval_macro_specificity": 0.9082706582818566, "eval_precision": 0.7824040660397941, "eval_precision_macro": 0.6165716760629552, "eval_recall": 0.7906458797327395, "eval_recall_macro": 0.6082973730032554, "eval_runtime": 37.438, "eval_samples_per_second": 11.993, "eval_steps_per_second": 1.523, "eval_weighted_fpr": 0.0811044003451251, "eval_weighted_sensitivity": 0.7906458797327395, "eval_weighted_specificity": 0.842436753394687, "step": 2464 }, { "epoch": 11.160714285714286, "grad_norm": 0.0017704592319205403, "learning_rate": 3.142857142857143e-05, "loss": 0.0159, "step": 2500 }, { "epoch": 12.0, "eval_accuracy": 0.7951002227171492, "eval_f1_macro": 0.6372747490500124, "eval_f1_micro": 0.7951002227171492, "eval_f1_weighted": 0.7916670590899947, "eval_loss": 1.714410662651062, "eval_macro_fpr": 0.09685632952239012, "eval_macro_sensitivity": 0.6412759206876854, "eval_macro_specificity": 0.9140152346037369, "eval_precision": 0.7913770752065027, "eval_precision_macro": 0.6393393002684569, "eval_recall": 0.7951002227171492, "eval_recall_macro": 0.6412759206876854, "eval_runtime": 34.7517, "eval_samples_per_second": 12.92, "eval_steps_per_second": 1.64, "eval_weighted_fpr": 0.07910576096302666, "eval_weighted_sensitivity": 0.7951002227171492, "eval_weighted_specificity": 0.8609607156977986, "step": 2688 }, { "epoch": 13.0, "eval_accuracy": 0.799554565701559, "eval_f1_macro": 0.6528931773500395, "eval_f1_micro": 0.799554565701559, "eval_f1_weighted": 0.798188843376642, "eval_loss": 1.7243342399597168, "eval_macro_fpr": 0.09420589017594908, "eval_macro_sensitivity": 0.6525655716832187, "eval_macro_specificity": 0.9158469519501292, "eval_precision": 0.7968817042081011, "eval_precision_macro": 0.6534600751896625, "eval_recall": 0.799554565701559, "eval_recall_macro": 0.6525655716832187, "eval_runtime": 35.7184, "eval_samples_per_second": 12.571, "eval_steps_per_second": 1.596, "eval_weighted_fpr": 0.07712082262210797, "eval_weighted_sensitivity": 0.799554565701559, "eval_weighted_specificity": 0.8638332420989578, "step": 2912 } ], "logging_steps": 500, "max_steps": 6720, "num_input_tokens_seen": 0, "num_train_epochs": 30, "save_steps": 500, "total_flos": 6129545213116416.0, "train_batch_size": 8, "trial_name": null, "trial_params": null }