{ "best_metric": 0.9282467532467532, "best_model_checkpoint": "mpnet-metric/checkpoint-1400", "epoch": 36.36363636363637, "global_step": 1600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 2.27, "eval_accuracy": 0.8194805194805195, "eval_f1": 0.7656701166780793, "eval_loss": 1.9282063245773315, "eval_matthews_correlation": 0.8177401806097793, "eval_runtime": 2.1248, "eval_samples_per_second": 1449.542, "eval_steps_per_second": 9.413, "step": 100 }, { "epoch": 4.55, "eval_accuracy": 0.8603896103896104, "eval_f1": 0.8221385737164676, "eval_loss": 1.785994529724121, "eval_matthews_correlation": 0.8588446795045349, "eval_runtime": 2.1571, "eval_samples_per_second": 1427.834, "eval_steps_per_second": 9.272, "step": 200 }, { "epoch": 6.82, "eval_accuracy": 0.8831168831168831, "eval_f1": 0.8503152420049573, "eval_loss": 1.703816533088684, "eval_matthews_correlation": 0.8817033568232515, "eval_runtime": 2.2955, "eval_samples_per_second": 1341.777, "eval_steps_per_second": 8.713, "step": 300 }, { "epoch": 9.09, "eval_accuracy": 0.8948051948051948, "eval_f1": 0.8658511061420076, "eval_loss": 1.5578949451446533, "eval_matthews_correlation": 0.893469940479661, "eval_runtime": 2.1159, "eval_samples_per_second": 1455.648, "eval_steps_per_second": 9.452, "step": 400 }, { "epoch": 11.36, "learning_rate": 2.91576008814464e-05, "loss": 1.3674, "step": 500 }, { "epoch": 11.36, "eval_accuracy": 0.9084415584415585, "eval_f1": 0.8884952022189863, "eval_loss": 1.6358195543289185, "eval_matthews_correlation": 0.9072261203467101, "eval_runtime": 2.0369, "eval_samples_per_second": 1512.102, "eval_steps_per_second": 9.819, "step": 500 }, { "epoch": 13.64, "eval_accuracy": 0.9191558441558442, "eval_f1": 0.9087017801267994, "eval_loss": 1.6092149019241333, "eval_matthews_correlation": 0.9180607280357055, "eval_runtime": 2.2317, "eval_samples_per_second": 1380.116, "eval_steps_per_second": 8.962, "step": 600 }, { "epoch": 15.91, "eval_accuracy": 0.9237012987012987, "eval_f1": 0.9173470137032593, "eval_loss": 1.6759223937988281, "eval_matthews_correlation": 0.92267900847975, "eval_runtime": 2.1403, "eval_samples_per_second": 1439.027, "eval_steps_per_second": 9.344, "step": 700 }, { "epoch": 18.18, "eval_accuracy": 0.922077922077922, "eval_f1": 0.9224956919233739, "eval_loss": 1.7042781114578247, "eval_matthews_correlation": 0.9210156723561079, "eval_runtime": 2.1182, "eval_samples_per_second": 1454.06, "eval_steps_per_second": 9.442, "step": 800 }, { "epoch": 20.45, "eval_accuracy": 0.9256493506493506, "eval_f1": 0.9250031430609338, "eval_loss": 1.618914246559143, "eval_matthews_correlation": 0.9246330543218574, "eval_runtime": 2.1102, "eval_samples_per_second": 1459.597, "eval_steps_per_second": 9.478, "step": 900 }, { "epoch": 22.73, "learning_rate": 1.758712434118989e-05, "loss": 0.4113, "step": 1000 }, { "epoch": 22.73, "eval_accuracy": 0.9272727272727272, "eval_f1": 0.9262478178442993, "eval_loss": 1.6726940870285034, "eval_matthews_correlation": 0.9262802775880362, "eval_runtime": 2.3947, "eval_samples_per_second": 1286.193, "eval_steps_per_second": 8.352, "step": 1000 }, { "epoch": 25.0, "eval_accuracy": 0.9282467532467532, "eval_f1": 0.9285902214751346, "eval_loss": 1.7208188772201538, "eval_matthews_correlation": 0.9272760959410294, "eval_runtime": 2.0547, "eval_samples_per_second": 1498.986, "eval_steps_per_second": 9.734, "step": 1100 }, { "epoch": 27.27, "eval_accuracy": 0.9272727272727272, "eval_f1": 0.9269182576494233, "eval_loss": 1.7480313777923584, "eval_matthews_correlation": 0.9262735351894748, "eval_runtime": 2.0774, "eval_samples_per_second": 1482.597, "eval_steps_per_second": 9.627, "step": 1200 }, { "epoch": 29.55, "eval_accuracy": 0.9262987012987013, "eval_f1": 0.9262601189689171, "eval_loss": 1.7753738164901733, "eval_matthews_correlation": 0.9252925536787239, "eval_runtime": 2.1885, "eval_samples_per_second": 1407.348, "eval_steps_per_second": 9.139, "step": 1300 }, { "epoch": 31.82, "eval_accuracy": 0.9282467532467532, "eval_f1": 0.9278794105174281, "eval_loss": 1.790648341178894, "eval_matthews_correlation": 0.9272619193360061, "eval_runtime": 2.0054, "eval_samples_per_second": 1535.842, "eval_steps_per_second": 9.973, "step": 1400 }, { "epoch": 34.09, "learning_rate": 6.0166478009333844e-06, "loss": 0.0733, "step": 1500 }, { "epoch": 34.09, "eval_accuracy": 0.9262987012987013, "eval_f1": 0.9263368444227621, "eval_loss": 1.805496335029602, "eval_matthews_correlation": 0.9252900896996127, "eval_runtime": 2.1349, "eval_samples_per_second": 1442.709, "eval_steps_per_second": 9.368, "step": 1500 }, { "epoch": 36.36, "eval_accuracy": 0.9282467532467532, "eval_f1": 0.9281799745185059, "eval_loss": 1.7787483930587769, "eval_matthews_correlation": 0.9272691959664779, "eval_runtime": 2.095, "eval_samples_per_second": 1470.152, "eval_steps_per_second": 9.546, "step": 1600 } ], "max_steps": 1760, "num_train_epochs": 40, "total_flos": 8360620865327346.0, "trial_name": null, "trial_params": null }