{ "best_metric": 0.8271405492730209, "best_model_checkpoint": "/scratch/mrahma45/pixel/finetuned_models/mbert/mbert-base-finetuned-masakhaner-kin/checkpoint-1000", "epoch": 38.80597014925373, "global_step": 2600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 2.99, "eval_accuracy_score": 0.9552972731336612, "eval_f1": 0.8061538461538461, "eval_loss": 0.14030461013317108, "eval_precision": 0.7683284457478006, "eval_recall": 0.8478964401294499, "eval_runtime": 4.2191, "eval_samples_per_second": 71.58, "eval_steps_per_second": 9.007, "step": 200 }, { "epoch": 5.97, "eval_accuracy_score": 0.9608106094471762, "eval_f1": 0.8109375, "eval_loss": 0.17163802683353424, "eval_precision": 0.783987915407855, "eval_recall": 0.8398058252427184, "eval_runtime": 4.2278, "eval_samples_per_second": 71.432, "eval_steps_per_second": 8.988, "step": 400 }, { "epoch": 7.46, "learning_rate": 4.865771812080537e-05, "loss": 0.1428, "step": 500 }, { "epoch": 8.96, "eval_accuracy_score": 0.9573834003874236, "eval_f1": 0.7830940988835726, "eval_loss": 0.2280413955450058, "eval_precision": 0.7720125786163522, "eval_recall": 0.7944983818770227, "eval_runtime": 4.2189, "eval_samples_per_second": 71.582, "eval_steps_per_second": 9.007, "step": 600 }, { "epoch": 11.94, "eval_accuracy_score": 0.9605125912680673, "eval_f1": 0.8210862619808306, "eval_loss": 0.22001390159130096, "eval_precision": 0.8107255520504731, "eval_recall": 0.8317152103559871, "eval_runtime": 4.2196, "eval_samples_per_second": 71.571, "eval_steps_per_second": 9.006, "step": 800 }, { "epoch": 14.93, "learning_rate": 4.697986577181208e-05, "loss": 0.0075, "step": 1000 }, { "epoch": 14.93, "eval_accuracy_score": 0.9640888094173745, "eval_f1": 0.8271405492730209, "eval_loss": 0.20800545811653137, "eval_precision": 0.8258064516129032, "eval_recall": 0.8284789644012945, "eval_runtime": 4.2152, "eval_samples_per_second": 71.645, "eval_steps_per_second": 9.015, "step": 1000 }, { "epoch": 17.91, "eval_accuracy_score": 0.9643868275964834, "eval_f1": 0.8350764279967821, "eval_loss": 0.2207585573196411, "eval_precision": 0.8304, "eval_recall": 0.8398058252427184, "eval_runtime": 4.214, "eval_samples_per_second": 71.666, "eval_steps_per_second": 9.018, "step": 1200 }, { "epoch": 20.9, "eval_accuracy_score": 0.9567873640292058, "eval_f1": 0.8034455755677369, "eval_loss": 0.24622981250286102, "eval_precision": 0.7784522003034902, "eval_recall": 0.8300970873786407, "eval_runtime": 4.2176, "eval_samples_per_second": 71.605, "eval_steps_per_second": 9.01, "step": 1400 }, { "epoch": 22.39, "learning_rate": 4.530201342281879e-05, "loss": 0.004, "step": 1500 }, { "epoch": 23.88, "eval_accuracy_score": 0.9658769184920281, "eval_f1": 0.8436763550667713, "eval_loss": 0.22536174952983856, "eval_precision": 0.8198473282442749, "eval_recall": 0.8689320388349514, "eval_runtime": 4.214, "eval_samples_per_second": 71.666, "eval_steps_per_second": 9.018, "step": 1600 }, { "epoch": 26.87, "eval_accuracy_score": 0.9646848457755923, "eval_f1": 0.8192, "eval_loss": 0.20931068062782288, "eval_precision": 0.810126582278481, "eval_recall": 0.8284789644012945, "eval_runtime": 4.2136, "eval_samples_per_second": 71.672, "eval_steps_per_second": 9.018, "step": 1800 }, { "epoch": 29.85, "learning_rate": 4.36241610738255e-05, "loss": 0.0028, "step": 2000 }, { "epoch": 29.85, "eval_accuracy_score": 0.9623007003427209, "eval_f1": 0.822774659182037, "eval_loss": 0.24018673598766327, "eval_precision": 0.8155802861685215, "eval_recall": 0.8300970873786407, "eval_runtime": 4.2137, "eval_samples_per_second": 71.671, "eval_steps_per_second": 9.018, "step": 2000 }, { "epoch": 32.84, "eval_accuracy_score": 0.9564893458500968, "eval_f1": 0.8009630818619582, "eval_loss": 0.26548677682876587, "eval_precision": 0.7945859872611465, "eval_recall": 0.8074433656957929, "eval_runtime": 4.2161, "eval_samples_per_second": 71.63, "eval_steps_per_second": 9.013, "step": 2200 }, { "epoch": 35.82, "eval_accuracy_score": 0.958128445835196, "eval_f1": 0.8034727703235991, "eval_loss": 0.2520817518234253, "eval_precision": 0.7842835130970724, "eval_recall": 0.8236245954692557, "eval_runtime": 4.2073, "eval_samples_per_second": 71.78, "eval_steps_per_second": 9.032, "step": 2400 }, { "epoch": 37.31, "learning_rate": 4.194630872483222e-05, "loss": 0.0033, "step": 2500 }, { "epoch": 38.81, "eval_accuracy_score": 0.9637907912382655, "eval_f1": 0.8270313757039421, "eval_loss": 0.2613898515701294, "eval_precision": 0.8224, "eval_recall": 0.8317152103559871, "eval_runtime": 4.201, "eval_samples_per_second": 71.887, "eval_steps_per_second": 9.045, "step": 2600 }, { "epoch": 38.81, "step": 2600, "total_flos": 1.0731614329737216e+16, "train_loss": 0.0309662873011369, "train_runtime": 2918.4318, "train_samples_per_second": 164.472, "train_steps_per_second": 5.14 } ], "max_steps": 15000, "num_train_epochs": 224, "total_flos": 1.0731614329737216e+16, "trial_name": null, "trial_params": null }