{ "best_metric": 2.967562437057495, "best_model_checkpoint": "flan-t5-base-flant5-apple-support/checkpoint-5785", "epoch": 5.0, "global_step": 5785, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.43, "learning_rate": 4.567847882454624e-05, "loss": 3.3318, "step": 500 }, { "epoch": 0.86, "learning_rate": 4.135695764909248e-05, "loss": 3.2673, "step": 1000 }, { "epoch": 1.0, "eval_gen_len": 18.972318339100347, "eval_loss": 3.0350406169891357, "eval_rouge1": 12.4094, "eval_rouge2": 2.1794, "eval_rougeL": 9.5255, "eval_rougeLsum": 10.9739, "eval_runtime": 319.5992, "eval_samples_per_second": 14.468, "eval_steps_per_second": 1.809, "step": 1157 }, { "epoch": 1.3, "learning_rate": 3.7035436473638726e-05, "loss": 3.2145, "step": 1500 }, { "epoch": 1.73, "learning_rate": 3.271391529818496e-05, "loss": 3.1854, "step": 2000 }, { "epoch": 2.0, "eval_gen_len": 18.964749134948097, "eval_loss": 2.9991722106933594, "eval_rouge1": 12.4579, "eval_rouge2": 2.1512, "eval_rougeL": 9.5232, "eval_rougeLsum": 11.0049, "eval_runtime": 319.123, "eval_samples_per_second": 14.49, "eval_steps_per_second": 1.811, "step": 2314 }, { "epoch": 2.16, "learning_rate": 2.8392394122731204e-05, "loss": 3.1388, "step": 2500 }, { "epoch": 2.59, "learning_rate": 2.4070872947277444e-05, "loss": 3.1006, "step": 3000 }, { "epoch": 3.0, "eval_gen_len": 18.9435553633218, "eval_loss": 2.9792306423187256, "eval_rouge1": 12.9794, "eval_rouge2": 2.2794, "eval_rougeL": 9.9245, "eval_rougeLsum": 11.5019, "eval_runtime": 317.3217, "eval_samples_per_second": 14.572, "eval_steps_per_second": 1.821, "step": 3471 }, { "epoch": 3.03, "learning_rate": 1.9749351771823683e-05, "loss": 3.1209, "step": 3500 }, { "epoch": 3.46, "learning_rate": 1.5427830596369925e-05, "loss": 3.0729, "step": 4000 }, { "epoch": 3.89, "learning_rate": 1.1106309420916162e-05, "loss": 3.0751, "step": 4500 }, { "epoch": 4.0, "eval_gen_len": 18.91371107266436, "eval_loss": 2.971137762069702, "eval_rouge1": 12.6779, "eval_rouge2": 2.1828, "eval_rougeL": 9.6962, "eval_rougeLsum": 11.221, "eval_runtime": 320.2879, "eval_samples_per_second": 14.437, "eval_steps_per_second": 1.805, "step": 4628 }, { "epoch": 4.32, "learning_rate": 6.784788245462403e-06, "loss": 3.0641, "step": 5000 }, { "epoch": 4.75, "learning_rate": 2.4632670700086435e-06, "loss": 3.0532, "step": 5500 }, { "epoch": 5.0, "eval_gen_len": 18.908737024221452, "eval_loss": 2.967562437057495, "eval_rouge1": 12.7991, "eval_rouge2": 2.244, "eval_rougeL": 9.8075, "eval_rougeLsum": 11.3618, "eval_runtime": 318.8859, "eval_samples_per_second": 14.5, "eval_steps_per_second": 1.813, "step": 5785 } ], "max_steps": 5785, "num_train_epochs": 5, "total_flos": 3.166660376395776e+16, "trial_name": null, "trial_params": null }