{ "best_metric": 1.7180376052856445, "best_model_checkpoint": "/home3/s5431786/nlp-final-project/results/google-flan-t5-small-e-snli-generation-explanation_use_prompt_label-selected-b64/checkpoint-12000", "epoch": 1.3979496738117427, "global_step": 12000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.23, "learning_rate": 0.0004659832246039143, "loss": 1.6051, "step": 2000 }, { "epoch": 0.23, "eval_accuracy": null, "eval_bertscore_f1": 0.9312730214807033, "eval_bleu": 0.39782836950988876, "eval_f1": null, "eval_loss": 1.7780297994613647, "eval_rouge1": 0.5911787258201253, "eval_rouge2": 0.38303308637957223, "eval_rougeL": 0.5377264257708202, "eval_rougeLsum": 0.5395006217014338, "eval_runtime": 168.0702, "eval_samples_per_second": 58.559, "eval_steps_per_second": 0.916, "step": 2000 }, { "epoch": 0.47, "learning_rate": 0.0009319664492078286, "loss": 1.4342, "step": 4000 }, { "epoch": 0.47, "eval_accuracy": null, "eval_bertscore_f1": 0.933153417701039, "eval_bleu": 0.4002469468404885, "eval_f1": null, "eval_loss": 1.7909314632415771, "eval_rouge1": 0.5975097321291585, "eval_rouge2": 0.3847152683676083, "eval_rougeL": 0.5420448625219438, "eval_rougeLsum": 0.5439086899907004, "eval_runtime": 163.5422, "eval_samples_per_second": 60.18, "eval_steps_per_second": 0.942, "step": 4000 }, { "epoch": 0.7, "learning_rate": 0.0009790552803256977, "loss": 1.3804, "step": 6000 }, { "epoch": 0.7, "eval_accuracy": null, "eval_bertscore_f1": 0.9348857560079773, "eval_bleu": 0.41900709929386093, "eval_f1": null, "eval_loss": 1.7246909141540527, "eval_rouge1": 0.616316027086431, "eval_rouge2": 0.4107303410412238, "eval_rougeL": 0.5610382702035865, "eval_rougeLsum": 0.5630504299315114, "eval_runtime": 164.6404, "eval_samples_per_second": 59.779, "eval_steps_per_second": 0.935, "step": 6000 }, { "epoch": 0.93, "learning_rate": 0.0009545298474518076, "loss": 1.3396, "step": 8000 }, { "epoch": 0.93, "eval_accuracy": null, "eval_bertscore_f1": 0.9358202236390555, "eval_bleu": 0.41886081162261424, "eval_f1": null, "eval_loss": 1.7622839212417603, "eval_rouge1": 0.6176280342703749, "eval_rouge2": 0.4078573926320103, "eval_rougeL": 0.5616472881864998, "eval_rougeLsum": 0.563450597865839, "eval_runtime": 154.9703, "eval_samples_per_second": 63.509, "eval_steps_per_second": 0.994, "step": 8000 }, { "epoch": 1.16, "learning_rate": 0.0009300044145779173, "loss": 1.2871, "step": 10000 }, { "epoch": 1.16, "eval_accuracy": null, "eval_bertscore_f1": 0.9358213962977603, "eval_bleu": 0.4193950275310417, "eval_f1": null, "eval_loss": 1.7429882287979126, "eval_rouge1": 0.6213453720058478, "eval_rouge2": 0.4161815104047649, "eval_rougeL": 0.5663236030411948, "eval_rougeLsum": 0.5683627905966635, "eval_runtime": 166.3727, "eval_samples_per_second": 59.156, "eval_steps_per_second": 0.926, "step": 10000 }, { "epoch": 1.4, "learning_rate": 0.0009054789817040271, "loss": 1.2598, "step": 12000 }, { "epoch": 1.4, "eval_accuracy": null, "eval_bertscore_f1": 0.9357474451383859, "eval_bleu": 0.4237575236205067, "eval_f1": null, "eval_loss": 1.7180376052856445, "eval_rouge1": 0.6178787224462856, "eval_rouge2": 0.41096129012621224, "eval_rougeL": 0.5625046403576894, "eval_rougeLsum": 0.5643579355959574, "eval_runtime": 161.2048, "eval_samples_per_second": 61.053, "eval_steps_per_second": 0.955, "step": 12000 } ], "max_steps": 85840, "num_train_epochs": 10, "total_flos": 1.8127294826041344e+16, "trial_name": null, "trial_params": null }