{ "best_metric": null, "best_model_checkpoint": null, "epoch": 3.0, "global_step": 111, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.19, "learning_rate": 0.00011666666666666668, "loss": 1.2176, "step": 7 }, { "epoch": 0.38, "learning_rate": 0.00019595959595959596, "loss": 0.9247, "step": 14 }, { "epoch": 0.57, "learning_rate": 0.00018181818181818183, "loss": 0.6798, "step": 21 }, { "epoch": 0.76, "learning_rate": 0.00016767676767676768, "loss": 0.5238, "step": 28 }, { "epoch": 0.95, "learning_rate": 0.00015353535353535353, "loss": 0.4068, "step": 35 }, { "epoch": 1.14, "learning_rate": 0.0001393939393939394, "loss": 0.3102, "step": 42 }, { "epoch": 1.32, "learning_rate": 0.00012525252525252527, "loss": 0.2554, "step": 49 }, { "epoch": 1.51, "learning_rate": 0.00011111111111111112, "loss": 0.1935, "step": 56 }, { "epoch": 1.7, "learning_rate": 9.696969696969698e-05, "loss": 0.1378, "step": 63 }, { "epoch": 1.89, "learning_rate": 8.282828282828283e-05, "loss": 0.1465, "step": 70 }, { "epoch": 2.08, "learning_rate": 6.86868686868687e-05, "loss": 0.1331, "step": 77 }, { "epoch": 2.27, "learning_rate": 5.4545454545454546e-05, "loss": 0.1259, "step": 84 }, { "epoch": 2.46, "learning_rate": 4.0404040404040405e-05, "loss": 0.1218, "step": 91 }, { "epoch": 2.65, "learning_rate": 2.6262626262626268e-05, "loss": 0.127, "step": 98 }, { "epoch": 2.84, "learning_rate": 1.2121212121212122e-05, "loss": 0.1137, "step": 105 } ], "max_steps": 111, "num_train_epochs": 3, "total_flos": 9089713377902592.0, "trial_name": null, "trial_params": null }