{ "loss": 1.1535, "learning_rate": 7.5e-05, "epoch": 2.7, "train_runtime": 3302.3968, "train_samples_per_second": 4.12, "train_steps_per_second": 0.004, "total_flos": 1.2484302776303616e+17, "train_loss": 1.434487760066986 }