{ "epoch": 10.0, "total_flos": 4.0857422266368e+18, "train_loss": 0.24487185467481612, "train_runtime": 1824.5027, "train_samples_per_second": 21.924, "train_steps_per_second": 1.37 }