{ "epoch": 3.87, "total_flos": 1.8333718891462656e+18, "train_loss": 0.12722260688050566, "train_runtime": 603.2075, "train_samples_per_second": 6.034, "train_steps_per_second": 0.146 }