{ "epoch": 1.0, "total_flos": 4.209776888119296e+16, "train_loss": 0.4081730590820313, "train_runtime": 544.5651, "train_samples": 160000, "train_samples_per_second": 293.812, "train_steps_per_second": 1.148, "train_tokens_per_second": 18803.995 }