{ "epoch": 6.74, "eval_loss": 2.268062114715576, "eval_runtime": 340.6941, "eval_samples": 300000, "eval_samples_per_second": 880.555, "eval_steps_per_second": 55.035, "perplexity": 9.660661408946421, "train_loss": 2.4076748518880207, "train_runtime": 247856.7094, "train_samples": 5700001, "train_samples_per_second": 154.928, "train_steps_per_second": 9.683 }