{ "epoch": 0.18, "eval_loss": 7.917535781860352, "eval_runtime": 1151.6067, "eval_samples": 8626, "eval_samples_per_second": 7.49, "eval_steps_per_second": 7.49, "perplexity": 2744.998429631847, "train_loss": 9.09298583984375, "train_runtime": 7786.6651, "train_samples": 141300, "train_samples_per_second": 3.288, "train_steps_per_second": 0.013 }