{ "epoch": 1.0, "eval_loss": 1.8534812927246094, "eval_runtime": 31.7929, "eval_samples_per_second": 13.745, "eval_steps_per_second": 1.73, "perplexity": 6.381998499391311, "total_flos": 4.13804323012608e+16, "train_loss": 2.0515993006877538, "train_runtime": 708.674, "train_samples_per_second": 6.426, "train_steps_per_second": 3.213 }