{ "epoch": 1.0, "eval_loss": 1.7895774841308594, "eval_runtime": 35.1352, "eval_samples_per_second": 22.143, "eval_steps_per_second": 2.789, "perplexity": 5.986922362210824, "total_flos": 6.253123043328e+16, "train_loss": 1.9996433352507346, "train_runtime": 916.5503, "train_samples_per_second": 7.491, "train_steps_per_second": 3.746 }