{ "epoch": 1.0, "eval_loss": 1.9632289409637451, "eval_runtime": 43.6749, "eval_samples_per_second": 22.255, "eval_steps_per_second": 2.793, "perplexity": 7.122287422001887, "total_flos": 7.999917391872e+16, "train_loss": 2.1433237489238244, "train_runtime": 1165.6218, "train_samples_per_second": 7.536, "train_steps_per_second": 3.768 }