{ "epoch": 3.0, "eval_accuracy": 0.7105720509450737, "eval_loss": 1.2192070484161377, "eval_runtime": 4409.7065, "eval_samples": 134942, "eval_samples_per_second": 30.601, "eval_steps_per_second": 7.65, "perplexity": 3.384502922346475, "train_loss": 1.4532578269084653, "train_runtime": 40248.475, "train_samples": 134942, "train_samples_per_second": 10.058, "train_steps_per_second": 2.515 }