{ "epoch": 3.0, "eval_accuracy": 0.6906063124235521, "eval_loss": 1.4509799480438232, "eval_runtime": 5230.4957, "eval_samples": 432388, "eval_samples_per_second": 82.667, "eval_steps_per_second": 2.584, "perplexity": 4.267294193497874, "train_loss": 3.0939811468297327, "train_runtime": 276726.3152, "train_samples": 3455772, "train_samples_per_second": 37.464, "train_steps_per_second": 1.171 }