{ "epoch": 1.0, "eval_accuracy": 0.36165373273858764, "eval_loss": 3.583437442779541, "eval_runtime": 4627.9586, "eval_samples": 419639, "eval_samples_per_second": 90.675, "eval_steps_per_second": 1.417, "perplexity": 35.99706627518808, "train_loss": 3.8837062227938306, "train_runtime": 230124.717, "train_samples": 7975299, "train_samples_per_second": 34.656, "train_steps_per_second": 1.083 }