{ "epoch": 1.0, "eval_loss": 2.332369565963745, "eval_runtime": 610.6779, "eval_samples_per_second": 135.671, "eval_steps_per_second": 8.481, "perplexity": 10.302324670795207, "total_flos": 6.236990962447417e+18, "train_loss": 2.428118334464832, "train_runtime": 22646.6509, "train_samples_per_second": 29.848, "train_steps_per_second": 1.866 }