{ "epoch": 1.0, "eval_loss": 2.001368999481201, "eval_runtime": 72.9694, "eval_samples_per_second": 80.061, "eval_steps_per_second": 10.018, "perplexity": 7.3991786401925825, "total_flos": 3.458455817609544e+17, "train_loss": 3.4343306545051546, "train_runtime": 789.0664, "train_samples_per_second": 29.473, "train_steps_per_second": 3.684 }