{ "epoch": 0.99968, "eval_loss": 1.097437858581543, "eval_runtime": 230.0389, "eval_samples": 12500, "eval_samples_per_second": 54.339, "eval_steps_per_second": 6.795, "perplexity": 2.9964787778596422, "total_flos": 6.457467788899123e+16, "train_loss": 1.3367621437688184, "train_runtime": 11215.3396, "train_samples": 100000, "train_samples_per_second": 8.916, "train_steps_per_second": 0.139 }