{ "epoch": 12.63, "eval_loss": 0.018954848870635033, "eval_runtime": 3.0784, "eval_samples_per_second": 43.204, "eval_steps_per_second": 0.975, "total_flos": 4.9113822316304794e+17, "train_loss": 0.24218196471532186, "train_runtime": 426.607, "train_samples_per_second": 41.982, "train_steps_per_second": 0.141 }