{ "epoch": 0.9999893708612791, "eval_accuracy": 0.5884871794871794, "eval_loss": 1.992581844329834, "eval_runtime": 128.1327, "eval_samples": 400, "eval_samples_per_second": 3.122, "eval_steps_per_second": 1.046, "num_input_tokens_seen": 3468165120, "perplexity": 7.334445735052817, "total_flos": 4.540784328132526e+18, "train_loss": 2.065564124978859, "train_runtime": 98524.0638, "train_samples": 846729, "train_samples_per_second": 8.594, "train_steps_per_second": 0.09 }