{ | |
"epoch": 50.0, | |
"eval_accuracy": 0.1519208618470086, | |
"eval_loss": 5.8251872062683105, | |
"eval_runtime": 11.1208, | |
"eval_samples": 3852, | |
"eval_samples_per_second": 346.376, | |
"eval_steps_per_second": 86.594, | |
"perplexity": 338.7245384996336, | |
"total_flos": 5161725447936000.0, | |
"train_loss": 6.140905278960581, | |
"train_runtime": 7883.0646, | |
"train_samples": 76378, | |
"train_samples_per_second": 484.444, | |
"train_steps_per_second": 30.28 | |
} |