{ | |
"epoch": 8.33, | |
"eval_accuracy": 0.45301927514806384, | |
"eval_loss": 3.091063976287842, | |
"eval_runtime": 653.704, | |
"eval_samples": 308356, | |
"eval_samples_per_second": 471.706, | |
"eval_steps_per_second": 3.804, | |
"perplexity": 22.00047350954521, | |
"train_loss": 4.550724849134638, | |
"train_runtime": 197998.9321, | |
"train_samples": 5858758, | |
"train_samples_per_second": 2958.985, | |
"train_steps_per_second": 23.863 | |
} |