{ | |
"epoch": 20.0, | |
"eval_accuracy": 0.4232865945768086, | |
"eval_loss": 3.037959337234497, | |
"eval_runtime": 112.5812, | |
"eval_samples": 52440, | |
"eval_samples_per_second": 465.797, | |
"eval_steps_per_second": 7.284, | |
"perplexity": 20.862626181925105, | |
"total_flos": 1.29957250203648e+18, | |
"train_loss": 2.656636161733025, | |
"train_runtime": 44071.5037, | |
"train_samples": 497364, | |
"train_samples_per_second": 225.708, | |
"train_steps_per_second": 7.054 | |
} |