{ | |
"epoch": 5.05, | |
"eval_loss": 1.942165732383728, | |
"eval_runtime": 459.5033, | |
"eval_samples": 400000, | |
"eval_samples_per_second": 870.505, | |
"eval_steps_per_second": 54.407, | |
"perplexity": 6.97383809440389, | |
"train_loss": 2.0860133251953124, | |
"train_runtime": 289964.3288, | |
"train_samples": 7600000, | |
"train_samples_per_second": 132.43, | |
"train_steps_per_second": 8.277 | |
} |