{ | |
"epoch": 0.18, | |
"eval_loss": 7.917535781860352, | |
"eval_runtime": 1151.6067, | |
"eval_samples": 8626, | |
"eval_samples_per_second": 7.49, | |
"eval_steps_per_second": 7.49, | |
"perplexity": 2744.998429631847, | |
"train_loss": 9.09298583984375, | |
"train_runtime": 7786.6651, | |
"train_samples": 141300, | |
"train_samples_per_second": 3.288, | |
"train_steps_per_second": 0.013 | |
} |