{ | |
"epoch": 1.0, | |
"eval_loss": 1.8534812927246094, | |
"eval_runtime": 31.7929, | |
"eval_samples_per_second": 13.745, | |
"eval_steps_per_second": 1.73, | |
"perplexity": 6.381998499391311, | |
"total_flos": 4.13804323012608e+16, | |
"train_loss": 2.0515993006877538, | |
"train_runtime": 708.674, | |
"train_samples_per_second": 6.426, | |
"train_steps_per_second": 3.213 | |
} |