{ | |
"epoch": 19.86, | |
"eval_loss": 2.3477182388305664, | |
"eval_runtime": 514.3522, | |
"eval_samples": 4906, | |
"eval_samples_per_second": 9.538, | |
"eval_steps_per_second": 4.769, | |
"perplexity": 10.461671434354535, | |
"train_loss": 2.42385498046875, | |
"train_runtime": 61408.2472, | |
"train_samples": 10000, | |
"train_samples_per_second": 3.257, | |
"train_steps_per_second": 0.407 | |
} |