{ | |
"epoch": 2.9964796996010326, | |
"eval_loss": 2.235288619995117, | |
"eval_runtime": 115.517, | |
"eval_samples_per_second": 8.198, | |
"eval_steps_per_second": 4.103, | |
"perplexity": 9.349179823068619, | |
"total_flos": 1.1780062420402176e+18, | |
"train_loss": 2.428264606566656, | |
"train_runtime": 11538.2228, | |
"train_samples_per_second": 2.216, | |
"train_steps_per_second": 0.138 | |
} |