{ | |
"epoch": 3.0, | |
"eval_accuracy": 0.2825701437173418, | |
"eval_loss": 4.0273261070251465, | |
"eval_runtime": 215.7835, | |
"eval_samples": 19045, | |
"eval_samples_per_second": 88.26, | |
"eval_steps_per_second": 2.762, | |
"perplexity": 56.11067653706432, | |
"total_flos": 1.44589665695957e+17, | |
"train_loss": 4.469071887788319, | |
"train_runtime": 13360.3551, | |
"train_samples": 175606, | |
"train_samples_per_second": 39.431, | |
"train_steps_per_second": 1.232 | |
} |