{ | |
"epoch": 1.9985964912280703, | |
"eval_loss": 0.22910664975643158, | |
"eval_runtime": 8.378, | |
"eval_samples": 100, | |
"eval_samples_per_second": 6.565, | |
"eval_steps_per_second": 0.836, | |
"perplexity": 1.2574761413829163, | |
"raw_train_examples": 78434, | |
"total_flos": 8.025299762167153e+17, | |
"train_examples": 39900, | |
"train_loss": 0.37913749282088366, | |
"train_runtime": 28381.1385, | |
"train_samples_per_second": 2.812, | |
"train_steps_per_second": 0.088 | |
} |