{ | |
"epoch": 1.0, | |
"eval_loss": 1.079127550125122, | |
"eval_runtime": 187.0771, | |
"eval_samples": 25000, | |
"eval_samples_per_second": 133.635, | |
"eval_steps_per_second": 16.704, | |
"perplexity": 2.9421115861328713, | |
"total_flos": 3.641341261824e+16, | |
"train_loss": 1.3328714208984376, | |
"train_runtime": 7223.6875, | |
"train_samples": 200000, | |
"train_samples_per_second": 27.687, | |
"train_steps_per_second": 0.433 | |
} |