{ | |
"epoch": 315.7894736842105, | |
"eval_accuracy": 0.8340939202119829, | |
"eval_loss": 1.1156361103057861, | |
"eval_runtime": 0.9791, | |
"eval_samples": 399, | |
"eval_samples_per_second": 407.517, | |
"eval_steps_per_second": 13.277, | |
"perplexity": 3.051508658043527, | |
"total_flos": 6.261324507818496e+16, | |
"train_loss": 0.5399098532358806, | |
"train_runtime": 6604.7234, | |
"train_samples": 3012, | |
"train_samples_per_second": 145.351, | |
"train_steps_per_second": 4.542 | |
} |