{ | |
"epoch": 19.995451444166477, | |
"eval_accuracy": 0.46725332517112805, | |
"eval_loss": 2.7611162662506104, | |
"eval_runtime": 117.7988, | |
"eval_samples": 59192, | |
"eval_samples_per_second": 502.484, | |
"eval_steps_per_second": 7.852, | |
"perplexity": 15.817489627072094, | |
"total_flos": 1.470253944471552e+18, | |
"train_loss": 2.893489753646781, | |
"train_runtime": 41720.7377, | |
"train_samples": 562814, | |
"train_samples_per_second": 269.801, | |
"train_steps_per_second": 1.054 | |
} |