{ | |
"epoch": 0.9998717955292536, | |
"eval_accuracy": 0.23258101286435434, | |
"eval_loss": 5.188788890838623, | |
"eval_runtime": 128.0489, | |
"eval_samples": 300, | |
"eval_samples_per_second": 2.343, | |
"eval_steps_per_second": 1.171, | |
"num_input_tokens_seen": 798621696, | |
"perplexity": 179.25132849100459, | |
"total_flos": 4.855554488590664e+17, | |
"train_loss": 5.304058988399935, | |
"train_runtime": 127910.3478, | |
"train_samples": 390002, | |
"train_samples_per_second": 3.049, | |
"train_steps_per_second": 0.048 | |
} |