{ | |
"epoch": 19.991464360935595, | |
"eval_accuracy": 0.47886644176457666, | |
"eval_loss": 2.683746337890625, | |
"eval_runtime": 71.9708, | |
"eval_samples": 60680, | |
"eval_samples_per_second": 843.12, | |
"eval_steps_per_second": 13.186, | |
"perplexity": 14.639836462706617, | |
"total_flos": 1.507910045663232e+18, | |
"train_loss": 2.80528530789056, | |
"train_runtime": 30473.0676, | |
"train_samples": 577344, | |
"train_samples_per_second": 378.921, | |
"train_steps_per_second": 1.48 | |
} |