{ | |
"epoch": 19.991464360935595, | |
"eval_accuracy": 0.47868057440510814, | |
"eval_loss": 2.6840312480926514, | |
"eval_runtime": 71.5689, | |
"eval_samples": 60680, | |
"eval_samples_per_second": 847.854, | |
"eval_steps_per_second": 13.26, | |
"perplexity": 14.644008095713023, | |
"total_flos": 1.507910045663232e+18, | |
"train_loss": 2.8050402250099604, | |
"train_runtime": 30336.2728, | |
"train_samples": 577344, | |
"train_samples_per_second": 380.629, | |
"train_steps_per_second": 1.487 | |
} |