ALM-AHME's picture
End of training
c7616b1
{
"epoch": 4.96,
"eval_accuracy": 0.9805094130675526,
"eval_loss": 0.04738219827413559,
"eval_runtime": 194.8962,
"eval_samples_per_second": 23.166,
"eval_steps_per_second": 1.452,
"total_flos": 8.138660625246413e+18,
"train_loss": 0.23329446437538312,
"train_runtime": 4933.7001,
"train_samples_per_second": 6.065,
"train_steps_per_second": 0.094
}