nano_cls-2-no-bf16 / train_results.json
Flamenco43's picture
End of training
1e811fc verified
{
"epoch": 1.0,
"total_flos": 4.216512416894157e+16,
"train_loss": 0.4463165575703874,
"train_runtime": 453.3701,
"train_samples": 160000,
"train_samples_per_second": 352.913,
"train_steps_per_second": 0.69,
"train_tokens_per_second": 22622.54
}