griffin-c3t-8L-v0.02-fineweb / all_results.json
pszemraj's picture
End of training
2cf6678 verified
raw
history blame contribute delete
537 Bytes
{
"epoch": 0.9998717955292536,
"eval_accuracy": 0.23258101286435434,
"eval_loss": 5.188788890838623,
"eval_runtime": 128.0489,
"eval_samples": 300,
"eval_samples_per_second": 2.343,
"eval_steps_per_second": 1.171,
"num_input_tokens_seen": 798621696,
"perplexity": 179.25132849100459,
"total_flos": 4.855554488590664e+17,
"train_loss": 5.304058988399935,
"train_runtime": 127910.3478,
"train_samples": 390002,
"train_samples_per_second": 3.049,
"train_steps_per_second": 0.048
}