deepseek-coder-1.3b-base-JUnit / all_results.json
iHateNLP's picture
End of training
d4fa5be verified
raw
history blame contribute delete
488 Bytes
{
"epoch": 1.9985964912280703,
"eval_loss": 0.22910664975643158,
"eval_runtime": 8.378,
"eval_samples": 100,
"eval_samples_per_second": 6.565,
"eval_steps_per_second": 0.836,
"perplexity": 1.2574761413829163,
"raw_train_examples": 78434,
"total_flos": 8.025299762167153e+17,
"train_examples": 39900,
"train_loss": 0.37913749282088366,
"train_runtime": 28381.1385,
"train_samples_per_second": 2.812,
"train_steps_per_second": 0.088
}