zephyr-7b-gemma-dpo / eval_results.json
RedaAlami's picture
End of training
ea18965 verified
raw
history blame
No virus
585 Bytes
{
"epoch": 1.9986987638256344,
"eval_logits/chosen": 452.641357421875,
"eval_logits/rejected": 436.01385498046875,
"eval_logps/chosen": -295.9647216796875,
"eval_logps/rejected": -334.555419921875,
"eval_loss": 0.6477869153022766,
"eval_rewards/accuracies": 0.6168639063835144,
"eval_rewards/chosen": -0.34524381160736084,
"eval_rewards/margins": 0.23360556364059448,
"eval_rewards/rejected": -0.5788493752479553,
"eval_runtime": 243.7753,
"eval_samples": 5406,
"eval_samples_per_second": 22.176,
"eval_steps_per_second": 0.693
}