taicheng's picture
End of training
5b5d083 verified
raw
history blame contribute delete
577 Bytes
{
"epoch": 1.0,
"eval_logits/chosen": -2.4359169006347656,
"eval_logits/rejected": -2.4180893898010254,
"eval_logps/chosen": -74.32483673095703,
"eval_logps/rejected": -86.18550872802734,
"eval_loss": 0.6700397729873657,
"eval_rewards/accuracies": 0.3154761791229248,
"eval_rewards/chosen": 0.0016639787936583161,
"eval_rewards/margins": 0.05223553627729416,
"eval_rewards/rejected": -0.05057155340909958,
"eval_runtime": 113.9808,
"eval_samples": 2000,
"eval_samples_per_second": 17.547,
"eval_steps_per_second": 0.553
}