phi-2-dpo-full-hydrox-safe / all_results.json
yihang7's picture
Model save
d9912c7 verified
raw
history blame contribute delete
743 Bytes
{
"epoch": 3.0,
"eval_logits/chosen": -0.3196437656879425,
"eval_logits/rejected": 0.2021237313747406,
"eval_logps/chosen": -275.47796630859375,
"eval_logps/rejected": -644.0859375,
"eval_loss": 0.005032053682953119,
"eval_rewards/accuracies": 0.9991582632064819,
"eval_rewards/chosen": -0.09963408857584,
"eval_rewards/margins": 19.299285888671875,
"eval_rewards/rejected": -19.3989200592041,
"eval_runtime": 525.9739,
"eval_samples": 9500,
"eval_samples_per_second": 18.062,
"eval_steps_per_second": 0.565,
"train_loss": 0.03813637946047515,
"train_runtime": 102663.2378,
"train_samples": 188284,
"train_samples_per_second": 5.502,
"train_steps_per_second": 0.086
}