simpo-train-small-correct / eval_results.json
jz666's picture
End of training
57ae941 verified
{
"epoch": 0.995910949568378,
"eval_logits/chosen": -13.768111228942871,
"eval_logits/rejected": -13.749955177307129,
"eval_logps/chosen": -1.4371137619018555,
"eval_logps/rejected": -1.7012752294540405,
"eval_loss": 4.129865646362305,
"eval_rewards/accuracies": 0.6721311211585999,
"eval_rewards/chosen": -14.371137619018555,
"eval_rewards/margins": 2.6416165828704834,
"eval_rewards/rejected": -17.012752532958984,
"eval_runtime": 65.8969,
"eval_samples": 1941,
"eval_samples_per_second": 29.455,
"eval_steps_per_second": 1.851
}