mistral-7b-dpo / eval_results.json
Jenbenarye's picture
Model save
5d16a7c verified
{
"epoch": 1.0,
"eval_logits/chosen": -3.0213913917541504,
"eval_logits/rejected": -3.038022518157959,
"eval_logps/chosen": -296.33209228515625,
"eval_logps/rejected": -291.47021484375,
"eval_loss": 0.4926324486732483,
"eval_rewards/accuracies": 0.7570000290870667,
"eval_rewards/chosen": -1.3098689317703247,
"eval_rewards/margins": 1.4436919689178467,
"eval_rewards/rejected": -2.753561019897461,
"eval_runtime": 1173.4935,
"eval_samples": 2000,
"eval_samples_per_second": 1.704,
"eval_steps_per_second": 0.213
}