| { | |
| "epoch": 0.9989701338825953, | |
| "eval_logits/chosen": -2.065095901489258, | |
| "eval_logits/rejected": -1.9689290523529053, | |
| "eval_logps/chosen": -335.3676452636719, | |
| "eval_logps/rejected": -427.32891845703125, | |
| "eval_loss": 0.5029041767120361, | |
| "eval_rewards/accuracies": 0.75, | |
| "eval_rewards/chosen": -1.1300084590911865, | |
| "eval_rewards/margins": 0.865437388420105, | |
| "eval_rewards/rejected": -1.995445728302002, | |
| "eval_runtime": 65.1127, | |
| "eval_samples_per_second": 15.358, | |
| "eval_steps_per_second": 0.246 | |
| } |