| { | |
| "epoch": 1.0, | |
| "eval_logps/chosen": -2.755657434463501, | |
| "eval_logps/rejected": -1.0496879816055298, | |
| "eval_loss": 21.31629180908203, | |
| "eval_rewards/accuracies": 0.0, | |
| "eval_rewards/chosen": -27.55657386779785, | |
| "eval_rewards/margins": -17.059694290161133, | |
| "eval_rewards/rejected": -10.496879577636719, | |
| "eval_runtime": 4.3483, | |
| "eval_samples": 12, | |
| "eval_samples_per_second": 2.76, | |
| "eval_steps_per_second": 0.69, | |
| "total_flos": 0.0, | |
| "train_loss": 22.58866818745931, | |
| "train_runtime": 4347.6828, | |
| "train_samples": 5640, | |
| "train_samples_per_second": 1.297, | |
| "train_steps_per_second": 0.13 | |
| } |