{ "run_name": "dpo_fft_LFM2.5-1.2B-Instruct_xinlai__Math-Step-DPO-10K_20260223_022854", "model": "LiquidAI/LFM2.5-1.2B-Instruct", "dataset": "xinlai/Math-Step-DPO-10K", "timestamp": "20260223_022854", "args": { "dataset": "xinlai/Math-Step-DPO-10K", "dataset_split": "train", "instruction_col": "initial_reason_steps", "chosen_col": "chosen", "rejected_col": "rejected", "max_samples": null, "seed": 42, "model_name": "LiquidAI/LFM2.5-1.2B-Instruct", "ref_4bit": false, "num_epochs": 1, "batch_size": 4, "grad_accum": 4, "learning_rate": 2e-06, "beta": 0.2, "max_length": 1024, "max_prompt_length": 768, "warmup_ratio": 0.1, "optim": "paged_adamw_8bit", "logging_steps": 10, "save_steps": 100, "eval_ratio": 0.05, "output_dir": "models", "run_name": null }, "train_metrics": { "train_runtime": 2398.316, "train_samples_per_second": 4.276, "train_steps_per_second": 0.267, "total_flos": 0.0, "train_loss": 0.5289894797128746, "epoch": 1.0 } }