{ "base_model": "Qwen/Qwen2.5-7B-Instruct", "dataset": "2reb/GameTheory-Bench", "train_examples": 2767, "eval_examples": 146, "lora_r": 64, "lora_alpha": 128, "epochs": 3, "batch_size": 2, "grad_accum": 8, "effective_batch": 16, "lr": 0.0002, "train_loss": 0.1613485331888552, "eval_loss": 0.08727391809225082, "runtime_seconds": 6895.8492 }