{ "model_name_or_path": "Qwen/Qwen3-4B-Instruct-2507", "trust_remote_code": true, "dropout": 0.1, "train_mode": "lora_head", "lora_r": 64, "lora_alpha": 128, "lora_dropout": 0.1, "lora_target_modules": null, "value_head_type": "mlp" }