| { | |
| "base_model_name_or_path": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", | |
| "bias": "none", | |
| "fan_in_fan_out": false, | |
| "inference_mode": true, | |
| "init_lora_weights": true, | |
| "lora_alpha": 32, | |
| "lora_dropout": 0.05, | |
| "modules_to_save": ["lm_head", "wte"], | |
| "peft_type": "LORA", | |
| "r": 16, | |
| "target_modules": ["q_proj", "v_proj", "k_proj", "o_proj"], | |
| "task_type": "CAUSAL_LM" | |
| } |