| { | |
| "sft_experiment_id": "E-9", | |
| "dataset_strategy_id": "baseline", | |
| "base_model": "unsloth/Qwen3-4B-Instruct-2507", | |
| "neftune_alpha": 5.0, | |
| "data_cleaning": true, | |
| "lora": { | |
| "r": 64, | |
| "alpha": 128, | |
| "dropout": 0.0, | |
| "target_modules": [ | |
| "q_proj", | |
| "k_proj", | |
| "v_proj", | |
| "o_proj", | |
| "gate_proj", | |
| "up_proj", | |
| "down_proj" | |
| ] | |
| }, | |
| "training": { | |
| "max_seq_len": 512, | |
| "epochs": 2, | |
| "lr": 2e-06, | |
| "per_device_train_bs": 2, | |
| "grad_accum": 8, | |
| "warmup_ratio": 0.1, | |
| "weight_decay": 0.05 | |
| }, | |
| "special": { | |
| "mask_cot": true, | |
| "upsampling": true, | |
| "curriculum": false | |
| } | |
| } |