{ "sft_experiment_id": "E-9", "dataset_strategy_id": "baseline", "base_model": "unsloth/Qwen3-4B-Instruct-2507", "neftune_alpha": 5.0, "data_cleaning": true, "lora": { "r": 64, "alpha": 128, "dropout": 0.0, "target_modules": [ "q_proj", "k_proj", "v_proj", "o_proj", "gate_proj", "up_proj", "down_proj" ] }, "training": { "max_seq_len": 512, "epochs": 2, "lr": 2e-06, "per_device_train_bs": 2, "grad_accum": 8, "warmup_ratio": 0.1, "weight_decay": 0.05 }, "special": { "mask_cot": true, "upsampling": true, "curriculum": false } }