| ### model | |
| model_name_or_path: Qwen/Qwen3-4B-Instruct-2507 | |
| trust_remote_code: true | |
| ### method | |
| stage: sft | |
| do_train: true | |
| finetuning_type: lora | |
| lora_rank: 8 | |
| lora_target: all | |
| ### dataset | |
| dataset: identity,alpaca_en_demo | |
| template: qwen3_nothink | |
| cutoff_len: 2048 | |
| max_samples: 1000 | |
| preprocessing_num_workers: 16 | |
| tokenized_path: saves/qwen3-4b/dataset/sft | |
| ### output (not used) | |
| output_dir: saves/qwen3-4b/lora/sft | |
| overwrite_output_dir: true | |