| { | |
| "model": "Qwen/Qwen3-4B-Instruct-2507", | |
| "quantization": { | |
| "load_in_4bit": false | |
| }, | |
| "dataset": "/root/jb/personas/finance/personal_budgeting/data/qa_pairs_train.json", | |
| "dataset_resolved_path": "/root/jb/personas/finance/personal_budgeting/data/qa_pairs_train.json", | |
| "num_train_samples": 5434, | |
| "num_val_samples": 679, | |
| "val_dataset": "/root/jb/personas/finance/personal_budgeting/data/qa_pairs_val.json", | |
| "val_ratio": null, | |
| "max_samples": null, | |
| "output_dir": "/root/jb/personas/finance/personal_budgeting/sft_output/2026-03-05_23-01-53", | |
| "save_artifact_path": "/root/jb/personas/finance/personal_budgeting/sft_output/2026-03-05_23-01-53", | |
| "lora": { | |
| "r": 64, | |
| "lora_alpha": 128, | |
| "lora_dropout": 0.05 | |
| }, | |
| "training": { | |
| "num_train_epochs": 2.0, | |
| "per_device_train_batch_size": 4, | |
| "gradient_accumulation_steps": 4, | |
| "learning_rate": 0.0002, | |
| "max_seq_length": 2048, | |
| "weight_decay": 0.0, | |
| "warmup_ratio": 0.05, | |
| "lr_scheduler_type": "cosine", | |
| "logging_steps": 20, | |
| "save_strategy": "steps", | |
| "save_steps": 500, | |
| "save_total_limit": 2, | |
| "eval_strategy": "steps", | |
| "eval_steps": 500, | |
| "bf16": true, | |
| "seed": 3407 | |
| }, | |
| "system_prompt": "You are a finance expert. Based on your financial expertise, provide your response or viewpoint on the given financial question or topic." | |
| } |