inv-test / training_config.json
jbae1213's picture
Upload training_config.json with huggingface_hub
a9e9a58 verified
{
"model": "Qwen/Qwen3-4B-Instruct-2507",
"quantization": {
"load_in_4bit": false
},
"dataset": "/root/jb/personas/finance/personal_budgeting/data/qa_pairs_train.json",
"dataset_resolved_path": "/root/jb/personas/finance/personal_budgeting/data/qa_pairs_train.json",
"num_train_samples": 5434,
"num_val_samples": 679,
"val_dataset": "/root/jb/personas/finance/personal_budgeting/data/qa_pairs_val.json",
"val_ratio": null,
"max_samples": null,
"output_dir": "/root/jb/personas/finance/personal_budgeting/sft_output/2026-03-05_23-01-53",
"save_artifact_path": "/root/jb/personas/finance/personal_budgeting/sft_output/2026-03-05_23-01-53",
"lora": {
"r": 64,
"lora_alpha": 128,
"lora_dropout": 0.05
},
"training": {
"num_train_epochs": 2.0,
"per_device_train_batch_size": 4,
"gradient_accumulation_steps": 4,
"learning_rate": 0.0002,
"max_seq_length": 2048,
"weight_decay": 0.0,
"warmup_ratio": 0.05,
"lr_scheduler_type": "cosine",
"logging_steps": 20,
"save_strategy": "steps",
"save_steps": 500,
"save_total_limit": 2,
"eval_strategy": "steps",
"eval_steps": 500,
"bf16": true,
"seed": 3407
},
"system_prompt": "You are a finance expert. Based on your financial expertise, provide your response or viewpoint on the given financial question or topic."
}