File size: 586 Bytes
4057342 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 | {
"stage": "2_SFT",
"base_model": "/workspace/nishka-gkc-phi3-base",
"training_start": "2025-12-29 04:16:19.019832",
"dataset": {
"path": "/workspace/pql_sft_training.jsonl",
"examples": 10038,
"estimated_tokens": 7000000
},
"lora_config": {
"r": 32,
"alpha": 64,
"dropout": 0.05,
"target_modules": [
"q_proj",
"k_proj",
"v_proj",
"o_proj",
"gate_proj",
"up_proj",
"down_proj"
]
},
"training_args": {
"epochs": 2,
"batch_size": 2,
"learning_rate": 0.0001,
"max_length": 2048
}
} |