wish-engine-toolcall-runbook / artifacts /two-phase-toolcall.hf.config.json
sahilmob's picture
docs: add config and job snapshots
8020510 verified
{
"base_model": "openai/gpt-oss-20b",
"phase1_hub_model_id": "sahilmob/gpt-oss-20b-toolcall-phase1-v2-strict-lora",
"final_hub_model_id": "sahilmob/gpt-oss-20b-toolcall-two-phase-v2-lora",
"output_root": "gpt-oss-20b-toolcall-two-phase-v2-sft",
"phase1": {
"dataset_source": "hub",
"dataset_id": "sahilmob/wish-engine-toolcall-next-v2-strict",
"train_split": "train",
"eval_split": "validation",
"num_train_epochs": 2,
"per_device_train_batch_size": 1,
"gradient_accumulation_steps": 16,
"learning_rate": 1.2e-5
},
"phase2": {
"dataset_source": "hub",
"dataset_id": "sahilmob/wish-engine-toolcall-next-v2",
"train_split": "train",
"eval_split": "validation",
"num_train_epochs": 1,
"per_device_train_batch_size": 1,
"gradient_accumulation_steps": 16,
"learning_rate": 8e-6
},
"lora": {
"r": 16,
"lora_alpha": 32,
"lora_dropout": 0.05,
"bias": "none",
"task_type": "CAUSAL_LM",
"target_modules": [
"q_proj",
"k_proj",
"v_proj",
"o_proj"
]
},
"runtime": {
"trackio_project": "wish-engine-toolcalls-gpt-oss-20b",
"trackio_run_name": "two-phase-toolcall-v2-sft-gpt-oss-20b",
"seed": 42,
"logging_steps": 10,
"save_steps": 100,
"save_total_limit": 2,
"eval_steps": 50,
"warmup_ratio": 0.1,
"lr_scheduler_type": "cosine",
"max_length": 1024,
"strict_chat_template": true,
"skip_trainer_model_move": true,
"force_single_device_model": true
}
}