| { | |
| "model": "phi4-mini", | |
| "use_unsloth_model": true, | |
| "dataset": "UWV/wim-instruct-wiki-to-jsonld-agent-steps", | |
| "max_samples": null, | |
| "filter_n2_only": true, | |
| "max_seq_length": 8192, | |
| "batch_size": 32, | |
| "gradient_accumulation_steps": 1, | |
| "max_steps": 5000, | |
| "learning_rate": 2e-05, | |
| "warmup_steps": 100, | |
| "max_grad_norm": 1.0, | |
| "lora_r": 512, | |
| "lora_alpha": 1024, | |
| "lora_dropout": 0.05, | |
| "target_modules": [ | |
| "q_proj", | |
| "k_proj", | |
| "v_proj", | |
| "o_proj" | |
| ], | |
| "load_in_4bit": true, | |
| "use_gradient_checkpointing": false, | |
| "rope_scaling": null, | |
| "output_dir": "/data/model_outputs/n2_schema_retrieval_model", | |
| "assistant_only_loss": true, | |
| "no_eval": false, | |
| "num_workers": 8, | |
| "full_finetune": false, | |
| "wandb": true, | |
| "seed": 42, | |
| "push_to_hub": false, | |
| "hub_model_id": null | |
| } |