{ "adapter_path": "checkpoints/trip-mutator-4b-v0-mlx-r8-v2", "batch_size": 1, "clear_cache_threshold": 0, "config": null, "data": "data/train", "fine_tune_type": "lora", "grad_accumulation_steps": 1, "grad_checkpoint": false, "iters": 600, "learning_rate": 0.0001, "lora_parameters": { "rank": 8, "dropout": 0.0, "scale": 20.0 }, "lr_schedule": null, "mask_prompt": false, "max_seq_length": 8192, "model": "Qwen/Qwen3-4B-Instruct-2507", "num_layers": 32, "optimizer": "adam", "optimizer_config": { "adam": {}, "adamw": {}, "muon": {}, "sgd": {}, "adafactor": {} }, "project_name": null, "report_to": null, "resume_adapter_file": null, "save_every": 200, "seed": 0, "steps_per_eval": 200, "steps_per_report": 10, "test": false, "test_batches": 500, "train": true, "val_batches": 25 }