| { | |
| "train_file": "/home/user/app/data/synthetic/train.jsonl", | |
| "validation_file": "/home/user/app/data/synthetic/validation.jsonl", | |
| "test_file": null, | |
| "output_dir": "/tmp/tiny-router-r6z0atnx/checkpoint", | |
| "encoder_name": "microsoft/MiniLM-L12-H384-uncased", | |
| "device": "cuda", | |
| "feature_mode": "full_interaction", | |
| "pooling_type": "attention", | |
| "use_head_dependencies": true, | |
| "dependency_hidden_dim": 32, | |
| "max_length": 128, | |
| "recency_max": 3600, | |
| "batch_size": 32, | |
| "epochs": 10, | |
| "encoder_lr": 2e-05, | |
| "head_lr": 2e-05, | |
| "weight_decay": 0.01, | |
| "warmup_ratio": 0.1, | |
| "dropout": 0.1, | |
| "seed": 13, | |
| "patience": 2, | |
| "mixed_precision": false, | |
| "confidence_threshold": 0.8, | |
| "head_loss_weights": "{}" | |
| } |