| { |
| "model_dir": "models/deberta_v3_mlm", |
| "task1_csv": "Data_for_deberta/processed/task1_ready/train.csv", |
| "task2_csv": "Data_for_deberta/processed/task2_ready/train.csv", |
| "output_dir": "outputs/train_runs", |
| "max_length": 384, |
| "val_ratio": 0.1, |
| "seed": 42, |
| "batch_size": 16, |
| "max_epochs": 10, |
| "min_epochs": 3, |
| "early_stop_patience": 2, |
| "learning_rate": 1.5e-05, |
| "weight_decay": 0.01, |
| "warmup_ratio": 0.06, |
| "boost_mult": 1.0, |
| "focal_gamma_task1": 0.0, |
| "rdrop_alpha_task2": 0.7, |
| "lambda_task1": 1.0, |
| "lambda_task2": 1.0, |
| "label_smoothing_task1": 0.02, |
| "label_smoothing_task2": 0.05, |
| "task2_balance_power": 0.5, |
| "task2_balance_min": 0.2, |
| "task2_balance_max": 5.0, |
| "title_empty_token": "[TITLE_EMPTY]", |
| "use_amp": true, |
| "cartography": true, |
| "cartography_lowmean_q": 0.005, |
| "cartography_task2_per_category_cap": 30 |
| } |