| { | |
| "train_jsonl": "data/groups_train.jsonl", | |
| "valid_jsonl": "data/groups_valid.jsonl", | |
| "run_dir": "runs/planA_strong_adv", | |
| "backbone": "google/mt5-small", | |
| "num_latents": 16, | |
| "latent_dropout": 0.1, | |
| "latent_noise_std": 0.01, | |
| "batch_size": 8, | |
| "grad_accum": 8, | |
| "epochs": 5, | |
| "max_doc_len": 256, | |
| "max_sum_len": 64, | |
| "eval_every": 400, | |
| "max_train_examples": 2000, | |
| "max_valid_examples": 200, | |
| "lambda_align": 1.0, | |
| "tau": 0.07, | |
| "lambda_varcov": 0.1, | |
| "var_target_std": 0.05, | |
| "lambda_mean": 1.0, | |
| "lambda_mean_diff": 0.3, | |
| "lambda_pair": 0.01, | |
| "lambda_lang": 10.0, | |
| "adv_start_step": 300, | |
| "grl_alpha": 10.0, | |
| "grl_warmup": 200, | |
| "lr_model": 0.0003, | |
| "lr_lang": 0.001 | |
| } |