File size: 704 Bytes
bed4c06
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
{
  "train_jsonl": "data/groups_train.jsonl",
  "valid_jsonl": "data/groups_valid.jsonl",
  "run_dir": "runs/planA_strong_adv",
  "backbone": "google/mt5-small",
  "num_latents": 16,
  "latent_dropout": 0.1,
  "latent_noise_std": 0.01,
  "batch_size": 8,
  "grad_accum": 8,
  "epochs": 5,
  "max_doc_len": 256,
  "max_sum_len": 64,
  "eval_every": 400,
  "max_train_examples": 2000,
  "max_valid_examples": 200,
  "lambda_align": 1.0,
  "tau": 0.07,
  "lambda_varcov": 0.1,
  "var_target_std": 0.05,
  "lambda_mean": 1.0,
  "lambda_mean_diff": 0.3,
  "lambda_pair": 0.01,
  "lambda_lang": 10.0,
  "adv_start_step": 300,
  "grl_alpha": 10.0,
  "grl_warmup": 200,
  "lr_model": 0.0003,
  "lr_lang": 0.001
}