File size: 578 Bytes
6a0e203
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
{
  "model_type": "sbert_cwl_l2",
  "base_model": "bert-base-uncased",
  "train_split": "train_10",
  "lambda_consistency": 1.0,
  "augmentations": [
    "back_translation",
    "aeda"
  ],
  "cwl_selection": "argmax_l2_distance",
  "augmented_dataset": "SurAyush/stsb_augmented_splits",
  "original_dataset": "SurAyush/stsb_splits",
  "pooling": "mean",
  "val_spearman": 0.8121,
  "test_spearman": 0.7511,
  "baseline_bert": 0.4729,
  "sbert_no_reg": 0.7441,
  "delta_vs_bert": 0.2782,
  "delta_vs_sbert": 0.007,
  "lr": 2e-05,
  "batch_size": 16,
  "early_stop_patience": 2
}