File size: 580 Bytes
88251e5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
{
  "model_type": "sbert_cwl_l2",
  "base_model": "bert-base-uncased",
  "train_split": "train_10",
  "lambda_consistency": 0.25,
  "augmentations": [
    "back_translation",
    "aeda"
  ],
  "cwl_selection": "argmax_l2_distance",
  "augmented_dataset": "SurAyush/stsb_augmented_splits",
  "original_dataset": "SurAyush/stsb_splits",
  "pooling": "mean",
  "val_spearman": 0.8243,
  "test_spearman": 0.7684,
  "baseline_bert": 0.4729,
  "sbert_no_reg": 0.7441,
  "delta_vs_bert": 0.2955,
  "delta_vs_sbert": 0.0243,
  "lr": 2e-05,
  "batch_size": 16,
  "early_stop_patience": 2
}