File size: 578 Bytes
6a0e203 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 | {
"model_type": "sbert_cwl_l2",
"base_model": "bert-base-uncased",
"train_split": "train_10",
"lambda_consistency": 1.0,
"augmentations": [
"back_translation",
"aeda"
],
"cwl_selection": "argmax_l2_distance",
"augmented_dataset": "SurAyush/stsb_augmented_splits",
"original_dataset": "SurAyush/stsb_splits",
"pooling": "mean",
"val_spearman": 0.8121,
"test_spearman": 0.7511,
"baseline_bert": 0.4729,
"sbert_no_reg": 0.7441,
"delta_vs_bert": 0.2782,
"delta_vs_sbert": 0.007,
"lr": 2e-05,
"batch_size": 16,
"early_stop_patience": 2
} |