| { | |
| "model_type": "sbert_cfl_l2", | |
| "base_model": "bert-base-uncased", | |
| "train_split": "train_10", | |
| "lambda_consistency": 0.1, | |
| "augmentations": "back_translation", | |
| "cwl_selection": "argmax_l2_distance", | |
| "augmented_dataset": "SurAyush/stsb_augmented_splits", | |
| "original_dataset": "SurAyush/stsb_splits", | |
| "pooling": "mean", | |
| "val_spearman": 0.8229, | |
| "test_spearman": 0.7706, | |
| "baseline_bert": 0.4729, | |
| "sbert_no_reg": 0.7441, | |
| "sbert_with_cwl": 0.7733, | |
| "delta_vs_bert": 0.2977, | |
| "delta_vs_sbert": 0.0265, | |
| "cfl_vs_cwl": -0.0027, | |
| "lr": 2e-05, | |
| "batch_size": 16, | |
| "early_stop_patience": 2 | |
| } |