| { | |
| "model_type": "sbert_cwl_l2", | |
| "base_model": "bert-base-uncased", | |
| "train_split": "train_20", | |
| "lambda_consistency": 0.5, | |
| "augmentations": [ | |
| "back_translation", | |
| "aeda" | |
| ], | |
| "cwl_selection": "argmax_l2_distance", | |
| "augmented_dataset": "SurAyush/stsb_augmented_splits", | |
| "original_dataset": "SurAyush/stsb_splits", | |
| "pooling": "mean", | |
| "val_spearman": 0.8372, | |
| "test_spearman": 0.7874, | |
| "baseline_bert": 0.4729, | |
| "sbert_no_reg": 0.7441, | |
| "delta_vs_bert": 0.3145, | |
| "delta_vs_sbert": 0.0433, | |
| "lr": 2e-05, | |
| "batch_size": 16, | |
| "early_stop_patience": 2 | |
| } |