{ "type": "soft_vote_ensemble", "models": [ { "name": "distilbert-base-uncased", "label": "dapt_distilbert", "dir": "dapt_distilbert" }, { "name": "roberta-base", "label": "roberta", "dir": "roberta" }, { "name": "microsoft/deberta-base", "label": "deberta", "dir": "deberta" } ], "label_map": { "DEPRESSED_MOOD": 0, "ANHEDONIA": 1, "APPETITE_CHANGE": 2, "SLEEP_ISSUES": 3, "PSYCHOMOTOR": 4, "FATIGUE": 5, "WORTHLESSNESS": 6, "COGNITIVE_ISSUES": 7, "SUICIDAL_THOUGHTS": 8, "SPECIAL_CASE": 9, "NO_SYMPTOM": 10 }, "label_readable": { "DEPRESSED_MOOD": "Depressed Mood", "ANHEDONIA": "Loss of Interest / Pleasure", "APPETITE_CHANGE": "Appetite / Weight Change", "SLEEP_ISSUES": "Sleep Disturbance", "PSYCHOMOTOR": "Psychomotor Changes", "FATIGUE": "Fatigue / Loss of Energy", "WORTHLESSNESS": "Worthlessness / Guilt", "COGNITIVE_ISSUES": "Difficulty Concentrating", "SUICIDAL_THOUGHTS": "Suicidal Ideation", "SPECIAL_CASE": "Other Clinical Indicator", "NO_SYMPTOM": "No Symptom Detected" }, "num_classes": 11, "pooling": "mean", "max_length": 128, "thresholds": { "DEPRESSED_MOOD": 0.25, "ANHEDONIA": 0.45, "APPETITE_CHANGE": 0.5, "SLEEP_ISSUES": 0.55, "PSYCHOMOTOR": 0.5, "FATIGUE": 0.6000000000000001, "WORTHLESSNESS": 0.4, "COGNITIVE_ISSUES": 0.15000000000000002, "SUICIDAL_THOUGHTS": 0.05, "SPECIAL_CASE": 0.55, "NO_SYMPTOM": 0.15000000000000002 }, "cv_performance": { "ensemble_micro_f1": "0.813 \u00b1 0.010", "ensemble_macro_f1": "0.770 \u00b1 0.017", "threshold_tuned_micro_f1": 0.82, "threshold_tuned_macro_f1": 0.792, "note": "Threshold-tuned metrics have slight optimistic bias (tuned on eval data). True performance is between raw ensemble and tuned metrics." }, "training_config": { "data": "cleaned_v2 (train + val) + augmented_v2 (196 samples)", "total_samples": 1792, "epochs": 7, "lr": 3e-05, "loss": "CrossEntropyLoss (effective-number weights, label_smoothing=0.1)", "pooling": "mean" }, "data_provenance": { "original_dataset": "ReDSM5 (CIKM 2025), 1,484 Reddit posts, 2,058 annotations", "cleaning": "Conflict resolution (53 sentences), dedup (20), confident learning (66 relabeled, 96 removed), manual fixes (9)", "augmentation": "196 samples via Gemini 2.5 Flash paraphrasing, similarity filtered [0.70, 0.95]", "dapt": "Domain-adaptive pre-training on 39K Reddit mental health posts (perplexity 16.90\u21927.59)" } }