Spaces:

Ellie5757575757
/

Aphasia_Classification

Running

App Files Files Community

Ellie5757575757 commited on Aug 8, 2025

Commit

d73663e

verified ·

1 Parent(s): 1d2b5c4

Update config.json

Browse files

Files changed (1) hide show

config.json +97 -64

config.json CHANGED Viewed

@@ -1,71 +1,104 @@
 {
-  "architectures": [
-    "BertForSequenceClassification"
-  ],
-  "attention_probs_dropout_prob": 0.1,
-  "classifier_dropout": null,
-  "gradient_checkpointing": false,
-  "hidden_act": "gelu",
-  "hidden_dropout_prob": 0.1,
-  "hidden_size": 768,
-  "initializer_range": 0.02,
-  "intermediate_size": 3072,
-  "layer_norm_eps": 1e-12,
-  "max_position_embeddings": 512,
-  "model_type": "bert",
-  "num_attention_heads": 12,
-  "num_hidden_layers": 12,
-  "pad_token_id": 0,
-  "position_embedding_type": "absolute",
-  "transformers_version": "4.30.0",
-  "type_vocab_size": 2,
-  "use_cache": true,
-  "vocab_size": 28996,
-  "torch_dtype": "float32",
   "id2label": {
-    "0": "Normal",
-    "1": "Mild Aphasia",
-    "2": "Moderate Aphasia",
-    "3": "Severe Aphasia"
   },
   "label2id": {
-    "Normal": 0,
-    "Mild Aphasia": 1,
-    "Moderate Aphasia": 2,
-    "Severe Aphasia": 3
   },
-  "num_labels": 4,
-  "problem_type": "single_label_classification",
-  "finetuning_task": "aphasia_classification",
-  "_name_or_path": "dmis-lab/biobert-base-cased-v1.1",
-  "base_model": "dmis-lab/biobert-base-cased-v1.1",
-  "task_specific_params": {
-    "aphasia_classification": {
-      "max_length": 512,
-      "do_lower_case": false,
-      "early_stopping": true,
-      "num_beams": 1
-    }
   },
-  "custom_config": {
-    "model_version": "1.0",
-    "training_data": "aphasia_corpus",
-    "evaluation_metrics": {
-      "accuracy": 0.85,
-      "f1_score": 0.83,
-      "precision": 0.84,
-      "recall": 0.82
-    },
-    "feature_extraction": {
-      "linguistic_features": true,
-      "syntactic_complexity": true,
-      "semantic_coherence": true,
-      "discourse_markers": true
-    },
-    "preprocessing": {
-      "cha_format": true,
-      "json_structured": true,
-      "text_normalization": true
-    }
-  }
 }

 {
+  "model_name": "microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract-fulltext",
+  "model_type": "StableAphasiaClassifier",
+  "num_labels": 9,
+  "architectures": ["StableAphasiaClassifier"],
+  "_name_or_path": "microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract-fulltext",
+  "problem_type": "single_label_classification",
+  "aphasia_types_mapping": {
+    "BROCA": 0,
+    "TRANSMOTOR": 1,
+    "NOTAPHASICBYWAB": 2,
+    "CONDUCTION": 3,
+    "WERNICKE": 4,
+    "ANOMIC": 5,
+    "GLOBAL": 6,
+    "ISOLATION": 7,
+    "TRANSSENSORY": 8
+  },
   "id2label": {
+    "0": "BROCA",
+    "1": "TRANSMOTOR",
+    "2": "NOTAPHASICBYWAB",
+    "3": "CONDUCTION",
+    "4": "WERNICKE",
+    "5": "ANOMIC",
+    "6": "GLOBAL",
+    "7": "ISOLATION",
+    "8": "TRANSSENSORY"
   },
   "label2id": {
+    "BROCA": 0,
+    "TRANSMOTOR": 1,
+    "NOTAPHASICBYWAB": 2,
+    "CONDUCTION": 3,
+    "WERNICKE": 4,
+    "ANOMIC": 5,
+    "GLOBAL": 6,
+    "ISOLATION": 7,
+    "TRANSSENSORY": 8
   },
+  "model_config": {
+    "max_length": 512,
+    "hidden_size": 768,
+    "pos_vocab_size": 150,
+    "pos_emb_dim": 64,
+    "grammar_dim": 3,
+    "grammar_hidden_dim": 64,
+    "duration_hidden_dim": 128,
+    "prosody_dim": 32,
+    "num_attention_heads": 8,
+    "attention_dropout": 0.3,
+    "classifier_hidden_dims": [512, 256],
+    "dropout_rate": 0.3,
+    "activation_fn": "tanh"
   },
+  "training_config": {
+    "learning_rate": 0.0005,
+    "weight_decay": 0.01,
+    "warmup_ratio": 0.1,
+    "batch_size": 10,
+    "gradient_accumulation_steps": 4,
+    "use_focal_loss": true,
+    "focal_alpha": 1.0,
+    "focal_gamma": 2.0,
+    "use_mixup": false,
+    "mixup_alpha": 0.2,
+    "use_label_smoothing": true,
+    "label_smoothing": 0.1
+  },
+  "adaptive_lr_config": {
+    "adaptive_lr": true,
+    "lr_patience": 3,
+    "lr_factor": 0.8,
+    "lr_increase_factor": 1.2,
+    "min_lr": 1e-06,
+    "max_lr": 0.001,
+    "oscillation_amplitude": 0.1
+  },
+  "tokenizer_config": {
+    "pad_token": "[PAD]",
+    "unk_token": "[UNK]",
+    "sep_token": "[SEP]",
+    "cls_token": "[CLS]",
+    "mask_token": "[MASK]",
+    "additional_special_tokens": [
+      "[DIALOGUE]",
+      "[TURN]",
+      "[PAUSE]",
+      "[REPEAT]",
+      "[HESITATION]"
+    ]
+  },
+  "torch_dtype": "float32",
+  "transformers_version": "4.36.0"
 }