init models research purposes

Files changed (4) hide show

AlteredShield.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:abbe88b5f9a0ee32941ce9495e381c471ba5e31b88e20f1a0b7cd5d382d4ada6
+size 899265658

BaseShield.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c2caf179c7ae25b2c6bfae58d3210d29c4eec1791e67cc39188d96094fc5590c
+size 879191355

alter_config.json ADDED Viewed

+{
+    "model_type": "ConcatModelWithRationale",
+    "hatebert_model": "GroNLP/hateBERT",
+    "rationale_model": "bert-base-uncased",
+    "cnn_num_filters": 128,
+    "cnn_kernel_sizes": [2, 3, 4],
+    "adapter_dim": 128,
+    "max_length": 128,
+    "num_labels": 2,
+    "architecture": {
+        "temporal_cnn": "TemporalCNN",
+        "msa_cnn": "MultiScaleAttentionCNN",
+        "projection": "ProjectionMLP"
+    },
+    "training_info": {
+        "batch_size": 8,
+        "learning_rate": 1e-5,
+        "weight_decay": 0.05,
+        "dropout": 0.5,
+        "best_val_loss": 0.27
+    }
+}

base_config.json ADDED Viewed

+{
+  "model_type": "BaseShield",
+  "architecture": "HateBERT + Rationale BERT with CLS Concatenation",
+  "version": "1.0.0",
+  "model_config": {
+    "hatebert_model": "GroNLP/hateBERT",
+    "rationale_model": "bert-base-uncased",
+    "hidden_size": 768,
+    "freeze_additional_model": true,
+    "num_labels": 2,
+    "projection_config": {
+      "input_size": 1536,
+      "hidden_size": 256,
+      "output_size": 2,
+      "dropout": 0.3
+    }
+  },
+  "training_config": {
+    "batch_size": 8,
+    "learning_rate": 1e-5,
+    "weight_decay": 0.0,
+    "epochs": 3,
+    "max_length": 128,
+    "optimizer": "AdamW",
+    "warmup_steps": 100,
+    "early_stopping": {
+      "enabled": true,
+      "patience": 3,
+      "metric": "loss"
+    }
+  }
+}