Update alter_config.json

#3
by niel-2ru - opened
Files changed (1) hide show
  1. alter_config.json +28 -17
alter_config.json CHANGED
@@ -1,22 +1,33 @@
1
  {
2
- "model_type": "ConcatModelWithRationale",
3
- "hatebert_model": "GroNLP/hateBERT",
4
- "rationale_model": "bert-base-uncased",
5
- "cnn_num_filters": 128,
6
- "cnn_kernel_sizes": [2, 3, 4],
 
 
 
7
  "adapter_dim": 128,
8
  "max_length": 128,
9
  "num_labels": 2,
10
- "architecture": {
11
- "temporal_cnn": "TemporalCNN",
12
- "msa_cnn": "MultiScaleAttentionCNN",
13
- "projection": "ProjectionMLP"
14
- },
15
- "training_info": {
16
- "batch_size": 8,
17
- "learning_rate": 1e-5,
18
- "weight_decay": 0.05,
19
- "dropout": 0.5,
20
- "best_val_loss": 0.27
21
- }
 
 
 
 
 
 
 
 
22
  }
 
1
  {
2
+ "model_type": "ConcatModelWithRationale",
3
+ "hatebert_model": "GroNLP/HateBERT",
4
+ "rationale_model": "bert-base-uncased",
5
+
6
+ "training_config": {
7
+ "cnn_filters": 128,
8
+ "cnn_kernels": [2, 3, 4],
9
+ "cnn_dropout": 0.3,
10
  "adapter_dim": 128,
11
  "max_length": 128,
12
  "num_labels": 2,
13
+
14
+ "batch_size": 8,
15
+ "learning_rate": 2e-5,
16
+ "weight_decay": 0.05,
17
+ "best_val_f1": 0.00
18
+ },
19
+
20
+ "architecture": {
21
+ "temporal_cnn": "TemporalCNN (max+mean pooling)",
22
+ "msa_cnn": "MultiScaleAttentionCNN (token attention pooling)",
23
+ "selector": "Gumbel-Sigmoid Token Selector",
24
+ "projection": "ProjectionMLP (concat CLS + CNN + rationale pooled)"
25
+ },
26
+
27
+ "notes": {
28
+ "trained_with": "ConcatModelWithRationale",
29
+ "framework": "PyTorch + Transformers",
30
+ "encoder_main": "HateBERT",
31
+ "encoder_rationale": "BERT-base-uncased"
32
+ }
33
  }