AmritJain commited on
Commit
3097927
·
verified ·
1 Parent(s): 1aabcde

Upload config.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.yaml +81 -0
config.yaml ADDED
@@ -0,0 +1,81 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Giant-Killer NLP Configuration
2
+ # Dendritic Optimization Hackathon
3
+
4
+ # Model Configuration
5
+ model:
6
+ name: "prajjwal1/bert-tiny" # 2 layers, 128 hidden size, ~4M params
7
+ num_labels: 2 # Binary classification (toxic/non-toxic)
8
+ hidden_dropout_prob: 0.1
9
+ attention_probs_dropout_prob: 0.1
10
+
11
+ # Data Configuration
12
+ data:
13
+ dataset_name: "jigsaw_toxicity_pred" # Jigsaw Unintended Bias dataset
14
+ max_length: 128 # For fast real-time processing
15
+ train_split: "train"
16
+ val_split: "validation"
17
+ test_split: "test"
18
+ batch_size: 32
19
+ num_workers: 4
20
+
21
+ # Training Configuration
22
+ training:
23
+ epochs: 10
24
+ learning_rate: 2.0e-5
25
+ weight_decay: 0.01
26
+ warmup_steps: 500
27
+ max_grad_norm: 1.0
28
+
29
+ # Scheduler configuration (handled by PAI tracker)
30
+ scheduler:
31
+ step_size: 1
32
+ gamma: 0.1
33
+
34
+ # Early stopping
35
+ early_stopping:
36
+ patience: 3
37
+ min_delta: 0.001
38
+
39
+ # Perforated AI Configuration
40
+ perforated_ai:
41
+ enabled: true
42
+ # Dendrite learning starts after base model plateaus
43
+ dendrite_learning:
44
+ enabled: true
45
+ correlation_threshold: 0.95
46
+
47
+ # Evaluation Configuration
48
+ evaluation:
49
+ metrics:
50
+ - accuracy
51
+ - f1
52
+ - precision
53
+ - recall
54
+ - auc_roc
55
+
56
+ # Benchmarking configuration
57
+ benchmark:
58
+ num_samples: 100
59
+ device: "cpu" # Benchmark on CPU for edge deployment
60
+ warm_up_runs: 10
61
+
62
+ # Quantization Configuration
63
+ quantization:
64
+ enabled: true
65
+ dtype: "qint8"
66
+ # Layers to quantize
67
+ layers:
68
+ - torch.nn.Linear
69
+ - torch.nn.Embedding
70
+
71
+ # Logging Configuration
72
+ logging:
73
+ level: "INFO"
74
+ tensorboard: true
75
+ log_dir: "logs/"
76
+ save_dir: "checkpoints/"
77
+ save_every_n_epochs: 1
78
+
79
+ # Reproducibility
80
+ seed: 42
81
+ deterministic: true