AbstractPhil commited on
Commit
5ef26d3
·
verified ·
1 Parent(s): 7b6206c

Update david_config.json - Run 20251104_122236

Browse files
weights/David-partial_shared-geometric_attention/20251104_122236/david_config.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "david_clip_vit_b16_geometric",
3
+ "uid": "c.david.clip_vit_b16_geometric",
4
+ "feature_dim": 512,
5
+ "num_classes": 1000,
6
+ "scales": [
7
+ 256,
8
+ 512,
9
+ 768,
10
+ 1024
11
+ ],
12
+ "sharing_mode": "partial_shared",
13
+ "fusion_mode": "geometric_attention",
14
+ "use_belly": true,
15
+ "belly_expand": 2.0,
16
+ "projection_temperature": 0.07,
17
+ "shared_feature_dim": 768,
18
+ "shared_layers": 2,
19
+ "shared_dropout": 0.1,
20
+ "fusion_temperature": 1.0,
21
+ "fusion_dropout": 0.1,
22
+ "tree_depth": 3,
23
+ "num_experts": 3,
24
+ "compression_ratio": 4,
25
+ "expert_dropout": 0.1,
26
+ "attention_dropout": 0.1,
27
+ "geometric_num_heads": 4,
28
+ "geometric_use_cayley": true,
29
+ "geometric_use_angular": true,
30
+ "geometric_scale_dim_aware": true,
31
+ "cantor_num_heads": 4,
32
+ "cantor_depth": 8,
33
+ "cantor_local_window": 3,
34
+ "cantor_use_scale_embeddings": true,
35
+ "progressive_training": false,
36
+ "scale_warmup_epochs": {
37
+ "256": 0,
38
+ "512": 0,
39
+ "768": 0,
40
+ "1024": 0
41
+ }
42
+ }