david-shared-space / weights /David-partial_shared-hierarchical_tree /20251012_191456 /david_config.json
| { | |
| "name": "david_balanced", | |
| "uid": "c.david.balanced", | |
| "feature_dim": 512, | |
| "num_classes": 1000, | |
| "scales": [ | |
| 256, | |
| 512, | |
| 768, | |
| 1024 | |
| ], | |
| "sharing_mode": "partial_shared", | |
| "fusion_mode": "hierarchical_tree", | |
| "use_belly": true, | |
| "belly_expand": 2.0, | |
| "shared_feature_dim": 768, | |
| "shared_layers": 2, | |
| "shared_dropout": 0.1, | |
| "fusion_temperature": 1.0, | |
| "fusion_dropout": 0.1, | |
| "tree_depth": 3, | |
| "num_experts": 3, | |
| "compression_ratio": 4, | |
| "expert_dropout": 0.1, | |
| "attention_dropout": 0.1, | |
| "progressive_training": true, | |
| "scale_warmup_epochs": { | |
| "256": 0, | |
| "512": 2, | |
| "768": 5, | |
| "1024": 8 | |
| } | |
| } |