| { |
| "model_name": "David-decoupled-deep_efficiency", |
| "run_id": "20251013_004438", |
| "timestamp": "2025-10-13T00:54:25.416777", |
| "best_val_acc": 60.18533333333333, |
| "best_epoch": 1, |
| "final_train_acc": 56.824520144524485, |
| "final_train_loss": 4.0311296205286915, |
| "scale_accuracies": { |
| "128": 60.18533333333333, |
| "256": 68.56666666666666, |
| "384": 71.02133333333333, |
| "448": 71.97066666666667, |
| "512": 72.43066666666667, |
| "576": 72.69866666666667, |
| "640": 73.09866666666667, |
| "768": 73.37733333333334, |
| "896": 73.866 |
| }, |
| "architecture": { |
| "preset": "gated_expert_team", |
| "sharing_mode": "decoupled", |
| "fusion_mode": "deep_efficiency", |
| "scales": [ |
| 128, |
| 256, |
| 384, |
| 448, |
| 512, |
| 576, |
| 640, |
| 768, |
| 896 |
| ], |
| "feature_dim": 512, |
| "num_classes": 1000, |
| "use_belly": true, |
| "belly_expand": 4 |
| }, |
| "training": { |
| "dataset": "AbstractPhil/imagenet-clip-features-orderly", |
| "model_variant": [ |
| "clip_vit_b16", |
| "clip_vit_laion_b32", |
| "clip_vit_b32" |
| ], |
| "num_epochs": 10, |
| "batch_size": 1024, |
| "learning_rate": 0.01, |
| "rose_weight": "0.1\u21920.8", |
| "cayley_loss": false, |
| "optimizer": "AdamW", |
| "scheduler": "cosine_restarts" |
| }, |
| "files": { |
| "weights_safetensors": "weights/David-decoupled-deep_efficiency/20251013_004438/best_model_acc60.19.safetensors", |
| "weights_pytorch": "weights/David-decoupled-deep_efficiency/20251013_004438/best_model.pth", |
| "config": "weights/David-decoupled-deep_efficiency/20251013_004438/david_config.json", |
| "training_config": "weights/David-decoupled-deep_efficiency/20251013_004438/train_config.json", |
| "tensorboard": "runs/David-decoupled-deep_efficiency/20251013_004438/" |
| } |
| } |