| { |
| "model_name": "David-decoupled-cantor_scale", |
| "run_id": "20251104_144102", |
| "timestamp": "2025-11-04T14:53:17.199658", |
| "best_val_acc": 85.094, |
| "best_epoch": 2, |
| "final_train_acc": 88.92135061237137, |
| "final_train_loss": 1.0967776605571407, |
| "scale_accuracies": { |
| "384": 83.518, |
| "512": 84.012, |
| "768": 84.434, |
| "1024": 84.376, |
| "1280": 84.022, |
| "1536": 84.16, |
| "1792": 84.126, |
| "2048": 84.176 |
| }, |
| "architecture": { |
| "preset": "clip_vit_bigg14_cantor_decoupled", |
| "sharing_mode": "decoupled", |
| "fusion_mode": "cantor_scale", |
| "scales": [ |
| 384, |
| 512, |
| 768, |
| 1024, |
| 1280, |
| 1536, |
| 1792, |
| 2048 |
| ], |
| "feature_dim": 1280, |
| "num_classes": 1000, |
| "use_belly": true, |
| "belly_expand": 2.0 |
| }, |
| "training": { |
| "dataset": "AbstractPhil/imagenet-clip-features-orderly", |
| "model_variant": "clip_vit_laion_bigg14", |
| "num_epochs": 5, |
| "batch_size": 512, |
| "learning_rate": 0.001, |
| "rose_weight": "0.1\u21920.5", |
| "cayley_loss": false, |
| "optimizer": "AdamW", |
| "scheduler": "cosine_restarts" |
| }, |
| "files": { |
| "weights_safetensors": "weights/David-decoupled-cantor_scale/20251104_144102/best_model_acc85.09.safetensors", |
| "weights_pytorch": "weights/David-decoupled-cantor_scale/20251104_144102/best_model.pth", |
| "config": "weights/David-decoupled-cantor_scale/20251104_144102/david_config.json", |
| "training_config": "weights/David-decoupled-cantor_scale/20251104_144102/train_config.json", |
| "tensorboard": "runs/David-decoupled-cantor_scale/20251104_144102/" |
| } |
| } |