| { | |
| "model_name": "David-partial_shared-deep_efficiency", | |
| "run_id": "20251012_181608", | |
| "timestamp": "2025-10-12T18:19:44.592213", | |
| "best_val_acc": 83.662, | |
| "best_epoch": 0, | |
| "final_train_acc": 82.10982643168299, | |
| "final_train_loss": 1.8410232910713829, | |
| "scale_accuracies": { | |
| "384": 83.27, | |
| "512": 83.312, | |
| "768": 83.59, | |
| "1024": 83.496, | |
| "1280": 83.662, | |
| "1536": 83.514, | |
| "1792": 83.398, | |
| "2048": 83.598 | |
| }, | |
| "architecture": { | |
| "preset": "clip_vit_bigg14", | |
| "sharing_mode": "partial_shared", | |
| "fusion_mode": "deep_efficiency", | |
| "scales": [ | |
| 384, | |
| 512, | |
| 768, | |
| 1024, | |
| 1280, | |
| 1536, | |
| 1792, | |
| 2048 | |
| ], | |
| "feature_dim": 1280, | |
| "num_classes": 1000, | |
| "use_belly": true, | |
| "belly_expand": 2.0 | |
| }, | |
| "training": { | |
| "dataset": "AbstractPhil/imagenet-clip-features-orderly", | |
| "model_variant": "clip_vit_laion_bigg14", | |
| "num_epochs": 10, | |
| "batch_size": 1024, | |
| "learning_rate": 0.001, | |
| "rose_weight": "0.1\u21920.5", | |
| "cayley_loss": false, | |
| "optimizer": "AdamW", | |
| "scheduler": "cosine_restarts" | |
| }, | |
| "files": { | |
| "weights_safetensors": "weights/David-partial_shared-deep_efficiency/20251012_181608/best_model_acc83.66.safetensors", | |
| "weights_pytorch": "weights/David-partial_shared-deep_efficiency/20251012_181608/best_model.pth", | |
| "config": "weights/David-partial_shared-deep_efficiency/20251012_181608/david_config.json", | |
| "training_config": "weights/David-partial_shared-deep_efficiency/20251012_181608/train_config.json", | |
| "tensorboard": "runs/David-partial_shared-deep_efficiency/20251012_181608/" | |
| } | |
| } |