{ "model_name": "David-decoupled-deep_efficiency", "run_id": "20251013_004438", "timestamp": "2025-10-13T01:08:55.162112", "best_val_acc": 61.802, "best_epoch": 4, "final_train_acc": 59.30749074866899, "final_train_loss": 3.694623793321019, "scale_accuracies": { "128": 61.802, "256": 70.146, "384": 72.66, "448": 73.44666666666667, "512": 73.876, "576": 74.25133333333333, "640": 74.45733333333334, "768": 74.82, "896": 75.262 }, "architecture": { "preset": "gated_expert_team", "sharing_mode": "decoupled", "fusion_mode": "deep_efficiency", "scales": [ 128, 256, 384, 448, 512, 576, 640, 768, 896 ], "feature_dim": 512, "num_classes": 1000, "use_belly": true, "belly_expand": 4 }, "training": { "dataset": "AbstractPhil/imagenet-clip-features-orderly", "model_variant": [ "clip_vit_b16", "clip_vit_laion_b32", "clip_vit_b32" ], "num_epochs": 10, "batch_size": 1024, "learning_rate": 0.01, "rose_weight": "0.1\u21920.8", "cayley_loss": false, "optimizer": "AdamW", "scheduler": "cosine_restarts" }, "files": { "weights_safetensors": "weights/David-decoupled-deep_efficiency/20251013_004438/best_model_acc61.80.safetensors", "weights_pytorch": "weights/David-decoupled-deep_efficiency/20251013_004438/best_model.pth", "config": "weights/David-decoupled-deep_efficiency/20251013_004438/david_config.json", "training_config": "weights/David-decoupled-deep_efficiency/20251013_004438/train_config.json", "tensorboard": "runs/David-decoupled-deep_efficiency/20251013_004438/" } }