{ "model_name": "David-decoupled-deep_efficiency", "run_id": "20251013_004438", "timestamp": "2025-10-13T01:13:44.834572", "best_val_acc": 62.246, "best_epoch": 5, "final_train_acc": 59.79954213619302, "final_train_loss": 3.6294693627380346, "scale_accuracies": { "128": 62.246, "256": 70.442, "384": 72.89, "448": 73.616, "512": 74.13, "576": 74.53733333333334, "640": 74.72066666666667, "768": 75.086, "896": 75.43733333333333 }, "architecture": { "preset": "gated_expert_team", "sharing_mode": "decoupled", "fusion_mode": "deep_efficiency", "scales": [ 128, 256, 384, 448, 512, 576, 640, 768, 896 ], "feature_dim": 512, "num_classes": 1000, "use_belly": true, "belly_expand": 4 }, "training": { "dataset": "AbstractPhil/imagenet-clip-features-orderly", "model_variant": [ "clip_vit_b16", "clip_vit_laion_b32", "clip_vit_b32" ], "num_epochs": 10, "batch_size": 1024, "learning_rate": 0.01, "rose_weight": "0.1\u21920.8", "cayley_loss": false, "optimizer": "AdamW", "scheduler": "cosine_restarts" }, "files": { "weights_safetensors": "weights/David-decoupled-deep_efficiency/20251013_004438/best_model_acc62.25.safetensors", "weights_pytorch": "weights/David-decoupled-deep_efficiency/20251013_004438/best_model.pth", "config": "weights/David-decoupled-deep_efficiency/20251013_004438/david_config.json", "training_config": "weights/David-decoupled-deep_efficiency/20251013_004438/train_config.json", "tensorboard": "runs/David-decoupled-deep_efficiency/20251013_004438/" } }