| { | |
| "model_name": "David-fully_shared-weighted_sum", | |
| "run_id": "20251012_231445", | |
| "timestamp": "2025-10-12T23:51:39.621670", | |
| "best_val_acc": 66.5, | |
| "best_epoch": 7, | |
| "final_train_acc": 63.52585832552145, | |
| "final_train_loss": 4.081520883974777, | |
| "scale_accuracies": { | |
| "256": 65.83333333333333, | |
| "512": 66.44466666666666 | |
| }, | |
| "architecture": { | |
| "preset": "small_fast", | |
| "sharing_mode": "fully_shared", | |
| "fusion_mode": "weighted_sum", | |
| "scales": [ | |
| 256, | |
| 512 | |
| ], | |
| "feature_dim": 512, | |
| "num_classes": 1000, | |
| "use_belly": false, | |
| "belly_expand": 2.0 | |
| }, | |
| "training": { | |
| "dataset": "AbstractPhil/imagenet-clip-features-orderly", | |
| "model_variant": [ | |
| "clip_vit_b16", | |
| "clip_vit_laion_b32", | |
| "clip_vit_b32" | |
| ], | |
| "num_epochs": 10, | |
| "batch_size": 1024, | |
| "learning_rate": 0.01, | |
| "rose_weight": "0.2\u21920.6", | |
| "cayley_loss": false, | |
| "optimizer": "AdamW", | |
| "scheduler": "cosine_restarts" | |
| }, | |
| "files": { | |
| "weights_safetensors": "weights/David-fully_shared-weighted_sum/20251012_231445/best_model_acc66.50.safetensors", | |
| "weights_pytorch": "weights/David-fully_shared-weighted_sum/20251012_231445/best_model.pth", | |
| "config": "weights/David-fully_shared-weighted_sum/20251012_231445/david_config.json", | |
| "training_config": "weights/David-fully_shared-weighted_sum/20251012_231445/train_config.json", | |
| "tensorboard": "runs/David-fully_shared-weighted_sum/20251012_231445/" | |
| } | |
| } |