| { |
| "repository": "AbstractPhil/gated-david", |
| "updated": "2025-11-04T13:41:00.647211", |
| "models": [ |
| { |
| "model_name": "David-partial_shared-deep_efficiency", |
| "run_id": "20251012_181608", |
| "timestamp": "2025-10-12T18:49:28.035826", |
| "best_val_acc": 84.726, |
| "best_epoch": 2, |
| "num_scales": 8, |
| "scales": [ |
| 384, |
| 512, |
| 768, |
| 1024, |
| 1280, |
| 1536, |
| 1792, |
| 2048 |
| ], |
| "parameters": 60814373, |
| "sharing_mode": "partial_shared", |
| "fusion_mode": "deep_efficiency", |
| "preset": "clip_vit_bigg14", |
| "weights_path": "weights/David-partial_shared-deep_efficiency/20251012_181608/best_model_acc84.73.safetensors", |
| "config_path": "weights/David-partial_shared-deep_efficiency/20251012_181608/david_config.json", |
| "history_path": "weights/David-partial_shared-deep_efficiency/20251012_181608/training_history.json" |
| }, |
| { |
| "model_name": "David-partial_shared-deep_efficiency", |
| "run_id": "20251012_161107", |
| "timestamp": "2025-10-12T16:46:37.288111", |
| "best_val_acc": 84.66, |
| "best_epoch": 9, |
| "num_scales": 8, |
| "scales": [ |
| 384, |
| 512, |
| 768, |
| 1024, |
| 1280, |
| 1536, |
| 1792, |
| 2048 |
| ], |
| "parameters": 60814373, |
| "sharing_mode": "partial_shared", |
| "fusion_mode": "deep_efficiency", |
| "preset": "clip_vit_bigg14", |
| "weights_path": "weights/David-partial_shared-deep_efficiency/20251012_161107/best_model_acc84.66.safetensors", |
| "config_path": "weights/David-partial_shared-deep_efficiency/20251012_161107/david_config.json", |
| "history_path": "weights/David-partial_shared-deep_efficiency/20251012_161107/training_history.json" |
| }, |
| { |
| "model_name": "David-partial_shared-cantor_scale", |
| "run_id": "20251104_133602", |
| "timestamp": "2025-11-04T13:41:00.647154", |
| "best_val_acc": 81.278, |
| "best_epoch": 0, |
| "num_scales": 5, |
| "scales": [ |
| 384, |
| 768, |
| 1024, |
| 1280, |
| 1536 |
| ], |
| "parameters": 32436998, |
| "sharing_mode": "partial_shared", |
| "fusion_mode": "cantor_scale", |
| "preset": "clip_vit_l14_cantor", |
| "weights_path": "weights/David-partial_shared-cantor_scale/20251104_133602/best_model_acc81.28.safetensors", |
| "config_path": "weights/David-partial_shared-cantor_scale/20251104_133602/david_config.json", |
| "history_path": "weights/David-partial_shared-cantor_scale/20251104_133602/training_history.json" |
| }, |
| { |
| "model_name": "David-decoupled-cantor_scale", |
| "run_id": "20251104_125328", |
| "timestamp": "2025-11-04T13:32:58.081861", |
| "best_val_acc": 78.866, |
| "best_epoch": 4, |
| "num_scales": 4, |
| "scales": [ |
| 512, |
| 4096, |
| 8192, |
| 16384 |
| ], |
| "parameters": 751239941, |
| "sharing_mode": "decoupled", |
| "fusion_mode": "cantor_scale", |
| "preset": "clip_vit_b16_cantor_decoupled_massive", |
| "weights_path": "weights/David-decoupled-cantor_scale/20251104_125328/best_model_acc78.87.safetensors", |
| "config_path": "weights/David-decoupled-cantor_scale/20251104_125328/david_config.json", |
| "history_path": "weights/David-decoupled-cantor_scale/20251104_125328/training_history.json" |
| }, |
| { |
| "model_name": "David-partial_shared-cantor_scale", |
| "run_id": "20251104_124032", |
| "timestamp": "2025-11-04T12:50:54.398340", |
| "best_val_acc": 78.182, |
| "best_epoch": 4, |
| "num_scales": 4, |
| "scales": [ |
| 256, |
| 512, |
| 768, |
| 1024 |
| ], |
| "parameters": 12895621, |
| "sharing_mode": "partial_shared", |
| "fusion_mode": "cantor_scale", |
| "preset": "clip_vit_b16_cantor", |
| "weights_path": "weights/David-partial_shared-cantor_scale/20251104_124032/best_model_acc78.18.safetensors", |
| "config_path": "weights/David-partial_shared-cantor_scale/20251104_124032/david_config.json", |
| "history_path": "weights/David-partial_shared-cantor_scale/20251104_124032/training_history.json" |
| }, |
| { |
| "model_name": "David-partial_shared-geometric_attention", |
| "run_id": "20251104_122236", |
| "timestamp": "2025-11-04T12:32:30.016304", |
| "best_val_acc": 78.06, |
| "best_epoch": 4, |
| "num_scales": 4, |
| "scales": [ |
| 256, |
| 512, |
| 768, |
| 1024 |
| ], |
| "parameters": 12599556, |
| "sharing_mode": "partial_shared", |
| "fusion_mode": "geometric_attention", |
| "preset": "clip_vit_b16_geometric", |
| "weights_path": "weights/David-partial_shared-geometric_attention/20251104_122236/best_model_acc78.06.safetensors", |
| "config_path": "weights/David-partial_shared-geometric_attention/20251104_122236/david_config.json", |
| "history_path": "weights/David-partial_shared-geometric_attention/20251104_122236/training_history.json" |
| }, |
| { |
| "model_name": "David-hierarchical-progressive", |
| "run_id": "20251012_145649", |
| "timestamp": "2025-10-12T15:15:00.402465", |
| "best_val_acc": 76.864, |
| "best_epoch": 9, |
| "num_scales": 4, |
| "scales": [ |
| 256, |
| 512, |
| 768, |
| 1024 |
| ], |
| "parameters": 10493184, |
| "sharing_mode": "hierarchical", |
| "fusion_mode": "progressive", |
| "preset": "hierarchical_refinement", |
| "weights_path": "weights/David-hierarchical-progressive/20251012_145649/best_model_acc76.86.safetensors", |
| "config_path": "weights/David-hierarchical-progressive/20251012_145649/david_config.json", |
| "history_path": "weights/David-hierarchical-progressive/20251012_145649/training_history.json" |
| }, |
| { |
| "model_name": "David-partial_shared-hierarchical_tree", |
| "run_id": "20251012_152245", |
| "timestamp": "2025-10-12T15:40:37.893214", |
| "best_val_acc": 75.532, |
| "best_epoch": 8, |
| "num_scales": 4, |
| "scales": [ |
| 256, |
| 512, |
| 768, |
| 1024 |
| ], |
| "parameters": 8758271, |
| "sharing_mode": "partial_shared", |
| "fusion_mode": "hierarchical_tree", |
| "preset": "balanced", |
| "weights_path": "weights/David-partial_shared-hierarchical_tree/20251012_152245/best_model_acc75.53.safetensors", |
| "config_path": "weights/David-partial_shared-hierarchical_tree/20251012_152245/david_config.json", |
| "history_path": "weights/David-partial_shared-hierarchical_tree/20251012_152245/training_history.json" |
| }, |
| { |
| "model_name": "David-hierarchical-progressive", |
| "run_id": "20251012_151647", |
| "timestamp": "2025-10-12T15:18:31.111538", |
| "best_val_acc": 72.232, |
| "best_epoch": 0, |
| "num_scales": 4, |
| "scales": [ |
| 256, |
| 512, |
| 768, |
| 1024 |
| ], |
| "parameters": 10493184, |
| "sharing_mode": "hierarchical", |
| "fusion_mode": "progressive", |
| "preset": "hierarchical_refinement", |
| "weights_path": "weights/David-hierarchical-progressive/20251012_151647/best_model_acc72.23.safetensors", |
| "config_path": "weights/David-hierarchical-progressive/20251012_151647/david_config.json", |
| "history_path": "weights/David-hierarchical-progressive/20251012_151647/training_history.json" |
| }, |
| { |
| "model_name": "David-fully_shared-weighted_sum", |
| "run_id": "20251012_135249", |
| "timestamp": "2025-10-12T14:09:57.535871", |
| "best_val_acc": 71.994, |
| "best_epoch": 9, |
| "num_scales": 2, |
| "scales": [ |
| 256, |
| 512 |
| ], |
| "parameters": 656898, |
| "sharing_mode": "fully_shared", |
| "fusion_mode": "weighted_sum", |
| "preset": "small_fast", |
| "weights_path": "weights/David-fully_shared-weighted_sum/20251012_135249/best_model_acc71.99.safetensors", |
| "config_path": "weights/David-fully_shared-weighted_sum/20251012_135249/david_config.json", |
| "history_path": "weights/David-fully_shared-weighted_sum/20251012_135249/training_history.json" |
| }, |
| { |
| "model_name": "David-fully_shared-weighted_sum", |
| "run_id": "20251012_141246", |
| "timestamp": "2025-10-12T14:29:34.375797", |
| "best_val_acc": 71.726, |
| "best_epoch": 9, |
| "num_scales": 2, |
| "scales": [ |
| 256, |
| 512 |
| ], |
| "parameters": 656898, |
| "sharing_mode": "fully_shared", |
| "fusion_mode": "weighted_sum", |
| "preset": "small_fast", |
| "weights_path": "weights/David-fully_shared-weighted_sum/20251012_141246/best_model_acc71.73.safetensors", |
| "config_path": "weights/David-fully_shared-weighted_sum/20251012_141246/david_config.json", |
| "history_path": "weights/David-fully_shared-weighted_sum/20251012_141246/training_history.json" |
| } |
| ], |
| "total_models": 11 |
| } |