File size: 5,576 Bytes
c0ba5ce 85649e3 c0ba5ce c524138 4da7c34 5a84698 c0ba5ce 5a84698 c524138 5357e1d b6e86ee 33a6a8b 578b5db 5357e1d 578b5db b6e86ee 95a78e9 b6e86ee 95a78e9 b6e86ee 125a191 2ae4c30 3f3060f 125a191 3f3060f 125a191 78aacb2 37c0db4 7df61e3 37c0db4 78aacb2 37c0db4 ded51dc 37c0db4 ded51dc 37c0db4 b6ae463 85649e3 c9bda7c b6ae463 c9bda7c b6ae463 c0ba5ce b6ae463 c0ba5ce |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 |
{
"repository": "AbstractPhil/david-shared-space",
"updated": "2025-10-13T01:33:24.619384",
"models": [
{
"model_name": "David-partial_shared-hierarchical_tree",
"run_id": "20251012_194945",
"timestamp": "2025-10-12T20:21:46.311771",
"best_val_acc": 75.74,
"best_epoch": 9,
"num_scales": 4,
"scales": [
256,
512,
768,
1024
],
"parameters": 8758271,
"sharing_mode": "partial_shared",
"fusion_mode": "hierarchical_tree",
"preset": "balanced",
"weights_path": "weights/David-partial_shared-hierarchical_tree/20251012_194945/best_model_acc75.74.safetensors",
"config_path": "weights/David-partial_shared-hierarchical_tree/20251012_194945/david_config.json",
"history_path": "weights/David-partial_shared-hierarchical_tree/20251012_194945/training_history.json"
},
{
"model_name": "David-partial_shared-hierarchical_tree",
"run_id": "20251012_210041",
"timestamp": "2025-10-12T21:45:34.243260",
"best_val_acc": 74.22733333333333,
"best_epoch": 7,
"num_scales": 4,
"scales": [
256,
512,
768,
1024
],
"parameters": 8758271,
"sharing_mode": "partial_shared",
"fusion_mode": "hierarchical_tree",
"preset": "balanced",
"weights_path": "weights/David-partial_shared-hierarchical_tree/20251012_210041/best_model_acc74.23.safetensors",
"config_path": "weights/David-partial_shared-hierarchical_tree/20251012_210041/david_config.json",
"history_path": "weights/David-partial_shared-hierarchical_tree/20251012_210041/training_history.json"
},
{
"model_name": "David-partial_shared-hierarchical_tree",
"run_id": "20251012_191456",
"timestamp": "2025-10-12T19:48:30.099231",
"best_val_acc": 73.695,
"best_epoch": 9,
"num_scales": 4,
"scales": [
256,
512,
768,
1024
],
"parameters": 8758271,
"sharing_mode": "partial_shared",
"fusion_mode": "hierarchical_tree",
"preset": "balanced",
"weights_path": "weights/David-partial_shared-hierarchical_tree/20251012_191456/best_model_acc73.69.safetensors",
"config_path": "weights/David-partial_shared-hierarchical_tree/20251012_191456/david_config.json",
"history_path": "weights/David-partial_shared-hierarchical_tree/20251012_191456/training_history.json"
},
{
"model_name": "David-decoupled-deep_efficiency",
"run_id": "20251012_221046",
"timestamp": "2025-10-12T22:58:06.100595",
"best_val_acc": 66.84133333333334,
"best_epoch": 9,
"num_scales": 5,
"scales": [
256,
512,
768,
1024,
1280
],
"parameters": 14877593,
"sharing_mode": "decoupled",
"fusion_mode": "deep_efficiency",
"preset": "high_accuracy",
"weights_path": "weights/David-decoupled-deep_efficiency/20251012_221046/best_model_acc66.84.safetensors",
"config_path": "weights/David-decoupled-deep_efficiency/20251012_221046/david_config.json",
"history_path": "weights/David-decoupled-deep_efficiency/20251012_221046/training_history.json"
},
{
"model_name": "David-fully_shared-weighted_sum",
"run_id": "20251012_235237",
"timestamp": "2025-10-13T00:38:45.818425",
"best_val_acc": 66.52333333333333,
"best_epoch": 9,
"num_scales": 2,
"scales": [
256,
512
],
"parameters": 656898,
"sharing_mode": "fully_shared",
"fusion_mode": "weighted_sum",
"preset": "small_fast",
"weights_path": "weights/David-fully_shared-weighted_sum/20251012_235237/best_model_acc66.52.safetensors",
"config_path": "weights/David-fully_shared-weighted_sum/20251012_235237/david_config.json",
"history_path": "weights/David-fully_shared-weighted_sum/20251012_235237/training_history.json"
},
{
"model_name": "David-fully_shared-weighted_sum",
"run_id": "20251012_231445",
"timestamp": "2025-10-12T23:51:38.341849",
"best_val_acc": 66.5,
"best_epoch": 7,
"num_scales": 2,
"scales": [
256,
512
],
"parameters": 656898,
"sharing_mode": "fully_shared",
"fusion_mode": "weighted_sum",
"preset": "small_fast",
"weights_path": "weights/David-fully_shared-weighted_sum/20251012_231445/best_model_acc66.50.safetensors",
"config_path": "weights/David-fully_shared-weighted_sum/20251012_231445/david_config.json",
"history_path": "weights/David-fully_shared-weighted_sum/20251012_231445/training_history.json"
},
{
"model_name": "David-decoupled-deep_efficiency",
"run_id": "20251013_004438",
"timestamp": "2025-10-13T01:33:24.619350",
"best_val_acc": 62.938,
"best_epoch": 9,
"num_scales": 9,
"scales": [
128,
256,
384,
448,
512,
576,
640,
768,
896
],
"parameters": 22133801,
"sharing_mode": "decoupled",
"fusion_mode": "deep_efficiency",
"preset": "gated_expert_team",
"weights_path": "weights/David-decoupled-deep_efficiency/20251013_004438/best_model_acc62.94.safetensors",
"config_path": "weights/David-decoupled-deep_efficiency/20251013_004438/david_config.json",
"history_path": "weights/David-decoupled-deep_efficiency/20251013_004438/training_history.json"
}
],
"total_models": 7
} |