File size: 1,744 Bytes
81834f9
c1a9009
 
2e27ed0
2e45494
 
 
 
81834f9
2e45494
 
 
 
 
 
 
 
 
81834f9
 
c1a9009
 
 
81834f9
c1a9009
81834f9
c1a9009
 
 
 
 
 
 
81834f9
 
 
c1a9009
 
81834f9
 
 
 
8fa679e
1f29e6a
 
81834f9
 
 
 
6568c35
1f29e6a
81834f9
 
 
 
2e45494
c1a9009
 
 
 
81834f9
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
{
  "model_name": "David-decoupled-deep_efficiency",
  "run_id": "20251013_004438",
  "timestamp": "2025-10-13T01:33:26.455926",
  "best_val_acc": 62.938,
  "best_epoch": 9,
  "final_train_acc": 61.07410925611831,
  "final_train_loss": 3.4686684005744417,
  "scale_accuracies": {
    "128": 62.938,
    "256": 71.08266666666667,
    "384": 73.44466666666666,
    "448": 74.28533333333333,
    "512": 74.61,
    "576": 75.04333333333334,
    "640": 75.17533333333333,
    "768": 75.57533333333333,
    "896": 75.904
  },
  "architecture": {
    "preset": "gated_expert_team",
    "sharing_mode": "decoupled",
    "fusion_mode": "deep_efficiency",
    "scales": [
      128,
      256,
      384,
      448,
      512,
      576,
      640,
      768,
      896
    ],
    "feature_dim": 512,
    "num_classes": 1000,
    "use_belly": true,
    "belly_expand": 4
  },
  "training": {
    "dataset": "AbstractPhil/imagenet-clip-features-orderly",
    "model_variant": [
      "clip_vit_b16",
      "clip_vit_laion_b32",
      "clip_vit_b32"
    ],
    "num_epochs": 10,
    "batch_size": 1024,
    "learning_rate": 0.01,
    "rose_weight": "0.1\u21920.8",
    "cayley_loss": false,
    "optimizer": "AdamW",
    "scheduler": "cosine_restarts"
  },
  "files": {
    "weights_safetensors": "weights/David-decoupled-deep_efficiency/20251013_004438/best_model_acc62.94.safetensors",
    "weights_pytorch": "weights/David-decoupled-deep_efficiency/20251013_004438/best_model.pth",
    "config": "weights/David-decoupled-deep_efficiency/20251013_004438/david_config.json",
    "training_config": "weights/David-decoupled-deep_efficiency/20251013_004438/train_config.json",
    "tensorboard": "runs/David-decoupled-deep_efficiency/20251013_004438/"
  }
}