AbstractPhil commited on
Commit
d6ebac0
·
verified ·
1 Parent(s): 242d1f5

Update metrics - Run 20251012_231445

Browse files
Files changed (1) hide show
  1. best_model.json +21 -27
best_model.json CHANGED
@@ -1,33 +1,27 @@
1
  {
2
- "model_name": "David-decoupled-deep_efficiency",
3
- "run_id": "20251012_221046",
4
- "timestamp": "2025-10-12T22:58:07.451985",
5
- "best_val_acc": 66.84133333333334,
6
- "best_epoch": 9,
7
- "final_train_acc": 66.11519029135155,
8
- "final_train_loss": 3.1497012801670814,
9
  "scale_accuracies": {
10
- "256": 66.84133333333334,
11
- "512": 72.716,
12
- "768": 74.34333333333333,
13
- "1024": 75.08933333333333,
14
- "1280": 75.36933333333333
15
  },
16
  "architecture": {
17
- "preset": "high_accuracy",
18
- "sharing_mode": "decoupled",
19
- "fusion_mode": "deep_efficiency",
20
  "scales": [
21
  256,
22
- 512,
23
- 768,
24
- 1024,
25
- 1280
26
  ],
27
  "feature_dim": 512,
28
  "num_classes": 1000,
29
- "use_belly": true,
30
- "belly_expand": 2.5
31
  },
32
  "training": {
33
  "dataset": "AbstractPhil/imagenet-clip-features-orderly",
@@ -39,16 +33,16 @@
39
  "num_epochs": 10,
40
  "batch_size": 1024,
41
  "learning_rate": 0.01,
42
- "rose_weight": "0.2\u21920.8",
43
  "cayley_loss": false,
44
  "optimizer": "AdamW",
45
  "scheduler": "cosine_restarts"
46
  },
47
  "files": {
48
- "weights_safetensors": "weights/David-decoupled-deep_efficiency/20251012_221046/best_model_acc66.84.safetensors",
49
- "weights_pytorch": "weights/David-decoupled-deep_efficiency/20251012_221046/best_model.pth",
50
- "config": "weights/David-decoupled-deep_efficiency/20251012_221046/david_config.json",
51
- "training_config": "weights/David-decoupled-deep_efficiency/20251012_221046/train_config.json",
52
- "tensorboard": "runs/David-decoupled-deep_efficiency/20251012_221046/"
53
  }
54
  }
 
1
  {
2
+ "model_name": "David-fully_shared-weighted_sum",
3
+ "run_id": "20251012_231445",
4
+ "timestamp": "2025-10-12T23:19:29.286511",
5
+ "best_val_acc": 63.041333333333334,
6
+ "best_epoch": 0,
7
+ "final_train_acc": 54.91727464101089,
8
+ "final_train_loss": 5.311051666323785,
9
  "scale_accuracies": {
10
+ "256": 62.11666666666667,
11
+ "512": 62.967333333333336
 
 
 
12
  },
13
  "architecture": {
14
+ "preset": "small_fast",
15
+ "sharing_mode": "fully_shared",
16
+ "fusion_mode": "weighted_sum",
17
  "scales": [
18
  256,
19
+ 512
 
 
 
20
  ],
21
  "feature_dim": 512,
22
  "num_classes": 1000,
23
+ "use_belly": false,
24
+ "belly_expand": 2.0
25
  },
26
  "training": {
27
  "dataset": "AbstractPhil/imagenet-clip-features-orderly",
 
33
  "num_epochs": 10,
34
  "batch_size": 1024,
35
  "learning_rate": 0.01,
36
+ "rose_weight": "0.2\u21920.6",
37
  "cayley_loss": false,
38
  "optimizer": "AdamW",
39
  "scheduler": "cosine_restarts"
40
  },
41
  "files": {
42
+ "weights_safetensors": "weights/David-fully_shared-weighted_sum/20251012_231445/best_model_acc63.04.safetensors",
43
+ "weights_pytorch": "weights/David-fully_shared-weighted_sum/20251012_231445/best_model.pth",
44
+ "config": "weights/David-fully_shared-weighted_sum/20251012_231445/david_config.json",
45
+ "training_config": "weights/David-fully_shared-weighted_sum/20251012_231445/train_config.json",
46
+ "tensorboard": "runs/David-fully_shared-weighted_sum/20251012_231445/"
47
  }
48
  }