AbstractPhil commited on
Commit
d03de48
·
verified ·
1 Parent(s): 89458a5

Update metrics - Run 20251104_122236

Browse files
Files changed (1) hide show
  1. best_model.json +23 -31
best_model.json CHANGED
@@ -1,44 +1,36 @@
1
  {
2
- "model_name": "David-partial_shared-deep_efficiency",
3
- "run_id": "20251012_181608",
4
- "timestamp": "2025-10-12T18:49:29.551461",
5
- "best_val_acc": 84.726,
6
- "best_epoch": 2,
7
- "final_train_acc": 96.34231915121136,
8
- "final_train_loss": 0.356455498800491,
9
  "scale_accuracies": {
10
- "384": 84.386,
11
- "512": 84.67,
12
- "768": 84.52,
13
- "1024": 84.71,
14
- "1280": 84.726,
15
- "1536": 84.566,
16
- "1792": 84.584,
17
- "2048": 84.59
18
  },
19
  "architecture": {
20
- "preset": "clip_vit_bigg14",
21
  "sharing_mode": "partial_shared",
22
- "fusion_mode": "deep_efficiency",
23
  "scales": [
24
- 384,
25
  512,
26
  768,
27
- 1024,
28
- 1280,
29
- 1536,
30
- 1792,
31
- 2048
32
  ],
33
- "feature_dim": 1280,
34
  "num_classes": 1000,
35
  "use_belly": true,
36
  "belly_expand": 2.0
37
  },
38
  "training": {
39
  "dataset": "AbstractPhil/imagenet-clip-features-orderly",
40
- "model_variant": "clip_vit_laion_bigg14",
41
- "num_epochs": 10,
42
  "batch_size": 1024,
43
  "learning_rate": 0.001,
44
  "rose_weight": "0.1\u21920.5",
@@ -47,10 +39,10 @@
47
  "scheduler": "cosine_restarts"
48
  },
49
  "files": {
50
- "weights_safetensors": "weights/David-partial_shared-deep_efficiency/20251012_181608/best_model_acc84.73.safetensors",
51
- "weights_pytorch": "weights/David-partial_shared-deep_efficiency/20251012_181608/best_model.pth",
52
- "config": "weights/David-partial_shared-deep_efficiency/20251012_181608/david_config.json",
53
- "training_config": "weights/David-partial_shared-deep_efficiency/20251012_181608/train_config.json",
54
- "tensorboard": "runs/David-partial_shared-deep_efficiency/20251012_181608/"
55
  }
56
  }
 
1
  {
2
+ "model_name": "David-partial_shared-geometric_attention",
3
+ "run_id": "20251104_122236",
4
+ "timestamp": "2025-11-04T12:24:29.877506",
5
+ "best_val_acc": 76.112,
6
+ "best_epoch": 0,
7
+ "final_train_acc": 71.75278476576433,
8
+ "final_train_loss": 3.1981250359989204,
9
  "scale_accuracies": {
10
+ "256": 74.25,
11
+ "512": 75.164,
12
+ "768": 75.256,
13
+ "1024": 75.82
 
 
 
 
14
  },
15
  "architecture": {
16
+ "preset": "clip_vit_b16_geometric",
17
  "sharing_mode": "partial_shared",
18
+ "fusion_mode": "geometric_attention",
19
  "scales": [
20
+ 256,
21
  512,
22
  768,
23
+ 1024
 
 
 
 
24
  ],
25
+ "feature_dim": 512,
26
  "num_classes": 1000,
27
  "use_belly": true,
28
  "belly_expand": 2.0
29
  },
30
  "training": {
31
  "dataset": "AbstractPhil/imagenet-clip-features-orderly",
32
+ "model_variant": "clip_vit_b16",
33
+ "num_epochs": 5,
34
  "batch_size": 1024,
35
  "learning_rate": 0.001,
36
  "rose_weight": "0.1\u21920.5",
 
39
  "scheduler": "cosine_restarts"
40
  },
41
  "files": {
42
+ "weights_safetensors": "weights/David-partial_shared-geometric_attention/20251104_122236/best_model_acc76.11.safetensors",
43
+ "weights_pytorch": "weights/David-partial_shared-geometric_attention/20251104_122236/best_model.pth",
44
+ "config": "weights/David-partial_shared-geometric_attention/20251104_122236/david_config.json",
45
+ "training_config": "weights/David-partial_shared-geometric_attention/20251104_122236/train_config.json",
46
+ "tensorboard": "runs/David-partial_shared-geometric_attention/20251104_122236/"
47
  }
48
  }