AbstractPhil commited on
Commit
5e37977
·
verified ·
1 Parent(s): 9c604d8

Upload weights and configs - Run 20251012_060013

Browse files
weights/best_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8c8c1b0b0d1d118d7f880b490776a34704118f99f16b630e4db415a1ae617aec
3
- size 325845164
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f43bed2fac2969dcf5527abfb501d2730cd33ac87f0e9cd365432e486a8c1bc4
3
+ size 2628344
weights/best_model_metadata.json CHANGED
The diff for this file is too large to render. See raw diff
 
weights/david_config.json CHANGED
@@ -1,45 +1,29 @@
1
  {
2
- "name": "david_clip_vit_l14_deep",
3
- "uid": "c.david.clip_vit_l14_deep",
4
- "feature_dim": 768,
5
  "num_classes": 1000,
6
  "scales": [
7
  256,
8
- 512,
9
- 768,
10
- 1024,
11
- 1280,
12
- 1536,
13
- 1792,
14
- 2048,
15
- 2304,
16
- 2560
17
  ],
18
- "sharing_mode": "partial_shared",
19
- "fusion_mode": "deep_efficiency",
20
- "use_belly": true,
21
  "belly_expand": 2.0,
22
- "shared_feature_dim": 1024,
23
- "shared_layers": 4,
24
  "shared_dropout": 0.1,
25
  "fusion_temperature": 1.0,
26
  "fusion_dropout": 0.1,
27
  "tree_depth": 3,
28
- "num_experts": 4,
29
  "compression_ratio": 4,
30
  "expert_dropout": 0.1,
31
  "attention_dropout": 0.1,
32
- "progressive_training": true,
33
  "scale_warmup_epochs": {
34
  "256": 0,
35
- "512": 1,
36
- "768": 2,
37
- "1024": 3,
38
- "1280": 4,
39
- "1536": 5,
40
- "1792": 6,
41
- "2048": 7,
42
- "2304": 8,
43
- "2560": 9
44
  }
45
  }
 
1
  {
2
+ "name": "david_small_fast",
3
+ "uid": "c.david.small_fast",
4
+ "feature_dim": 512,
5
  "num_classes": 1000,
6
  "scales": [
7
  256,
8
+ 512
 
 
 
 
 
 
 
 
9
  ],
10
+ "sharing_mode": "fully_shared",
11
+ "fusion_mode": "weighted_sum",
12
+ "use_belly": false,
13
  "belly_expand": 2.0,
14
+ "shared_feature_dim": 512,
15
+ "shared_layers": 1,
16
  "shared_dropout": 0.1,
17
  "fusion_temperature": 1.0,
18
  "fusion_dropout": 0.1,
19
  "tree_depth": 3,
20
+ "num_experts": 3,
21
  "compression_ratio": 4,
22
  "expert_dropout": 0.1,
23
  "attention_dropout": 0.1,
24
+ "progressive_training": false,
25
  "scale_warmup_epochs": {
26
  "256": 0,
27
+ "512": 0
 
 
 
 
 
 
 
 
28
  }
29
  }
weights/train_config.json CHANGED
@@ -1,27 +1,16 @@
1
  {
2
  "name": "david_training",
3
- "run_id": "20251012_050214",
4
  "dataset_name": "AbstractPhil/imagenet-clip-features-orderly",
5
- "model_variant": "clip_vit_l14",
6
  "num_classes": 1000,
7
- "preset": "clip_vit_l14_deep",
8
  "custom_config_path": null,
9
  "num_classes_override": null,
10
  "use_belly_override": null,
11
  "belly_expand_override": null,
12
- "progressive_training_override": true,
13
- "scale_warmup_epochs_override": {
14
- "256": 0,
15
- "512": 1,
16
- "768": 2,
17
- "1024": 3,
18
- "1280": 4,
19
- "1536": 5,
20
- "1792": 6,
21
- "2048": 7,
22
- "2304": 8,
23
- "2560": 9
24
- },
25
  "num_epochs": 10,
26
  "batch_size": 1024,
27
  "learning_rate": 0.01,
 
1
  {
2
  "name": "david_training",
3
+ "run_id": "20251012_060013",
4
  "dataset_name": "AbstractPhil/imagenet-clip-features-orderly",
5
+ "model_variant": "clip_vit_b16",
6
  "num_classes": 1000,
7
+ "preset": "small_fast",
8
  "custom_config_path": null,
9
  "num_classes_override": null,
10
  "use_belly_override": null,
11
  "belly_expand_override": null,
12
+ "progressive_training_override": false,
13
+ "scale_warmup_epochs_override": null,
 
 
 
 
 
 
 
 
 
 
 
14
  "num_epochs": 10,
15
  "batch_size": 1024,
16
  "learning_rate": 0.01,