AbstractPhil commited on
Commit
b4ffd15
·
verified ·
1 Parent(s): 7c9fe6a

Update beatrix-dualstream-base (Epoch 0, Acc: 0.0816)

Browse files
README.md CHANGED
@@ -10,25 +10,25 @@ license: mit
10
 
11
  # ViT-Beatrix Dual-Stream Family
12
 
13
- ## Current Experiment: beatrix-trainD-pretrained-geometry
14
 
15
- **Model Path**: `weights/beatrix-trainD-pretrained-geometry/20251009_001904_frozen_geometry/`
16
 
17
 
18
  ## Architecture
19
 
20
  - **Visual Dimension**: 512
21
- - **Geometric Dimension**: 256
22
- - **Geometric Tokens**: 8
23
- - **Dual Blocks**: 8 layers
24
- - **k-simplex**: 4
25
 
26
  ## Performance
27
 
28
- - **Best Accuracy**: 0.3331
29
- - **Current Epoch**: 10
30
  - **Dataset**: CIFAR-100
31
 
32
  ---
33
 
34
- *Last updated: Epoch 10 | Best Accuracy: 0.3331*
 
10
 
11
  # ViT-Beatrix Dual-Stream Family
12
 
13
+ ## Current Experiment: beatrix-dualstream-base
14
 
15
+ **Model Path**: `weights/beatrix-dualstream-base/20251009_011847/`
16
 
17
 
18
  ## Architecture
19
 
20
  - **Visual Dimension**: 512
21
+ - **Geometric Dimension**: 512
22
+ - **Geometric Tokens**: 16
23
+ - **Dual Blocks**: 16 layers
24
+ - **k-simplex**: 12
25
 
26
  ## Performance
27
 
28
+ - **Best Accuracy**: 0.0816
29
+ - **Current Epoch**: 0
30
  - **Dataset**: CIFAR-100
31
 
32
  ---
33
 
34
+ *Last updated: Epoch 0 | Best Accuracy: 0.0816*
weights/beatrix-dualstream-base/20251009_011847/config.json ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "num_classes": 100,
3
+ "img_size": 32,
4
+ "patch_size": 4,
5
+ "visual_dim": 512,
6
+ "geom_dim": 512,
7
+ "k_simplex": 12,
8
+ "depth": 16,
9
+ "num_heads": 8,
10
+ "mlp_ratio": 4.0,
11
+ "dropout": 0.0,
12
+ "num_geom_tokens": 16,
13
+ "freeze_geometric_stream": false,
14
+ "geometric_checkpoint_path": null,
15
+ "pe_levels": 24,
16
+ "pe_features_per_level": 2,
17
+ "pe_smooth_tau": 0.25,
18
+ "simplex_init_method": "regular",
19
+ "simplex_init_scale": 1.0,
20
+ "batch_size": 512,
21
+ "num_epochs": 100,
22
+ "learning_rate": 0.0001,
23
+ "weight_decay": 0.005,
24
+ "warmup_epochs": 10,
25
+ "task_loss_weight": 0.5,
26
+ "flow_loss_weight": 1.0,
27
+ "coherence_loss_weight": 0.3,
28
+ "multiscale_loss_weight": 0.2,
29
+ "use_adaptive_augmentation": false,
30
+ "overfit_threshold": 0.05,
31
+ "augmentation_cooldown_epochs": 5,
32
+ "min_accuracy_for_augmentation": 0.45,
33
+ "mixup_alpha": 0.2,
34
+ "cutmix_alpha": 1.0,
35
+ "use_cutmix_schedule": false,
36
+ "cutmix_schedule": [
37
+ [
38
+ 0,
39
+ 0.2
40
+ ],
41
+ [
42
+ 20,
43
+ 0.5
44
+ ],
45
+ [
46
+ 40,
47
+ 1.0
48
+ ],
49
+ [
50
+ 60,
51
+ 1.2
52
+ ],
53
+ [
54
+ 80,
55
+ 1.5
56
+ ],
57
+ [
58
+ 100,
59
+ 1.8
60
+ ],
61
+ [
62
+ 120,
63
+ 2.0
64
+ ]
65
+ ],
66
+ "device": "cuda",
67
+ "num_workers": 4,
68
+ "pin_memory": true,
69
+ "save_dir": "./checkpoints_dualstream",
70
+ "save_every": 10,
71
+ "use_safetensors": true,
72
+ "timestamp_dirs": true,
73
+ "push_to_hub": true,
74
+ "hub_model_id": "AbstractPhil/vit-beatrix-dualstream",
75
+ "hub_model_name": "beatrix-dualstream-base",
76
+ "hub_upload_best_only": true,
77
+ "hub_upload_every_n_epochs": 10,
78
+ "use_tensorboard": true,
79
+ "log_dir": "./logs_dualstream",
80
+ "log_every": 50,
81
+ "monitor_stream_health": true,
82
+ "log_stream_norms": true
83
+ }
weights/beatrix-dualstream-base/20251009_011847/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42536611e612c2a8f345a107bc036e88fc4a6e812c5d3d402947063695fc1314
3
+ size 538890112