AbstractPhil commited on
Commit
2fd7fca
·
verified ·
1 Parent(s): 5f751ad

Update beatrix-trainD-frozen-geometry (Epoch 0, Acc: 0.0697) - frozen_geometry

Browse files
README.md CHANGED
@@ -12,7 +12,7 @@ license: mit
12
 
13
  ## Current Experiment: beatrix-trainD-frozen-geometry
14
 
15
- **Model Path**: `weights/beatrix-trainD-frozen-geometry/20251008_203147_frozen_geometry/`
16
 
17
 
18
  ## Architecture
@@ -25,10 +25,10 @@ license: mit
25
 
26
  ## Performance
27
 
28
- - **Best Accuracy**: 0.4962
29
- - **Current Epoch**: 90
30
  - **Dataset**: CIFAR-100
31
 
32
  ---
33
 
34
- *Last updated: Epoch 90 | Best Accuracy: 0.4962*
 
12
 
13
  ## Current Experiment: beatrix-trainD-frozen-geometry
14
 
15
+ **Model Path**: `weights/beatrix-trainD-frozen-geometry/20251008_222447_frozen_geometry/`
16
 
17
 
18
  ## Architecture
 
25
 
26
  ## Performance
27
 
28
+ - **Best Accuracy**: 0.0697
29
+ - **Current Epoch**: 0
30
  - **Dataset**: CIFAR-100
31
 
32
  ---
33
 
34
+ *Last updated: Epoch 0 | Best Accuracy: 0.0697*
weights/beatrix-trainD-frozen-geometry/20251008_222447_frozen_geometry/config.json ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "num_classes": 100,
3
+ "img_size": 32,
4
+ "patch_size": 4,
5
+ "visual_dim": 512,
6
+ "geom_dim": 256,
7
+ "k_simplex": 4,
8
+ "depth": 8,
9
+ "num_heads": 8,
10
+ "mlp_ratio": 4.0,
11
+ "dropout": 0.0,
12
+ "num_geom_tokens": 8,
13
+ "freeze_geometric_stream": true,
14
+ "geometric_checkpoint_path": "./checkpoints_dualstream/20251008_163456_chaos_native/model_epoch_149.safetensors",
15
+ "pe_levels": 12,
16
+ "pe_features_per_level": 2,
17
+ "pe_smooth_tau": 0.25,
18
+ "simplex_init_method": "regular",
19
+ "simplex_init_scale": 1.0,
20
+ "batch_size": 512,
21
+ "num_epochs": 100,
22
+ "learning_rate": 0.0001,
23
+ "weight_decay": 0.005,
24
+ "warmup_epochs": 10,
25
+ "task_loss_weight": 1.0,
26
+ "flow_loss_weight": 0.0,
27
+ "coherence_loss_weight": 0.0,
28
+ "multiscale_loss_weight": 0.0,
29
+ "use_adaptive_augmentation": true,
30
+ "overfit_threshold": 0.05,
31
+ "augmentation_cooldown_epochs": 5,
32
+ "min_accuracy_for_augmentation": 0.45,
33
+ "mixup_alpha": 0.2,
34
+ "cutmix_alpha": 1.0,
35
+ "use_cutmix_schedule": false,
36
+ "cutmix_schedule": [
37
+ [
38
+ 0,
39
+ 0.2
40
+ ],
41
+ [
42
+ 20,
43
+ 0.5
44
+ ],
45
+ [
46
+ 40,
47
+ 1.0
48
+ ],
49
+ [
50
+ 60,
51
+ 1.2
52
+ ],
53
+ [
54
+ 80,
55
+ 1.5
56
+ ],
57
+ [
58
+ 100,
59
+ 1.8
60
+ ],
61
+ [
62
+ 120,
63
+ 2.0
64
+ ]
65
+ ],
66
+ "device": "cuda",
67
+ "num_workers": 4,
68
+ "pin_memory": true,
69
+ "save_dir": "./checkpoints_dualstream",
70
+ "save_every": 10,
71
+ "use_safetensors": true,
72
+ "timestamp_dirs": true,
73
+ "push_to_hub": true,
74
+ "hub_model_id": "AbstractPhil/vit-beatrix-dualstream",
75
+ "hub_model_name": "beatrix-trainD-frozen-geometry",
76
+ "hub_upload_best_only": true,
77
+ "hub_upload_every_n_epochs": 10,
78
+ "use_tensorboard": true,
79
+ "log_dir": "./logs_dualstream",
80
+ "log_every": 50,
81
+ "monitor_stream_health": true,
82
+ "log_stream_norms": true
83
+ }
weights/beatrix-trainD-frozen-geometry/20251008_222447_frozen_geometry/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:120d9b47480dbbd419b5a02a357f4a867a004c30be2f917563bd6d746b7d56fa
3
+ size 164567960