File size: 1,584 Bytes
ec4601d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
{
  "num_classes": 100,
  "img_size": 32,
  "patch_size": 4,
  "visual_dim": 512,
  "geom_dim": 256,
  "k_simplex": 4,
  "depth": 8,
  "num_heads": 8,
  "mlp_ratio": 4.0,
  "dropout": 0.0,
  "num_geom_tokens": 8,
  "pe_levels": 12,
  "pe_features_per_level": 2,
  "pe_smooth_tau": 0.25,
  "simplex_init_method": "regular",
  "simplex_init_scale": 1.0,
  "batch_size": 512,
  "num_epochs": 150,
  "learning_rate": 0.0001,
  "weight_decay": 0.005,
  "warmup_epochs": 10,
  "task_loss_weight": 0.5,
  "flow_loss_weight": 1.5,
  "coherence_loss_weight": 0.5,
  "multiscale_loss_weight": 0.3,
  "use_adaptive_augmentation": false,
  "overfit_threshold": 0.05,
  "augmentation_cooldown_epochs": 5,
  "min_accuracy_for_augmentation": 0.45,
  "mixup_alpha": 0.2,
  "cutmix_alpha": 1.0,
  "use_cutmix_schedule": true,
  "cutmix_schedule": [
    [
      0,
      0.2
    ],
    [
      20,
      0.5
    ],
    [
      40,
      1.0
    ],
    [
      60,
      1.2
    ],
    [
      80,
      1.5
    ],
    [
      100,
      1.8
    ],
    [
      120,
      2.0
    ]
  ],
  "device": "cuda",
  "num_workers": 4,
  "pin_memory": true,
  "save_dir": "./checkpoints_dualstream",
  "save_every": 10,
  "use_safetensors": true,
  "timestamp_dirs": true,
  "push_to_hub": true,
  "hub_model_id": "AbstractPhil/vit-beatrix-dualstream",
  "hub_model_name": "beatrix-trainC-chaos-native",
  "hub_upload_best_only": true,
  "hub_upload_every_n_epochs": 10,
  "use_tensorboard": true,
  "log_dir": "./logs_dualstream",
  "log_every": 50,
  "monitor_stream_health": true,
  "log_stream_norms": true
}