KBlueLeaf commited on
Commit
bb82075
·
verified ·
1 Parent(s): 987ec21

Upload r1a40xe8/config.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. r1a40xe8/config.py +81 -0
r1a40xe8/config.py ADDED
@@ -0,0 +1,81 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ """Sweep: tt3d regression, imgnet_B pretrained decoder (no dual aug)."""
2
+ import random
3
+ from kohakuengine import Config
4
+
5
+ SEED = 42
6
+ RUN_ID = "".join(random.choices("abcdefghijklmnopqrstuvwxyz0123456789", k=8))
7
+ RUN_NAME = "H100_tt3d_reg_decB_video"
8
+ BASE_MODEL_NAME = "facebook/dinov3-vitb16-pretrain-lvd1689m"
9
+ ENCODER_AE_PATH = None
10
+ ENCODER_AE_BACKEND = "latentmaid"
11
+ ENCODER_AE_MODE = "video"
12
+ DECODER_AE_PATH = "latent_models/latentmaid_image_vae/latentmaid_2222_eq.pt"
13
+ DECODER_AE_BACKEND = "image_vae"
14
+ DECODER_AE_MODE = "image"
15
+ LATENT_MEAN = [-0.69, -0.48, -0.60, 0.28]
16
+ LATENT_STD = [12.38, 11.22, 7.93, 21.22]
17
+ T_PATCH = 1
18
+ TOKEN_COUNTS = [1]
19
+ BACKBONE_ARCH = "ttvidt"
20
+ BACKBONE_CONFIG = None
21
+
22
+ MOTION_ENCODER_CONFIG = {
23
+ "temporal_patch_size": 1,
24
+ "temporal_patch_overlap": 0,
25
+ "motion_layers_period": 1,
26
+ "num_motion_tokens": 8,
27
+ "motion_ffn_type": "gelu",
28
+ "tt_mode": "3d",
29
+ "tt_downsample": 4,
30
+ }
31
+ MOTION_DECODER_CONFIG = {
32
+ "image_dim": 4,
33
+ "patch_size": 2,
34
+ "decoder_style": "dit",
35
+ "num_layers": 16,
36
+ "hidden_size": 1024,
37
+ "intermediate_size": 4096,
38
+ "num_heads": 16,
39
+ "decode_mode": "diffusion",
40
+ "qk_norm": True,
41
+ "attn_bias": False,
42
+ "use_final_norm": False,
43
+ }
44
+ FRAME_COUNT = 8
45
+ SAMPLE_FPS = 6
46
+ DATASET_FOLDERS = [
47
+ "/mnt/shared/p03/kohaku/openvid384/OpenVid384px-tar",
48
+ "/mnt/shared/p03/kohaku/moments_in_time/Moments_in_Time_Raw/training-tar",
49
+ ]
50
+ TRAIN_MODE = "regression"
51
+ UNFREEZE_BACKBONE = True
52
+ GRAD_CKPT = False
53
+ GRAD_CLIP_VAL = 0.1
54
+ DECODER_PRETRAINED = "KBlueLeaf/dit-testing/pretrain_video_B_qknorm_nofinal"
55
+
56
+ LEARNING_RATE = 5e-4
57
+ BASE_DIM = 256
58
+ WEIGHT_DECAY = 0.01
59
+ BETAS = (0.9, 0.98)
60
+ BASE_SCHEDULER_CONFIG = {
61
+ "lr": {
62
+ "mode": "cosine",
63
+ "end": -1,
64
+ "min_value": 0.01,
65
+ "warmup": 10000,
66
+ }
67
+ }
68
+
69
+ GPUS = [0, 1, 2, 3]
70
+ EPOCH = 8
71
+ BATCH_SIZE = 8
72
+ GRAD_ACC = 1
73
+ NUM_WORKERS = 24
74
+ DATASET_TYPE = "tar"
75
+
76
+ LOG_INTERVAL = 2500
77
+ CKPT_INTERVAL = 5000
78
+
79
+ def config_gen():
80
+ print("Run with run_id:", RUN_ID)
81
+ return Config.from_globals()