Xrenya commited on
Commit
bfca611
·
verified ·
1 Parent(s): 7f5b039

Create ELF-M-owt.yml

Browse files
Files changed (1) hide show
  1. ELF-M-owt.yml +67 -0
ELF-M-owt.yml ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Dataset
2
+ data_path: "embedded-language-flows/openwebtext-t5"
3
+ max_length: 1024
4
+
5
+ # Encoder
6
+ encoder_model_name: t5-small
7
+ encoder_checkpoint: "embedded-language-flows/t5_small_encoder_jax/t5_small_encoder_jax.pkl"
8
+ latent_mean: 0.0
9
+ latent_std: 0.2
10
+
11
+ # Model architecture
12
+ model: ELF-M # ELF-B, ELF-M
13
+ bottleneck_dim: 128
14
+ num_time_tokens: 4
15
+ num_self_cond_cfg_tokens: 4
16
+ num_model_mode_tokens: 4
17
+
18
+ # Denoiser objective
19
+ denoiser_p_mean: -1.5
20
+ denoiser_p_std: 0.8
21
+ denoiser_noise_scale: 2.0
22
+ t_eps: 0.05
23
+ time_schedule: "logit_normal"
24
+
25
+ # Decoder objective
26
+ decoder_prob: 0.2
27
+ decoder_noise_scale: 5.0
28
+ decoder_p_mean: 0.8
29
+ decoder_p_std: 0.8
30
+
31
+ # Conditioning / CFG
32
+ self_cond_prob: 0.5
33
+
34
+ # Training (optimizer + schedule)
35
+ epochs: 4
36
+ global_batch_size: 512
37
+ blr: 0.001
38
+ weight_decay: 0.0
39
+ warmup_epochs: 0.5
40
+ warmup_steps: -1 # -1 falls back to warmup_epochs
41
+ optimizer: muon # "adamw" or "muon"
42
+
43
+ # EMA
44
+ ema_decay1: 0.9999
45
+
46
+ # Sampling
47
+ sampling_configs_path: "configs/sampling_configs/uncond_sampling_configs.yml"
48
+ num_samples: 1000
49
+
50
+ # Logging & Checkpointing
51
+ log_freq: 100
52
+ save_freq: 1
53
+ save_last_freq: 1
54
+ eval_freq: 1
55
+
56
+ # Output
57
+ output_dir: "outputs/elf_m-owt"
58
+ resume: null
59
+
60
+ # Wandb
61
+ use_wandb: true
62
+ wandb_project: elf
63
+ wandb_entity: null
64
+ wandb_run_name: elf_m-owt
65
+
66
+ # Misc
67
+ seed: 42