lillian039 commited on
Commit
2724e1c
·
verified ·
1 Parent(s): 2d0296c

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ checkpoint_0/ocdbt.process_0/d/961934ef67f08ca0e602c89e25310435 filter=lfs diff=lfs merge=lfs -text
37
+ checkpoint_0/ocdbt.process_0/d/a42ffa565d5d5a8a129cb64352df601c filter=lfs diff=lfs merge=lfs -text
38
+ checkpoint_0/ocdbt.process_0/d/c1ffccc6374a2d6988433b8927c8b6f5 filter=lfs diff=lfs merge=lfs -text
39
+ checkpoint_0/ocdbt.process_0/d/e6b21145a10013010c4aa83a68b552ad filter=lfs diff=lfs merge=lfs -text
ELF-M-owt.yml ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Dataset
2
+ data_path: "embedded-language-flows/openwebtext-t5"
3
+ max_length: 1024
4
+
5
+ # Encoder
6
+ encoder_model_name: t5-small
7
+ encoder_checkpoint: "embedded-language-flows/t5_small_encoder_jax/t5_small_encoder_jax.pkl"
8
+ latent_mean: 0.0
9
+ latent_std: 0.2
10
+
11
+ # Model architecture
12
+ model: ELF-M # ELF-B, ELF-M
13
+ bottleneck_dim: 128
14
+ num_time_tokens: 4
15
+ num_self_cond_cfg_tokens: 4
16
+ num_model_mode_tokens: 4
17
+
18
+ # Denoiser objective
19
+ denoiser_p_mean: -1.5
20
+ denoiser_p_std: 0.8
21
+ denoiser_noise_scale: 2.0
22
+ t_eps: 0.05
23
+ time_schedule: "logit_normal"
24
+
25
+ # Decoder objective
26
+ decoder_prob: 0.2
27
+ decoder_noise_scale: 5.0
28
+ decoder_p_mean: 0.8
29
+ decoder_p_std: 0.8
30
+
31
+ # Conditioning / CFG
32
+ self_cond_prob: 0.5
33
+
34
+ # Training (optimizer + schedule)
35
+ epochs: 4
36
+ global_batch_size: 512
37
+ blr: 0.001
38
+ weight_decay: 0.0
39
+ warmup_epochs: 0.5
40
+ warmup_steps: -1 # -1 falls back to warmup_epochs
41
+ optimizer: muon # "adamw" or "muon"
42
+
43
+ # EMA
44
+ ema_decay1: 0.9999
45
+
46
+ # Sampling
47
+ sampling_configs_path: "configs/sampling_configs/uncond_sampling_configs.yml"
48
+ num_samples: 1000
49
+
50
+ # Logging & Checkpointing
51
+ log_freq: 100
52
+ save_freq: 1
53
+ save_last_freq: 1
54
+ eval_freq: 1
55
+
56
+ # Output
57
+ output_dir: "outputs/elf_m-owt"
58
+ resume: null
59
+
60
+ # Wandb
61
+ use_wandb: true
62
+ wandb_project: elf
63
+ wandb_entity: null
64
+ wandb_run_name: elf_m-owt
65
+
66
+ # Misc
67
+ seed: 42
checkpoint_0/_CHECKPOINT_METADATA ADDED
@@ -0,0 +1 @@
 
 
1
+ {"init_timestamp_nsecs": 1778513483615276684, "commit_timestamp_nsecs": 1778513494595536170}
checkpoint_0/_METADATA ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint_0/d/9b67b2b1a3556c070ef179edfd9b3f83 ADDED
Binary file (28.3 kB). View file
 
checkpoint_0/manifest.ocdbt ADDED
Binary file (120 Bytes). View file
 
checkpoint_0/ocdbt.process_0/d/28c37ec0597e779fcbb5c3ca25c1ebe1 ADDED
Binary file (28.3 kB). View file
 
checkpoint_0/ocdbt.process_0/d/961934ef67f08ca0e602c89e25310435 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6a5dc2b3989acc8e21a70346bcdd644180ccf010273e612af98c4f88d98de98
3
+ size 2162982912
checkpoint_0/ocdbt.process_0/d/a42ffa565d5d5a8a129cb64352df601c ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a27ed82c50f8be44e8b58c4ac438ba24de7592fd96e643201c1cbf128ce65ec
3
+ size 122421248
checkpoint_0/ocdbt.process_0/d/c1ffccc6374a2d6988433b8927c8b6f5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88e7ad8dc94c7baa8fba1fdf7896bd72dc6fdeb7624642b71ca74c193647ef83
3
+ size 8445952
checkpoint_0/ocdbt.process_0/d/e6b21145a10013010c4aa83a68b552ad ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aef9f7e9ab4bb8bf30a8f678b3ed65dfa92c595110f3ef1c9032770f2931923b
3
+ size 245628928
checkpoint_0/ocdbt.process_0/d/eca55eb1012f96c9cf85c23fa87fef6a ADDED
Binary file (205 Bytes). View file
 
checkpoint_0/ocdbt.process_0/manifest.ocdbt ADDED
Binary file (322 Bytes). View file