lillian039 commited on
Commit
6322864
·
verified ·
1 Parent(s): f41b07e

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ checkpoint_0/ocdbt.process_0/d/0e7ab4f3f368d144d7c4c258982b46ab filter=lfs diff=lfs merge=lfs -text
37
+ checkpoint_0/ocdbt.process_0/d/2633e0ceb216c7296fd0fbd3f73f684c filter=lfs diff=lfs merge=lfs -text
38
+ checkpoint_0/ocdbt.process_0/d/a81aa518a0f3a1c96445302e15102b43 filter=lfs diff=lfs merge=lfs -text
ELF-B-owt.yml ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Dataset
2
+ data_path: "embedded-language-flows/openwebtext-t5"
3
+ max_length: 1024
4
+
5
+ # Encoder
6
+ encoder_model_name: t5-small
7
+ encoder_checkpoint: "embedded-language-flows/t5_small_encoder_jax/t5_small_encoder_jax.pkl"
8
+ latent_mean: 0.0
9
+ latent_std: 0.2
10
+
11
+ # Model architecture
12
+ model: ELF-B # ELF-B, ELF-M
13
+ bottleneck_dim: 128
14
+ num_time_tokens: 4
15
+ num_self_cond_cfg_tokens: 4
16
+ num_model_mode_tokens: 4
17
+
18
+ # Denoiser objective
19
+ denoiser_p_mean: -1.5
20
+ denoiser_p_std: 0.8
21
+ denoiser_noise_scale: 2.0
22
+ t_eps: 0.05
23
+ time_schedule: "logit_normal"
24
+
25
+ # Decoder objective
26
+ decoder_prob: 0.2
27
+ decoder_noise_scale: 5.0
28
+ decoder_p_mean: 0.8
29
+ decoder_p_std: 0.8
30
+
31
+ # Conditioning / CFG
32
+ self_cond_prob: 0.5
33
+
34
+ # Training (optimizer + schedule)
35
+ epochs: 5
36
+ global_batch_size: 512
37
+ blr: 0.001
38
+ weight_decay: 0.0
39
+ warmup_epochs: 0.5
40
+ warmup_steps: -1 # -1 falls back to warmup_epochs
41
+ optimizer: muon # "adamw" or "muon"
42
+
43
+ # EMA
44
+ ema_decay1: 0.9999
45
+
46
+ # Sampling
47
+ sampling_configs_path: "configs/sampling_configs/uncond_sampling_configs.yml"
48
+ num_samples: 1000
49
+
50
+ # Logging & Checkpointing
51
+ log_freq: 100
52
+ save_freq: 1
53
+ save_last_freq: 1
54
+ eval_freq: 1
55
+
56
+ # Output
57
+ output_dir: "outputs/elf_b-owt"
58
+ resume: null
59
+
60
+ # Wandb
61
+ use_wandb: true
62
+ wandb_project: elf
63
+ wandb_entity: null
64
+ wandb_run_name: elf_b-owt
65
+
66
+ # Misc
67
+ seed: 42
checkpoint_0/_CHECKPOINT_METADATA ADDED
@@ -0,0 +1 @@
 
 
1
+ {"init_timestamp_nsecs": 1778512720445321844, "commit_timestamp_nsecs": 1778512721871004161}
checkpoint_0/_METADATA ADDED
The diff for this file is too large to render. See raw diff
 
checkpoint_0/d/b2956458b381bb217a79647c7089da38 ADDED
Binary file (14.7 kB). View file
 
checkpoint_0/manifest.ocdbt ADDED
Binary file (118 Bytes). View file
 
checkpoint_0/ocdbt.process_0/d/0e7ab4f3f368d144d7c4c258982b46ab ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac82f340836e6de299f1ad9cc250a64df48be839c80dbc4cd8336fbfd69243d9
3
+ size 441221120
checkpoint_0/ocdbt.process_0/d/2633e0ceb216c7296fd0fbd3f73f684c ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05379428f522f8c535397455c4c46086b80f51806dc5ca660c11743844c41932
3
+ size 33722368
checkpoint_0/ocdbt.process_0/d/a81aa518a0f3a1c96445302e15102b43 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea4f8854c3627f38ae3b33cd50ddb6107d4dbacc4b5c5fe34e9762ead4f5891c
3
+ size 301690880
checkpoint_0/ocdbt.process_0/d/cfc804c81b4c74de303f6af62fad5fb0 ADDED
Binary file (205 Bytes). View file
 
checkpoint_0/ocdbt.process_0/manifest.ocdbt ADDED
Binary file (278 Bytes). View file