| data_path: embedded-language-flows/xsum_train_t5 | |
| eval_data_path: embedded-language-flows/xsum_validation_t5 | |
| max_length: 1088 | |
| max_input_length: 1024 | |
| pad_token: eos | |
| encoder_model_name: t5-small | |
| encoder_checkpoint: embedded-language-flows/t5_small_encoder_jax/t5_small_encoder_jax.pkl | |
| latent_mean: 0.0 | |
| latent_std: 0.2 | |
| model: ELF-B | |
| bottleneck_dim: 128 | |
| num_time_tokens: 4 | |
| num_self_cond_cfg_tokens: 4 | |
| num_model_mode_tokens: 4 | |
| denoiser_p_mean: -1.5 | |
| denoiser_p_std: 0.8 | |
| denoiser_noise_scale: 2.0 | |
| t_eps: 0.05 | |
| time_schedule: logit_normal | |
| decoder_prob: 0.2 | |
| decoder_noise_scale: 1.0 | |
| decoder_p_mean: 0.8 | |
| decoder_p_std: 0.8 | |
| label_drop_prob: 0.1 | |
| self_cond_prob: 0.5 | |
| epochs: 1 | |
| global_batch_size: 64 | |
| blr: 0.001 | |
| weight_decay: 0.0 | |
| warmup_steps: 5000 | |
| optimizer: muon | |
| ema_decay1: 0.9999 | |
| sampling_configs_path: configs/sampling_configs/cond_sampling_configs.yml | |
| num_samples: 100 | |
| log_freq: 100 | |
| save_freq: 1 | |
| eval_freq: 1 | |
| output_dir: /home/linluqiu/ELF/src/outputs/elf_b-xsum | |
| hf_repo_id: linluqiu/test | |
| resume: /home/linluqiu/ELF/src/outputs/elf_b-xsum | |
| use_wandb: true | |
| wandb_project: elf | |
| wandb_entity: null | |
| wandb_run_name: elf_b-xsum | |
| seed: 42 | |
| sampling_configs: | |
| - sampling_method: ode | |
| num_sampling_steps: | |
| - 4 | |
| cfgs: | |
| - 1 | |
| self_cond_cfg_scales: | |
| - 1 | |
| time_schedule: logit_normal | |
| batch_size: 16 | |
| lr: 0.00025 | |