| total_params: 5930596 | |
| image_size: 256 | |
| num_train_steps: -1 | |
| num_epochs: 50 | |
| batch_size: 1 | |
| lr: 0.0001 | |
| lr_warmup_steps: 10 | |
| lr_scheduler: cosine_with_restarts | |
| gradient_accumulation_steps: 2000 | |
| save_results_every: 500 | |
| save_model_every: 5000 | |
| dim: 32 | |
| vq_codebook_size: 128 | |
| vq_codebook_dim: 128 | |
| seq_len: 1024 | |
| channels: 3 | |
| layers: 4 | |
| discr_layers: 4 | |
| scheduler_power: 8.0 | |
| num_cycles: 800 | |
| only_save_last_checkpoint: false | |
| validation_image_scale: 1.0 | |
| no_center_crop: false | |
| no_flip: false | |
| random_crop: true | |
| dataset_save_path: H:/cached_datasets/INE | |
| clear_previous_experiments: false | |
| max_grad_norm: null | |
| discr_max_grad_norm: null | |
| seed: 42 | |
| valid_frac: 0.05 | |
| use_ema: false | |
| ema_beta: 0.995 | |
| ema_update_after_step: 1 | |
| ema_update_every: 1 | |
| apply_grad_penalty_every: 4 | |
| image_column: image | |
| caption_column: caption | |
| log_with: wandb | |
| mixed_precision: 'no' | |
| use_8bit_adam: false | |
| results_dir: results\Muse-v0.12_test | |
| logging_dir: null | |
| resume_path: results\Muse-v0.12_test\vae.6270000.pt | |
| dataset_name: null | |
| streaming: false | |
| train_data_dir: H:/dataset | |
| checkpoint_limit: null | |
| cond_drop_prob: 0.5 | |
| taming_model_path: null | |
| taming_config_path: null | |
| optimizer: Adam | |
| weight_decay: 0.001 | |
| cache_path: null | |
| no_cache: true | |
| latest_checkpoint: true | |
| do_not_save_config: false | |
| use_l2_recon_loss: false | |
| debug: false | |
| config_path: null | |
| validation_folder_at_end_of_epoch: samples/validation | |
| exclude_folders: null | |
| webdataset: null | |
| project_name: muse_vae | |
| run_name: null | |
| wandb_user: null | |
| hf_split_name: train | |