| image_finetune: false |
|
|
| output_dir: "outputs" |
| pretrained_model_path: "runwayml/stable-diffusion-v1-5" |
|
|
| unet_additional_kwargs: |
| use_motion_module : true |
| motion_module_resolutions : [ 1,2,4,8 ] |
| unet_use_cross_frame_attention : false |
| unet_use_temporal_attention : false |
|
|
| motion_module_type: Vanilla |
| motion_module_kwargs: |
| num_attention_heads : 8 |
| num_transformer_block : 1 |
| attention_block_types : [ "Temporal_Self", "Temporal_Self" ] |
| temporal_position_encoding : true |
| temporal_position_encoding_max_len : 24 |
| temporal_attention_dim_div : 1 |
| zero_initialize : true |
|
|
| noise_scheduler_kwargs: |
| num_train_timesteps: 1000 |
| beta_start: 0.00085 |
| beta_end: 0.012 |
| beta_schedule: "linear" |
| steps_offset: 1 |
| clip_sample: false |
|
|
| train_data: |
| csv_path: "data/output.csv" |
| video_folder: "data/output" |
| sample_size: 256 |
| sample_stride: 4 |
| sample_n_frames: 5 |
|
|
| validation_data: |
| prompts: |
| - "Snow rocky mountains peaks canyon. Snow blanketed rocky mountains surround and shadow deep canyons." |
| - "A drone view of celebration with Christmas tree and fireworks, starry sky - background." |
| - "Robot dancing in times square." |
| - "Pacific coast, carmel by the sea ocean and waves." |
| num_inference_steps: 20 |
| guidance_scale: 12.5 |
| temporal_context": 24 |
| use_inv_latent": True |
| num_inv_steps: 50 |
|
|
| trainable_modules: |
| - "motion_modules." |
|
|
| unet_checkpoint_path: "" |
|
|
| learning_rate: 3.e-5 |
| train_batch_size: 1 |
|
|
| max_train_epoch: -1 |
| max_train_steps: 300 |
| checkpointing_epochs: -1 |
| checkpointing_steps: 1000 |
|
|
| validation_steps: 100 |
| |
|
|
| global_seed: 42 |
| mixed_precision_training: true |
| enable_xformers_memory_efficient_attention: True |
|
|
| is_debug: True |
|
|