| pretrained_model_path: checkpoints/CompVis/stable-diffusion-v1-4 |
| output_dir: /home/user/app/experiments/talking-man |
| train_data: |
| video_path: /tmp/gradio/f79f070ba10b1b7872faa157ada00e09644ef2f2/Untitled Video.mp4 |
| prompt: A person of East Asian ethnicity standing in a well-lit office environment |
| with large windows, speaking directly to the camera, wearing a white shirt, and |
| conveying a calm and professional demeanor. The background is slightly blurred, |
| showcasing greenery and modern office decor, with minimal distractions |
| n_sample_frames: 8 |
| width: 512 |
| height: 512 |
| sample_start_idx: 0 |
| sample_frame_rate: 1 |
| validation_data: |
| prompts: |
| - A person of East Asian descent is standing in a bright office setting with large |
| windows, addressing the camera directly. They are dressed in a white shirt and |
| project a calm, professional demeanor. The background is slightly out of focus, |
| highlighting greenery and modern office furnishings, with minimal visual distractions |
| video_length: 8 |
| width: 512 |
| height: 512 |
| num_inference_steps: 50 |
| guidance_scale: 7.5 |
| validation_steps: 100 |
| trainable_modules: |
| - attn1.to_q |
| - attn2.to_q |
| - attn_temp |
| train_batch_size: 1 |
| max_train_steps: 300 |
| learning_rate: 3.5e-05 |
| scale_lr: false |
| lr_scheduler: constant |
| lr_warmup_steps: 0 |
| adam_beta1: 0.9 |
| adam_beta2: 0.999 |
| adam_weight_decay: 0.01 |
| adam_epsilon: 1.0e-08 |
| max_grad_norm: 1.0 |
| gradient_accumulation_steps: 1 |
| gradient_checkpointing: true |
| checkpointing_steps: 1000 |
| resume_from_checkpoint: null |
| mixed_precision: fp16 |
| use_8bit_adam: false |
| enable_xformers_memory_efficient_attention: true |
| seed: 31118 |
|
|