| | export MODEL_NAME="models/Diffusion_Transformer/Wan2.1-T2V-1.3B/" |
| | export DATASET_NAME="datasets/internal_datasets/" |
| | export DATASET_META_NAME="datasets/internal_datasets/metadata.json" |
| | |
| | |
| | |
| | NCCL_DEBUG=INFO |
| |
|
| | accelerate launch --mixed_precision="bf16" scripts/wan2.1/train_distill.py \ |
| | --config_path="config/wan2.1/wan_civitai.yaml" \ |
| | --pretrained_model_name_or_path=$MODEL_NAME \ |
| | --train_data_dir=$DATASET_NAME \ |
| | --train_data_meta=$DATASET_META_NAME \ |
| | --image_sample_size=640 \ |
| | --video_sample_size=640 \ |
| | --token_sample_size=640 \ |
| | --video_sample_stride=2 \ |
| | --video_sample_n_frames=81 \ |
| | --train_batch_size=1 \ |
| | --video_repeat=1 \ |
| | --gradient_accumulation_steps=1 \ |
| | --dataloader_num_workers=8 \ |
| | --num_train_epochs=100 \ |
| | --checkpointing_steps=50 \ |
| | --learning_rate=2e-06 \ |
| | --learning_rate_critic=2e-07 \ |
| | --lr_scheduler="constant_with_warmup" \ |
| | --lr_warmup_steps=100 \ |
| | --seed=42 \ |
| | --output_dir="output_dir_distill" \ |
| | --gradient_checkpointing \ |
| | --mixed_precision="bf16" \ |
| | --adam_weight_decay=3e-2 \ |
| | --adam_epsilon=1e-10 \ |
| | --vae_mini_batch=1 \ |
| | --max_grad_norm=0.05 \ |
| | --random_hw_adapt \ |
| | --training_with_video_token_length \ |
| | --enable_bucket \ |
| | --uniform_sampling \ |
| | --train_mode="normal" \ |
| | --trainable_modules "." \ |
| | --low_vram |
| |
|