export MODEL_NAME="models/Diffusion_Transformer/Wan2.2-T2V-A14B" export DATASET_NAME="datasets/internal_datasets/" export DATASET_META_NAME="datasets/internal_datasets/metadata.json" # NCCL_IB_DISABLE=1 and NCCL_P2P_DISABLE=1 are used in multi nodes without RDMA. # export NCCL_IB_DISABLE=1 # export NCCL_P2P_DISABLE=1 NCCL_DEBUG=INFO accelerate launch --mixed_precision="bf16" scripts/wan2.2/train.py \ --config_path="config/wan2.2/wan_civitai_t2v.yaml" \ --pretrained_model_name_or_path=$MODEL_NAME \ --train_data_dir=$DATASET_NAME \ --train_data_meta=$DATASET_META_NAME \ --image_sample_size=640 \ --video_sample_size=640 \ --token_sample_size=640 \ --video_sample_stride=2 \ --video_sample_n_frames=81 \ --train_batch_size=1 \ --video_repeat=1 \ --gradient_accumulation_steps=1 \ --dataloader_num_workers=8 \ --num_train_epochs=100 \ --checkpointing_steps=50 \ --learning_rate=2e-05 \ --lr_scheduler="constant_with_warmup" \ --lr_warmup_steps=100 \ --seed=42 \ --output_dir="output_dir" \ --gradient_checkpointing \ --mixed_precision="bf16" \ --adam_weight_decay=3e-2 \ --adam_epsilon=1e-10 \ --vae_mini_batch=1 \ --max_grad_norm=0.05 \ --random_hw_adapt \ --training_with_video_token_length \ --enable_bucket \ --uniform_sampling \ --low_vram \ --boundary_type="low" \ --train_mode="normal" \ --trainable_modules "." # The Training Shell Code for Image to Video # You need to use "config/wan2.2/wan_civitai_i2v.yaml" # # export MODEL_NAME="models/Diffusion_Transformer/Wan2.2-I2V-A14B" # export DATASET_NAME="datasets/internal_datasets/" # export DATASET_META_NAME="datasets/internal_datasets/metadata.json" # # NCCL_IB_DISABLE=1 and NCCL_P2P_DISABLE=1 are used in multi nodes without RDMA. # # export NCCL_IB_DISABLE=1 # # export NCCL_P2P_DISABLE=1 # NCCL_DEBUG=INFO # accelerate launch --mixed_precision="bf16" scripts/wan2.2/train.py \ # --config_path="config/wan2.2/wan_civitai_i2v.yaml" \ # --pretrained_model_name_or_path=$MODEL_NAME \ # --train_data_dir=$DATASET_NAME \ # --train_data_meta=$DATASET_META_NAME \ # --image_sample_size=640 \ # --video_sample_size=640 \ # --token_sample_size=640 \ # --video_sample_stride=2 \ # --video_sample_n_frames=81 \ # --train_batch_size=1 \ # --video_repeat=1 \ # --gradient_accumulation_steps=1 \ # --dataloader_num_workers=8 \ # --num_train_epochs=100 \ # --checkpointing_steps=50 \ # --learning_rate=2e-05 \ # --lr_scheduler="constant_with_warmup" \ # --lr_warmup_steps=100 \ # --seed=42 \ # --output_dir="output_dir" \ # --gradient_checkpointing \ # --mixed_precision="bf16" \ # --adam_weight_decay=3e-2 \ # --adam_epsilon=1e-10 \ # --vae_mini_batch=1 \ # --max_grad_norm=0.05 \ # --random_hw_adapt \ # --training_with_video_token_length \ # --enable_bucket \ # --uniform_sampling \ # --low_vram \ # --boundary_type="low" \ # --train_mode="i2v" \ # --trainable_modules "."