| export MODEL_NAME="models/Diffusion_Transformer/Wan2.2-Fun-A14B-InP" | |
| export TRAIN_PROMPT_PATH="MovieGenVideoBench_train.txt" | |
| # Train HPSv2.1 reward LoRA for the low noise model of Wan2.2-Fun-A14B-InP | |
| accelerate launch --mixed_precision="bf16" --num-processes=8 --use_deepspeed --deepspeed_config_file config/zero_stage2_config.json scripts/wan2.2_fun/train_reward_lora.py \ | |
| --config_path="config/wan2.2/wan_civitai_i2v.yaml" \ | |
| --pretrained_model_name_or_path=$MODEL_NAME \ | |
| --train_batch_size=1 \ | |
| --gradient_accumulation_steps=1 \ | |
| --max_train_steps=10000 \ | |
| --checkpointing_steps=100 \ | |
| --learning_rate=1e-05 \ | |
| --seed=42 \ | |
| --output_dir="output_dir" \ | |
| --gradient_checkpointing \ | |
| --mixed_precision="bf16" \ | |
| --adam_weight_decay=3e-2 \ | |
| --adam_epsilon=1e-10 \ | |
| --max_grad_norm=0.3 \ | |
| --boundary_type="low" \ | |
| --lora_skip_name="ffn" \ | |
| --low_vram \ | |
| --use_deepspeed \ | |
| --prompt_path=$TRAIN_PROMPT_PATH \ | |
| --train_sample_height=256 \ | |
| --train_sample_width=256 \ | |
| --num_inference_steps=40 \ | |
| --video_length=81 \ | |
| --num_decoded_latents=1 \ | |
| --reward_fn="HPSReward" \ | |
| --reward_fn_kwargs='{"version": "v2.1"}' \ | |
| --backprop_strategy="tail" \ | |
| --backprop_num_steps=1 \ | |
| --backprop | |
| # Train MPS reward LoRA for the high noise model of Wan2.2-Fun-A14B-InP | |
| # accelerate launch --mixed_precision="bf16" --num-processes=8 --use_deepspeed --deepspeed_config_file config/zero_stage3_config_cpu_offload.json scripts/wan2.2_fun/train_reward_lora.py \ | |
| # --config_path="config/wan2.2/wan_civitai_i2v.yaml" \ | |
| # --pretrained_model_name_or_path=$MODEL_NAME \ | |
| # --train_batch_size=1 \ | |
| # --gradient_accumulation_steps=1 \ | |
| # --max_train_steps=10000 \ | |
| # --checkpointing_steps=100 \ | |
| # --learning_rate=1e-05 \ | |
| # --seed=42 \ | |
| # --output_dir="output_dir" \ | |
| # --gradient_checkpointing \ | |
| # --mixed_precision="bf16" \ | |
| # --adam_weight_decay=3e-2 \ | |
| # --adam_epsilon=1e-10 \ | |
| # --max_grad_norm=0.3 \ | |
| # --boundary_type="high" \ | |
| # --lora_skip_name="ffn" \ | |
| # --low_vram \ | |
| # --use_deepspeed \ | |
| # --prompt_path=$TRAIN_PROMPT_PATH \ | |
| # --train_sample_height=256 \ | |
| # --train_sample_width=256 \ | |
| # --num_inference_steps=40 \ | |
| # --video_length=81 \ | |
| # --num_decoded_latents=1 \ | |
| # --reward_fn="MPSReward" \ | |
| # --backprop_strategy="tail" \ | |
| # --backprop_num_steps=1 \ | |
| # --backprop |