yongqiang
initialize this repo
ba96580
export MODEL_NAME="models/Diffusion_Transformer/Wan2.2-Fun-A14B-InP"
export TRAIN_PROMPT_PATH="MovieGenVideoBench_train.txt"
# Train HPSv2.1 reward LoRA for the low noise model of Wan2.2-Fun-A14B-InP
accelerate launch --mixed_precision="bf16" --num-processes=8 --use_deepspeed --deepspeed_config_file config/zero_stage2_config.json scripts/wan2.2_fun/train_reward_lora.py \
--config_path="config/wan2.2/wan_civitai_i2v.yaml" \
--pretrained_model_name_or_path=$MODEL_NAME \
--train_batch_size=1 \
--gradient_accumulation_steps=1 \
--max_train_steps=10000 \
--checkpointing_steps=100 \
--learning_rate=1e-05 \
--seed=42 \
--output_dir="output_dir" \
--gradient_checkpointing \
--mixed_precision="bf16" \
--adam_weight_decay=3e-2 \
--adam_epsilon=1e-10 \
--max_grad_norm=0.3 \
--boundary_type="low" \
--lora_skip_name="ffn" \
--low_vram \
--use_deepspeed \
--prompt_path=$TRAIN_PROMPT_PATH \
--train_sample_height=256 \
--train_sample_width=256 \
--num_inference_steps=40 \
--video_length=81 \
--num_decoded_latents=1 \
--reward_fn="HPSReward" \
--reward_fn_kwargs='{"version": "v2.1"}' \
--backprop_strategy="tail" \
--backprop_num_steps=1 \
--backprop
# Train MPS reward LoRA for the high noise model of Wan2.2-Fun-A14B-InP
# accelerate launch --mixed_precision="bf16" --num-processes=8 --use_deepspeed --deepspeed_config_file config/zero_stage3_config_cpu_offload.json scripts/wan2.2_fun/train_reward_lora.py \
# --config_path="config/wan2.2/wan_civitai_i2v.yaml" \
# --pretrained_model_name_or_path=$MODEL_NAME \
# --train_batch_size=1 \
# --gradient_accumulation_steps=1 \
# --max_train_steps=10000 \
# --checkpointing_steps=100 \
# --learning_rate=1e-05 \
# --seed=42 \
# --output_dir="output_dir" \
# --gradient_checkpointing \
# --mixed_precision="bf16" \
# --adam_weight_decay=3e-2 \
# --adam_epsilon=1e-10 \
# --max_grad_norm=0.3 \
# --boundary_type="high" \
# --lora_skip_name="ffn" \
# --low_vram \
# --use_deepspeed \
# --prompt_path=$TRAIN_PROMPT_PATH \
# --train_sample_height=256 \
# --train_sample_width=256 \
# --num_inference_steps=40 \
# --video_length=81 \
# --num_decoded_latents=1 \
# --reward_fn="MPSReward" \
# --backprop_strategy="tail" \
# --backprop_num_steps=1 \
# --backprop