AXERA-TECH
/

Z-Image-Turbo

Model card Files Files and versions

Z-Image-Turbo / VideoX-Fun /scripts /wan2.2_fun /train_reward_lora.sh

yongqiang

initialize this repo

ba96580 about 2 months ago

history blame contribute delete

2.32 kB

	export MODEL_NAME="models/Diffusion_Transformer/Wan2.2-Fun-A14B-InP"
	export TRAIN_PROMPT_PATH="MovieGenVideoBench_train.txt"

	# Train HPSv2.1 reward LoRA for the low noise model of Wan2.2-Fun-A14B-InP
	accelerate launch --mixed_precision="bf16" --num-processes=8 --use_deepspeed --deepspeed_config_file config/zero_stage2_config.json scripts/wan2.2_fun/train_reward_lora.py \
	--config_path="config/wan2.2/wan_civitai_i2v.yaml" \
	--pretrained_model_name_or_path=$MODEL_NAME \
	--train_batch_size=1 \
	--gradient_accumulation_steps=1 \
	--max_train_steps=10000 \
	--checkpointing_steps=100 \
	--learning_rate=1e-05 \
	--seed=42 \
	--output_dir="output_dir" \
	--gradient_checkpointing \
	--mixed_precision="bf16" \
	--adam_weight_decay=3e-2 \
	--adam_epsilon=1e-10 \
	--max_grad_norm=0.3 \
	--boundary_type="low" \
	--lora_skip_name="ffn" \
	--low_vram \
	--use_deepspeed \
	--prompt_path=$TRAIN_PROMPT_PATH \
	--train_sample_height=256 \
	--train_sample_width=256 \
	--num_inference_steps=40 \
	--video_length=81 \
	--num_decoded_latents=1 \
	--reward_fn="HPSReward" \
	--reward_fn_kwargs='{"version": "v2.1"}' \
	--backprop_strategy="tail" \
	--backprop_num_steps=1 \
	--backprop

	# Train MPS reward LoRA for the high noise model of Wan2.2-Fun-A14B-InP
	# accelerate launch --mixed_precision="bf16" --num-processes=8 --use_deepspeed --deepspeed_config_file config/zero_stage3_config_cpu_offload.json scripts/wan2.2_fun/train_reward_lora.py \
	# --config_path="config/wan2.2/wan_civitai_i2v.yaml" \
	# --pretrained_model_name_or_path=$MODEL_NAME \
	# --train_batch_size=1 \
	# --gradient_accumulation_steps=1 \
	# --max_train_steps=10000 \
	# --checkpointing_steps=100 \
	# --learning_rate=1e-05 \
	# --seed=42 \
	# --output_dir="output_dir" \
	# --gradient_checkpointing \
	# --mixed_precision="bf16" \
	# --adam_weight_decay=3e-2 \
	# --adam_epsilon=1e-10 \
	# --max_grad_norm=0.3 \
	# --boundary_type="high" \
	# --lora_skip_name="ffn" \
	# --low_vram \
	# --use_deepspeed \
	# --prompt_path=$TRAIN_PROMPT_PATH \
	# --train_sample_height=256 \
	# --train_sample_width=256 \
	# --num_inference_steps=40 \
	# --video_length=81 \
	# --num_decoded_latents=1 \
	# --reward_fn="MPSReward" \
	# --backprop_strategy="tail" \
	# --backprop_num_steps=1 \
	# --backprop