43 / Meissonic /train /run_overfit.sh
BryanW's picture
Upload folder using huggingface_hub
3d1c0e1 verified
#!/bin/bash
# Overfitting experiment script
# This script runs a small overfitting experiment to verify implementation correctness
accelerate launch --multi_gpu --gpu_ids '0,1,2,3,4,5,6,7' --main_process_port 25011 --num_processes 8 train/train_overfit.py \
--text_encoder_architecture umt5-base \
--video_tokenizer_model_id "Cosmos-1.0-Tokenizer-DV8x16x16" \
--instance_data_dir "/mnt/VideoGen/dataset/OpenVid1M/video_reorg/OpenVid1M_reorganized.csv" \
--max_samples 256 \
--num_frames 8 \
--video_height 64 \
--video_width 112 \
--dataloader_num_workers 8 \
--train_batch_size 1 \
--gradient_accumulation_steps 1 \
--learning_rate 5e-4 \
--max_train_steps 3000 \
--lr_warmup_steps 100 \
--gradient_checkpointing \
--mixed_precision bf16 \
--seed 42 \
--output_dir "./output_overfit" \
--logging_steps 50 \
--save_steps 500 \
--inference_steps 500 \
--num_inference_samples 4 \
--num_inference_steps 48 \
--wan_pretrained_path Wan-AI/Wan2.1-T2V-1.3B # Optional: path to pretrained Wan weights