tantanbei
/

shangche_wan

Model card Files Files and versions

tantanbei commited on Jun 12, 2025

Commit

5c9418c

·

verified ·

1 Parent(s): b49baf9

Create train_wan_1_3b.toml

Files changed (1) hide show

train_wan_1_3b.toml +50 -0

train_wan_1_3b.toml ADDED Viewed

	@@ -0,0 +1,50 @@

+# This configuration should allow you to train Wan 14b t2v on 512x512x81 sized videos (or varying aspect ratios of the same size), with 24GB VRAM.
+# change this
+output_dir = '/data/data/model_training/shangche_wan2_1_lora/output'
+# and this
+dataset = '/data/app/diffusion-pipe/examples/dataset.toml'
+# training settings
+epochs = 1000
+micro_batch_size_per_gpu = 5
+pipeline_stages = 1
+gradient_accumulation_steps = 2
+gradient_clipping = 1
+warmup_steps = 30
+# eval settings
+eval_every_n_epochs = 1
+eval_before_first_step = true
+eval_micro_batch_size_per_gpu = 5
+eval_gradient_accumulation_steps = 2
+# misc settings
+save_every_n_epochs = 1
+checkpoint_every_n_minutes = 120
+activation_checkpointing = 'unsloth'
+partition_method = 'parameters'
+save_dtype = 'bfloat16'
+caching_batch_size = 1
+steps_per_print = 1
+video_clip_mode = 'single_beginning'
+# blocks_to_swap = 32
+[model]
+type = 'wan'
+ckpt_path = '/data/app/diffusion-pipe/submodules/Wan2_1/Wan2.1-T2V-1.3B'
+dtype = 'bfloat16'
+transformer_dtype = 'float8'
+timestep_sample_method = 'logit_normal'
+[adapter]
+type = 'lora'
+rank = 32
+dtype = 'bfloat16'
+[optimizer]
+type = 'AdamW8bitKahan'
+lr = 1e-5
+betas = [0.9, 0.99]
+weight_decay = 0.01
+stabilize = false