bobcastell commited on
Commit
de1859d
·
verified ·
1 Parent(s): 0f7e230

Upload 20251103_03-44-07/backup/config_orig/hunyuan_video.toml with huggingface_hub

Browse files
20251103_03-44-07/backup/config_orig/hunyuan_video.toml ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ output_dir = "/root/diffusion-pipe/hunyuan-video-lora"
2
+ dataset = "/root/config/dataset_hunyuan.toml"
3
+ epochs = 1
4
+ micro_batch_size_per_gpu = 8
5
+ pipeline_stages = 1
6
+ gradient_accumulation_steps = 8
7
+ gradient_clipping = 1.0
8
+ warmup_steps = 50
9
+ eval_every_n_epochs = 1
10
+ save_every_n_epochs = 1
11
+ activation_checkpointing = true
12
+ caching_batch_size = 4
13
+ steps_per_print = 1
14
+ video_clip_mode = "single_middle"
15
+ checkpoint_every_n_epochs = 1
16
+
17
+ [model]
18
+ type = "hunyuan-video"
19
+ dtype = "bfloat16"
20
+ transformer_dtype = "float8"
21
+ timestep_sample_method = "logit_normal"
22
+ transformer_path = "/root/diffusion-pipe/ckpts/hunyuan-video-t2v-720p/transformers/hunyuan_video_720_cfgdistill_fp8_e4m3fn.safetensors"
23
+ vae_path = "/root/diffusion-pipe/ckpts/hunyuan-video-t2v-720p/vae/hunyuan_video_vae_bf16.safetensors"
24
+ clip_path = "/root/diffusion-pipe/ckpts/text_encoder_2/clip-vit-large-patch14"
25
+ llm_path = "/root/diffusion-pipe/ckpts/text_encoder/llava-llama-3-8b-text-encoder-tokenizer"
26
+
27
+ [adapter]
28
+ type = "lora"
29
+ rank = 32
30
+ dtype = "bfloat16"
31
+
32
+ [optimizer]
33
+ type = "adamw_optimi"
34
+ lr = 0.0001
35
+ weight_decay = 0.01
36
+ betas = [ 0.9, 0.99,]
37
+ eps = 1e-8