bobcastell commited on
Commit
fb2ef32
·
verified ·
1 Parent(s): 7a7aab9

Upload 20251209_01-41-16/hunyuan_video.toml with huggingface_hub

Browse files
20251209_01-41-16/hunyuan_video.toml ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ output_dir = "/root/diffusion-pipe/hunyuan-video-lora"
2
+ dataset = "/root/config/dataset.toml"
3
+ epochs = 200
4
+ micro_batch_size_per_gpu = 8
5
+ pipeline_stages = 1
6
+ gradient_accumulation_steps = 4
7
+ gradient_clipping = 1
8
+ warmup_steps = 100
9
+ eval_every_n_epochs = 5
10
+ eval_before_first_step = true
11
+ eval_micro_batch_size_per_gpu = 1
12
+ eval_gradient_accumulation_steps = 1
13
+ save_every_n_epochs = 100
14
+ activation_checkpointing = true
15
+ partition_method = "parameters"
16
+ save_dtype = "bfloat16"
17
+ caching_batch_size = 4
18
+ steps_per_print = 1
19
+ video_clip_mode = "single_middle"
20
+ checkpoint_every_n_epochs = 100
21
+
22
+ [model]
23
+ type = "hunyuan-video"
24
+ dtype = "bfloat16"
25
+ transformer_dtype = "float8"
26
+ timestep_sample_method = "logit_normal"
27
+ transformer_path = "/root/diffusion-pipe/ckpts/hunyuan-video-t2v-720p/transformers/hunyuan_video_720_cfgdistill_bf16.safetensors"
28
+ vae_path = "/root/diffusion-pipe/ckpts/hunyuan-video-t2v-720p/vae/hunyuan_video_vae_bf16.safetensors"
29
+ clip_path = "/root/diffusion-pipe/ckpts/text_encoder_2/clip-vit-large-patch14"
30
+ llm_path = "/root/diffusion-pipe/ckpts/text_encoder/llava-llama-3-8b-text-encoder-tokenizer"
31
+
32
+ [adapter]
33
+ type = "lora"
34
+ rank = 64
35
+ dtype = "bfloat16"
36
+
37
+ [optimizer]
38
+ type = "adamw_optimi"
39
+ lr = 0.0001
40
+ betas = [ 0.9, 0.99,]
41
+ weight_decay = 0.01
42
+ eps = 1e-8