ziyc commited on
Commit
578092d
·
verified ·
1 Parent(s): e52bdc2
train-sink_0-attn_size_6-T_21/checkpoint_model_000600/model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f11ecc60838c609d0ff1e1ba57ce3bd47aa13c68e9d50ccc1c046eee721506c
3
+ size 17028883814
train-sink_0-attn_size_6-T_21/config.yaml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ generator_ckpt: checkpoints/ode_init.pt
2
+ generator_fsdp_wrap_strategy: size
3
+ real_score_fsdp_wrap_strategy: size
4
+ fake_score_fsdp_wrap_strategy: size
5
+ real_name: Wan2.1-T2V-14B
6
+ text_encoder_fsdp_wrap_strategy: size
7
+ denoising_step_list:
8
+ - 1000
9
+ - 750
10
+ - 500
11
+ - 250
12
+ warp_denoising_step: true # need to remove - 0 in denoising_step_list if warp_denoising_step is true
13
+ ts_schedule: false
14
+ num_train_timestep: 1000
15
+ timestep_shift: 5.0
16
+ guidance_scale: 3.0
17
+ denoising_loss_type: flow
18
+ mixed_precision: true
19
+ seed: 0
20
+ wandb_host: WANDB_HOST
21
+ wandb_key: WANDB_KEY
22
+ wandb_entity: WANDB_ENTITY
23
+ wandb_project: WANDB_PROJECT
24
+ sharding_strategy: hybrid_full
25
+ lr: 2.0e-06
26
+ lr_critic: 4.0e-07
27
+ beta1: 0.0
28
+ beta2: 0.999
29
+ beta1_critic: 0.0
30
+ beta2_critic: 0.999
31
+ data_path: prompts/vidprom_filtered_extended.txt
32
+ batch_size: 1
33
+ ema_weight: 0.99
34
+ ema_start_step: 200
35
+ total_batch_size: 64
36
+ log_iters: 50
37
+ negative_prompt: '色调艳丽,过曝,静态,细节模糊不清,字幕,风格,作品,画作,画面,静止,整体发灰,最差质量,低质量,JPEG压缩残留,丑陋的,残缺的,多余的手指,画得不好的手部,画得不好的脸部,畸形的,毁容的,形态畸形的肢体,手指融合,静止不动的画面,杂乱的背景,三条腿,背景人很多,倒着走'
38
+ dfake_gen_update_ratio: 5
39
+ image_or_video_shape:
40
+ - 1
41
+ - 21
42
+ - 16
43
+ - 60
44
+ - 104
45
+ distribution_loss: dmd
46
+ trainer: score_distillation
47
+ gradient_checkpointing: true
48
+ num_frame_per_block: 3
49
+ load_raw_video: false
50
+ model_kwargs:
51
+ timestep_shift: 5.0
train-sink_1-attn_size_12-T_21/checkpoint_model_000600/model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ace61408300eb77a97438a7817d4609b1c80dc757998e5d4e696b6ad235be1f4
3
+ size 17028883814
train-sink_1-attn_size_12-T_21/config.yaml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ generator_ckpt: checkpoints/ode_init.pt
2
+ generator_fsdp_wrap_strategy: size
3
+ real_score_fsdp_wrap_strategy: size
4
+ fake_score_fsdp_wrap_strategy: size
5
+ real_name: Wan2.1-T2V-14B
6
+ text_encoder_fsdp_wrap_strategy: size
7
+ denoising_step_list:
8
+ - 1000
9
+ - 750
10
+ - 500
11
+ - 250
12
+ warp_denoising_step: true # need to remove - 0 in denoising_step_list if warp_denoising_step is true
13
+ ts_schedule: false
14
+ num_train_timestep: 1000
15
+ timestep_shift: 5.0
16
+ guidance_scale: 3.0
17
+ denoising_loss_type: flow
18
+ mixed_precision: true
19
+ seed: 0
20
+ wandb_host: WANDB_HOST
21
+ wandb_key: WANDB_KEY
22
+ wandb_entity: WANDB_ENTITY
23
+ wandb_project: WANDB_PROJECT
24
+ sharding_strategy: hybrid_full
25
+ lr: 2.0e-06
26
+ lr_critic: 4.0e-07
27
+ beta1: 0.0
28
+ beta2: 0.999
29
+ beta1_critic: 0.0
30
+ beta2_critic: 0.999
31
+ data_path: prompts/vidprom_filtered_extended.txt
32
+ batch_size: 1
33
+ ema_weight: 0.99
34
+ ema_start_step: 200
35
+ total_batch_size: 64
36
+ log_iters: 50
37
+ negative_prompt: '色调艳丽,过曝,静态,细节模糊不清,字幕,风格,作品,画作,画面,静止,整体发灰,最差质量,低质量,JPEG压缩残留,丑陋的,残缺的,多余的手指,画得不好的手部,画得不好的脸部,畸形的,毁容的,形态畸形的肢体,手指融合,静止不动的画面,杂乱的背景,三条腿,背景人很多,倒着走'
38
+ dfake_gen_update_ratio: 5
39
+ image_or_video_shape:
40
+ - 1
41
+ - 21
42
+ - 16
43
+ - 60
44
+ - 104
45
+ distribution_loss: dmd
46
+ trainer: score_distillation
47
+ gradient_checkpointing: true
48
+ num_frame_per_block: 3
49
+ load_raw_video: false
50
+ model_kwargs:
51
+ timestep_shift: 5.0
train-sink_1-attn_size_12-T_42/checkpoint_model_000500/model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:399da0c195dffbdcb9827778d0ff5a399fe5794ee324619c3d974142acbd6c4e
3
+ size 17028883814
train-sink_1-attn_size_12-T_42/config.yaml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ generator_ckpt: checkpoints/ode_init.pt
2
+ generator_fsdp_wrap_strategy: size
3
+ real_score_fsdp_wrap_strategy: size
4
+ fake_score_fsdp_wrap_strategy: size
5
+ real_name: Wan2.1-T2V-14B
6
+ text_encoder_fsdp_wrap_strategy: size
7
+ denoising_step_list:
8
+ - 1000
9
+ - 750
10
+ - 500
11
+ - 250
12
+ warp_denoising_step: true # need to remove - 0 in denoising_step_list if warp_denoising_step is true
13
+ ts_schedule: false
14
+ num_train_timestep: 1000
15
+ timestep_shift: 5.0
16
+ guidance_scale: 3.0
17
+ denoising_loss_type: flow
18
+ mixed_precision: true
19
+ seed: 0
20
+ wandb_host: WANDB_HOST
21
+ wandb_key: WANDB_KEY
22
+ wandb_entity: WANDB_ENTITY
23
+ wandb_project: WANDB_PROJECT
24
+ sharding_strategy: hybrid_full
25
+ lr: 2.0e-06
26
+ lr_critic: 4.0e-07
27
+ beta1: 0.0
28
+ beta2: 0.999
29
+ beta1_critic: 0.0
30
+ beta2_critic: 0.999
31
+ data_path: prompts/vidprom_filtered_extended.txt
32
+ batch_size: 1
33
+ ema_weight: 0.99
34
+ ema_start_step: 200
35
+ total_batch_size: 64
36
+ log_iters: 50
37
+ negative_prompt: '色调艳丽,过曝,静态,细节模糊不清,字幕,风格,作品,画作,画面,静止,整体发灰,最差质量,低质量,JPEG压缩残留,丑陋的,残缺的,多余的手指,画得不好的手部,画得不好的脸部,畸形的,毁容的,形态畸形的肢体,手指融合,静止不动的画面,杂乱的背景,三条腿,背景人很多,倒着走'
38
+ dfake_gen_update_ratio: 5
39
+ image_or_video_shape:
40
+ - 1
41
+ - 21
42
+ - 16
43
+ - 60
44
+ - 104
45
+ distribution_loss: dmd
46
+ trainer: score_distillation
47
+ gradient_checkpointing: true
48
+ num_frame_per_block: 3
49
+ load_raw_video: false
50
+ model_kwargs:
51
+ timestep_shift: 5.0