Tuyabei commited on
Commit
984f84f
·
verified ·
1 Parent(s): d5b18ba

Upload config.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.yaml +103 -0
config.yaml ADDED
@@ -0,0 +1,103 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ target: lvdm.models.ddpm3d.LatentVisualDiffusion
3
+ params:
4
+ rescale_betas_zero_snr: True
5
+ parameterization: "v"
6
+ linear_start: 0.00085
7
+ linear_end: 0.012
8
+ num_timesteps_cond: 1
9
+ timesteps: 1000
10
+ first_stage_key: video
11
+ cond_stage_key: caption
12
+ cond_stage_trainable: False
13
+ conditioning_key: hybrid
14
+ image_size: [40, 64]
15
+ channels: 4
16
+ scale_by_std: False
17
+ scale_factor: 0.18215
18
+ use_ema: False
19
+ uncond_type: 'empty_seq'
20
+ use_dynamic_rescale: true
21
+ base_scale: 0.7
22
+ fps_condition_type: 'fps'
23
+ perframe_ae: True
24
+ unet_config:
25
+ target: lvdm.modules.networks.openaimodel3d.UNetModel
26
+ params:
27
+ in_channels: 8
28
+ out_channels: 4
29
+ model_channels: 320
30
+ attention_resolutions:
31
+ - 4
32
+ - 2
33
+ - 1
34
+ num_res_blocks: 2
35
+ channel_mult:
36
+ - 1
37
+ - 2
38
+ - 4
39
+ - 4
40
+ dropout: 0.1
41
+ num_head_channels: 64
42
+ transformer_depth: 1
43
+ context_dim: 1024
44
+ use_linear: true
45
+ use_checkpoint: True
46
+ temporal_conv: True
47
+ temporal_attention: True
48
+ temporal_selfatt_only: false
49
+ use_relative_position: false
50
+ use_causal_attention: False
51
+ temporal_length: 16
52
+ addition_attention: true
53
+ image_cross_attention: true
54
+ default_fs: 24
55
+ fs_condition: true
56
+
57
+ first_stage_config:
58
+ target: lvdm.models.autoencoder.AutoencoderKL
59
+ params:
60
+ embed_dim: 4
61
+ monitor: val/rec_loss
62
+ ddconfig:
63
+ double_z: True
64
+ z_channels: 4
65
+ resolution: 256
66
+ in_channels: 3
67
+ out_ch: 3
68
+ ch: 128
69
+ ch_mult:
70
+ - 1
71
+ - 2
72
+ - 4
73
+ - 4
74
+ num_res_blocks: 2
75
+ attn_resolutions: []
76
+ dropout: 0.0
77
+ lossconfig:
78
+ target: torch.nn.Identity
79
+
80
+ cond_stage_config:
81
+ target: lvdm.modules.encoders.condition.FrozenOpenCLIPEmbedder
82
+ params:
83
+ freeze: true
84
+ layer: "penultimate"
85
+
86
+ img_cond_stage_config:
87
+ target: lvdm.modules.encoders.condition.FrozenOpenCLIPImageEmbedderV2
88
+ params:
89
+ freeze: true
90
+
91
+ image_proj_stage_config:
92
+ target: lvdm.modules.encoders.resampler.Resampler
93
+ params:
94
+ dim: 1024
95
+ depth: 4
96
+ dim_head: 64
97
+ heads: 12
98
+ num_queries: 16
99
+ embedding_dim: 1280
100
+ output_dim: 1024
101
+ ff_mult: 4
102
+ video_length: 16
103
+