HReynaud commited on
Commit
d308cfc
·
1 Parent(s): 941c72f
lvfm/FMvT-S2-16f8/config.json ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "DiffuserSTDiT",
3
+ "_diffusers_version": "0.30.3",
4
+ "_name_or_path": "experiments/lvfm_STDiT-S_16f8_all/checkpoint-1000000/denoiser_ema",
5
+ "caption_channels": 1,
6
+ "class_dropout_prob": 0.0,
7
+ "decay": 0.9999,
8
+ "depth": 12,
9
+ "drop_path": 0.0,
10
+ "enable_flashattn": false,
11
+ "hidden_size": 384,
12
+ "in_channels": 32,
13
+ "input_size": [
14
+ 64,
15
+ 14,
16
+ 14
17
+ ],
18
+ "inv_gamma": 1.0,
19
+ "min_decay": 0.0,
20
+ "mlp_ratio": 4.0,
21
+ "model_max_length": 1,
22
+ "no_temporal_pos_emb": false,
23
+ "num_heads": 6,
24
+ "optimization_step": 1,
25
+ "out_channels": 16,
26
+ "patch_size": [
27
+ 1,
28
+ 2,
29
+ 2
30
+ ],
31
+ "power": 0.6666666666666666,
32
+ "space_scale": 1.0,
33
+ "time_scale": 1.0,
34
+ "update_after_step": 0,
35
+ "use_ema_warmup": false
36
+ }
lvfm/FMvT-S2-16f8/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:334747fe2ce2230479f477c3b0c9762474558d4bab31045f9b64086e2b5b6293
3
+ size 147609372
lvfm/FMvT-S2-4f4/config.json ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "DiffuserSTDiT",
3
+ "_diffusers_version": "0.30.3",
4
+ "_name_or_path": "experiments/lvfm_STDiT-S2_4f4_all/checkpoint-980000/denoiser_ema",
5
+ "caption_channels": 1,
6
+ "class_dropout_prob": 0.0,
7
+ "decay": 0.9999,
8
+ "depth": 12,
9
+ "drop_path": 0.0,
10
+ "enable_flashattn": false,
11
+ "hidden_size": 384,
12
+ "in_channels": 8,
13
+ "input_size": [
14
+ 64,
15
+ 28,
16
+ 28
17
+ ],
18
+ "inv_gamma": 1.0,
19
+ "min_decay": 0.0,
20
+ "mlp_ratio": 4.0,
21
+ "model_max_length": 1,
22
+ "no_temporal_pos_emb": false,
23
+ "num_heads": 6,
24
+ "optimization_step": 20001,
25
+ "out_channels": 4,
26
+ "patch_size": [
27
+ 1,
28
+ 2,
29
+ 2
30
+ ],
31
+ "power": 0.6666666666666666,
32
+ "space_scale": 1.0,
33
+ "time_scale": 1.0,
34
+ "update_after_step": 0,
35
+ "use_ema_warmup": false
36
+ }
lvfm/FMvT-S2-4f4/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d8179f081db6c3af1e9b66476b76b0f63775ed27d7338bad48f79b7063b0cad
3
+ size 147613788
lvfm/FMvT-S4-4f4/config.json ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "DiffuserSTDiT",
3
+ "_diffusers_version": "0.30.3",
4
+ "_name_or_path": "experiments/lvfm_STDiT-S4_4f4_all/checkpoint-950000/denoiser_ema",
5
+ "caption_channels": 1,
6
+ "class_dropout_prob": 0.0,
7
+ "decay": 0.9999,
8
+ "depth": 12,
9
+ "drop_path": 0.0,
10
+ "enable_flashattn": false,
11
+ "hidden_size": 384,
12
+ "in_channels": 8,
13
+ "input_size": [
14
+ 64,
15
+ 28,
16
+ 28
17
+ ],
18
+ "inv_gamma": 1.0,
19
+ "min_decay": 0.0,
20
+ "mlp_ratio": 4.0,
21
+ "model_max_length": 1,
22
+ "no_temporal_pos_emb": false,
23
+ "num_heads": 6,
24
+ "optimization_step": 50001,
25
+ "out_channels": 4,
26
+ "patch_size": [
27
+ 1,
28
+ 4,
29
+ 4
30
+ ],
31
+ "power": 0.6666666666666666,
32
+ "space_scale": 1.0,
33
+ "time_scale": 1.0,
34
+ "update_after_step": 0,
35
+ "use_ema_warmup": false
36
+ }
lvfm/FMvT-S4-4f4/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f005f889f06011c343ba866c6742b70553698792a1582d1b674923dcfe61ca0
3
+ size 147609364
lvfm/STUNet-S-16f8/config.json ADDED
@@ -0,0 +1,45 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNetSTIC",
3
+ "_diffusers_version": "0.30.3",
4
+ "_name_or_path": "experiments/lvfm_UNetSTIC-S_16f8_all/checkpoint-80000/denoiser_ema",
5
+ "addition_time_embed_dim": 1,
6
+ "block_out_channels": [
7
+ 64,
8
+ 128,
9
+ 192,
10
+ 256
11
+ ],
12
+ "cross_attention_dim": 1,
13
+ "decay": 0.9999,
14
+ "down_block_types": [
15
+ "CrossAttnDownBlockSpatioTemporal",
16
+ "CrossAttnDownBlockSpatioTemporal",
17
+ "CrossAttnDownBlockSpatioTemporal",
18
+ "DownBlockSpatioTemporal"
19
+ ],
20
+ "in_channels": 32,
21
+ "inv_gamma": 1.0,
22
+ "layers_per_block": 2,
23
+ "min_decay": 0.0,
24
+ "num_attention_heads": [
25
+ 8,
26
+ 16,
27
+ 16,
28
+ 32
29
+ ],
30
+ "num_frames": 64,
31
+ "optimization_step": 20001,
32
+ "out_channels": 16,
33
+ "power": 0.6666666666666666,
34
+ "projection_class_embeddings_input_dim": 1,
35
+ "sample_size": 14,
36
+ "transformer_layers_per_block": 1,
37
+ "up_block_types": [
38
+ "UpBlockSpatioTemporal",
39
+ "CrossAttnUpBlockSpatioTemporal",
40
+ "CrossAttnUpBlockSpatioTemporal",
41
+ "CrossAttnUpBlockSpatioTemporal"
42
+ ],
43
+ "update_after_step": 0,
44
+ "use_ema_warmup": false
45
+ }
lvfm/STUNet-S-16f8/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0b9557a143942a9035d4864c3160bad58e7aea97cd6a3596ed5d845bee77121
3
+ size 183327136
lvfm/STUNet-S-4f4/config.json ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNetSTIC",
3
+ "_diffusers_version": "0.30.3",
4
+ "addition_time_embed_dim": 1,
5
+ "block_out_channels": [
6
+ 64,
7
+ 128,
8
+ 192,
9
+ 256
10
+ ],
11
+ "cross_attention_dim": 1,
12
+ "decay": 0.9999,
13
+ "down_block_types": [
14
+ "CrossAttnDownBlockSpatioTemporal",
15
+ "CrossAttnDownBlockSpatioTemporal",
16
+ "CrossAttnDownBlockSpatioTemporal",
17
+ "DownBlockSpatioTemporal"
18
+ ],
19
+ "in_channels": 8,
20
+ "inv_gamma": 1.0,
21
+ "layers_per_block": 2,
22
+ "min_decay": 0.0,
23
+ "num_attention_heads": [
24
+ 8,
25
+ 16,
26
+ 16,
27
+ 32
28
+ ],
29
+ "num_frames": 64,
30
+ "optimization_step": 50001,
31
+ "out_channels": 4,
32
+ "power": 0.6666666666666666,
33
+ "projection_class_embeddings_input_dim": 1,
34
+ "sample_size": 28,
35
+ "transformer_layers_per_block": 1,
36
+ "up_block_types": [
37
+ "UpBlockSpatioTemporal",
38
+ "CrossAttnUpBlockSpatioTemporal",
39
+ "CrossAttnUpBlockSpatioTemporal",
40
+ "CrossAttnUpBlockSpatioTemporal"
41
+ ],
42
+ "update_after_step": 0,
43
+ "use_ema_warmup": false
44
+ }
lvfm/STUNet-S-4f4/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:905c3805763567fb7cb113cda48d8cee3296ccecefe213dc9525ba7dbe909a58
3
+ size 183244088