OzzyGT HF Staff commited on
Commit
215ef71
·
verified ·
1 Parent(s): 082d6ca

Upload 2 files

Browse files
vae/config.json CHANGED
@@ -2,38 +2,54 @@
2
  "_class_name": "AutoencoderKLLTX2Video",
3
  "_diffusers_version": "0.37.0.dev0",
4
  "block_out_channels": [
 
 
5
  32,
6
- 64
7
  ],
8
  "decoder_block_out_channels": [
 
 
9
  32
10
  ],
11
  "decoder_causal": false,
12
  "decoder_inject_noise": [
 
 
13
  false,
14
  false
15
  ],
16
  "decoder_layers_per_block": [
 
 
17
  1,
18
  1
19
  ],
20
  "decoder_spatial_padding_mode": "reflect",
21
  "decoder_spatio_temporal_scaling": [
 
 
22
  true
23
  ],
24
  "down_block_types": [
 
 
25
  "LTX2VideoDownBlock3D",
26
  "LTX2VideoDownBlock3D"
27
  ],
28
  "downsample_type": [
29
  "spatial",
30
- "temporal"
 
 
31
  ],
32
  "encoder_causal": true,
33
  "encoder_spatial_padding_mode": "zeros",
34
  "in_channels": 3,
35
  "latent_channels": 4,
36
  "layers_per_block": [
 
 
37
  1,
38
  1,
39
  1
@@ -45,15 +61,21 @@
45
  "scaling_factor": 1.0,
46
  "spatial_compression_ratio": 32,
47
  "spatio_temporal_scaling": [
 
 
48
  true,
49
  true
50
  ],
51
  "temporal_compression_ratio": 8,
52
  "timestep_conditioning": false,
53
  "upsample_factor": [
 
 
54
  2
55
  ],
56
  "upsample_residual": [
 
 
57
  true
58
  ]
59
  }
 
2
  "_class_name": "AutoencoderKLLTX2Video",
3
  "_diffusers_version": "0.37.0.dev0",
4
  "block_out_channels": [
5
+ 16,
6
+ 16,
7
  32,
8
+ 32
9
  ],
10
  "decoder_block_out_channels": [
11
+ 8,
12
+ 16,
13
  32
14
  ],
15
  "decoder_causal": false,
16
  "decoder_inject_noise": [
17
+ false,
18
+ false,
19
  false,
20
  false
21
  ],
22
  "decoder_layers_per_block": [
23
+ 1,
24
+ 1,
25
  1,
26
  1
27
  ],
28
  "decoder_spatial_padding_mode": "reflect",
29
  "decoder_spatio_temporal_scaling": [
30
+ true,
31
+ true,
32
  true
33
  ],
34
  "down_block_types": [
35
+ "LTX2VideoDownBlock3D",
36
+ "LTX2VideoDownBlock3D",
37
  "LTX2VideoDownBlock3D",
38
  "LTX2VideoDownBlock3D"
39
  ],
40
  "downsample_type": [
41
  "spatial",
42
+ "temporal",
43
+ "spatiotemporal",
44
+ "spatiotemporal"
45
  ],
46
  "encoder_causal": true,
47
  "encoder_spatial_padding_mode": "zeros",
48
  "in_channels": 3,
49
  "latent_channels": 4,
50
  "layers_per_block": [
51
+ 1,
52
+ 1,
53
  1,
54
  1,
55
  1
 
61
  "scaling_factor": 1.0,
62
  "spatial_compression_ratio": 32,
63
  "spatio_temporal_scaling": [
64
+ true,
65
+ true,
66
  true,
67
  true
68
  ],
69
  "temporal_compression_ratio": 8,
70
  "timestep_conditioning": false,
71
  "upsample_factor": [
72
+ 2,
73
+ 2,
74
  2
75
  ],
76
  "upsample_residual": [
77
+ true,
78
+ true,
79
  true
80
  ]
81
  }
vae/diffusion_pytorch_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e6671690f82856448442ec433c4037a5691d03c2985a06558b0d59c2b55f69c
3
- size 1052218
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0291ee2b34c08e6bd93aab7a4cbc63cc0e41dd10e7e721e4e1f6cbd8e574d292
3
+ size 777842