| { | |
| "_class_name": "AutoencoderDC", | |
| "_diffusers_version": "0.33.1", | |
| "attention_head_dim": 2, | |
| "decoder_act_fns": "silu", | |
| "decoder_block_out_channels": [ | |
| 8, | |
| 8 | |
| ], | |
| "decoder_block_types": [ | |
| "ResBlock", | |
| "EfficientViTBlock" | |
| ], | |
| "decoder_layers_per_block": [ | |
| 1, | |
| 1 | |
| ], | |
| "decoder_norm_types": "rms_norm", | |
| "decoder_qkv_multiscales": [ | |
| [], | |
| [ | |
| 5 | |
| ] | |
| ], | |
| "downsample_block_type": "conv", | |
| "encoder_block_out_channels": [ | |
| 8, | |
| 8 | |
| ], | |
| "encoder_block_types": [ | |
| "ResBlock", | |
| "EfficientViTBlock" | |
| ], | |
| "encoder_layers_per_block": [ | |
| 1, | |
| 1 | |
| ], | |
| "encoder_qkv_multiscales": [ | |
| [], | |
| [ | |
| 5 | |
| ] | |
| ], | |
| "in_channels": 3, | |
| "latent_channels": 4, | |
| "scaling_factor": 0.41407, | |
| "upsample_block_type": "interpolate" | |
| } | |