| { |
| "in_channels": 3, |
| "out_channels": 3, |
| "down_block_types": [ |
| "DownBlock2D", |
| "DownBlock2D", |
| "AttnDownBlock2D", |
| "DownBlock2D" |
| ], |
| "up_block_types": [ |
| "UpBlock2D", |
| "AttnUpBlock2D", |
| "UpBlock2D", |
| "UpBlock2D" |
| ], |
| "block_out_channels": [ |
| 128, 256, 384, 512 |
| ], |
| "layers_per_block": 2, |
| "norm_num_groups": 32, |
| "cross_attention_dim": null, |
| "attention_head_dim": 8, |
| "resnet_time_scale_shift": "default", |
| "class_embed_type": null, |
| "num_class_embeds": null, |
| "use_linear_projection": false, |
| "only_cross_attention": false, |
| "mid_block_scale_factor": 1, |
| "out_bias": true, |
| "flip_sin_to_cos": true, |
| "freq_shift": 0 |
| } |