{ "in_channels": 3, "hidden_size_x": 32, "z_channels": 1152, "max_freqs": 8, "num_res_blocks": 3, "patch_size": 16 }