{ "model_type": "inl-vae", "image_size": 256, "base_channels": 128, "latent_dim": 4, "channel_mult": [ 1, 2, 4, 4 ], "num_res_blocks": 2, "training_steps": 15000, "torch_dtype": "float16" }