{ "model_type": "mmdit", "latent_dim": 16, "latent_size": 16, "hidden_dim": 512, "n_layers": 16, "n_heads": 8, "text_embed_dim": 768, "patch_size": 128, "sine_encoding_frequency": 10000, "num_classes": 1081 }