| { | |
| "model_type": "mmdit", | |
| "latent_dim": 16, | |
| "latent_size": 16, | |
| "hidden_dim": 512, | |
| "n_layers": 16, | |
| "n_heads": 8, | |
| "text_embed_dim": 768, | |
| "patch_size": 128, | |
| "sine_encoding_frequency": 10000, | |
| "num_classes": 1081 | |
| } |
| { | |
| "model_type": "mmdit", | |
| "latent_dim": 16, | |
| "latent_size": 16, | |
| "hidden_dim": 512, | |
| "n_layers": 16, | |
| "n_heads": 8, | |
| "text_embed_dim": 768, | |
| "patch_size": 128, | |
| "sine_encoding_frequency": 10000, | |
| "num_classes": 1081 | |
| } |