{ "model_type": "humanoid-multimodal", "hidden_size": 512, "num_layers": 8, "num_attention_heads": 8, "modalities": ["vision", "imu", "force"], "description": "Multimodal sensor fusion model for humanoid control" }