{ "input_dim": 960, "output_dim": 960, "architecture": "Linear-GELU-Linear", "audio_encoder": "dymn10_as", "base_vlm": "SmolVLM2-500M" }