{ "architectures": [ "SpeechDecoderModel" ], "backbone": "gru", "backbone_kwargs": { "bidirectional": false, "input_dropout": 0.2, "mlp_head": false, "n_layers": 5, "n_units": 768, "patch_size": 14, "patch_stride": 4, "rnn_dropout": 0.4 }, "dtype": "float32", "model_type": "neural-speech-decoder", "n_classes": 41, "n_days": 24, "n_phoneme_classes": 41, "neural_dim": 256, "prediction": "direct", "transformers_version": "5.5.3" }