{ "model_type": "sensevoice", "vocab_size": 25055, "input_size": 560, "encoder_conf": { "output_size": 512, "attention_heads": 4, "linear_units": 2048, "num_blocks": 50, "tp_blocks": 20, "dropout_rate": 0.1, "attention_dropout_rate": 0.1, "kernel_size": 11, "sanm_shift": 0, "normalize_before": true }, "frontend_conf": { "fs": 16000, "window": "hamming", "n_mels": 80, "frame_length": 25, "frame_shift": 10, "lfr_m": 7, "lfr_n": 6 } }