{ "model_type": "echo_tts", "sample_rate": 44100, "max_text_length": 768, "max_speaker_latent_length": 6400, "audio_downsample_factor": 2048, "normalize_text": true, "delete_blockwise_modules": false, "pca_filename": "pca_state.safetensors", "fish_codec_repo": "jordand/fish-s1-dac-min", "model_path": "mlx_echo_tts_base", "dit": { "latent_size": 80, "model_size": 2048, "num_layers": 24, "num_heads": 16, "intermediate_size": 5888, "norm_eps": 1e-05, "text_vocab_size": 256, "text_model_size": 1280, "text_num_layers": 14, "text_num_heads": 10, "text_intermediate_size": 3328, "speaker_patch_size": 4, "speaker_model_size": 1280, "speaker_num_layers": 14, "speaker_num_heads": 10, "speaker_intermediate_size": 3328, "timestep_embed_size": 512, "adaln_rank": 256 }, "sampler": { "num_steps": 40, "cfg_scale_text": 3.0, "cfg_scale_speaker": 8.0, "cfg_min_t": 0.5, "cfg_max_t": 1.0, "truncation_factor": null, "rescale_k": null, "rescale_sigma": null, "speaker_kv_scale": null, "speaker_kv_max_layers": null, "speaker_kv_min_t": null, "sequence_length": 640 } }