{ "dim": 1024, "depth": 22, "heads": 16, "ff_mult": 2, "text_dim": 512, "text_mask_padding": false, "conv_layers": 4, "pe_attn_head": 1, "mel_spec_type": "vocos" }