| { |
| "data": { |
| "text_cleaners": [ |
| "cjke_cleaners2" |
| ], |
| "sampling_rate": 22050, |
| "filter_length": 1024, |
| "hop_length": 256, |
| "win_length": 1024, |
| "n_mel_channels": 80, |
| "add_blank": true, |
| "cleaned_text": true, |
| "n_speakers": 10 |
| }, |
| "model": { |
| "inter_channels": 192, |
| "hidden_channels": 192, |
| "filter_channels": 768, |
| "n_heads": 2, |
| "n_layers": 6, |
| "n_layers_trans_flow": 3, |
| "kernel_size": 3, |
| "p_dropout": 0.1, |
| "resblock": "1", |
| "resblock_kernel_sizes": [ |
| 3, |
| 7, |
| 11 |
| ], |
| "resblock_dilation_sizes": [ |
| [ |
| 1, |
| 3, |
| 5 |
| ], |
| [ |
| 1, |
| 3, |
| 5 |
| ], |
| [ |
| 1, |
| 3, |
| 5 |
| ] |
| ], |
| "upsample_rates": [ |
| 8, |
| 8, |
| 2, |
| 2 |
| ], |
| "upsample_initial_channel": 512, |
| "upsample_kernel_sizes": [ |
| 16, |
| 16, |
| 4, |
| 4 |
| ], |
| "n_layers_q": 3, |
| "use_spectral_norm": false, |
| "gin_channels": 256 |
| }, |
| "symbols": [ |
| "_", |
| ",", |
| ".", |
| "!", |
| "?", |
| "-", |
| "~", |
| "\u2026", |
| "N", |
| "Q", |
| "a", |
| "b", |
| "d", |
| "e", |
| "f", |
| "g", |
| "h", |
| "i", |
| "j", |
| "k", |
| "l", |
| "m", |
| "n", |
| "o", |
| "p", |
| "s", |
| "t", |
| "u", |
| "v", |
| "w", |
| "x", |
| "y", |
| "z", |
| "\u0251", |
| "\u00e6", |
| "\u0283", |
| "\u0291", |
| "\u00e7", |
| "\u026f", |
| "\u026a", |
| "\u0254", |
| "\u025b", |
| "\u0279", |
| "\u00f0", |
| "\u0259", |
| "\u026b", |
| "\u0265", |
| "\u0278", |
| "\u028a", |
| "\u027e", |
| "\u0292", |
| "\u03b8", |
| "\u03b2", |
| "\u014b", |
| "\u0266", |
| "\u207c", |
| "\u02b0", |
| "`", |
| "^", |
| "#", |
| "*", |
| "=", |
| "\u02c8", |
| "\u02cc", |
| "\u2192", |
| "\u2193", |
| "\u2191", |
| " " |
| ], |
| "speakers": { |
| "default": 0 |
| } |
| } |