| { |
| "type": "bigvgan", |
| "has_bwe_generator": true, |
| "vocoder": { |
| "upsample_initial_channel": 1536, |
| "resblock": "AMP1", |
| "upsample_rates": [5, 2, 2, 2, 2, 2], |
| "upsample_kernel_sizes": [11, 4, 4, 4, 4, 4], |
| "resblock_kernel_sizes": [3, 7, 11], |
| "resblock_dilation_sizes": [[1, 3, 5], [1, 3, 5], [1, 3, 5]], |
| "stereo": true, |
| "activation": "snakebeta", |
| "use_tanh_at_final": false, |
| "apply_final_activation": true, |
| "use_bias_at_final": false |
| }, |
| "bwe": { |
| "upsample_initial_channel": 512, |
| "resblock": "AMP1", |
| "upsample_rates": [6, 5, 2, 2, 2], |
| "upsample_kernel_sizes": [12, 11, 4, 4, 4], |
| "resblock_kernel_sizes": [3, 7, 11], |
| "resblock_dilation_sizes": [[1, 3, 5], [1, 3, 5], [1, 3, 5]], |
| "stereo": true, |
| "activation": "snakebeta", |
| "use_tanh_at_final": false, |
| "apply_final_activation": false, |
| "use_bias_at_final": false, |
| "input_sampling_rate": 16000, |
| "output_sampling_rate": 48000, |
| "hop_length": 80 |
| } |
| } |
|
|