| { | |
| "model_type": "hifigan", | |
| "sample_rate": 22050, | |
| "num_mels": 80, | |
| "num_freq": 1025, | |
| "n_fft": 1024, | |
| "hop_size": 256, | |
| "win_size": 1024, | |
| "fmin": 0.0, | |
| "fmax": 8000.0, | |
| "upsample_rates": [8, 8, 2, 2], | |
| "upsample_kernel_sizes": [16, 16, 4, 4], | |
| "upsample_initial_channel": 512, | |
| "resblock_kernel_sizes": [3, 7, 11], | |
| "resblock_dilation_sizes": [ | |
| [1, 3, 5], | |
| [1, 3, 5], | |
| [1, 3, 5] | |
| ], | |
| "resblock_type": "1", | |
| "use_spectral_norm": false, | |
| "version": "1.0", | |
| "authors": ["Arjit"], | |
| "description": "HiFi-GAN vocoder for high-fidelity audio waveform generation from mel-spectrograms" | |
| } | |