LTX-2.3-dev / vocoder /config.json
prince-canuma's picture
Upload folder using huggingface_hub
e3bb663 verified
{
"type": "bigvgan",
"has_bwe_generator": true,
"vocoder": {
"upsample_initial_channel": 1536,
"resblock": "AMP1",
"upsample_rates": [5, 2, 2, 2, 2, 2],
"upsample_kernel_sizes": [11, 4, 4, 4, 4, 4],
"resblock_kernel_sizes": [3, 7, 11],
"resblock_dilation_sizes": [[1, 3, 5], [1, 3, 5], [1, 3, 5]],
"stereo": true,
"activation": "snakebeta",
"use_tanh_at_final": false,
"apply_final_activation": true,
"use_bias_at_final": false
},
"bwe": {
"upsample_initial_channel": 512,
"resblock": "AMP1",
"upsample_rates": [6, 5, 2, 2, 2],
"upsample_kernel_sizes": [12, 11, 4, 4, 4],
"resblock_kernel_sizes": [3, 7, 11],
"resblock_dilation_sizes": [[1, 3, 5], [1, 3, 5], [1, 3, 5]],
"stereo": true,
"activation": "snakebeta",
"use_tanh_at_final": false,
"apply_final_activation": false,
"use_bias_at_final": false,
"input_sampling_rate": 16000,
"output_sampling_rate": 48000,
"hop_length": 80
}
}