_target_: nemo.collections.tts.data.audio_trimming.VadAudioTrimmer
model_name: "vad_multilingual_marblenet"
vad_sample_rate: 16000
vad_threshold: 0.5
device: "cpu"
speech_frame_threshold: 3
trim_win_length: 4096
trim_hop_length: 1024
pad_seconds: 0.2 |