Upload noise_removal.py
Browse filesupdated noise removal logic
- noise_removal.py +22 -0
noise_removal.py
ADDED
|
@@ -0,0 +1,22 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
from speechbrain.pretrained import SpectralMaskEnhancement
|
| 2 |
+
import torchaudio
|
| 3 |
+
|
| 4 |
+
model = SpectralMaskEnhancement.from_hparams(source="speechbrain/metricgan-plus-voicebank", )
|
| 5 |
+
|
| 6 |
+
from speechbrain.pretrained import SpectralMaskEnhancement
|
| 7 |
+
import torchaudio
|
| 8 |
+
import torch
|
| 9 |
+
|
| 10 |
+
model = SpectralMaskEnhancement.from_hparams(source="speechbrain/metricgan-plus-voicebank")
|
| 11 |
+
|
| 12 |
+
def remove_noise(input_path, output_path):
|
| 13 |
+
enhanced = model.enhance_file(input_path)
|
| 14 |
+
waveform, sample_rate = enhanced
|
| 15 |
+
|
| 16 |
+
if waveform.dim() == 0:
|
| 17 |
+
raise ValueError(f"Enhanced waveform is empty for file: {input_path}")
|
| 18 |
+
elif waveform.dim() == 1:
|
| 19 |
+
waveform = waveform.unsqueeze(0)
|
| 20 |
+
|
| 21 |
+
torchaudio.save(output_path, waveform, sample_rate)
|
| 22 |
+
|