Spaces:

Geek7
/

ancztxi2

Sleeping

Geek7 commited on Oct 5, 2024

Commit

41eafd2

verified ·

1 Parent(s): 0da2786

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,3 +1,32 @@
 import gradio as gr
-gr.Interface.load("models/speechbrain/mtl-mimic-voicebank").launch()

 import gradio as gr
+import torchaudio
+from speechbrain.inference.enhancement import WaveformEnhancement
+import torch
+# Load the SpeechBrain enhancement model
+enhance_model = WaveformEnhancement.from_hparams(
+    source="speechbrain/mtl-mimic-voicebank",
+    savedir="pretrained_models/mtl-mimic-voicebank",
+)
+def enhance_audio(input_audio):
+    # Load the uploaded audio file
+    waveform, sample_rate = torchaudio.load(input_audio)
+    # Enhance the audio
+    enhanced_waveform = enhance_model.enhance_batch(waveform)
+    # Save the enhanced audio to a file
+    output_path = "enhanced_audio.wav"
+    torchaudio.save(output_path, enhanced_waveform.cpu(), sample_rate)
+    return output_path
+# Set up the Gradio interface
+demo = gr.Interface(
+    fn=enhance_audio,
+    inputs=gr.Audio(type="filepath"),  # Upload an audio file
+    outputs=gr.Audio(type="filepath"),  # Download the enhanced audio
+)
+demo.launch()