Spaces:

N4DerAX20
/

VO-Cleaner-App

Sleeping

App Files Files Community

N4DerAX20 commited on Jul 3, 2025

Commit

1a53a31

verified ·

1 Parent(s): 7a6fe93

Upload 2 files

Browse files

Files changed (2) hide show

app.py +28 -19
requirements.txt +3 -1

app.py CHANGED Viewed

@@ -1,34 +1,43 @@
 import gradio as gr
 import torchaudio
-from speechbrain.inference.enhance import Denoise
-# Load new model (this one works with SpeechBrain 1.0+)
-denoiser = Denoise.from_hparams(
-    source="speechbrain/denoise",
-    savedir="denoise_model"
-)
 def enhance_vo(file, denoise_strength):
-    # Load original audio
-    orig, fs = torchaudio.load(file)
-    # Denoise audio
-    cleaned = denoiser.enhance(orig, fs)
-    # Blend original and cleaned based on slider value (dry/wet mix)
-    blend_ratio = denoise_strength / 100.0
-    output = (1 - blend_ratio) * orig + blend_ratio * cleaned
-    # Normalize to avoid clipping
     output = output / output.abs().max()
-    # Save output
     output_path = "enhanced_output.wav"
-    torchaudio.save(output_path, output, fs)
     return output_path
-# Gradio app
 interface = gr.Interface(
     fn=enhance_vo,
     inputs=[
@@ -36,8 +45,8 @@ interface = gr.Interface(
         gr.Slider(0, 100, value=100, label="Noise Reduction Strength (%)")
     ],
     outputs=gr.Audio(type="filepath", label="Enhanced Audio (WAV)"),
-    title="VO Audio Enhancer",
-    description="Upload your voiceover (MP3/WAV), adjust the noise reduction level, and download the enhanced file."
 )
 interface.launch()

 import gradio as gr
+import requests
+import soundfile as sf
+import io
+import torch
 import torchaudio
+API_URL = "https://hf.space/embed/akhaliq/denoise-audio/+/api/predict"
 def enhance_vo(file, denoise_strength):
+    # Step 1: Read audio and send to remote model
+    with open(file, "rb") as f:
+        response = requests.post(API_URL, files={"data": f})
+    if response.status_code != 200:
+        raise Exception("Denoising model failed to process audio.")
+    # Step 2: Get denoised audio back
+    response_data = response.json()
+    url = response_data["data"][0]["url"]
+    audio_response = requests.get(url)
+    denoised_bytes = io.BytesIO(audio_response.content)
+    # Step 3: Load both original and denoised audio
+    orig_waveform, sr = torchaudio.load(file)
+    denoised_waveform, _ = torchaudio.load(denoised_bytes)
+    # Step 4: Blend based on slider value
+    blend_ratio = denoise_strength / 100.0
+    output = (1 - blend_ratio) * orig_waveform + blend_ratio * denoised_waveform
     output = output / output.abs().max()
+    # Step 5: Save to file
     output_path = "enhanced_output.wav"
+    torchaudio.save(output_path, output, sr)
     return output_path
+# Gradio app UI
 interface = gr.Interface(
     fn=enhance_vo,
     inputs=[
         gr.Slider(0, 100, value=100, label="Noise Reduction Strength (%)")
     ],
     outputs=gr.Audio(type="filepath", label="Enhanced Audio (WAV)"),
+    title="Adobe-style VO Enhancer (Online Model)",
+    description="Upload VO audio (MP3/WAV), adjust slider, and download cleaned WAV file."
 )
 interface.launch()

requirements.txt CHANGED Viewed

@@ -1,3 +1,5 @@
 gradio
 torchaudio
-speechbrain>=1.0.0

 gradio
+requests
 torchaudio
+soundfile