Spaces:

musicgowdam
/

Audio_stem_Extractor-1

Build error

musicgowdam commited on Oct 5, 2025

Commit

981b156

verified ·

1 Parent(s): 66719e8

Upload 3 files

Files changed (3) hide show

README.md CHANGED Viewed

@@ -1,14 +1,13 @@
 ---
-title: Audio Stem Extractor-1
-emoji: 📈
-colorFrom: gray
-colorTo: indigo
 sdk: gradio
-sdk_version: 5.49.0
 app_file: app.py
 pinned: false
-license: mit
-short_description: Audio_stem_Extractor_2
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: Vocal Extractor
+emoji: 🎤️
+colorFrom: red
+colorTo: red
 sdk: gradio
+sdk_version: 5.47.2
 app_file: app.py
 pinned: false
+short_description: Extracting Vocal part from songs
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

app.py ADDED Viewed

+import os
+import gradio as gr
+from scipy.io.wavfile import write
+from pydub import AudioSegment
+def wav_to_mp3(wav_path, mp3_path, bitrate="128k"):  # 128k is a good default for quality/compression
+    audio = AudioSegment.from_wav(wav_path)
+    audio.export(mp3_path, format="mp3", bitrate=bitrate)
+def inference(audio):
+    os.makedirs("out", exist_ok=True)
+    write('test.wav', audio[0], audio[1])
+    os.system("python3 -m demucs.separate -n htdemucs --two-stems=vocals test.wav -o out")
+    vocals_wav = "./out/htdemucs/test/vocals.wav"
+    no_vocals_wav = "./out/htdemucs/test/no_vocals.wav"
+    vocals_mp3 = "./out/htdemucs/test/vocals.mp3"
+    no_vocals_mp3 = "./out/htdemucs/test/no_vocals.mp3"
+    wav_to_mp3(vocals_wav, vocals_mp3)
+    wav_to_mp3(no_vocals_wav, no_vocals_mp3)
+    return vocals_mp3, no_vocals_mp3
+title = "Demucs Music Source Separation (v4)"
+article = "<p style='text-align: center'><a href='https://arxiv.org/abs/1911.13254' target='_blank'>Music Source Separation in the Waveform Domain</a> | <a href='https://github.com/facebookresearch/demucs' target='_blank'>Github Repo</a> | <a href='https://www.thafx.com' target='_blank'>//THAFX</a></p>"
+gr.Interface(
+    inference,
+    gr.Audio(type="numpy", label="Input"),
+    [gr.Audio(type="filepath", label="Vocals"),gr.Audio(type="filepath", label="No Vocals / Instrumental")],
+    title=title,
+    article=article,
+    ).launch()

requirements.txt ADDED Viewed

+git+https://github.com/facebookresearch/demucs#egg=demucs
+scipy
+invisible-watermark
+fonts
+font-roboto
+numpy<1.26
+pydub