SESA_Fast_Separation

Running

App Files Files Community

ASesYusuf1 commited on May 15, 2025

Commit

67568d2

verified ·

1 Parent(s): 88bba59

Update gui.py

Browse files

Files changed (1) hide show

gui.py +17 -25

gui.py CHANGED Viewed

@@ -46,7 +46,7 @@ client_utils._json_schema_to_python_type = patched_json_schema_to_python_type
 device = "cuda" if torch.cuda.is_available() else "cpu"
 use_autocast = device == "cuda"
-# Model dictionaries organized by category
 ROFORMER_MODELS = {
     "Vocals": {
         'MelBand Roformer | Big Beta 6X by unwa': 'melband_roformer_big_beta6x.ckpt',
@@ -120,7 +120,7 @@ ROFORMER_MODELS = {
     "Karaoke": {
         'Mel-Roformer-Karaoke-Aufr33-Viperx': 'mel_band_roformer_karaoke_aufr33_viperx_sdr_10.1956.ckpt',
         'MelBand Roformer | Karaoke by Gabox': 'mel_band_roformer_karaoke_gabox.ckpt',
-        "MelBand Roformer | Karaoke by becruily": 'mel_band_roformer_karaoke_becruily.ckpt',
     },
     "General Purpose": {
         'BS-Roformer-Viperx-1297': 'model_bs_roformer_ep_317_sdr_12.9755.ckpt',
@@ -140,7 +140,7 @@ ROFORMER_MODELS = {
 OUTPUT_FORMATS = ['wav', 'flac', 'mp3', 'ogg', 'opus', 'm4a', 'aiff', 'ac3']
-# CSS for UI styling (unchanged from previous)
 CSS = """
 /* Modern ve Etkileşimli Tema */
 #app-container {
@@ -355,8 +355,8 @@ button:hover {
 """
 # Functions
-def download_audio(url, out_dir="ytdl"):
-    """Download audio from a URL using yt-dlp."""
     if not url or not validators.url(url):
         raise ValueError("Invalid or missing URL.")
@@ -368,10 +368,15 @@ def download_audio(url, out_dir="ytdl"):
         'format': 'bestaudio/best',
         'postprocessors': [{'key': 'FFmpegExtractAudio', 'preferredcodec': 'wav', 'preferredquality': '192'}],
         'outtmpl': os.path.join(out_dir, '%(title)s.%(ext)s'),
     }
     try:
         with YoutubeDL(ydl_opts) as ydl:
-            ydl.download([url])
             info_dict = ydl.extract_info(url, download=True)
             return ydl.prepare_filename(info_dict).rsplit('.', 1)[0] + '.wav'
     except Exception as e:
@@ -516,7 +521,7 @@ def create_interface():
                 with gr.Group(elem_classes="dubbing-theme"):
                     gr.Markdown("### General Settings")
                     model_file_dir = gr.Textbox(value="/tmp/audio-separator-models/", label="📂 Model Cache", placeholder="Path to model directory", interactive=True)
-                    output_dir = gr.Textbox(value="output+*6", label="📤 Output Directory", placeholder="Where to save results", interactive=True)
                     output_format = gr.Dropdown(value="wav", choices=OUTPUT_FORMATS, label="🎶 Output Format", interactive=True)
                     norm_threshold = gr.Slider(0.1, 1.0, value=0.9, step=0.1, label="🔊 Normalization Threshold", interactive=True)
                     amp_threshold = gr.Slider(0.1, 1.0, value=0.3, step=0.1, label="📈 Amplification Threshold", interactive=True)
@@ -529,6 +534,7 @@ def create_interface():
                     with gr.Row():
                         roformer_audio = gr.Audio(label="🎧 Upload Audio", type="filepath", interactive=True)
                         url_ro = gr.Textbox(label="🔗 Or Paste URL", placeholder="YouTube or audio URL", interactive=True)
                         download_roformer = gr.Button("⬇️ Download", variant="secondary")
                     roformer_exclude_stems = gr.Textbox(label="🚫 Exclude Stems", placeholder="e.g., vocals, drums (comma-separated)", interactive=True)
                     with gr.Row():
@@ -552,6 +558,7 @@ def create_interface():
                     with gr.Row():
                         ensemble_audio = gr.Audio(label="🎧 Upload Audio", type="filepath", interactive=True)
                         url_ensemble = gr.Textbox(label="🔗 Or Paste URL", placeholder="YouTube or audio URL", interactive=True)
                         download_ensemble = gr.Button("⬇️ Download", variant="secondary")
                     ensemble_exclude_stems = gr.Textbox(label="🚫 Exclude Stems", placeholder="e.g., vocals, drums (comma-separated)", interactive=True)
                     with gr.Row():
@@ -571,7 +578,7 @@ def create_interface():
         # Event Handlers
         roformer_category.change(update_roformer_models, inputs=[roformer_category], outputs=[roformer_model])
-        download_roformer.click(fn=download_audio, inputs=[url_ro], outputs=[roformer_audio])
         roformer_button.click(
             roformer_separator,
             inputs=[
@@ -582,7 +589,7 @@ def create_interface():
             outputs=[roformer_stem1, roformer_stem2]
         )
         ensemble_category.change(update_ensemble_models, inputs=[ensemble_category], outputs=[ensemble_models])
-        download_ensemble.click(fn=download_audio, inputs=[url_ensemble], outputs=[ensemble_audio])
         ensemble_button.click(
             fn=auto_ensemble_process,
             inputs=[
@@ -594,19 +601,4 @@ def create_interface():
             outputs=[ensemble_output, ensemble_status]
         )
-    return app
-if __name__ == "__main__":
-    parser = argparse.ArgumentParser(description="Music Source Separation Web UI")
-    parser.add_argument("--port", type=int, default=7860, help="Port to run the UI on")
-    args = parser.parse_args()
-    app = create_interface()
-    try:
-        # For Hugging Face Spaces
-        app.launch(server_name="0.0.0.0", server_port=args.port, share=True)
-    except Exception as e:
-        logger.error(f"Failed to launch app: {e}")
-        raise
-    finally:
-        app.close()

 device = "cuda" if torch.cuda.is_available() else "cpu"
 use_autocast = device == "cuda"
+# Model dictionaries organized by category (unchanged)
 ROFORMER_MODELS = {
     "Vocals": {
         'MelBand Roformer | Big Beta 6X by unwa': 'melband_roformer_big_beta6x.ckpt',
     "Karaoke": {
         'Mel-Roformer-Karaoke-Aufr33-Viperx': 'mel_band_roformer_karaoke_aufr33_viperx_sdr_10.1956.ckpt',
         'MelBand Roformer | Karaoke by Gabox': 'mel_band_roformer_karaoke_gabox.ckpt',
+        'MelBand Roformer | Karaoke by becruily': 'mel_band_roformer_karaoke_becruily.ckpt',
     },
     "General Purpose": {
         'BS-Roformer-Viperx-1297': 'model_bs_roformer_ep_317_sdr_12.9755.ckpt',
 OUTPUT_FORMATS = ['wav', 'flac', 'mp3', 'ogg', 'opus', 'm4a', 'aiff', 'ac3']
+# CSS for UI styling (unchanged)
 CSS = """
 /* Modern ve Etkileşimli Tema */
 #app-container {
 """
 # Functions
+def download_audio(url, cookies_file=None, out_dir="ytdl"):
+    """Download audio from a URL using yt-dlp with cookies support."""
     if not url or not validators.url(url):
         raise ValueError("Invalid or missing URL.")
         'format': 'bestaudio/best',
         'postprocessors': [{'key': 'FFmpegExtractAudio', 'preferredcodec': 'wav', 'preferredquality': '192'}],
         'outtmpl': os.path.join(out_dir, '%(title)s.%(ext)s'),
+        'user_agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36',
+        'geo_bypass': True,
+        'force_ipv4': True,
+        'referer': 'https://www.youtube.com/',
+        'noplaylist': True,
+        'cookiefile': cookies_file if cookies_file else None,
     }
     try:
         with YoutubeDL(ydl_opts) as ydl:
             info_dict = ydl.extract_info(url, download=True)
             return ydl.prepare_filename(info_dict).rsplit('.', 1)[0] + '.wav'
     except Exception as e:
                 with gr.Group(elem_classes="dubbing-theme"):
                     gr.Markdown("### General Settings")
                     model_file_dir = gr.Textbox(value="/tmp/audio-separator-models/", label="📂 Model Cache", placeholder="Path to model directory", interactive=True)
+                    output_dir = gr.Textbox(value="output", label="📤 Output Directory", placeholder="Where to save results", interactive=True)
                     output_format = gr.Dropdown(value="wav", choices=OUTPUT_FORMATS, label="🎶 Output Format", interactive=True)
                     norm_threshold = gr.Slider(0.1, 1.0, value=0.9, step=0.1, label="🔊 Normalization Threshold", interactive=True)
                     amp_threshold = gr.Slider(0.1, 1.0, value=0.3, step=0.1, label="📈 Amplification Threshold", interactive=True)
                     with gr.Row():
                         roformer_audio = gr.Audio(label="🎧 Upload Audio", type="filepath", interactive=True)
                         url_ro = gr.Textbox(label="🔗 Or Paste URL", placeholder="YouTube or audio URL", interactive=True)
+                        cookies_ro = gr.File(label="🍪 Cookies File", file_types=[".txt"], interactive=True)
                         download_roformer = gr.Button("⬇️ Download", variant="secondary")
                     roformer_exclude_stems = gr.Textbox(label="🚫 Exclude Stems", placeholder="e.g., vocals, drums (comma-separated)", interactive=True)
                     with gr.Row():
                     with gr.Row():
                         ensemble_audio = gr.Audio(label="🎧 Upload Audio", type="filepath", interactive=True)
                         url_ensemble = gr.Textbox(label="🔗 Or Paste URL", placeholder="YouTube or audio URL", interactive=True)
+                        cookies_ensemble = gr.File(label="🍪 Cookies File", file_types=[".txt"], interactive=True)
                         download_ensemble = gr.Button("⬇️ Download", variant="secondary")
                     ensemble_exclude_stems = gr.Textbox(label="🚫 Exclude Stems", placeholder="e.g., vocals, drums (comma-separated)", interactive=True)
                     with gr.Row():
         # Event Handlers
         roformer_category.change(update_roformer_models, inputs=[roformer_category], outputs=[roformer_model])
+        download_roformer.click(fn=download_audio, inputs=[url_ro, cookies_ro], outputs=[roformer_audio])
         roformer_button.click(
             roformer_separator,
             inputs=[
             outputs=[roformer_stem1, roformer_stem2]
         )
         ensemble_category.change(update_ensemble_models, inputs=[ensemble_category], outputs=[ensemble_models])
+        download_ensemble.click(fn=download_audio, inputs=[url_ensemble, cookies_ensemble], outputs=[ensemble_audio])
         ensemble_button.click(
             fn=auto_ensemble_process,
             inputs=[
             outputs=[ensemble_output, ensemble_status]
         )
+    return app