SESA_Fast_Separation

Running

App Files Files Community

ASesYusuf1 commited on Apr 25, 2025

Commit

6a76931

verified ·

1 Parent(s): 003791d

Update gui.py

Browse files

Files changed (1) hide show

gui.py +245 -169

gui.py CHANGED Viewed

@@ -9,7 +9,8 @@ from audio_separator.separator import Separator
 import numpy as np
 import librosa
 import soundfile as sf
-from ensemble import ensemble_files  # ensemble.py'dan import
 device = "cuda" if torch.cuda.is_available() else "cpu"
 use_autocast = device == "cuda"
@@ -21,7 +22,9 @@ logger = logging.getLogger(__name__)
 # Model dictionaries organized by category
 ROFORMER_MODELS = {
     "Vocals": {
         'MelBand Roformer | Vocals by Kimberley Jensen': 'vocals_mel_band_roformer.ckpt',
         'MelBand Roformer | Vocals by becruily': 'mel_band_roformer_vocals_becruily.ckpt',
         'MelBand Roformer | Vocals Fullness by Aname': 'mel_band_roformer_vocal_fullness_aname.ckpt',
         'BS Roformer | Vocals by Gabox': 'bs_roformer_vocals_gabox.ckpt',
@@ -34,6 +37,13 @@ ROFORMER_MODELS = {
         'BS Roformer | Male-Female by aufr33': 'bs_roformer_male_female_by_aufr33_sdr_7.2889.ckpt',
     },
     "Instrumentals": {
         'MelBand Roformer Kim | Inst V1 by Unwa': 'melband_roformer_inst_v1.ckpt',
         'MelBand Roformer Kim | Inst V1 (E) by Unwa': 'melband_roformer_inst_v1e.ckpt',
         'MelBand Roformer Kim | Inst V2 by Unwa': 'melband_roformer_inst_v2.ckpt',
@@ -76,6 +86,7 @@ ROFORMER_MODELS = {
     "Karaoke": {
         'Mel-Roformer-Karaoke-Aufr33-Viperx': 'mel_band_roformer_karaoke_aufr33_viperx_sdr_10.1956.ckpt',
         'MelBand Roformer | Karaoke by Gabox': 'mel_band_roformer_karaoke_gabox.ckpt',
     },
     "General Purpose": {
         'BS-Roformer-Viperx-1297': 'model_bs_roformer_ep_317_sdr_12.9755.ckpt',
@@ -102,29 +113,30 @@ ROFORMER_MODELS = {
 OUTPUT_FORMATS = ['wav', 'flac', 'mp3', 'ogg', 'opus', 'm4a', 'aiff', 'ac3']
-# CSS
 CSS = """
-/* İnce ve Ortalanmış Tema */
 #app-container {
-    max-width: 600px;
     width: 100%;
     margin: 0 auto;
-    padding: 0.2rem;
     box-sizing: border-box;
     display: flex;
     flex-direction: column;
     align-items: center;
     min-height: 100vh;
-    background-color: #2d0b0b;
     position: relative;
 }
 body {
     background: url('/content/logo.jpg') no-repeat center center fixed;
     background-size: cover;
     margin: 0;
     padding: 0;
-    font-family: 'Poppins', sans-serif;
-    color: #C0C0C0;
     display: flex;
     justify-content: center;
 }
@@ -135,163 +147,180 @@ body::after {
     left: 0;
     width: 100%;
     height: 100%;
-    background: rgba(45, 11, 11, 0.85);
     z-index: -1;
 }
 .logo-container {
     position: fixed;
-    top: 0.2rem;
     left: 50%;
     transform: translateX(-50%);
     z-index: 2000;
 }
 .logo-img {
-    width: 60px;
     height: auto;
 }
 .header-text {
     text-align: center;
-    padding: 2rem 0.3rem 0.3rem;
-    color: #ff4040;
-    font-size: 1.4rem;
-    font-weight: 700;
-    text-shadow: 0 0 5px rgba(255, 64, 64, 0.4);
-    z-index: 1500;
 }
 .dubbing-theme {
-    background: linear-gradient(to bottom, #800000, #2d0b0b);
-    border-radius: 6px;
-    padding: 0.4rem;
-    box-shadow: 0 3px 10px rgba(255, 64, 64, 0.2);
     width: 100%;
 }
 .footer {
     text-align: center;
-    padding: 0.2rem;
-    color: #ff4040;
-    font-size: 10px;
     position: fixed;
     bottom: 0;
     width: 100%;
-    max-width: 600px;
-    background: rgba(45, 11, 11, 0.7);
     z-index: 1001;
     left: 50%;
     transform: translateX(-50%);
 }
 button {
-    background: #800000 !important;
-    border: 1px solid #ff4040 !important;
-    color: #C0C0C0 !important;
-    border-radius: 4px !important;
-    padding: 4px 8px !important;
-    font-size: 0.75rem !important;
-    transition: all 0.2s ease !important;
 }
 button:hover {
-    transform: scale(1.03) !important;
-    background: #ff4040 !important;
-    box-shadow: 0 3px 12px rgba(255, 64, 64, 0.5) !important;
 }
 .compact-upload.horizontal {
-    display: inline-flex !important;
     align-items: center !important;
-    gap: 4px !important;
-    max-width: 200px !important;
-    height: 28px !important;
-    padding: 0 5px !important;
-    border: 1px solid #ff4040 !important;
-    background: rgba(128, 0, 0, 0.5) !important;
-    border-radius: 4px !important;
-    color: #C0C0C0 !important;
 }
 .compact-upload.horizontal:hover {
-    border-color: #ff6b6b !important;
-    background: rgba(128, 0, 0, 0.7) !important;
 }
 .compact-upload.horizontal button {
-    padding: 2px 6px !important;
-    font-size: 0.6rem !important;
-    height: 20px !important;
-    min-width: 40px !important;
 }
 .gr-tab {
-    background: rgba(128, 0, 0, 0.5) !important;
-    border-radius: 5px 5px 0 0 !important;
-    padding: 0.3rem 0.6rem !important;
-    margin: 0 1px !important;
-    color: #C0C0C0 !important;
-    border: 1px solid #ff4040 !important;
-    z-index: 1500;
-    font-size: 0.8rem !important;
 }
 .gr-tab-selected {
-    background: #800000 !important;
-    color: #ffffff !important;
-    border: 1px solid #ff6b6b !important;
-    box-shadow: 0 2px 5px rgba(255, 64, 64, 0.5) !important;
 }
 .compact-grid {
-    gap: 0.15rem !important;
-    max-height: 30vh;
     overflow-y: auto;
-    padding: 0.3rem;
-    background: rgba(128, 0, 0, 0.3) !important;
-    border-radius: 5px;
-    border: 1px solid #ff4040 !important;
     width: 100%;
 }
 .compact-dropdown {
-    padding: 4px 6px !important;
-    border-radius: 5px !important;
-    border: 1px solid #ff4040 !important;
-    background: rgba(128, 0, 0, 0.5) !important;
-    color: #C0C0C0 !important;
     width: 100%;
-    font-size: 0.8rem !important;
 }
 .gr-slider input[type="range"] {
     -webkit-appearance: none !important;
     width: 100% !important;
-    height: 5px !important;
-    background: #ff4040 !important;
-    border-radius: 2px !important;
     outline: none !important;
 }
 .gr-slider input[type="range"]::-webkit-slider-thumb {
     -webkit-appearance: none !important;
-    width: 12px !important;
-    height: 12px !important;
-    background: #800000 !important;
-    border: 1px solid #ff6b6b !important;
     border-radius: 50% !important;
     cursor: pointer !important;
 }
 .gr-slider input[type="range"]::-moz-range-thumb {
-    width: 12px !important;
-    height: 12px !important;
-    background: #800000 !important;
-    border: 1px solid #ff6b6b !important;
     border-radius: 50% !important;
     cursor: pointer !important;
 }
 @media (max-width: 768px) {
     #app-container {
         max-width: 100%;
-        padding: 0.1rem;
     }
     .header-text {
-        font-size: 1.2rem;
-        padding: 1.5rem 0.3rem 0.2rem;
     }
     .logo-img {
-        width: 40px;
     }
     .compact-upload.horizontal {
         max-width: 100% !important;
     }
     .compact-grid {
-        max-height: 25vh;
     }
     .footer {
         max-width: 100%;
@@ -300,14 +329,19 @@ button:hover {
 """
 # Fonksiyonlar
-def download_audio(url, output_dir="ytdl"):
     if not url:
         raise ValueError("No URL provided.")
-    os.makedirs(output_dir, exist_ok=True)
     ydl_opts = {
         'format': 'bestaudio/best',
         'postprocessors': [{'key': 'FFmpegExtractAudio', 'preferredcodec': 'wav', 'preferredquality': '192'}],
-        'outtmpl': os.path.join(output_dir, '%(title)s.%(ext)s'),
     }
     try:
         with YoutubeDL(ydl_opts) as ydl:
@@ -317,9 +351,15 @@ def download_audio(url, output_dir="ytdl"):
     except Exception as e:
         raise RuntimeError(f"Download failed: {e}")
-def roformer_separator(audio, model_key, seg_size, override_seg_size, overlap, pitch_shift, model_dir, out_dir, out_format, norm_thresh, amp_thresh, batch_size, single_stem="", progress=gr.Progress(track_tqdm=True)):
     if not audio:
         raise ValueError("No audio file provided.")
     base_name = os.path.splitext(os.path.basename(audio))[0]
     for category, models in ROFORMER_MODELS.items():
         if model_key in models:
@@ -333,32 +373,45 @@ def roformer_separator(audio, model_key, seg_size, override_seg_size, overlap, p
         separator = Separator(
             log_level=logging.INFO,
             model_file_dir=model_dir,
-            output_dir=out_dir,
             output_format=out_format,
             normalization_threshold=norm_thresh,
             amplification_threshold=amp_thresh,
             use_autocast=use_autocast,
-            output_single_stem=single_stem if single_stem.strip() else None,
             mdxc_params={"segment_size": seg_size, "override_model_segment_size": override_seg_size, "batch_size": batch_size, "overlap": overlap, "pitch_shift": pitch_shift}
         )
         progress(0.2, desc="Loading model...")
         separator.load_model(model_filename=model)
         progress(0.7, desc="Separating audio...")
         separation = separator.separate(audio)
-        stems = [os.path.join(out_dir, file_name) for file_name in separation]
-        return stems[0], stems[1] if len(stems) > 1 and not single_stem.strip() else None
     except Exception as e:
         logger.error(f"Separation failed: {e}")
         raise RuntimeError(f"Separation failed: {e}")
-def auto_ensemble_process(audio, model_keys, seg_size, overlap, out_format, use_tta, model_dir, out_dir, norm_thresh, amp_thresh, batch_size, ensemble_method, only_instrumental, progress=gr.Progress()):
     if not audio or not model_keys:
         raise ValueError("Audio or models missing.")
     base_name = os.path.splitext(os.path.basename(audio))[0]
     logger.info(f"Ensemble for {base_name} with {model_keys}")
-    all_stems = []
     total_models = len(model_keys)
     for i, model_key in enumerate(model_keys):
         for category, models in ROFORMER_MODELS.items():
             if model_key in models:
@@ -366,10 +419,11 @@ def auto_ensemble_process(audio, model_keys, seg_size, overlap, out_format, use_
                 break
         else:
             continue
         separator = Separator(
             log_level=logging.INFO,
             model_file_dir=model_dir,
-            output_dir=out_dir,
             output_format=out_format,
             normalization_threshold=norm_thresh,
             amplification_threshold=amp_thresh,
@@ -380,22 +434,36 @@ def auto_ensemble_process(audio, model_keys, seg_size, overlap, out_format, use_
         separator.load_model(model_filename=model)
         progress(0.5 + (0.4 / total_models) * i, desc=f"Separating with {model_key}")
         separation = separator.separate(audio)
-        stems = [os.path.join(out_dir, file_name) for file_name in separation]
-        if only_instrumental:
-            instrumental_stem = next((stem for stem in stems if "instrumental" in stem.lower()), None)
-            if instrumental_stem:
-                all_stems.append(instrumental_stem)
         else:
-            all_stems.append(stems[0])
     if not all_stems:
-        raise ValueError("No valid stems for ensemble.")
-    output_file = os.path.join(out_dir, f"{base_name}_ensemble_{'instrumental_' if only_instrumental else ''}{ensemble_method}.{out_format}")
-    with open(output_file, 'w') as f:
-        f.write("Simulated ensemble output")
     progress(1.0, desc="Ensemble complete")
-    return output_file, f"Ensemble completed with {ensemble_method}"
 def update_roformer_models(category):
     return gr.update(choices=list(ROFORMER_MODELS[category].keys()))
@@ -405,70 +473,84 @@ def update_ensemble_models(category):
 # Arayüzü bir fonksiyon olarak tanımla
 def create_interface():
-    with gr.Blocks(title="🎵 Audio-Separator 🎵", css=CSS, elem_id="app-container") as app:
-        gr.Markdown("<h1 class='header-text'>🎵 Audio-Separator 🎵</h1>")
         with gr.Tabs():
             with gr.Tab("⚙️ Settings"):
-                model_file_dir = gr.Textbox(value="/tmp/audio-separator-models/", label="📂 Model Cache", placeholder="/tmp/audio-separator-models/")
-                output_dir = gr.Textbox(value="output", label="📤 Output Dir", placeholder="output")
-                output_format = gr.Dropdown(value="wav", choices=OUTPUT_FORMATS, label="🎶 Format")
-                norm_threshold = gr.Slider(0.1, 1, value=0.9, step=0.1, label="🔊 Norm Thresh")
-                amp_threshold = gr.Slider(0.1, 1, value=0.6, step=0.1, label="📈 Amp Thresh")
-                batch_size = gr.Slider(1, 16, value=1, step=1, label="⚡ Batch Size")
             with gr.Tab("🎤 Roformer"):
-                roformer_audio = gr.Audio(label="🎧 Input Audio", type="filepath")
-                roformer_single_stem = gr.Textbox(label="🎼 Single Stem", placeholder="e.g., Instrumental")
-                roformer_category = gr.Dropdown(label="📚 Category", choices=list(ROFORMER_MODELS.keys()), value="General Purpose")
-                roformer_model = gr.Dropdown(label="🛠️ Model", choices=list(ROFORMER_MODELS["General Purpose"].keys()))
-                with gr.Row():
-                    roformer_seg_size = gr.Slider(32, 4000, value=256, step=32, label="📏 Seg Size")
-                    roformer_overlap = gr.Slider(2, 10, value=8, step=1, label="🔄 Overlap")
-                with gr.Row():
-                    roformer_pitch_shift = gr.Slider(-12, 12, value=0, step=1, label="🎵 Pitch")
-                    roformer_override_seg_size = gr.Checkbox(value=False, label="🔧 Override Seg")
-                with gr.Row():
-                    url_ro = gr.Textbox(label="🔗 URL", placeholder="Audio/Video URL")
-                    download_roformer = gr.Button("⬇️ Download")
-                roformer_button = gr.Button("✂️ Separate!", variant="primary")
-                with gr.Row():
-                    roformer_stem1 = gr.Audio(label="🎸 Stem 1", type="filepath", interactive=False)
-                    roformer_stem2 = gr.Audio(label="🥁 Stem 2", type="filepath", interactive=False)
             with gr.Tab("🎚️ Auto Ensemble"):
-                ensemble_audio = gr.Audio(label="🎧 Input Audio", type="filepath")
-                ensemble_category = gr.Dropdown(label="📚 Category", choices=list(ROFORMER_MODELS.keys()), value="Instrumentals")
-                ensemble_models = gr.Dropdown(label="🛠️ Models", choices=list(ROFORMER_MODELS["Instrumentals"].keys()), multiselect=True)
-                with gr.Row():
-                    ensemble_seg_size = gr.Slider(32, 4000, value=256, step=32, label="📏 Seg Size")
-                    ensemble_overlap = gr.Slider(0.1, 0.9, value=0.2, step=0.1, label="🔄 Overlap")
-                with gr.Row():
-                    ensemble_use_tta = gr.Checkbox(value=False, label="🔍 TTA")
-                    only_instrumental = gr.Checkbox(value=False, label="🎸 Only Instr")
-                ensemble_method = gr.Dropdown(label="⚙️ Method", choices=['avg_wave', 'median_wave', 'max_wave', 'min_wave'], value='avg_wave')
-                with gr.Row():
-                    url_ensemble = gr.Textbox(label="🔗 URL", placeholder="Audio/Video URL")
-                    download_ensemble = gr.Button("⬇️ Download")
-                ensemble_button = gr.Button("🎛️ Run Ensemble!", variant="primary")
-                ensemble_output = gr.Audio(label="🎶 Output", type="filepath", interactive=False)
-                ensemble_status = gr.Textbox(label="📢 Status", interactive=False)
-        gr.HTML("<div class='footer'>Powered by Audio-Separator 🌟🎶</div>")
-        # Event Handlers
         roformer_category.change(update_roformer_models, inputs=[roformer_category], outputs=[roformer_model])
         download_roformer.click(fn=download_audio, inputs=[url_ro], outputs=[roformer_audio])
         roformer_button.click(
             roformer_separator,
-            inputs=[roformer_audio, roformer_model, roformer_seg_size, roformer_override_seg_size, roformer_overlap, roformer_pitch_shift, model_file_dir, output_dir, output_format, norm_threshold, amp_threshold, batch_size, roformer_single_stem],
             outputs=[roformer_stem1, roformer_stem2]
         )
         ensemble_category.change(update_ensemble_models, inputs=[ensemble_category], outputs=[ensemble_models])
         download_ensemble.click(fn=download_audio, inputs=[url_ensemble], outputs=[ensemble_audio])
         ensemble_button.click(
-            auto_ensemble_process,
-            inputs=[ensemble_audio, ensemble_models, ensemble_seg_size, ensemble_overlap, output_format, ensemble_use_tta, model_file_dir, output_dir, norm_threshold, amp_threshold, batch_size, ensemble_method, only_instrumental],
             outputs=[ensemble_output, ensemble_status]
         )
@@ -480,13 +562,7 @@ if __name__ == "__main__":
     parser.add_argument("--ngrok-token", type=str, default=None, help="Ngrok token for tunneling")
     args = parser.parse_args()
-    app = create_interface()  # app değişkenini burada tanımlıyoruz
-    if args.ngrok_token:
-        from pyngrok import ngrok
-        ngrok.set_auth_token(args.ngrok_token)
-        public_url = ngrok.connect(args.port, "http")
-        print(f"Ngrok URL: {public_url}")
-        app.launch(server_name="0.0.0.0", server_port=args.port)
-    else:
-        app.launch(server_name="0.0.0.0", server_port=args.port, share=True)

 import numpy as np
 import librosa
 import soundfile as sf
+from ensemble import ensemble_files
+import shutil
 device = "cuda" if torch.cuda.is_available() else "cpu"
 use_autocast = device == "cuda"
 # Model dictionaries organized by category
 ROFORMER_MODELS = {
     "Vocals": {
+        'MelBand Roformer | Big Beta 6X by unwa': 'melband_roformer_big_beta6x.ckpt',
         'MelBand Roformer | Vocals by Kimberley Jensen': 'vocals_mel_band_roformer.ckpt',
+        'MelBand Roformer Kim | FT 3 by unwa': 'mel_band_roformer_kim_ft3_unwa.ckpt',
         'MelBand Roformer | Vocals by becruily': 'mel_band_roformer_vocals_becruily.ckpt',
         'MelBand Roformer | Vocals Fullness by Aname': 'mel_band_roformer_vocal_fullness_aname.ckpt',
         'BS Roformer | Vocals by Gabox': 'bs_roformer_vocals_gabox.ckpt',
         'BS Roformer | Male-Female by aufr33': 'bs_roformer_male_female_by_aufr33_sdr_7.2889.ckpt',
     },
     "Instrumentals": {
+        'MelBand Roformer | FVX by Gabox': 'mel_band_roformer_instrumental_fvx_gabox.ckpt',
+        'MelBand Roformer | INSTV8N by Gabox': 'mel_band_roformer_instrumental_instv8n_gabox.ckpt',
+        'MelBand Roformer | INSTV8 by Gabox': 'mel_band_roformer_instrumental_instv8_gabox.ckpt',
+        'MelBand Roformer | INSTV7N by Gabox': 'mel_band_roformer_instrumental_instv7n_gabox.ckpt',
+        'MelBand Roformer | Instrumental Bleedless V3 by Gabox': 'mel_band_roformer_instrumental_bleedless_v3_gabox.ckpt',
+        'MelBand Roformer Kim | Inst V1 (E) Plus by Unwa': 'melband_roformer_inst_v1e_plus.ckpt',
+        'MelBand Roformer Kim | Inst V1 Plus by Unwa': 'melband_roformer_inst_v1_plus.ckpt',
         'MelBand Roformer Kim | Inst V1 by Unwa': 'melband_roformer_inst_v1.ckpt',
         'MelBand Roformer Kim | Inst V1 (E) by Unwa': 'melband_roformer_inst_v1e.ckpt',
         'MelBand Roformer Kim | Inst V2 by Unwa': 'melband_roformer_inst_v2.ckpt',
     "Karaoke": {
         'Mel-Roformer-Karaoke-Aufr33-Viperx': 'mel_band_roformer_karaoke_aufr33_viperx_sdr_10.1956.ckpt',
         'MelBand Roformer | Karaoke by Gabox': 'mel_band_roformer_karaoke_gabox.ckpt',
+        "MelBand Roformer | Karaoke by becruily": 'mel_band_roformer_karaoke_becruily.ckpt',
     },
     "General Purpose": {
         'BS-Roformer-Viperx-1297': 'model_bs_roformer_ep_317_sdr_12.9755.ckpt',
 OUTPUT_FORMATS = ['wav', 'flac', 'mp3', 'ogg', 'opus', 'm4a', 'aiff', 'ac3']
+# CSS (değişmedi, aynı kalıyor)
 CSS = """
+/* Modern ve Etkileşimli Tema */
 #app-container {
+    max-width: 900px;
     width: 100%;
     margin: 0 auto;
+    padding: 1rem;
     box-sizing: border-box;
     display: flex;
     flex-direction: column;
     align-items: center;
     min-height: 100vh;
+    background: linear-gradient(135deg, #1a0b2e, #2e1a47);
     position: relative;
+    overflow: hidden;
 }
 body {
     background: url('/content/logo.jpg') no-repeat center center fixed;
     background-size: cover;
     margin: 0;
     padding: 0;
+    font-family: 'Roboto', sans-serif;
+    color: #e0e0e0;
     display: flex;
     justify-content: center;
 }
     left: 0;
     width: 100%;
     height: 100%;
+    background: rgba(26, 11, 46, 0.8);
     z-index: -1;
 }
 .logo-container {
     position: fixed;
+    top: 1rem;
     left: 50%;
     transform: translateX(-50%);
     z-index: 2000;
 }
 .logo-img {
+    width: 80px;
     height: auto;
+    transition: transform 0.3s ease;
+}
+.logo-img:hover {
+    transform: scale(1.1);
 }
 .header-text {
     text-align: center;
+    padding: 3rem 0 1rem;
+    color: #ff6b6b;
+    font-size: 2rem;
+    font-weight: 800;
+    text-shadow: 0 0 10px rgba(255, 107, 107, 0.7);
+    animation: glow 2s infinite alternate;
+}
+@keyframes glow {
+    0% { text-shadow: 0 0 10px rgba(255, 107, 107, 0.7); }
+    100% { text-shadow: 0 0 20px rgba(255, 107, 107, 1); }
 }
 .dubbing-theme {
+    background: rgba(46, 26, 71, 0.9);
+    border-radius: 12px;
+    padding: 1rem;
+    box-shadow: 0 5px 20px rgba(255, 107, 107, 0.3);
     width: 100%;
+    transition: transform 0.3s ease;
+}
+.dubbing-theme:hover {
+    transform: translateY(-5px);
 }
 .footer {
     text-align: center;
+    padding: 0.5rem;
+    color: #ff6b6b;
+    font-size: 12px;
     position: fixed;
     bottom: 0;
     width: 100%;
+    max-width: 900px;
+    background: rgba(26, 11, 46, 0.7);
     z-index: 1001;
     left: 50%;
     transform: translateX(-50%);
 }
 button {
+    background: #ff6b6b !important;
+    border: none !important;
+    color: #fff !important;
+    border-radius: 8px !important;
+    padding: 8px 16px !important;
+    font-size: 1rem !important;
+    font-weight: 600 !important;
+    transition: all 0.3s ease !important;
+    box-shadow: 0 2px 8px rgba(255, 107, 107, 0.4) !important;
 }
 button:hover {
+    transform: scale(1.05) !important;
+    background: #ff8787 !important;
+    box-shadow: 0 4px 12px rgba(255, 107, 107, 0.6) !important;
 }
 .compact-upload.horizontal {
+    display: flex !important;
     align-items: center !important;
+    gap: 8px !important;
+    max-width: 300px !important;
+    padding: 6px 10px !important;
+    border: 2px dashed #ff6b6b !important;
+    background: rgba(46, 26, 71, 0.7) !important;
+    border-radius: 8px !important;
+    color: #e0e0e0 !important;
+    transition: border-color 0.3s ease !important;
 }
 .compact-upload.horizontal:hover {
+    border-color: #ff8787 !important;
 }
 .compact-upload.horizontal button {
+    padding: 4px 10px !important;
+    font-size: 0.8rem !important;
 }
 .gr-tab {
+    background: rgba(46, 26, 71, 0.7) !important;
+    border-radius: 8px 8px 0 0 !important;
+    padding: 0.5rem 1rem !important;
+    margin: 0 2px !important;
+    color: #e0e0e0 !important;
+    border: 2px solid #ff6b6b !important;
+    font-size: 1rem !important;
+    transition: all 0.3s ease !important;
 }
 .gr-tab-selected {
+    background: #ff6b6b !important;
+    color: #fff !important;
+    border: 2px solid #ff8787 !important;
+    box-shadow: 0 2px 8px rgba(255, 107, 107, 0.5) !important;
 }
 .compact-grid {
+    gap: 0.5rem !important;
+    max-height: 40vh;
     overflow-y: auto;
+    padding: 1rem;
+    background: rgba(46, 26, 71, 0.7) !important;
+    border-radius: 10px;
+    border: 2px solid #ff6b6b !important;
     width: 100%;
 }
 .compact-dropdown {
+    padding: 8px 12px !important;
+    border-radius: 8px !important;
+    border: 2px solid #ff6b6b !important;
+    background: rgba(46, 26, 71, 0.7) !important;
+    color: #e0e0e0 !important;
     width: 100%;
+    font-size: 1rem !important;
+    transition: border-color 0.3s ease !important;
+}
+.compact-dropdown:hover {
+    border-color: #ff8787 !important;
 }
 .gr-slider input[type="range"] {
     -webkit-appearance: none !important;
     width: 100% !important;
+    height: 6px !important;
+    background: #ff6b6b !important;
+    border-radius: 3px !important;
     outline: none !important;
 }
 .gr-slider input[type="range"]::-webkit-slider-thumb {
     -webkit-appearance: none !important;
+    width: 16px !important;
+    height: 16px !important;
+    background: #fff !important;
+    border: 2px solid #ff6b6b !important;
     border-radius: 50% !important;
     cursor: pointer !important;
+    box-shadow: 0 2px 6px rgba(0, 0, 0, 0.2) !important;
 }
 .gr-slider input[type="range"]::-moz-range-thumb {
+    width: 16px !important;
+    height: 16px !important;
+    background: #fff !important;
+    border: 2px solid #ff6b6b !important;
     border-radius: 50% !important;
     cursor: pointer !important;
+    box-shadow: 0 2px 6px rgba(0, 0, 0, 0.2) !important;
 }
 @media (max-width: 768px) {
     #app-container {
         max-width: 100%;
+        padding: 0.5rem;
     }
     .header-text {
+        font-size: 1.5rem;
+        padding: 2rem 0 0.5rem;
     }
     .logo-img {
+        width: 60px;
     }
     .compact-upload.horizontal {
         max-width: 100% !important;
     }
     .compact-grid {
+        max-height: 30vh;
     }
     .footer {
         max-width: 100%;
 """
 # Fonksiyonlar
+def download_audio(url, out_dir="ytdl"):
     if not url:
         raise ValueError("No URL provided.")
+    # ytdl klasörünü temizle
+    if os.path.exists(out_dir):
+        shutil.rmtree(out_dir)
+    os.makedirs(out_dir, exist_ok=True)
     ydl_opts = {
         'format': 'bestaudio/best',
         'postprocessors': [{'key': 'FFmpegExtractAudio', 'preferredcodec': 'wav', 'preferredquality': '192'}],
+        'outtmpl': os.path.join(out_dir, '%(title)s.%(ext)s'),
     }
     try:
         with YoutubeDL(ydl_opts) as ydl:
     except Exception as e:
         raise RuntimeError(f"Download failed: {e}")
+def roformer_separator(audio, model_key, seg_size, override_seg_size, overlap, pitch_shift, model_dir, output_dir, out_format, norm_thresh, amp_thresh, batch_size, exclude_stems="", progress=gr.Progress(track_tqdm=True)):
     if not audio:
         raise ValueError("No audio file provided.")
+    # output klasörünü temizle
+    if os.path.exists(output_dir):
+        shutil.rmtree(output_dir)
+    os.makedirs(output_dir, exist_ok=True)
     base_name = os.path.splitext(os.path.basename(audio))[0]
     for category, models in ROFORMER_MODELS.items():
         if model_key in models:
         separator = Separator(
             log_level=logging.INFO,
             model_file_dir=model_dir,
+            output_dir=output_dir,
             output_format=out_format,
             normalization_threshold=norm_thresh,
             amplification_threshold=amp_thresh,
             use_autocast=use_autocast,
             mdxc_params={"segment_size": seg_size, "override_model_segment_size": override_seg_size, "batch_size": batch_size, "overlap": overlap, "pitch_shift": pitch_shift}
         )
         progress(0.2, desc="Loading model...")
         separator.load_model(model_filename=model)
         progress(0.7, desc="Separating audio...")
         separation = separator.separate(audio)
+        stems = [os.path.join(output_dir, file_name) for file_name in separation]
+        # Exclude stems filtresi
+        if exclude_stems.strip():
+            excluded = [s.strip().lower() for s in exclude_stems.split(',')]
+            filtered_stems = [stem for stem in stems if not any(ex in os.path.basename(stem).lower() for ex in excluded)]
+            return filtered_stems[0] if filtered_stems else None, filtered_stems[1] if len(filtered_stems) > 1 else None
+        return stems[0], stems[1] if len(stems) > 1 else None
     except Exception as e:
         logger.error(f"Separation failed: {e}")
         raise RuntimeError(f"Separation failed: {e}")
+def auto_ensemble_process(audio, model_keys, seg_size, overlap, out_format, use_tta, model_dir, output_dir, norm_thresh, amp_thresh, batch_size, ensemble_method, exclude_stems="", weights=None, progress=gr.Progress()):
     if not audio or not model_keys:
         raise ValueError("Audio or models missing.")
+    # output klasörünü temizle
+    if os.path.exists(output_dir):
+        shutil.rmtree(output_dir)
+    os.makedirs(output_dir, exist_ok=True)
     base_name = os.path.splitext(os.path.basename(audio))[0]
     logger.info(f"Ensemble for {base_name} with {model_keys}")
+    all_stems = []  # Tüm modellerden kalan stem'ler burada toplanacak
     total_models = len(model_keys)
+    # Her model için ayrıştırma yap
     for i, model_key in enumerate(model_keys):
         for category, models in ROFORMER_MODELS.items():
             if model_key in models:
                 break
         else:
             continue
         separator = Separator(
             log_level=logging.INFO,
             model_file_dir=model_dir,
+            output_dir=output_dir,
             output_format=out_format,
             normalization_threshold=norm_thresh,
             amplification_threshold=amp_thresh,
         separator.load_model(model_filename=model)
         progress(0.5 + (0.4 / total_models) * i, desc=f"Separating with {model_key}")
         separation = separator.separate(audio)
+        stems = [os.path.join(output_dir, file_name) for file_name in separation]
+        # Exclude stems filtresi
+        if exclude_stems.strip():
+            excluded = [s.strip().lower() for s in exclude_stems.split(',')]
+            filtered_stems = [stem for stem in stems if not any(ex in os.path.basename(stem).lower() for ex in excluded)]
+            all_stems.extend(filtered_stems)
         else:
+            all_stems.extend(stems)  # Eğer exclude_stems yoksa tüm stem'leri al
     if not all_stems:
+        raise ValueError("No valid stems for ensemble after exclusion.")
+    # Weights kontrolü
+    if weights is None or len(weights) != len(model_keys):
+        weights = [1.0] * len(model_keys)
+    # Tüm kalan stem'leri birleştir
+    output_file = os.path.join(output_dir, f"{base_name}_ensemble_{ensemble_method}.{out_format}")
+    ensemble_args = [
+        "--files", *all_stems,
+        "--type", ensemble_method,
+        "--weights", *[str(w) for w in weights[:len(all_stems)]],  # Stem sayısına göre weights kes
+        "--output", output_file
+    ]
+    progress(0.9, desc="Running ensemble...")
+    ensemble_files(ensemble_args)
     progress(1.0, desc="Ensemble complete")
+    return output_file, f"Ensemble completed with {ensemble_method}, excluded: {exclude_stems if exclude_stems else 'None'}"
 def update_roformer_models(category):
     return gr.update(choices=list(ROFORMER_MODELS[category].keys()))
 # Arayüzü bir fonksiyon olarak tanımla
 def create_interface():
+    with gr.Blocks(title="🎵 SESA Fast Separation 🎵", css=CSS, elem_id="app-container") as app:
+        gr.Markdown("<h1 class='header-text'>🎵 SESA Fast Separation 🎵</h1>")
         with gr.Tabs():
+            # Settings Sekmesi
             with gr.Tab("⚙️ Settings"):
+                with gr.Group(elem_classes="dubbing-theme"):
+                    gr.Markdown("### General Settings")
+                    model_file_dir = gr.Textbox(value="/tmp/audio-separator-models/", label="📂 Model Cache", placeholder="Path to model directory", interactive=True)
+                    output_dir = gr.Textbox(value="output", label="📤 Output Directory", placeholder="Where to save results", interactive=True)
+                    output_format = gr.Dropdown(value="wav", choices=OUTPUT_FORMATS, label="🎶 Output Format", interactive=True)
+                    norm_threshold = gr.Slider(0.1, 1, value=0.9, step=0.1, label="🔊 Normalization Threshold", interactive=True)
+                    amp_threshold = gr.Slider(0.1, 1, value=0.3, step=0.1, label="📈 Amplification Threshold", interactive=True)
+                    batch_size = gr.Slider(1, 16, value=4, step=1, label="⚡ Batch Size", interactive=True)
+            # Roformer Sekmesi
             with gr.Tab("🎤 Roformer"):
+                with gr.Group(elem_classes="dubbing-theme"):
+                    gr.Markdown("### Audio Separation")
+                    with gr.Row():
+                        roformer_audio = gr.Audio(label="🎧 Upload Audio", type="filepath", interactive=True)
+                        url_ro = gr.Textbox(label="🔗 Or Paste URL", placeholder="YouTube or audio URL", interactive=True)
+                        download_roformer = gr.Button("⬇️ download", variant="secondary")
+                    roformer_exclude_stems = gr.Textbox(label="🚫 Exclude Stems", placeholder="e.g., vocals, drums (comma-separated)", interactive=True)
+                    with gr.Row():
+                        roformer_category = gr.Dropdown(label="📚 Category", choices=list(ROFORMER_MODELS.keys()), value="General Purpose", interactive=True)
+                        roformer_model = gr.Dropdown(label="🛠️ Model", choices=list(ROFORMER_MODELS["General Purpose"].keys()), interactive=True)
+                    with gr.Row():
+                        roformer_seg_size = gr.Slider(32, 4000, value=256, step=32, label="📏 Segment Size", interactive=True)
+                        roformer_overlap = gr.Slider(2, 10, value=8, step=1, label="🔄 Overlap", interactive=True)
+                    with gr.Row():
+                        roformer_pitch_shift = gr.Slider(-12, 12, value=0, step=1, label="🎵 Pitch Shift", interactive=True)
+                        roformer_override_seg_size = gr.Checkbox(value=False, label="🔧 Override Segment Size", interactive=True)
+                    roformer_button = gr.Button("✂️ Separate Now!", variant="primary")
+                    with gr.Row():
+                        roformer_stem1 = gr.Audio(label="🎸 Stem 1", type="filepath", interactive=False)
+                        roformer_stem2 = gr.Audio(label="🥁 Stem 2", type="filepath", interactive=False)
+            # Auto Ensemble Sekmesi
             with gr.Tab("🎚️ Auto Ensemble"):
+                with gr.Group(elem_classes="dubbing-theme"):
+                    gr.Markdown("### Ensemble Processing")
+                    with gr.Row():
+                        ensemble_audio = gr.Audio(label="🎧 Upload Audio", type="filepath", interactive=True)
+                        url_ensemble = gr.Textbox(label="🔗 Or Paste URL", placeholder="YouTube or audio URL", interactive=True)
+                        download_ensemble = gr.Button("⬇️ download", variant="secondary")
+                    ensemble_exclude_stems = gr.Textbox(label="🚫 Exclude Stems", placeholder="e.g., vocals, drums (comma-separated)", interactive=True)
+                    with gr.Row():
+                        ensemble_category = gr.Dropdown(label="📚 Category", choices=list(ROFORMER_MODELS.keys()), value="Instrumentals", interactive=True)
+                        ensemble_models = gr.Dropdown(label="🛠️ Models", choices=list(ROFORMER_MODELS["Instrumentals"].keys()), multiselect=True, interactive=True)
+                    with gr.Row():
+                        ensemble_seg_size = gr.Slider(32, 4000, value=256, step=32, label="📏 Segment Size", interactive=True)
+                        ensemble_overlap = gr.Slider(2, 10, value=8, step=1, label="🔄 Overlap", interactive=True)
+                        ensemble_use_tta = gr.Checkbox(value=False, label="🔍 Use TTA", interactive=True)
+                    ensemble_method = gr.Dropdown(label="⚙️ Ensemble Method", choices=['avg_wave', 'median_wave', 'max_wave', 'min_wave', 'avg_fft', 'median_fft', 'max_fft', 'min_fft'], value='avg_wave', interactive=True)
+                    ensemble_weights = gr.Textbox(label="⚖️ Weights", placeholder="e.g., 1.0, 1.0 (comma-separated)", interactive=True)
+                    ensemble_button = gr.Button("🎛️ Run Ensemble!", variant="primary")
+                    ensemble_output = gr.Audio(label="🎶 Ensemble Result", type="filepath", interactive=False)
+                    ensemble_status = gr.Textbox(label="📢 Status", interactive=False)
+        gr.HTML("<div class='footer'>Powered by Audio-Separator 🌟🎶 | Made with ❤️</div>")
+        # Event Handlers (Aynı kalıyor)
         roformer_category.change(update_roformer_models, inputs=[roformer_category], outputs=[roformer_model])
         download_roformer.click(fn=download_audio, inputs=[url_ro], outputs=[roformer_audio])
         roformer_button.click(
             roformer_separator,
+            inputs=[roformer_audio, roformer_model, roformer_seg_size, roformer_override_seg_size, roformer_overlap, roformer_pitch_shift, model_file_dir, output_dir, output_format, norm_threshold, amp_threshold, batch_size, roformer_exclude_stems],
             outputs=[roformer_stem1, roformer_stem2]
         )
         ensemble_category.change(update_ensemble_models, inputs=[ensemble_category], outputs=[ensemble_models])
         download_ensemble.click(fn=download_audio, inputs=[url_ensemble], outputs=[ensemble_audio])
         ensemble_button.click(
+            lambda *args: auto_ensemble_process(
+                *args[:-1],
+                weights=[float(w.strip()) for w in args[-1].split(',')] if args[-1] else None
+            ),
+            inputs=[ensemble_audio, ensemble_models, ensemble_seg_size, ensemble_overlap, output_format, ensemble_use_tta, model_file_dir, output_dir, norm_threshold, amp_threshold, batch_size, ensemble_method, ensemble_exclude_stems, ensemble_weights],
             outputs=[ensemble_output, ensemble_status]
         )
     parser.add_argument("--ngrok-token", type=str, default=None, help="Ngrok token for tunneling")
     args = parser.parse_args()
+    app = create_interface()
+    app.launch(server_name="0.0.0.0", server_port=args.port, share=True)
+    app.close()