DRVC

Sleeping

App Files Files Community

Singhp08 commited on Apr 12

Commit

8ffa95c

verified ·

1 Parent(s): 1bf63c5

Update app.py

Browse files

Files changed (1) hide show

app.py +113 -42

app.py CHANGED Viewed

@@ -23,6 +23,7 @@ import threading
 import argparse
 import sys
 parser = argparse.ArgumentParser(description="Run the app with optional sharing")
 parser.add_argument('--share', action='store_true', help='Enable sharing mode')
 parser.add_argument('--theme', type=str, default="aliabid94/new-theme", help='Set the theme')
@@ -33,12 +34,10 @@ IS_ZERO_GPU = os.getenv("SPACES_ZERO_GPU")
 logging.getLogger("infer_rvc_python").setLevel(logging.ERROR)
 converter = BaseLoader(only_cpu=False, hubert_path=None, rmvpe_path=None)
 converter.hu_bert_model = load_hu_bert(Config(only_cpu=False), converter.hubert_path)
-# ========== डिफ़ॉल्ट मॉडल डाउनलोड को हटा दिया गया है ==========
-# पहले यहाँ test_model डाउनलोड होता था, जिससे स्पेस हैंग हो जाता था। अब नहीं होगा।
 title = "<center><strong><font size='7'>RVC⚡ZERO</font></strong></center>"
 description = "This demo is provided for educational and research purposes only." if IS_ZERO_GPU else ""
 RESOURCES = "- You can also try `RVC⚡ZERO` in Colab’s free tier [link](https://github.com/R3gm/rvc_zero_ui?tab=readme-ov-file#rvczero)."
@@ -47,6 +46,7 @@ delete_cache_time = (3200, 3200) if IS_ZERO_GPU else (86400, 86400)
 PITCH_ALGO_OPT = ["pm", "harvest", "crepe", "rmvpe", "rmvpe+"]
 async def get_voices_list(proxy=None):
     from edge_tts import list_voices
     voices = await list_voices(proxy=proxy)
@@ -62,6 +62,7 @@ async def get_voices_list(proxy=None):
         for v in voices
     ]
 def find_files(directory):
     file_paths = []
     for fname in os.listdir(directory):
@@ -150,31 +151,56 @@ def get_my_model(url_data, progress=gr.Progress(track_tqdm=True)):
     finally:
         threading.Thread(target=clear_files, args=(directory,)).start()
-# ========== logs/ फोल्डर से मॉडल स्कैन ==========
 def scan_models():
     logs_dir = "logs"
     if not os.path.isdir(logs_dir):
         return []
     models = []
-    for model_name in os.listdir(logs_dir):
-        model_path = os.path.join(logs_dir, model_name)
-        if not os.path.isdir(model_path):
-            continue
-        pth_files = [f for f in os.listdir(model_path) if f.endswith(".pth")]
-        idx_files = [f for f in os.listdir(model_path) if f.endswith(".index")]
-        if pth_files and idx_files:
-            pth_path = os.path.join(model_path, pth_files[0])
-            idx_path = os.path.join(model_path, idx_files[0])
-            models.append((model_name, pth_path, idx_path))
     return models
-def update_model_paths(model_name):
-    for name, pth, idx in scan_models():
-        if name == model_name:
-            return pth, idx
     return None, None
-# ========== ऑडियो इफेक्ट ==========
 def add_audio_effects(audio_list, type_output):
     result = []
     for audio_path in audio_list:
@@ -244,13 +270,13 @@ def run(
     type_output,
     steps,
 ):
-    # डीबग जानकारी प्रिंट करें
     print("DEBUG: file_m =", file_m)
     print("DEBUG: file_index =", file_index)
     if not audio_files:
         raise ValueError("Please provide audio files")
     if isinstance(audio_files, str):
         audio_files = [audio_files]
@@ -290,14 +316,36 @@ def run(
     return result
-# ========== UI कम्पोनेंट ==========
-def audio_conf():
-    return gr.File(label="Audio files", file_count="multiple", type="filepath")
 def model_dropdown_conf():
     models = scan_models()
-    choices = [name for name, _, _ in models]
-    return gr.Dropdown(label="Select Model", choices=choices, value=choices[0] if choices else None, interactive=True)
 def hidden_model_path_conf():
     return gr.Textbox(visible=False)
@@ -324,16 +372,16 @@ def consonant_protec_conf():
     return gr.Slider(0, 0.5, value=0.5, label="Consonant breath protection")
 def button_conf():
-    return gr.Button("Inference", variant="primary")
 def output_conf():
-    return gr.File(label="Result", file_count="multiple", interactive=False)
 def active_tts_conf():
-    return gr.Checkbox(False, label="TTS", container=False)
 def tts_voice_conf(voices):
-    return gr.Dropdown(label="tts voice", choices=voices, visible=False)
 def tts_text_conf():
     return gr.Textbox(placeholder="Write the text here...", label="Text", visible=False, lines=3)
@@ -354,11 +402,12 @@ def format_output_gui():
     return gr.Dropdown(choices=["wav", "mp3", "flac"], value="wav", label="Format output")
 def denoise_conf():
-    return gr.Checkbox(False, label="Denoise", container=False)
 def effects_conf():
-    return gr.Checkbox(False, label="Reverb", container=False)
 def infer_tts_audio(tts_voice, tts_text, play_tts):
     out_dir = "output"
     folder_tts = "USER_" + str(random.randint(10000, 99999))
@@ -373,7 +422,7 @@ def show_components_tts(val):
     return (gr.update(visible=val),) * 4
 def down_active_conf():
-    return gr.Checkbox(False, label="URL-to-Model", container=False)
 def down_url_conf():
     return gr.Textbox(placeholder="Write the url here...", label="Enter URL", visible=False)
@@ -384,6 +433,7 @@ def down_button_conf():
 def show_components_down(val):
     return (gr.update(visible=val),) * 3
 CSS = """
 #audio_tts {
   visibility: hidden; height: 0px; width: 0px; max-width: 0px; max-height: 0px;
@@ -395,6 +445,7 @@ def get_gui(theme, voices):
         gr.Markdown(title)
         gr.Markdown(description)
         active_tts = active_tts_conf()
         with gr.Row():
             with gr.Column(scale=1):
@@ -407,9 +458,17 @@ def get_gui(theme, voices):
                 tts_play = sound_gui()
         active_tts.change(show_components_tts, [active_tts], [tts_voice, tts_text, tts_button, tts_active_play])
-        aud = audio_conf()
-        tts_button.click(infer_tts_audio, [tts_voice, tts_text, tts_active_play], [aud, tts_play])
         down_active = down_active_conf()
         down_info = gr.Markdown(
             "Provide a link to a zip file, or separate links with comma for .pth and .index files.",
@@ -430,14 +489,12 @@ def get_gui(theme, voices):
         down_button.click(update_from_url, [down_url], [hidden_model, hidden_index])
         model_dropdown = model_dropdown_conf()
-        def on_model_select(name):
-            return update_model_paths(name)
-        model_dropdown.change(on_model_select, [model_dropdown], [hidden_model, hidden_index])
-        with gr.Accordion("Advanced settings", open=False):
             algo = pitch_algo_conf()
             algo_lvl = pitch_lvl_conf()
             idx_inf = index_inf_conf()
@@ -453,10 +510,24 @@ def get_gui(theme, voices):
         btn = button_conf()
         out = output_conf()
         btn.click(
-            run,
             inputs=[
-                aud, hidden_model, algo, algo_lvl, hidden_index,
                 idx_inf, res_fc, env_r, cons,
                 denoise_gui, effects_gui, fmt_out, steps_gui
             ],

 import argparse
 import sys
+# ---------- कमांड लाइन आर्गुमेंट्स ----------
 parser = argparse.ArgumentParser(description="Run the app with optional sharing")
 parser.add_argument('--share', action='store_true', help='Enable sharing mode')
 parser.add_argument('--theme', type=str, default="aliabid94/new-theme", help='Set the theme')
 logging.getLogger("infer_rvc_python").setLevel(logging.ERROR)
+# ---------- RVC कन्वर्टर इनिशियलाइज़ेशन ----------
 converter = BaseLoader(only_cpu=False, hubert_path=None, rmvpe_path=None)
 converter.hu_bert_model = load_hu_bert(Config(only_cpu=False), converter.hubert_path)
 title = "<center><strong><font size='7'>RVC⚡ZERO</font></strong></center>"
 description = "This demo is provided for educational and research purposes only." if IS_ZERO_GPU else ""
 RESOURCES = "- You can also try `RVC⚡ZERO` in Colab’s free tier [link](https://github.com/R3gm/rvc_zero_ui?tab=readme-ov-file#rvczero)."
 PITCH_ALGO_OPT = ["pm", "harvest", "crepe", "rmvpe", "rmvpe+"]
+# ========== एज TTS वॉइस लिस्ट ==========
 async def get_voices_list(proxy=None):
     from edge_tts import list_voices
     voices = await list_voices(proxy=proxy)
         for v in voices
     ]
+# ========== फ़ाइल सर्च हेल्पर्स ==========
 def find_files(directory):
     file_paths = []
     for fname in os.listdir(directory):
     finally:
         threading.Thread(target=clear_files, args=(directory,)).start()
+# ==================== नया मॉडल स्कैनिंग लॉजिक (फिक्स) ====================
 def scan_models():
+    """
+    logs फ़ोल्डर के अंदर किसी भी स्थान पर मौजूद .pth और .index फ़ाइलों को ढूंढता है।
+    हर मॉडल का नाम .pth फ़ाइल के बेसनेम (बिना एक्सटेंशन) से लिया जाता है।
+    संबंधित .index फ़ाइल उसी डायरेक्टरी में या logs फ़ोल्डर में खोजी जाती है।
+    """
     logs_dir = "logs"
     if not os.path.isdir(logs_dir):
         return []
     models = []
+    # पूरे logs फ़ोल्डर में .pth फ़ाइलें खोजें
+    for root, dirs, files in os.walk(logs_dir):
+        for file in files:
+            if file.endswith(".pth"):
+                pth_path = os.path.join(root, file)
+                model_name = os.path.splitext(file)[0]
+                # संबंधित .index फ़ाइल खोजें (पहले उसी फ़ोल्डर में, फिर पूरे logs में)
+                idx_path = None
+                # उसी फ़ोल्डर में देखें
+                for idx_file in os.listdir(root):
+                    if idx_file.endswith(".index") and os.path.splitext(idx_file)[0] == model_name:
+                        idx_path = os.path.join(root, idx_file)
+                        break
+                # अगर न मिले तो पूरे logs में ढूंढें
+                if idx_path is None:
+                    for r, d, f in os.walk(logs_dir):
+                        for idx_file in f:
+                            if idx_file.endswith(".index") and os.path.splitext(idx_file)[0] == model_name:
+                                idx_path = os.path.join(r, idx_file)
+                                break
+                        if idx_path:
+                            break
+                # डुप्लिकेट न���म से बचने के लिए यूनिक key बनाएँ (फ़ोल्डर+नाम)
+                unique_key = os.path.relpath(pth_path, logs_dir).replace(os.sep, "_")
+                models.append((unique_key, pth_path, idx_path if idx_path else ""))
     return models
+def update_model_paths(selected_key):
+    """
+    ड्रॉपडाउन से चुने गए मॉडल के लिए .pth और .index के पूरे पाथ लौटाता है।
+    """
+    models = scan_models()
+    for key, pth, idx in models:
+        if key == selected_key:
+            return pth, idx if idx else None
     return None, None
+# ========== ऑडियो इफेक्ट्स ==========
 def add_audio_effects(audio_list, type_output):
     result = []
     for audio_path in audio_list:
     type_output,
     steps,
 ):
     print("DEBUG: file_m =", file_m)
     print("DEBUG: file_index =", file_index)
     if not audio_files:
         raise ValueError("Please provide audio files")
+    # यदि एकल ऑडियो फ़ाइल (gr.Audio से) आई है तो उसे लिस्ट में बदलें
     if isinstance(audio_files, str):
         audio_files = [audio_files]
     return result
+# ========== UI कम्पोनेंट्स ==========
+def audio_input_conf():
+    """
+    दो तरह के इनपुट:
+    1. gr.Audio - माइक्रोफ़ोन से रिकॉर्ड या एकल फ़ाइल अपलोड
+    2. gr.File - एक साथ कई फ़ाइलें अपलोड करने के लिए
+    """
+    return gr.Audio(
+        label="🎤 Record or Upload Audio",
+        type="filepath",
+        sources=["microphone", "upload"]
+    )
+def multi_audio_conf():
+    return gr.File(
+        label="📁 Upload Multiple Audio Files (Optional)",
+        file_count="multiple",
+        file_types=[".wav", ".mp3", ".flac", ".m4a", ".ogg"],
+        type="filepath"
+    )
 def model_dropdown_conf():
     models = scan_models()
+    choices = [key for key, _, _ in models]
+    return gr.Dropdown(
+        label="🤖 Select Model",
+        choices=choices,
+        value=choices[0] if choices else None,
+        interactive=True
+    )
 def hidden_model_path_conf():
     return gr.Textbox(visible=False)
     return gr.Slider(0, 0.5, value=0.5, label="Consonant breath protection")
 def button_conf():
+    return gr.Button("🚀 Inference", variant="primary")
 def output_conf():
+    return gr.File(label="✅ Result", file_count="multiple", interactive=False)
 def active_tts_conf():
+    return gr.Checkbox(False, label="🔊 TTS", container=False)
 def tts_voice_conf(voices):
+    return gr.Dropdown(label="TTS Voice", choices=voices, visible=False)
 def tts_text_conf():
     return gr.Textbox(placeholder="Write the text here...", label="Text", visible=False, lines=3)
     return gr.Dropdown(choices=["wav", "mp3", "flac"], value="wav", label="Format output")
 def denoise_conf():
+    return gr.Checkbox(False, label="🧹 Denoise", container=False)
 def effects_conf():
+    return gr.Checkbox(False, label="🎚️ Reverb", container=False)
+# ---------- TTS ----------
 def infer_tts_audio(tts_voice, tts_text, play_tts):
     out_dir = "output"
     folder_tts = "USER_" + str(random.randint(10000, 99999))
     return (gr.update(visible=val),) * 4
 def down_active_conf():
+    return gr.Checkbox(False, label="🌐 URL-to-Model", container=False)
 def down_url_conf():
     return gr.Textbox(placeholder="Write the url here...", label="Enter URL", visible=False)
 def show_components_down(val):
     return (gr.update(visible=val),) * 3
+# ---------- मुख्य GUI ----------
 CSS = """
 #audio_tts {
   visibility: hidden; height: 0px; width: 0px; max-width: 0px; max-height: 0px;
         gr.Markdown(title)
         gr.Markdown(description)
+        # ---- TTS सेक्शन ----
         active_tts = active_tts_conf()
         with gr.Row():
             with gr.Column(scale=1):
                 tts_play = sound_gui()
         active_tts.change(show_components_tts, [active_tts], [tts_voice, tts_text, tts_button, tts_active_play])
+        # ---- ऑडियो इनपुट (रिकॉर्ड + मल्टीपल) ----
+        gr.Markdown("## 📥 Input Audio")
+        with gr.Row():
+            audio_record = audio_input_conf()
+            audio_multi = multi_audio_conf()
+        # TTS आउटपुट को ऑडियो इनपुट में जोड़ें
+        tts_button.click(infer_tts_audio, [tts_voice, tts_text, tts_active_play], [audio_multi, tts_play])
+        # ---- URL से मॉडल लोडिंग ----
         down_active = down_active_conf()
         down_info = gr.Markdown(
             "Provide a link to a zip file, or separate links with comma for .pth and .index files.",
         down_button.click(update_from_url, [down_url], [hidden_model, hidden_index])
+        # ---- मॉडल चयन (ड्रॉपडाउन) ----
         model_dropdown = model_dropdown_conf()
+        model_dropdown.change(update_model_paths, [model_dropdown], [hidden_model, hidden_index])
+        # ---- एडवांस्ड सेटिंग्स ----
+        with gr.Accordion("⚙️ Advanced settings", open=False):
             algo = pitch_algo_conf()
             algo_lvl = pitch_lvl_conf()
             idx_inf = index_inf_conf()
         btn = button_conf()
         out = output_conf()
+        # ---- रन फ़ंक्शन: ऑडियो स्रोतों को मर्ज करना ----
+        def combined_audio_inputs(record_audio, multi_files):
+            """
+            यदि multi_files में फ़ाइलें हैं तो उन्हें प्राथमिकता दें,
+            अन्यथा record_audio का उपयोग करें।
+            """
+            if multi_files:
+                return multi_files
+            elif record_audio:
+                return record_audio
+            else:
+                return None
         btn.click(
+            lambda rec, multi, *rest: run(combined_audio_inputs(rec, multi), *rest),
             inputs=[
+                audio_record, audio_multi,
+                hidden_model, algo, algo_lvl, hidden_index,
                 idx_inf, res_fc, env_r, cons,
                 denoise_gui, effects_gui, fmt_out, steps_gui
             ],