rvc_zero

Running on Zero

App Files Files Community

Amirox commited on Jan 20

Commit

fe4a50f

1 Parent(s): 1950609

Add run_with_urls function for audio conversion via URLs and integrate MCP-friendly interface in Gradio

Browse files

Files changed (1) hide show

app.py +115 -0

app.py CHANGED Viewed

@@ -466,6 +466,87 @@ def run(
     return result
 def audio_conf():
     return gr.File(
         label="Audio files",
@@ -889,6 +970,40 @@ def get_gui(theme):
         )
         gr.Markdown(RESOURCES)
     return app

     return result
+def run_with_urls(
+    audio_url: str,
+    model_url: str,
+    index_url: str = None,
+    pitch_alg: str = "rmvpe+",
+    pitch_lvl: int = 0,
+    index_inf: float = 0.75,
+    r_m_f: int = 3,
+    e_r: float = 0.25,
+    c_b_p: float = 0.5,
+    active_noise_reduce: bool = False,
+    audio_effects: bool = False,
+    type_output: str = "wav",
+    steps: int = 1,
+):
+    """
+    Convert audio using RVC voice conversion with URL inputs (MCP-friendly).
+    Args:
+        audio_url: URL to audio or video file. Supported: wav, mp3, ogg, flac, m4a, mp4, mkv, webm, avi, mov.
+        model_url: URL to the model file (.pth) or zip file containing model.
+        index_url: Optional URL to the index file (.index). Leave empty if using zip.
+        pitch_alg: Pitch algorithm - one of: pm, harvest, crepe, rmvpe, rmvpe+
+        pitch_lvl: Pitch level adjustment (-24 to 24, default: 0)
+        index_inf: Index influence (0.0 to 1.0, default: 0.75)
+        r_m_f: Respiration median filtering (0 to 7, default: 3)
+        e_r: Envelope ratio (0.0 to 1.0, default: 0.25)
+        c_b_p: Consonant breath protection (0.0 to 0.5, default: 0.5)
+        active_noise_reduce: Apply noise reduction (default: False)
+        audio_effects: Apply reverb and compression effects (default: False)
+        type_output: Output format - one of: wav, mp3, flac (default: wav)
+        steps: Number of conversion steps (1 to 3, default: 1)
+    Returns:
+        List of paths to converted audio files.
+    """
+    # Download audio file
+    out_dir = "downloads"
+    audio_folder = str(random.randint(10000, 99999))
+    audio_dir = os.path.join(out_dir, audio_folder)
+    os.makedirs(audio_dir, exist_ok=True)
+    # Supported audio and video formats (ffmpeg will extract audio from video)
+    SUPPORTED_FORMATS = (
+        # Audio formats
+        '.wav', '.mp3', '.ogg', '.flac', '.m4a', '.aac', '.wma', '.opus',
+        # Video formats (audio will be extracted)
+        '.mp4', '.mkv', '.webm', '.avi', '.mov', '.wmv', '.flv', '.m4v'
+    )
+    try:
+        # Download audio/video file
+        download_manager(url=audio_url.strip(), path=audio_dir, extension="")
+        audio_files = [os.path.join(audio_dir, f) for f in os.listdir(audio_dir)
+                       if f.lower().endswith(SUPPORTED_FORMATS)]
+        if not audio_files:
+            raise ValueError(f"No audio/video file found after downloading from {audio_url}. Supported formats: {SUPPORTED_FORMATS}")
+        # Call the main run function with URLs for model/index
+        return run(
+            audio_files=audio_files,
+            file_m=model_url,
+            pitch_alg=pitch_alg,
+            pitch_lvl=pitch_lvl,
+            file_index=index_url,
+            index_inf=index_inf,
+            r_m_f=r_m_f,
+            e_r=e_r,
+            c_b_p=c_b_p,
+            active_noise_reduce=active_noise_reduce,
+            audio_effects=audio_effects,
+            type_output=type_output,
+            steps=steps,
+        )
+    finally:
+        # Cleanup audio download folder
+        t = threading.Thread(target=clear_files, args=(audio_dir,))
+        t.start()
 def audio_conf():
     return gr.File(
         label="Audio files",
         )
         gr.Markdown(RESOURCES)
+        # MCP-friendly interface (hidden in UI, exposed for API/MCP calls)
+        with gr.Accordion("API / MCP Interface", open=False, visible=True):
+            gr.Markdown("Use this interface for API calls or MCP integration with URL inputs.")
+            with gr.Row():
+                mcp_audio_url = gr.Textbox(label="Audio URL", placeholder="https://example.com/audio.wav")
+                mcp_model_url = gr.Textbox(label="Model URL (.pth or .zip)", placeholder="https://huggingface.co/.../model.pth")
+                mcp_index_url = gr.Textbox(label="Index URL (optional)", placeholder="https://huggingface.co/.../model.index")
+            with gr.Row():
+                mcp_pitch_alg = gr.Dropdown(PITCH_ALGO_OPT, value="rmvpe+", label="Pitch Algorithm")
+                mcp_pitch_lvl = gr.Slider(minimum=-24, maximum=24, value=0, step=1, label="Pitch Level")
+                mcp_index_inf = gr.Slider(minimum=0, maximum=1, value=0.75, label="Index Influence")
+            with gr.Row():
+                mcp_r_m_f = gr.Slider(minimum=0, maximum=7, value=3, step=1, label="Respiration Filter")
+                mcp_e_r = gr.Slider(minimum=0, maximum=1, value=0.25, label="Envelope Ratio")
+                mcp_c_b_p = gr.Slider(minimum=0, maximum=0.5, value=0.5, label="Consonant Protection")
+            with gr.Row():
+                mcp_noise_reduce = gr.Checkbox(value=False, label="Noise Reduce")
+                mcp_effects = gr.Checkbox(value=False, label="Audio Effects")
+                mcp_format = gr.Dropdown(["wav", "mp3", "flac"], value="wav", label="Output Format")
+                mcp_steps = gr.Slider(minimum=1, maximum=3, value=1, step=1, label="Steps")
+            mcp_button = gr.Button("Convert (URL)", variant="secondary")
+            mcp_output = gr.File(label="Result", file_count="multiple")
+            mcp_button.click(
+                fn=run_with_urls,
+                inputs=[
+                    mcp_audio_url, mcp_model_url, mcp_index_url,
+                    mcp_pitch_alg, mcp_pitch_lvl, mcp_index_inf,
+                    mcp_r_m_f, mcp_e_r, mcp_c_b_p,
+                    mcp_noise_reduce, mcp_effects, mcp_format, mcp_steps
+                ],
+                outputs=[mcp_output],
+            )
     return app