cctvoi

Runtime error

App Files Files Community

Vgjkmhf commited on Dec 5, 2025

Commit

4b76478

verified ·

1 Parent(s): 92f6db2

Update app.py

Browse files

Files changed (1) hide show

app.py +215 -92

app.py CHANGED Viewed

@@ -1,146 +1,269 @@
 import os
 import sys
 import time
-import inspect
 import traceback
 import numpy as np
 import soundfile as sf
 import librosa
 import gradio as gr
-from scipy.signal import iirpeak, lfilter
-# 1. Setup
 try:
     import imageio_ffmpeg
     import static_ffmpeg
     from rvc_python.infer import RVCInference
-    static_ffmpeg.add_paths()
-    ffmpeg_path = imageio_ffmpeg.get_ffmpeg_exe()
-    os.environ["PATH"] += os.pathsep + os.path.dirname(ffmpeg_path)
-    print("✅ System Ready")
 except ImportError as e:
-    print(f"❌ Import Error: {e}")
     sys.exit(1)
-TEMP_DIR = "/tmp/rvc_studio"
 os.makedirs(TEMP_DIR, exist_ok=True)
 os.environ["TEMP"] = TEMP_DIR
-# 2. DSP Functions
-def anti_muffle_filter(y, sr):
-    try:
-        b, a = iirpeak(600, Q=1.5, fs=sr, ftype='notch')
-        return lfilter(b, a, y)
-    except: return y
-def clarity_boost(y, sr):
     try:
-        b, a = iirpeak(8000, Q=0.7, fs=sr, ftype='peak')
-        boosted = lfilter(b, a, y)
-        return (y * 0.7) + (boosted * 0.3)
-    except: return y
 def preprocess_audio(input_path):
     try:
-        y, sr = librosa.load(input_path, sr=None, mono=True)
-        y = librosa.util.normalize(y) * 0.90
-        y = anti_muffle_filter(y, sr)
         processed_path = os.path.join(TEMP_DIR, "preprocessed.wav")
         sf.write(processed_path, y, sr)
-        return processed_path, f"✅ Preprocess Done (SR: {sr}Hz)"
     except Exception as e:
-        return input_path, f"⚠️ Preprocess Warning: {e}"
-def postprocess_audio(input_path):
     try:
-        y, sr = librosa.load(input_path, sr=None, mono=True)
-        y = clarity_boost(y, sr)
         y = librosa.util.normalize(y) * 0.95
-        post_path = os.path.join(TEMP_DIR, "postprocessed.wav")
-        sf.write(post_path, y, sr)
-        return post_path, "✅ Postprocess Done"
-    except Exception as e:
-        return input_path, f"⚠️ Postprocess Warning: {e}"
-# 3. Pipeline
 def rvc_process_pipeline(
-    audio_path, model_file, index_file, pitch_change, f0_method,
-    index_rate, protect_val, filter_radius, resample_sr, envelope_mix, hop_length
 ):
-    if not audio_path or not model_file:
-        return None, "❌ Input missing"
     try:
-        clean_audio, log1 = preprocess_audio(audio_path)
-        rvc = RVCInference(device="cpu")
-        rvc.load_model(model_file.name)
-        rvc_out_path = os.path.join(TEMP_DIR, "rvc_output.wav")
-        if os.path.exists(rvc_out_path): os.remove(rvc_out_path)
-        sig = inspect.signature(rvc.infer_file)
-        params = sig.parameters
-        kwargs = {"input_path": clean_audio, "output_path": rvc_out_path}
-        if "pitch" in params: kwargs["pitch"] = int(pitch_change)
-        elif "f0_up_key" in params: kwargs["f0_up_key"] = int(pitch_change)
-        if "method" in params: kwargs["method"] = f0_method
-        elif "f0_method" in params: kwargs["f0_method"] = f0_method
-        if "index_path" in params and index_file: kwargs["index_path"] = index_file.name
-        if "index_rate" in params: kwargs["index_rate"] = float(index_rate)
-        if "protect" in params: kwargs["protect"] = float(protect_val)
-        if "filter_radius" in params: kwargs["filter_radius"] = int(filter_radius)
-        if "resample_sr" in params: kwargs["resample_sr"] = int(resample_sr)
-        if "rms_mix_rate" in params: kwargs["rms_mix_rate"] = float(envelope_mix)
-        if "hop_length" in params: kwargs["hop_length"] = int(hop_length)
-        print(f"Running: {kwargs}")
-        rvc.infer_file(**kwargs)
-        log2 = "✅ RVC Done"
-        final_output, log3 = postprocess_audio(rvc_out_path)
-        # --- اصلاح خط مشکل‌دار ---
-        full_log = "
-".join([str(log1), str(log2), str(log3)])
-        return final_output, full_log
     except Exception as e:
-        err = f"❌ Error: {traceback.format_exc()}"
-        print(err)
-        return None, err
-# 4. UI
-with gr.Blocks(title="RVC Studio Pro", theme=gr.themes.Soft()) as demo:
-    gr.Markdown("# 🎙️ RVC Studio Pro")
     with gr.Row():
-        with gr.Column(scale=1):
-            audio_in = gr.Audio(label="Input", type="filepath")
             with gr.Row():
-                model_in = gr.File(label="Model", file_types=[".pth"])
-                index_in = gr.File(label="Index", file_types=[".index"])
-            pitch = gr.Slider(-24, 24, value=0, step=1, label="Pitch")
-            method = gr.Dropdown(["rmvpe", "harvest", "crepe", "pm"], value="harvest", label="Algo")
-            btn = gr.Button("✨ Start", variant="primary")
-        with gr.Column(scale=1):
-            audio_out = gr.Audio(label="Output")
-            status = gr.Textbox(label="Logs", lines=5)
-            with gr.Accordion("Settings", open=True):
-                with gr.Tab("Quality"):
-                    index_rate = gr.Slider(0, 1, value=0.3, label="Index Rate")
-                    protect = gr.Slider(0, 0.5, value=0.45, label="Protect")
-                    filter_radius = gr.Slider(0, 7, value=3, label="Filter Radius")
-                with gr.Tab("Clarity"):
-                    envelope_mix = gr.Slider(0, 1, value=0.25, label="Vol Mix")
-                    hop_length = gr.Slider(32, 256, value=64, step=32, label="Hop Length")
-                    resample_sr = gr.Slider(0, 48000, value=40000, step=8000, label="Resample SR")
-    btn.click(rvc_process_pipeline, inputs=[audio_in, model_in, index_in, pitch, method, index_rate, protect, filter_radius, resample_sr, envelope_mix, hop_length], outputs=[audio_out, status])
 if __name__ == "__main__":
     demo.queue().launch(server_name="0.0.0.0", server_port=7860)

 import os
 import sys
 import time
 import traceback
+import inspect
+import logging
+import shutil
+import subprocess
 import numpy as np
 import soundfile as sf
 import librosa
 import gradio as gr
+import scipy.signal as signal  # اضافه شده برای پردازش سیگنال حرفه‌ای
+from datetime import datetime
+# ==========================================
+# 1. تنظیمات اولیه و کتابخانه‌ها
+# ==========================================
+print(">>> در حال راه‌اندازی سیستم RVC Pro Max...")
 try:
     import imageio_ffmpeg
     import static_ffmpeg
     from rvc_python.infer import RVCInference
+    print("✅ کتابخانه‌های RVC با موفقیت بارگذاری شدند.")
 except ImportError as e:
+    print(f"❌ خطای بحرانی در ایمپورت: {e}")
+    print("لطفاً requirements.txt را بررسی کنید.")
     sys.exit(1)
+# تنظیم مسیر FFmpeg
+try:
+    static_ffmpeg.add_paths()
+    ffmpeg_exe = imageio_ffmpeg.get_ffmpeg_exe()
+    os.environ["PATH"] += os.pathsep + os.path.dirname(ffmpeg_exe)
+    print(f"✅ FFmpeg یافت شد: {ffmpeg_exe}")
+except Exception as e:
+    print(f"⚠️ هشدار FFmpeg: {e}")
+TEMP_DIR = "/tmp/rvc_temp"
 os.makedirs(TEMP_DIR, exist_ok=True)
 os.environ["TEMP"] = TEMP_DIR
+os.environ["TMPDIR"] = TEMP_DIR
+# ==========================================
+# 2. توابع پردازش صدا (Audio DSP)
+# ==========================================
+def log_message(message):
+    timestamp = datetime.now().strftime("%H:%M:%S")
+    return f"[{timestamp}] {message}"
+def apply_clarity_eq(y, sr):
+    """
+    اعمال EQ برای رفع تودماغی و شفاف‌سازی صدا
+    1. Low-Cut: حذف هام (Hum) زیر 60Hz
+    2. Mid-Cut: کاهش فرکانس‌های تودماغی (800Hz - 1.2kHz)
+    3. High-Boost: افزایش فرکانس‌های شفاف (Air) بالای 6kHz
+    """
     try:
+        # 1. High-pass filter (حذف نویز خیلی بم)
+        sos_hp = signal.butter(4, 60, 'hp', fs=sr, output='sos')
+        y = signal.sosfilt(sos_hp, y)
+        # 2. Notch/Bell filter برای کاهش تودماغی (حدود 1000Hz)
+        # استفاده از فیلتر Peaking EQ معکوس
+        b, a = signal.iirpeak(1000, 1.0, fs=sr)
+        # اعمال معکوس (کاهش دامنه در این فرکانس) - پیاده‌سازی ساده‌تر با فیلتر باترورث بند-استاپ نرم
+        # اما اینجا یک ترفند ساده‌تر می‌زنیم: کاهش ملایم میدرنج
+        # یک فیلتر ساده برای کاهش ناحیه 1k
+        sos_mid = signal.butter(2, [800, 1200], 'bandstop', fs=sr, output='sos')
+        # میکس کردن سیگنال فیلتر شده با اصلی (Dry/Wet) برای اینکه صدا توخالی نشود
+        y_filtered = signal.sosfilt(sos_mid, y)
+        y = (y * 0.7) + (y_filtered * 0.3) # تاثیر ملایم
+        # 3. High Shelf Boost (شفافیت)
+        # بوست کردن فرکانس‌های بالای 5000 هرتز
+        sos_high = signal.butter(2, 5000, 'hp', fs=sr, output='sos')
+        y_high = signal.sosfilt(sos_high, y)
+        y = y + (y_high * 0.15) # افزودن 15% فرکانس بالا به سیگنال اصلی
+        return y
+    except Exception as e:
+        print(f"EQ Error: {e}")
+        return y
 def preprocess_audio(input_path):
     try:
+        y, sr = librosa.load(input_path, sr=None)
+        if y.ndim > 1:
+            y = librosa.to_mono(y)
+        # نرمال‌سازی استاندارد
+        y = librosa.util.normalize(y)
         processed_path = os.path.join(TEMP_DIR, "preprocessed.wav")
         sf.write(processed_path, y, sr)
+        return processed_path, f"✅ صدا پیش‌پردازش شد (SR: {sr}Hz)"
     except Exception as e:
+        return input_path, f"⚠️ پیش‌پردازش ناموفق: {e}"
+def post_process_audio(input_path, clarity_boost=True):
+    """پردازش نهایی برای کیفیت استودیویی"""
     try:
+        y, sr = librosa.load(input_path, sr=None)
+        if clarity_boost:
+            y = apply_clarity_eq(y, sr)
+        # نرمال‌سازی نهایی (جلوگیری از Clipping)
         y = librosa.util.normalize(y) * 0.95
+        output_path = input_path.replace(".wav", "_final.wav")
+        sf.write(output_path, y, sr)
+        return output_path
+    except Exception:
+        return input_path
+def cleanup_temp():
+    try:
+        if os.path.exists(TEMP_DIR):
+            shutil.rmtree(TEMP_DIR)
+            os.makedirs(TEMP_DIR)
+    except Exception:
+        pass
+# ==========================================
+# 3. موتور تبدیل صدا (RVC Engine)
+# ==========================================
 def rvc_process_pipeline(
+    audio_path, model_file, index_file,
+    pitch_change, f0_method, index_rate,
+    protect_val, filter_radius, resample_sr,
+    envelope_mix, hop_length,
+    enable_clarity
 ):
+    logs = []
+    logs.append(log_message("🚀 شروع عملیات تبدیل..."))
+    if not audio_path: return None, "❌ فایل صوتی انتخاب نشده است."
+    if not model_file: return None, "❌ فایل مدل انتخاب نشده است."
     try:
+        cleanup_temp()
+        model_path = model_file.name
+        index_path = index_file.name if index_file else None
+        # 1. پیش‌پردازش
+        clean_audio, msg = preprocess_audio(audio_path)
+        logs.append(log_message(msg))
+        # 2. لود مدل
+        logs.append(log_message(f"📂 مدل: {os.path.basename(model_path)}"))
+        rvc = RVCInference(device="cpu") # اگر GPU دارید "cuda" بگذارید
+        rvc.load_model(model_path)
+        output_temp = os.path.join(TEMP_DIR, f"rvc_out_{int(time.time())}.wav")
+        # 3. تنظیم پارامترها (بهینه‌سازی شده برای کیفیت)
+        kwargs = {
+            "input_path": clean_audio,
+            "output_path": output_temp,
+            "pitch": int(pitch_change),
+            "method": f0_method,
+            "index_path": index_path,
+            "index_rate": float(index_rate),
+            "protect": float(protect_val),
+            "filter_radius": int(filter_radius),
+            "resample_sr": int(resample_sr),
+            "rms_mix_rate": float(envelope_mix),
+            "hop_length": int(hop_length)
+        }
+        # بررسی پارامترهای معتبر تابع (برای جلوگیری از ارور نسخه‌های قدیمی)
+        sig = inspect.signature(rvc.infer_file)
+        valid_keys = sig.parameters.keys()
+        filtered_kwargs = {k: v for k, v in kwargs.items() if k in valid_keys or k == "pitch" or k == "method"}
+        # هندل کردن تغییر نام پارامترها در نسخه‌های مختلف
+        if "f0_up_key" in valid_keys and "pitch" in filtered_kwargs:
+            filtered_kwargs["f0_up_key"] = filtered_kwargs.pop("pitch")
+        if "f0_method" in valid_keys and "method" in filtered_kwargs:
+            filtered_kwargs["f0_method"] = filtered_kwargs.pop("method")
+        logs.append(log_message(f"⚙️ متد: {f0_method} | شفاف‌سازی: {'فعال' if enable_clarity else 'غیرفعال'}"))
+        # 4. اجرای تبدیل
+        start_time = time.time()
+        rvc.infer_file(**filtered_kwargs)
+        # 5. پس‌پردازش (شفاف‌سازی)
+        final_output = output_temp
+        if enable_clarity:
+            logs.append(log_message("✨ در حال اعمال فیلتر شفاف‌سازی و رفع تودماغی..."))
+            final_output = post_process_audio(output_temp, clarity_boost=True)
+        duration = time.time() - start_time
+        logs.append(log_message(f"✅ تمام شد! ({duration:.2f}s)"))
+        return final_output, "
+".join(logs)
     except Exception as e:
+        return None, f"❌ خطا: {traceback.format_exc()}"
+# ==========================================
+# 4. رابط کاربری (Gradio)
+# ==========================================
+custom_css = """
+#run_btn {background: linear-gradient(90deg, #FF5722 0%, #FF8A65 100%); color: white; border: none;}
+.gradio-container {font-family: 'Tahoma', sans-serif;}
+"""
+with gr.Blocks(title="RVC Pro Persian", theme=gr.themes.Soft(), css=custom_css) as demo:
+    gr.Markdown("## 🎙️ RVC Pro: مبدل صدای حرفه‌ای (رفع گنگی و تودماغی)")
     with gr.Row():
+        with gr.Column():
+            audio_input = gr.Audio(label="ورودی صدا", type="filepath")
             with gr.Row():
+                model_input = gr.File(label="مدل (.pth)", file_types=[".pth"])
+                index_input = gr.File(label="ایندکس (.index)", file_types=[".index"])
+            # تمام الگوریتم‌ها
+            algo_dropdown = gr.Dropdown(
+                choices=["rmvpe", "fcpe", "crepe", "harvest", "pm"],
+                value="rmvpe",
+                label="الگوریتم (RMVPE پیشنهاد می‌شود)",
+                info="RMVPE: بهترین کیفیت | PM: سریع | Harvest: برای نت‌های پایین"
+            )
+            pitch_slider = gr.Slider(-24, 24, value=0, step=1, label="تغییر گام (Pitch)")
+            btn_run = gr.Button("🚀 تبدیل صدا", elem_id="run_btn", variant="primary")
+        with gr.Column():
+            with gr.Accordion("تنظیمات کیفیت (رفع نویز و خش)", open=True):
+                enable_clarity = gr.Checkbox(value=True, label="✨ فعال‌سازی شفاف‌کننده صدا (رفع تودماغی)")
+                with gr.Row():
+                    index_rate = gr.Slider(0, 1, value=0.4, step=0.05, label="تاثیر ایندکس", info="بیشتر = شبیه‌تر به مدل (اما شاید نویزی)")
+                    envelope_mix = gr.Slider(0, 1, value=0.25, step=0.05, label="میکس حجم (Volume Mix)", info="کمتر = شفاف‌تر (حجم مد��)")
+                with gr.Row():
+                    protect_val = gr.Slider(0, 0.5, value=0.33, step=0.01, label="محافظت (Protect)", info="0.33 استاندارد است")
+                    filter_radius = gr.Slider(0, 7, value=3, step=1, label="فیلتر نرم‌کننده", info="3 = متعادل")
+                with gr.Row():
+                    resample_sr = gr.Slider(0, 48000, value=0, step=1000, label="ری‌سمپل", info="0 = بدون تغییر (پیشنهادی)")
+                    hop_len = gr.Slider(1, 512, value=128, step=1, label="Hop Length", info="128 استاندارد")
+            output_audio = gr.Audio(label="خروجی نهایی", type="filepath")
+            logs = gr.Textbox(label="گزارش", lines=5)
+    btn_run.click(
+        rvc_process_pipeline,
+        inputs=[
+            audio_input, model_input, index_input,
+            pitch_slider, algo_dropdown, index_rate,
+            protect_val, filter_radius, resample_sr,
+            envelope_mix, hop_len, enable_clarity
+        ],
+        outputs=[output_audio, logs]
+    )
 if __name__ == "__main__":
     demo.queue().launch(server_name="0.0.0.0", server_port=7860)