Spaces:

OrangyDev
/

cctvoi

Runtime error

App Files Files Community

Vgjkmhf commited on Dec 5, 2025

Commit

3c44ab0

verified ·

1 Parent(s): 4b76478

Update app.py

Browse files

Files changed (1) hide show

app.py +57 -81

app.py CHANGED Viewed

@@ -10,11 +10,11 @@ import numpy as np
 import soundfile as sf
 import librosa
 import gradio as gr
-import scipy.signal as signal  # اضافه شده برای پردازش سیگنال حرفه‌ای
 from datetime import datetime
 # ==========================================
-# 1. تنظیمات اولیه و کتابخانه‌ها
 # ==========================================
 print(">>> در حال راه‌اندازی سیستم RVC Pro Max...")
@@ -25,7 +25,6 @@ try:
     print("✅ کتابخانه‌های RVC با موفقیت بارگذاری شدند.")
 except ImportError as e:
     print(f"❌ خطای بحرانی در ایمپورت: {e}")
-    print("لطفاً requirements.txt را بررسی کنید.")
     sys.exit(1)
 # تنظیم مسیر FFmpeg
@@ -33,7 +32,6 @@ try:
     static_ffmpeg.add_paths()
     ffmpeg_exe = imageio_ffmpeg.get_ffmpeg_exe()
     os.environ["PATH"] += os.pathsep + os.path.dirname(ffmpeg_exe)
-    print(f"✅ FFmpeg یافت شد: {ffmpeg_exe}")
 except Exception as e:
     print(f"⚠️ هشدار FFmpeg: {e}")
@@ -43,7 +41,7 @@ os.environ["TEMP"] = TEMP_DIR
 os.environ["TMPDIR"] = TEMP_DIR
 # ==========================================
-# 2. توابع پردازش صدا (Audio DSP)
 # ==========================================
 def log_message(message):
@@ -51,33 +49,23 @@ def log_message(message):
     return f"[{timestamp}] {message}"
 def apply_clarity_eq(y, sr):
-    """
-    اعمال EQ برای رفع تودماغی و شفاف‌سازی صدا
-    1. Low-Cut: حذف هام (Hum) زیر 60Hz
-    2. Mid-Cut: کاهش فرکانس‌های تودماغی (800Hz - 1.2kHz)
-    3. High-Boost: افزایش فرکانس‌های شفاف (Air) بالای 6kHz
-    """
     try:
-        # 1. High-pass filter (حذف نویز خیلی بم)
         sos_hp = signal.butter(4, 60, 'hp', fs=sr, output='sos')
         y = signal.sosfilt(sos_hp, y)
-        # 2. Notch/Bell filter برای کاهش تودماغی (حدود 1000Hz)
-        # استفاده از فیلتر Peaking EQ معکوس
-        b, a = signal.iirpeak(1000, 1.0, fs=sr)
-        # اعمال معکوس (کاهش دامنه در این فرکانس) - پیاده‌سازی ساده‌تر با فیلتر باترورث بند-استاپ نرم
-        # اما اینجا یک ترفند ساده‌تر می‌زنیم: کاهش ملایم میدرنج
-        # یک فیلتر ساده برای کاهش ناحیه 1k
         sos_mid = signal.butter(2, [800, 1200], 'bandstop', fs=sr, output='sos')
-        # میکس کردن سیگنال فیلتر شده با اصلی (Dry/Wet) برای اینکه صدا توخالی نشود
         y_filtered = signal.sosfilt(sos_mid, y)
-        y = (y * 0.7) + (y_filtered * 0.3) # تاثیر ملایم
-        # 3. High Shelf Boost (شفافیت)
-        # بوست کردن فرکانس‌های بالای 5000 هرتز
         sos_high = signal.butter(2, 5000, 'hp', fs=sr, output='sos')
         y_high = signal.sosfilt(sos_high, y)
-        y = y + (y_high * 0.15) # افزودن 15% فرکانس بالا به سیگنال اصلی
         return y
     except Exception as e:
@@ -89,27 +77,19 @@ def preprocess_audio(input_path):
         y, sr = librosa.load(input_path, sr=None)
         if y.ndim > 1:
             y = librosa.to_mono(y)
-        # نرمال‌سازی استاندارد
         y = librosa.util.normalize(y)
         processed_path = os.path.join(TEMP_DIR, "preprocessed.wav")
         sf.write(processed_path, y, sr)
         return processed_path, f"✅ صدا پیش‌پردازش شد (SR: {sr}Hz)"
     except Exception as e:
-        return input_path, f"⚠️ پیش‌پردازش ناموفق: {e}"
 def post_process_audio(input_path, clarity_boost=True):
-    """پردازش نهایی برای کیفیت استودیویی"""
     try:
         y, sr = librosa.load(input_path, sr=None)
         if clarity_boost:
             y = apply_clarity_eq(y, sr)
-        # نرمال‌سازی نهایی (جلوگیری از Clipping)
         y = librosa.util.normalize(y) * 0.95
         output_path = input_path.replace(".wav", "_final.wav")
         sf.write(output_path, y, sr)
         return output_path
@@ -118,14 +98,13 @@ def post_process_audio(input_path, clarity_boost=True):
 def cleanup_temp():
     try:
-        if os.path.exists(TEMP_DIR):
-            shutil.rmtree(TEMP_DIR)
-            os.makedirs(TEMP_DIR)
     except Exception:
         pass
 # ==========================================
-# 3. موتور تبدیل صدا (RVC Engine)
 # ==========================================
 def rvc_process_pipeline(
@@ -138,26 +117,28 @@ def rvc_process_pipeline(
     logs = []
     logs.append(log_message("🚀 شروع عملیات تبدیل..."))
-    if not audio_path: return None, "❌ فایل صوتی انتخاب نشده است."
-    if not model_file: return None, "❌ فایل مدل انتخاب نشده است."
     try:
         cleanup_temp()
         model_path = model_file.name
         index_path = index_file.name if index_file else None
-        # 1. پیش‌پردازش
         clean_audio, msg = preprocess_audio(audio_path)
         logs.append(log_message(msg))
-        # 2. لود مدل
         logs.append(log_message(f"📂 مدل: {os.path.basename(model_path)}"))
-        rvc = RVCInference(device="cpu") # اگر GPU دارید "cuda" بگذارید
         rvc.load_model(model_path)
         output_temp = os.path.join(TEMP_DIR, f"rvc_out_{int(time.time())}.wav")
-        # 3. تنظیم پارامترها (بهینه‌سازی شده برای کیفیت)
         kwargs = {
             "input_path": clean_audio,
             "output_path": output_temp,
@@ -172,49 +153,54 @@ def rvc_process_pipeline(
             "hop_length": int(hop_length)
         }
-        # بررسی پارامترهای معتبر تابع (برای جلوگیری از ارور نسخه‌های قدیمی)
         sig = inspect.signature(rvc.infer_file)
         valid_keys = sig.parameters.keys()
-        filtered_kwargs = {k: v for k, v in kwargs.items() if k in valid_keys or k == "pitch" or k == "method"}
-        # هندل کردن تغییر نام پارامترها در نسخه‌های مختلف
-        if "f0_up_key" in valid_keys and "pitch" in filtered_kwargs:
-            filtered_kwargs["f0_up_key"] = filtered_kwargs.pop("pitch")
-        if "f0_method" in valid_keys and "method" in filtered_kwargs:
-            filtered_kwargs["f0_method"] = filtered_kwargs.pop("method")
-        logs.append(log_message(f"⚙️ متد: {f0_method} | شفاف‌سازی: {'فعال' if enable_clarity else 'غیرفعال'}"))
-        # 4. اجرای تبدیل
         start_time = time.time()
-        rvc.infer_file(**filtered_kwargs)
-        # 5. پس‌پردازش (شفاف‌سازی)
         final_output = output_temp
-        if enable_clarity:
-            logs.append(log_message("✨ در حال اعمال فیلتر شفاف‌سازی و رفع تودماغی..."))
             final_output = post_process_audio(output_temp, clarity_boost=True)
         duration = time.time() - start_time
         logs.append(log_message(f"✅ تمام شد! ({duration:.2f}s)"))
-        return final_output, "
 ".join(logs)
     except Exception as e:
-        return None, f"❌ خطا: {traceback.format_exc()}"
 # ==========================================
-# 4. رابط کاربری (Gradio)
 # ==========================================
 custom_css = """
 #run_btn {background: linear-gradient(90deg, #FF5722 0%, #FF8A65 100%); color: white; border: none;}
-.gradio-container {font-family: 'Tahoma', sans-serif;}
 """
 with gr.Blocks(title="RVC Pro Persian", theme=gr.themes.Soft(), css=custom_css) as demo:
-    gr.Markdown("## 🎙️ RVC Pro: مبدل صدای حرفه‌ای (رفع گنگی و تودماغی)")
     with gr.Row():
         with gr.Column():
@@ -223,33 +209,23 @@ with gr.Blocks(title="RVC Pro Persian", theme=gr.themes.Soft(), css=custom_css)
                 model_input = gr.File(label="مدل (.pth)", file_types=[".pth"])
                 index_input = gr.File(label="ایندکس (.index)", file_types=[".index"])
-            # تمام الگوریتم‌ها
             algo_dropdown = gr.Dropdown(
                 choices=["rmvpe", "fcpe", "crepe", "harvest", "pm"],
                 value="rmvpe",
-                label="الگوریتم (RMVPE پیشنهاد می‌شود)",
-                info="RMVPE: بهترین کیفیت | PM: سریع | Harvest: برای نت‌های پایین"
             )
-            pitch_slider = gr.Slider(-24, 24, value=0, step=1, label="تغییر گام (Pitch)")
             btn_run = gr.Button("🚀 تبدیل صدا", elem_id="run_btn", variant="primary")
         with gr.Column():
-            with gr.Accordion("تنظیمات کیفیت (رفع نویز و خش)", open=True):
-                enable_clarity = gr.Checkbox(value=True, label="✨ فعال‌سازی شفاف‌کننده صدا (رفع تودماغی)")
-                with gr.Row():
-                    index_rate = gr.Slider(0, 1, value=0.4, step=0.05, label="تاثیر ایندکس", info="بیشتر = شبیه‌تر به مدل (اما شاید نویزی)")
-                    envelope_mix = gr.Slider(0, 1, value=0.25, step=0.05, label="میکس حجم (Volume Mix)", info="کمتر = شفاف‌تر (حجم مدل)")
-                with gr.Row():
-                    protect_val = gr.Slider(0, 0.5, value=0.33, step=0.01, label="محافظت (Protect)", info="0.33 استاندارد است")
-                    filter_radius = gr.Slider(0, 7, value=3, step=1, label="فیلتر نرم‌کننده", info="3 = متعادل")
-                with gr.Row():
-                    resample_sr = gr.Slider(0, 48000, value=0, step=1000, label="ری‌سمپل", info="0 = بدون تغییر (پیشنهادی)")
-                    hop_len = gr.Slider(1, 512, value=128, step=1, label="Hop Length", info="128 استاندارد")
             output_audio = gr.Audio(label="خروجی نهایی", type="filepath")
             logs = gr.Textbox(label="گزارش", lines=5)

 import soundfile as sf
 import librosa
 import gradio as gr
+import scipy.signal as signal
 from datetime import datetime
 # ==========================================
+# 1. تنظیمات اولیه
 # ==========================================
 print(">>> در حال راه‌اندازی سیستم RVC Pro Max...")
     print("✅ کتابخانه‌های RVC با موفقیت بارگذاری شدند.")
 except ImportError as e:
     print(f"❌ خطای بحرانی در ایمپورت: {e}")
     sys.exit(1)
 # تنظیم مسیر FFmpeg
     static_ffmpeg.add_paths()
     ffmpeg_exe = imageio_ffmpeg.get_ffmpeg_exe()
     os.environ["PATH"] += os.pathsep + os.path.dirname(ffmpeg_exe)
 except Exception as e:
     print(f"⚠️ هشدار FFmpeg: {e}")
 os.environ["TMPDIR"] = TEMP_DIR
 # ==========================================
+# 2. توابع پردازش صدا (DSP)
 # ==========================================
 def log_message(message):
     return f"[{timestamp}] {message}"
 def apply_clarity_eq(y, sr):
+    """اعمال EQ برای شفاف‌سازی و رفع تودماغی"""
     try:
+        # 1. Low-Cut (حذف نویز زیر 60 هرتز)
         sos_hp = signal.butter(4, 60, 'hp', fs=sr, output='sos')
         y = signal.sosfilt(sos_hp, y)
+        # 2. کاهش فرکانس‌های تودماغی (حدود 1000 هرتز)
+        # فیلتر Band-stop ملایم
         sos_mid = signal.butter(2, [800, 1200], 'bandstop', fs=sr, output='sos')
         y_filtered = signal.sosfilt(sos_mid, y)
+        # ترکیب 30 درصد فیلتر شده با 70 درصد اصلی
+        y = (y * 0.7) + (y_filtered * 0.3)
+        # 3. High Boost (شفافیت)
         sos_high = signal.butter(2, 5000, 'hp', fs=sr, output='sos')
         y_high = signal.sosfilt(sos_high, y)
+        y = y + (y_high * 0.15)
         return y
     except Exception as e:
         y, sr = librosa.load(input_path, sr=None)
         if y.ndim > 1:
             y = librosa.to_mono(y)
         y = librosa.util.normalize(y)
         processed_path = os.path.join(TEMP_DIR, "preprocessed.wav")
         sf.write(processed_path, y, sr)
         return processed_path, f"✅ صدا پیش‌پردازش شد (SR: {sr}Hz)"
     except Exception as e:
+        return input_path, f"⚠️ خطا در پیش‌پردازش: {e}"
 def post_process_audio(input_path, clarity_boost=True):
     try:
         y, sr = librosa.load(input_path, sr=None)
         if clarity_boost:
             y = apply_clarity_eq(y, sr)
         y = librosa.util.normalize(y) * 0.95
         output_path = input_path.replace(".wav", "_final.wav")
         sf.write(output_path, y, sr)
         return output_path
 def cleanup_temp():
     try:
+        for f in os.listdir(TEMP_DIR):
+            os.remove(os.path.join(TEMP_DIR, f))
     except Exception:
         pass
 # ==========================================
+# 3. موتور تبدیل (اصلاح شده)
 # ==========================================
 def rvc_process_pipeline(
     logs = []
     logs.append(log_message("🚀 شروع عملیات تبدیل..."))
+    if not audio_path:
+        return None, "❌ فایل صوتی انتخاب نشده است."
+    if not model_file:
+        return None, "❌ فایل مدل انتخاب نشده است."
     try:
         cleanup_temp()
         model_path = model_file.name
         index_path = index_file.name if index_file else None
+        # پیش‌پردازش
         clean_audio, msg = preprocess_audio(audio_path)
         logs.append(log_message(msg))
+        # بارگذاری مدل
         logs.append(log_message(f"📂 مدل: {os.path.basename(model_path)}"))
+        rvc = RVCInference(device="cpu")
         rvc.load_model(model_path)
         output_temp = os.path.join(TEMP_DIR, f"rvc_out_{int(time.time())}.wav")
+        # پارامترها
         kwargs = {
             "input_path": clean_audio,
             "output_path": output_temp,
             "hop_length": int(hop_length)
         }
+        # فیلتر کردن پارامترهای نامعتبر برای جلوگیری از خطای نسخه
         sig = inspect.signature(rvc.infer_file)
         valid_keys = sig.parameters.keys()
+        final_kwargs = {}
+        for k, v in kwargs.items():
+            if k in valid_keys:
+                final_kwargs[k] = v
+            # نگاشت نام‌های قدیمی به جدید
+            elif k == "pitch" and "f0_up_key" in valid_keys:
+                final_kwargs["f0_up_key"] = v
+            elif k == "method" and "f0_method" in valid_keys:
+                final_kwargs["f0_method"] = v
+        logs.append(log_message(f"⚙️ متد: {f0_method}"))
         start_time = time.time()
+        rvc.infer_file(**final_kwargs)
+        # پس‌پردازش
         final_output = output_temp
+        if enable_clarity and os.path.exists(output_temp):
+            logs.append(log_message("✨ اعمال فیلتر شفاف‌سازی..."))
             final_output = post_process_audio(output_temp, clarity_boost=True)
         duration = time.time() - start_time
         logs.append(log_message(f"✅ تمام شد! ({duration:.2f}s)"))
+        # اینجا خطایی که داشتید رفع شده است:
+        log_text = "
 ".join(logs)
+        return final_output, log_text
     except Exception as e:
+        err_msg = f"❌ خطا: {traceback.format_exc()}"
+        print(err_msg)
+        return None, err_msg
 # ==========================================
+# 4. رابط کاربری
 # ==========================================
 custom_css = """
 #run_btn {background: linear-gradient(90deg, #FF5722 0%, #FF8A65 100%); color: white; border: none;}
 """
 with gr.Blocks(title="RVC Pro Persian", theme=gr.themes.Soft(), css=custom_css) as demo:
+    gr.Markdown("## 🎙️ RVC Pro: مبدل صدای حرفه‌ای (اصلاح شده)")
     with gr.Row():
         with gr.Column():
                 model_input = gr.File(label="مدل (.pth)", file_types=[".pth"])
                 index_input = gr.File(label="ایندکس (.index)", file_types=[".index"])
             algo_dropdown = gr.Dropdown(
                 choices=["rmvpe", "fcpe", "crepe", "harvest", "pm"],
                 value="rmvpe",
+                label="الگوریتم"
             )
+            pitch_slider = gr.Slider(-24, 24, value=0, step=1, label="تغییر گام")
             btn_run = gr.Button("🚀 تبدیل صدا", elem_id="run_btn", variant="primary")
         with gr.Column():
+            with gr.Accordion("تنظیمات کیفیت", open=True):
+                enable_clarity = gr.Checkbox(value=True, label="رفع تودماغی (Clarity)")
+                index_rate = gr.Slider(0, 1, value=0.4, step=0.05, label="تاثیر ایندکس")
+                envelope_mix = gr.Slider(0, 1, value=0.25, step=0.05, label="Volume Mix")
+                protect_val = gr.Slider(0, 0.5, value=0.33, step=0.01, label="Protect")
+                filter_radius = gr.Slider(0, 7, value=3, step=1, label="Filter Radius")
+                resample_sr = gr.Slider(0, 48000, value=0, step=1000, label="Resample SR")
+                hop_len = gr.Slider(1, 512, value=128, step=1, label="Hop Length")
             output_audio = gr.Audio(label="خروجی نهایی", type="filepath")
             logs = gr.Textbox(label="گزارش", lines=5)