Spaces:

Hamed744
/

Ttspro

Paused

App Files Files Community

Hamed744 commited on Jul 10, 2025

Commit

4a4b4c1

verified ·

1 Parent(s): 2f4845f

Update app.py

Browse files

Files changed (1) hide show

app.py +52 -33

app.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# app.py - نسخه کامل و نهایی برای تمام اسپیس‌های Hugging Face
 import os
 import sys
@@ -15,8 +15,6 @@ from fastapi import FastAPI, HTTPException
 from pydantic import BaseModel
 from google import genai
 from google.genai import types
-# اضافه کردن uvicorn برای اجرا از داخل اسکریپت
 import uvicorn
 try:
@@ -25,10 +23,12 @@ try:
 except ImportError:
     PYDUB_AVAILABLE = False
-# --- پیکربندی لاگینگ ---
 logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s', datefmt='%Y-%m-%d %H:%M:%S')
-# --- START: تعریف تمام توابع کمکی ---
 # --- منطق مدیریت API Key ---
 ALL_API_KEYS: list[str] = []
@@ -42,14 +42,40 @@ def _init_api_keys():
         ALL_API_KEYS = [key.strip() for key in all_keys_string.split(',') if key.strip()]
     logging.info(f"✅ تعداد {len(ALL_API_KEYS)} کلید API جیمینای بارگذاری شد.")
     if not ALL_API_KEYS:
-        logging.warning("⛔️ هشدار: هیچ Secret با نام ALL_GEMINI_API_KEYS یافت نشد! برنامه بدون کلید API کار نخواهد کرد.")
 # --- ثابت‌ها ---
 FIXED_MODEL_NAME = "gemini-2.5-flash-preview-tts"
 DEFAULT_MAX_CHUNK_SIZE = 3800
 DEFAULT_SLEEP_BETWEEN_REQUESTS = 8
-# --- توابع کمکی فایل و صدا ---
 def save_binary_file(file_name, data):
     try:
         with open(file_name, "wb") as f: f.write(data)
@@ -57,7 +83,6 @@ def save_binary_file(file_name, data):
     except Exception as e:
         logging.error(f"❌ خطا در ذخیره فایل {file_name}: {e}")
         return None
 def convert_to_wav(audio_data: bytes, mime_type: str) -> bytes:
     parameters = parse_audio_mime_type(mime_type)
     bits_per_sample, rate = parameters["bits_per_sample"], parameters["rate"]
@@ -66,7 +91,6 @@ def convert_to_wav(audio_data: bytes, mime_type: str) -> bytes:
     byte_rate, chunk_size = rate * block_align, 36 + data_size
     header = struct.pack("<4sI4s4sIHHIIHH4sI", b"RIFF", chunk_size, b"WAVE", b"fmt ", 16, 1, num_channels, rate, byte_rate, block_align, bits_per_sample, b"data", data_size)
     return header + audio_data
 def parse_audio_mime_type(mime_type: str) -> dict[str, int]:
     bits, rate = 16, 24000
     for param in mime_type.split(";"):
@@ -78,7 +102,6 @@ def parse_audio_mime_type(mime_type: str) -> dict[str, int]:
             try: bits = int(param.split("L", 1)[1])
             except: pass
     return {"bits_per_sample": bits, "rate": rate}
 def smart_text_split(text, max_size=3800):
     if len(text) <= max_size: return [text]
     chunks, current_chunk = [], ""
@@ -95,7 +118,6 @@ def smart_text_split(text, max_size=3800):
     if current_chunk: chunks.append(current_chunk.strip())
     final_chunks = [c for c in chunks if c]
     return final_chunks
 def merge_audio_files_func(file_paths, output_path):
     if not PYDUB_AVAILABLE: logging.warning("⚠️ pydub برای ادغام در دسترس نیست."); return False
     try:
@@ -106,39 +128,45 @@ def merge_audio_files_func(file_paths, output_path):
         combined.export(output_path, format="wav")
         return True
     except Exception as e: logging.error(f"❌ خطا در ادغام فایل‌های صوتی: {e}"); return False
-def get_next_api_key():
-    global NEXT_KEY_INDEX, ALL_API_KEYS, KEY_LOCK
-    with KEY_LOCK:
-        if not ALL_API_KEYS: return None, None
-        key_to_use = ALL_API_KEYS[NEXT_KEY_INDEX % len(ALL_API_KEYS)]
-        key_display_index = (NEXT_KEY_INDEX % len(ALL_API_KEYS)) + 1
-        NEXT_KEY_INDEX += 1
-        return key_to_use, key_display_index
-# --- منطق اصلی تولید صدا ---
 def generate_audio_chunk_with_retry(chunk_text, prompt_text, voice, temp, session_id):
     if not ALL_API_KEYS: raise Exception("هیچ کلید API برای پردازش در دسترس نیست.")
     for _ in range(len(ALL_API_KEYS)):
-        selected_api_key, key_idx_display = get_next_api_key()
-        if not selected_api_key: break
         logging.info(f"[{session_id}] ⚙️ تلاش برای تولید قطعه با کلید API شماره {key_idx_display}")
         try:
-            client = genai.Client(api_key=selected_api_key)
             final_text = f'"{prompt_text}"\n{chunk_text}' if prompt_text and prompt_text.strip() else chunk_text
             contents = [types.Content(role="user", parts=[types.Part.from_text(text=final_text)])]
             config = types.GenerateContentConfig(temperature=temp, response_modalities=["audio"],
                 speech_config=types.SpeechConfig(voice_config=types.VoiceConfig(
                     prebuilt_voice_config=types.PrebuiltVoiceConfig(voice_name=voice))))
             response = client.models.generate_content(model=FIXED_MODEL_NAME, contents=contents, config=config)
             if response.candidates and response.candidates[0].content and response.candidates[0].content.parts and response.candidates[0].content.parts[0].inline_data:
                 logging.info(f"[{session_id}] ✅ قطعه با موفقیت توسط کلید شماره {key_idx_display} تولید شد.")
                 return response.candidates[0].content.parts[0].inline_data
         except Exception as e:
             logging.error(f"[{session_id}] ❌ خطا در تولید قطعه با کلید شماره {key_idx_display}: {e}.")
     return None
 def core_generate_audio(text_input, prompt_input, selected_voice, temperature_val, session_id):
     logging.info(f"[{session_id}] 🚀 شروع فرآیند تولید صدا.")
     temp_dir = f"temp_{session_id}"
     os.makedirs(temp_dir, exist_ok=True)
@@ -179,9 +207,6 @@ def core_generate_audio(text_input, prompt_input, selected_voice, temperature_va
         if os.path.exists(temp_dir):
             shutil.rmtree(temp_dir)
-# --- END: تعریف تمام توابع کمکی ---
 # --- اجرای کدهای اولیه برنامه ---
 _init_api_keys()
@@ -221,12 +246,6 @@ def health_check():
 logging.info("✅✅✅ Application logic initialized successfully. Starting Uvicorn server...")
-# --- START: بخش جدید برای اجرای سرور ---
 if __name__ == "__main__":
-    # پورت را از متغیرهای محیطی هاگینگ فیس یا به صورت پیش‌فرض 7860 بخوان
     port = int(os.environ.get("PORT", 7860))
-    # اجرای سرور Uvicorn از داخل کد پایتون
-    # reload=False برای محیط production مهم است
-    uvicorn.run(app, host="0.0.0.0", port=port, reload=False)
-# --- END: بخش جدید برای اجرای سرور ---

+# app.py - نسخه کامل و بهینه‌سازی شده برای پایداری بالا
 import os
 import sys
 from pydantic import BaseModel
 from google import genai
 from google.genai import types
 import uvicorn
 try:
 except ImportError:
     PYDUB_AVAILABLE = False
 logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s', datefmt='%Y-%m-%d %H:%M:%S')
+# --- START: بخش جدید برای مدیریت بهینه Client ها ---
+GEMINI_CLIENTS_CACHE = {} # یک دیکشنری برای کش کردن client ها
+CLIENT_CACHE_LOCK = threading.Lock() # یک قفل برای دسترسی امن به کش
+# --- END: بخش جدید ---
 # --- منطق مدیریت API Key ---
 ALL_API_KEYS: list[str] = []
         ALL_API_KEYS = [key.strip() for key in all_keys_string.split(',') if key.strip()]
     logging.info(f"✅ تعداد {len(ALL_API_KEYS)} کلید API جیمینای بارگذاری شد.")
     if not ALL_API_KEYS:
+        logging.warning("⛔️ هشدار: هیچ Secret با نام ALL_GEMINI_API_KEYS یافت نشد!")
+def get_next_api_key_and_client():
+    """
+    تغییر اصلی: این تابع هم کلید و هم یک client کش‌شده یا جدید را برمی‌گرداند.
+    """
+    with KEY_LOCK:
+        if not ALL_API_KEYS:
+            return None, None, -1
+        current_index = NEXT_KEY_INDEX % len(ALL_API_KEYS)
+        key_to_use = ALL_API_KEYS[current_index]
+        key_display_index = current_index + 1
+        NEXT_KEY_INDEX += 1
+    # حالا که کلید را داریم، client مربوط به آن را از کش دریافت می‌کنیم
+    with CLIENT_CACHE_LOCK:
+        if key_to_use in GEMINI_CLIENTS_CACHE:
+            # اگر client در کش بود، همان را برمی‌گردانیم
+            client = GEMINI_CLIENTS_CACHE[key_to_use]
+        else:
+            # اگر نبود، یکی جدید می‌سازیم و در کش ذخیره می‌کنیم
+            logging.info(f"Creating new Gemini client for key ending in ...{key_to_use[-4:]}")
+            client = genai.Client(api_key=key_to_use)
+            GEMINI_CLIENTS_CACHE[key_to_use] = client
+    return key_to_use, client, key_display_index
 # --- ثابت‌ها ---
 FIXED_MODEL_NAME = "gemini-2.5-flash-preview-tts"
 DEFAULT_MAX_CHUNK_SIZE = 3800
 DEFAULT_SLEEP_BETWEEN_REQUESTS = 8
+# ... (توابع کمکی دیگر مثل save_binary_file, convert_to_wav و ... بدون تغییر اینجا قرار می‌گیرند) ...
 def save_binary_file(file_name, data):
     try:
         with open(file_name, "wb") as f: f.write(data)
     except Exception as e:
         logging.error(f"❌ خطا در ذخیره فایل {file_name}: {e}")
         return None
 def convert_to_wav(audio_data: bytes, mime_type: str) -> bytes:
     parameters = parse_audio_mime_type(mime_type)
     bits_per_sample, rate = parameters["bits_per_sample"], parameters["rate"]
     byte_rate, chunk_size = rate * block_align, 36 + data_size
     header = struct.pack("<4sI4s4sIHHIIHH4sI", b"RIFF", chunk_size, b"WAVE", b"fmt ", 16, 1, num_channels, rate, byte_rate, block_align, bits_per_sample, b"data", data_size)
     return header + audio_data
 def parse_audio_mime_type(mime_type: str) -> dict[str, int]:
     bits, rate = 16, 24000
     for param in mime_type.split(";"):
             try: bits = int(param.split("L", 1)[1])
             except: pass
     return {"bits_per_sample": bits, "rate": rate}
 def smart_text_split(text, max_size=3800):
     if len(text) <= max_size: return [text]
     chunks, current_chunk = [], ""
     if current_chunk: chunks.append(current_chunk.strip())
     final_chunks = [c for c in chunks if c]
     return final_chunks
 def merge_audio_files_func(file_paths, output_path):
     if not PYDUB_AVAILABLE: logging.warning("⚠️ pydub برای ادغام در دسترس نیست."); return False
     try:
         combined.export(output_path, format="wav")
         return True
     except Exception as e: logging.error(f"❌ خطا در ادغام فایل‌های صوتی: {e}"); return False
+# ... (پایان توابع کمکی) ...
+# --- منطق اصلی تولید صدا (با استفاده از Client کش شده) ---
 def generate_audio_chunk_with_retry(chunk_text, prompt_text, voice, temp, session_id):
     if not ALL_API_KEYS: raise Exception("هیچ کلید API برای پردازش در دسترس نیست.")
     for _ in range(len(ALL_API_KEYS)):
+        # تغییر اصلی: دریافت همزمان کلید و client
+        selected_api_key, client, key_idx_display = get_next_api_key_and_client()
+        if not client:
+            break
         logging.info(f"[{session_id}] ⚙️ تلاش برای تولید قطعه با کلید API شماره {key_idx_display}")
         try:
+            # دیگر نیازی به ساخت client جدید نیست!
             final_text = f'"{prompt_text}"\n{chunk_text}' if prompt_text and prompt_text.strip() else chunk_text
             contents = [types.Content(role="user", parts=[types.Part.from_text(text=final_text)])]
             config = types.GenerateContentConfig(temperature=temp, response_modalities=["audio"],
                 speech_config=types.SpeechConfig(voice_config=types.VoiceConfig(
                     prebuilt_voice_config=types.PrebuiltVoiceConfig(voice_name=voice))))
             response = client.models.generate_content(model=FIXED_MODEL_NAME, contents=contents, config=config)
             if response.candidates and response.candidates[0].content and response.candidates[0].content.parts and response.candidates[0].content.parts[0].inline_data:
                 logging.info(f"[{session_id}] ✅ قطعه با موفقیت توسط کلید شماره {key_idx_display} تولید شد.")
                 return response.candidates[0].content.parts[0].inline_data
         except Exception as e:
             logging.error(f"[{session_id}] ❌ خطا در تولید قطعه با کلید شماره {key_idx_display}: {e}.")
+            # اگر خطا مربوط به احراز هویت بود، client را از کش حذف می‌کنیم تا دفعه بعد دوباره ساخته شود
+            if "authentication" in str(e).lower():
+                with CLIENT_CACHE_LOCK:
+                    if selected_api_key in GEMINI_CLIENTS_CACHE:
+                        del GEMINI_CLIENTS_CACHE[selected_api_key]
+                        logging.warning(f"Client for key ...{selected_api_key[-4:]} removed from cache due to auth error.")
     return None
 def core_generate_audio(text_input, prompt_input, selected_voice, temperature_val, session_id):
+    # این تابع بدون تغییر باقی می‌ماند
     logging.info(f"[{session_id}] 🚀 شروع فرآیند تولید صدا.")
     temp_dir = f"temp_{session_id}"
     os.makedirs(temp_dir, exist_ok=True)
         if os.path.exists(temp_dir):
             shutil.rmtree(temp_dir)
 # --- اجرای کدهای اولیه برنامه ---
 _init_api_keys()
 logging.info("✅✅✅ Application logic initialized successfully. Starting Uvicorn server...")
 if __name__ == "__main__":
     port = int(os.environ.get("PORT", 7860))
+    uvicorn.run(app, host="0.0.0.0", port=port, reload=False)