Spaces:

Opera8
/

Podgen2

Paused

App Files Files Community

Opera8 commited on May 11

Commit

77e328d

verified ·

1 Parent(s): 53b65bd

Update app.py

Browse files

Files changed (1) hide show

app.py +30 -20

app.py CHANGED Viewed

@@ -115,11 +115,11 @@ def get_user_ip():
         return request.headers.getlist("X-Forwarded-For")[0].split(',')[0].strip()
     return request.remote_addr
-# --- TTS HELPER FUNCTIONS (تمیزکننده و سازنده پرقدرت) ---
 def call_worker(index, chunk_payload):
     raw_text = chunk_payload.get("text", "")
-    # 🔴 پاکسازی متن از تمام کاراکترهای سمی (مارک‌داون، براکت و ...)
     clean_text = re.sub(r'[*_`~#]', '', raw_text)
     clean_text = re.sub(r'\[.*?\]|\(.*?\)', '', clean_text)
     clean_text = clean_text.strip()
@@ -142,8 +142,7 @@ def call_worker(index, chunk_payload):
         "fallback_to_live": True
     }
-    # تلاش مستمر و بدون جا انداختن حتی یک کلمه
-    max_attempts = 50
     for attempt in range(max_attempts):
         workers = list(WORKER_URLS)
@@ -172,8 +171,7 @@ def call_worker(index, chunk_payload):
         logging.warning(f"🔄 [قطعه {index+1}] کارگرها شلوغ/خطا دادند. استراحت به مدت {sleep_time:.1f} ثانیه...")
         time.sleep(sleep_time)
-    # اگر بعد از 50 بار ساخته نشد، ارور صادر میکنه تا پادکست ناقص نمونه
-    raise ValueError(f"قطعه {index+1} پس از 50 بار تلاش ساخته نشد.")
 # --- AI PODCAST SCRIPT LOGIC (Cohere Labs Space) ---
 def generate_podcast_in_background(task_id, system_prompt, safety_settings):
@@ -246,30 +244,30 @@ def generate_podcast_in_background(task_id, system_prompt, safety_settings):
     except Exception as e:
         with tasks_lock: tasks[task_id].update({'status': 'failed', 'error': str(e)})
-# --- FULL AUTO PODCAST LOGIC (پردازش دسته‌ای 7تایی) ---
 def generate_full_podcast_audio_background(task_id, prompt, speakers):
     try:
         logging.info(f"🚀 [پروژه {task_id}] عملیات ساخت پادکست آغاز شد.")
         with tasks_lock:
             tasks[task_id] = {'status': 'writing_script', 'progress': 'در حال نگارش سناریو...'}
         spk_text = "\n".join([f"- {s['id']}: {s['name']}" for s in speakers])
-        # 🔴 پرامپت دقیقاً منطبق با سایت شد + دستور اکید برای نوشتن فقط به زبان فارسی تا کارگر ارور نده
         system_prompt = f"""Act as a Professional Podcast Producer.
 Topic: "{prompt}"
 Speakers Available:
 {spk_text}
-CRITICAL INSTRUCTION: You must create a VERY LONG, in-depth, and highly detailed podcast script.
-- Do NOT write a short summary.
-- The conversation must deeply explore the topic. Make it a very long and detailed conversation, as long as necessary to fully cover the topic.
-- Make the dialogue engaging and informative.
-- 🔴 IMPORTANT: Write the ENTIRE script ONLY in Persian (Farsi) language. Do NOT use English characters.
 Output ONLY valid JSON.
-Format: {{"selected_speakers": ["id1", "id2"], "script": [{{"speaker_id": "id1", "dialogue": "..."}}]}}
-Dialogue rules: No stage directions like [laugh], (sigh). Just spoken words."""
         AYA_SPACE_URL = "https://coherelabs-aya-expanse.hf.space/gradio_api"
         MAX_ATTEMPTS = 50
@@ -320,7 +318,6 @@ Dialogue rules: No stage directions like [laugh], (sigh). Just spoken words."""
         for t in data["script"]:
             if "dialogue" in t: t["dialogue"] = re.sub(r'\[.*?\]|\(.*?\)', '', t["dialogue"]).strip()
-        # فقط نوبت‌هایی که متن دارن رو پردازش می‌کنیم
         script_turns = [t for t in data.get("script", []) if str(t.get("dialogue", "")).strip()]
         total_turns = len(script_turns)
@@ -333,15 +330,28 @@ Dialogue rules: No stage directions like [laugh], (sigh). Just spoken words."""
         completed_count = 0
         def process_single_chunk(index, turn_data):
-            speaker_id = turn_data.get("speaker_id")
             dialogue = turn_data.get("dialogue")
-            payload = {"text": dialogue, "speaker": speaker_id, "temperature": 0.9, "is_custom": False}
             idx, audio_seg = call_worker(index, payload)
             if audio_seg is None:
                 raise ValueError(f"خطا در تولید صدای نوبت {index+1}")
             return idx, audio_seg
-        # 🌟 استراتژی طلایی دسته‌بندی (7 تا 7 تا) که پیشنهاد خودت بود 🌟
         batch_size = 7
         batches = [script_turns[i:i + batch_size] for i in range(0, total_turns, batch_size)]
@@ -502,7 +512,7 @@ def create_full_podcast():
         safety = [{"category": c, "threshold": "BLOCK_NONE"} for c in ["HARM_CATEGORY_HARASSMENT", "HARM_CATEGORY_HATE_SPEECH", "HARM_CATEGORY_SEXUALLY_EXPLICIT", "HARM_CATEGORY_DANGEROUS_CONTENT"]]
         spk_text = "\n".join([f"- {s['id']}: {s['name']}" for s in speakers])
-        sys_prompt = f"""Act as a Professional Podcast Producer.\nTopic: "{prompt}"\nSpeakers Available:\n{spk_text}\nCRITICAL INSTRUCTION: You must create a VERY LONG, in-depth, and highly detailed podcast script.\n- Do NOT write a short summary.\n- The conversation must deeply explore the topic.\n- Make the dialogue engaging and informative.\n- 🔴 IMPORTANT: Write the ENTIRE script ONLY in Persian (Farsi) language. Do NOT use English characters.\n\nOutput ONLY valid JSON.\nFormat: {{"selected_speakers": ["id1", "id2"], "script": [{{"speaker_id": "id1", "dialogue": "..."}}]}}\nDialogue rules: No stage directions like [laugh], (sigh). Just spoken words."""
         threading.Thread(target=generate_podcast_in_background, args=(task_id, sys_prompt, safety)).start()
         return jsonify({"task_id": task_id}), 202

         return request.headers.getlist("X-Forwarded-For")[0].split(',')[0].strip()
     return request.remote_addr
+# --- TTS HELPER FUNCTIONS ---
 def call_worker(index, chunk_payload):
     raw_text = chunk_payload.get("text", "")
+    # پاکسازی متن از براکت‌ها و کاراکترهای مخرب
     clean_text = re.sub(r'[*_`~#]', '', raw_text)
     clean_text = re.sub(r'\[.*?\]|\(.*?\)', '', clean_text)
     clean_text = clean_text.strip()
         "fallback_to_live": True
     }
+    max_attempts = 40
     for attempt in range(max_attempts):
         workers = list(WORKER_URLS)
         logging.warning(f"🔄 [قطعه {index+1}] کارگرها شلوغ/خطا دادند. استراحت به مدت {sleep_time:.1f} ثانیه...")
         time.sleep(sleep_time)
+    raise ValueError(f"قطعه {index+1} پس از 40 بار تلاش ساخته نشد.")
 # --- AI PODCAST SCRIPT LOGIC (Cohere Labs Space) ---
 def generate_podcast_in_background(task_id, system_prompt, safety_settings):
     except Exception as e:
         with tasks_lock: tasks[task_id].update({'status': 'failed', 'error': str(e)})
+# --- FULL AUTO PODCAST LOGIC ---
 def generate_full_podcast_audio_background(task_id, prompt, speakers):
     try:
         logging.info(f"🚀 [پروژه {task_id}] عملیات ساخت پادکست آغاز شد.")
         with tasks_lock:
             tasks[task_id] = {'status': 'writing_script', 'progress': 'در حال نگارش سناریو...'}
+        valid_speaker_ids = [str(s['id']).strip() for s in speakers]
+        default_speaker_id = valid_speaker_ids[0] if valid_speaker_ids else "Charon"
         spk_text = "\n".join([f"- {s['id']}: {s['name']}" for s in speakers])
         system_prompt = f"""Act as a Professional Podcast Producer.
 Topic: "{prompt}"
 Speakers Available:
 {spk_text}
+CRITICAL INSTRUCTIONS:
+1. Create a VERY LONG, in-depth, and highly detailed podcast script.
+2. STRICT RULE: Keep EVERY SINGLE dialogue line SHORT. If a speaker has a lot to say, BREAK their speech into multiple separate, consecutive turns for that SAME speaker.
+3. NO stage directions, NO emojis, NO brackets like [laugh] or (sigh). Plain spoken text ONLY.
 Output ONLY valid JSON.
+Format: {{"selected_speakers": ["id1", "id2"], "script": [{{"speaker_id": "id1", "dialogue": "..."}}]}}"""
         AYA_SPACE_URL = "https://coherelabs-aya-expanse.hf.space/gradio_api"
         MAX_ATTEMPTS = 50
         for t in data["script"]:
             if "dialogue" in t: t["dialogue"] = re.sub(r'\[.*?\]|\(.*?\)', '', t["dialogue"]).strip()
         script_turns = [t for t in data.get("script", []) if str(t.get("dialogue", "")).strip()]
         total_turns = len(script_turns)
         completed_count = 0
         def process_single_chunk(index, turn_data):
+            # 🔴 سیستم هوشمند جایگزینی گوینده (شبیه‌سازی کامل رفتار سایت)
+            raw_speaker_id = str(turn_data.get("speaker_id", "")).strip()
+            final_speaker_id = raw_speaker_id
+            if final_speaker_id not in valid_speaker_ids:
+                found = False
+                for v_id in valid_speaker_ids:
+                    if final_speaker_id.lower() == v_id.lower():
+                        final_speaker_id = v_id
+                        found = True
+                        break
+                if not found:
+                    logging.warning(f"⚠️ آیدی گوینده نامعتبر '{raw_speaker_id}' تشخیص داده شد. جایگزین شد با '{default_speaker_id}'.")
+                    final_speaker_id = default_speaker_id
             dialogue = turn_data.get("dialogue")
+            payload = {"text": dialogue, "speaker": final_speaker_id, "temperature": 0.9, "is_custom": False}
             idx, audio_seg = call_worker(index, payload)
             if audio_seg is None:
                 raise ValueError(f"خطا در تولید صدای نوبت {index+1}")
             return idx, audio_seg
         batch_size = 7
         batches = [script_turns[i:i + batch_size] for i in range(0, total_turns, batch_size)]
         safety = [{"category": c, "threshold": "BLOCK_NONE"} for c in ["HARM_CATEGORY_HARASSMENT", "HARM_CATEGORY_HATE_SPEECH", "HARM_CATEGORY_SEXUALLY_EXPLICIT", "HARM_CATEGORY_DANGEROUS_CONTENT"]]
         spk_text = "\n".join([f"- {s['id']}: {s['name']}" for s in speakers])
+        sys_prompt = f"""Act as a Professional Podcast Producer.\nTopic: "{prompt}"\nSpeakers Available:\n{spk_text}\nCRITICAL INSTRUCTIONS:\n1. Create a VERY LONG, in-depth podcast script.\n2. Keep EVERY dialogue line SHORT. Break long speeches into multiple consecutive turns for the same speaker.\n3. NO stage directions, NO emojis, NO brackets. Plain text ONLY.\n\nOutput ONLY valid JSON.\nFormat: {{"selected_speakers": ["id1", "id2"], "script": [{{"speaker_id": "id1", "dialogue": "..."}}]}}"""
         threading.Thread(target=generate_podcast_in_background, args=(task_id, sys_prompt, safety)).start()
         return jsonify({"task_id": task_id}), 202