Spaces:

pbichpur
/

NotebookLMClone

Running

App Files Files Community

github-actions[bot] commited on 18 days ago

Commit

ea7dc28

1 Parent(s): 62f0a86

Sync from GitHub 568a6a97b4e0075c2edef972568daa49f4f256c0

Browse files

Files changed (3) hide show

frontend/app.py +20 -0
src/artifacts/podcast_generator.py +23 -0
src/artifacts/tts_adapter.py +31 -3

frontend/app.py CHANGED Viewed

@@ -1,5 +1,6 @@
 from __future__ import annotations
 import os
 from typing import Any
 import requests
@@ -693,6 +694,12 @@ elif page == "Notebooks":
                     if ok and isinstance(artifact_result, list):
                         artifacts = artifact_result
                         if artifacts:
                             st.dataframe(artifacts, use_container_width=True)
                             artifact_options = {
                                 f"{a['id']} - {a.get('type', 'unknown')} - {a.get('status', '')}": a
@@ -756,6 +763,19 @@ elif page == "Notebooks":
                                     st.info(f"Podcast status: {artifact_status}")
                             else:
                                 st.info("Select an artifact to preview.")
                         else:
                             st.info("No artifacts generated yet.")
                     else:

 from __future__ import annotations
 import os
+import time
 from typing import Any
 import requests
                     if ok and isinstance(artifact_result, list):
                         artifacts = artifact_result
                         if artifacts:
+                            auto_refresh_key = f"auto_refresh_artifacts_{selected_notebook_id}"
+                            auto_refresh = st.checkbox(
+                                "Auto-refresh while artifacts are processing",
+                                value=bool(st.session_state.get(auto_refresh_key, True)),
+                                key=auto_refresh_key,
+                            )
                             st.dataframe(artifacts, use_container_width=True)
                             artifact_options = {
                                 f"{a['id']} - {a.get('type', 'unknown')} - {a.get('status', '')}": a
                                     st.info(f"Podcast status: {artifact_status}")
                             else:
                                 st.info("Select an artifact to preview.")
+                            in_flight = sum(
+                                1
+                                for a in artifacts
+                                if str(a.get("status", "")).lower() in {"pending", "processing"}
+                            )
+                            if auto_refresh and in_flight > 0:
+                                st.caption(
+                                    f"{in_flight} artifact(s) still processing. "
+                                    "Refreshing in 4 seconds..."
+                                )
+                                time.sleep(4)
+                                st.rerun()
                         else:
                             st.info("No artifacts generated yet.")
                     else:

src/artifacts/podcast_generator.py CHANGED Viewed

@@ -426,6 +426,26 @@ IMPORTANT:
 - Make it sound like a real conversation, not a lecture
 """
     def _synthesize_segments(
         self,
         script: List[Dict[str, str]],
@@ -477,6 +497,9 @@ IMPORTANT:
                 )
                 self._last_tts_errors.append(error_detail)
                 print(f"  ⚠️  Failed {error_detail}")
                 continue
         return audio_files

 - Make it sound like a real conversation, not a lecture
 """
+    @staticmethod
+    def _is_fatal_tts_error(exc: Exception) -> bool:
+        """
+        Detect provider/configuration errors where retrying further segments is pointless.
+        """
+        text = " ".join(str(exc).lower().split())
+        fatal_markers = [
+            "voice_not_found",
+            "no compatible elevenlabs synthesis method found",
+            "invalid_api_key",
+            "unauthorized",
+            "authentication",
+            "forbidden",
+            "insufficient_credits",
+            "quota",
+            "status_code: 401",
+            "status_code: 403",
+        ]
+        return any(marker in text for marker in fatal_markers)
     def _synthesize_segments(
         self,
         script: List[Dict[str, str]],
                 )
                 self._last_tts_errors.append(error_detail)
                 print(f"  ⚠️  Failed {error_detail}")
+                if self._is_fatal_tts_error(e):
+                    print("  ⛔ Fatal TTS configuration/provider error detected. Stopping remaining segments.")
+                    break
                 continue
         return audio_files

src/artifacts/tts_adapter.py CHANGED Viewed

@@ -12,6 +12,20 @@ load_dotenv()
 # TTS Provider type
 TTSProvider = Literal["openai", "elevenlabs", "edge"]
 class TTSAdapter(ABC):
     """Base class for TTS providers."""
@@ -76,13 +90,27 @@ class ElevenLabsTTS(TTSAdapter):
     def _load_voice_aliases(self) -> dict[str, str]:
         """Best-effort map of configured voice names to voice IDs."""
         try:
-            response = self.client.voices.get_all()
             voices = getattr(response, "voices", response)
         except Exception:
-            return {}
-        aliases: dict[str, str] = {}
         for voice in voices or []:
             if isinstance(voice, dict):
                 name = voice.get("name")

 # TTS Provider type
 TTSProvider = Literal["openai", "elevenlabs", "edge"]
+# Common ElevenLabs preset voice name -> voice_id mapping.
+# This allows env values like "Rachel"/"Antoni" to work with SDK methods that require voice_id.
+ELEVENLABS_PRESET_VOICE_IDS: dict[str, str] = {
+    "rachel": "21m00Tcm4TlvDq8ikWAM",
+    "domi": "AZnzlk1XvdvUeBnXmlld",
+    "bella": "EXAVITQu4vr4xnSDxMaL",
+    "antoni": "ErXwobaYiN019PkySvjV",
+    "elli": "MF3mGyEYCl7XYWbV9V6O",
+    "josh": "TxGEqnHWrfWFTfGW9XjX",
+    "arnold": "VR6AewLTigWG4xSOukaG",
+    "adam": "pNInz6obpgDQGcFmaJgB",
+    "sam": "yoZ06aMxZJJ28mfd3POQ",
+}
 class TTSAdapter(ABC):
     """Base class for TTS providers."""
     def _load_voice_aliases(self) -> dict[str, str]:
         """Best-effort map of configured voice names to voice IDs."""
+        aliases: dict[str, str] = dict(ELEVENLABS_PRESET_VOICE_IDS)
+        # First try the latest SDK shape.
         try:
+            voices_api = getattr(self.client, "voices", None)
+            if voices_api is None:
+                return aliases
+            if hasattr(voices_api, "get_all"):
+                response = voices_api.get_all()
+            elif hasattr(voices_api, "search"):
+                response = voices_api.search()
+            elif hasattr(voices_api, "list"):
+                response = voices_api.list()
+            else:
+                return aliases
             voices = getattr(response, "voices", response)
         except Exception:
+            return aliases
         for voice in voices or []:
             if isinstance(voice, dict):
                 name = voice.get("name")