Spaces:

gnosticdev
/

Podcastking2

Sleeping

App Files Files Community

gnosticdev commited on Jun 20, 2025

Commit

bf07215

verified ·

1 Parent(s): de6323e

Update conver.py

Browse files

Files changed (1) hide show

conver.py +19 -22

conver.py CHANGED Viewed

@@ -10,7 +10,6 @@ import tempfile
 from pydub import AudioSegment
 import base64
 from pathlib import Path
-import shutil  # Importamos shutil para manejo de directorios
 @dataclass
 class ConversationConfig:
@@ -41,7 +40,6 @@ class URLToAudioConverter:
             raise ValueError("Input text cannot be empty")
         try:
-            # Prompt mejorado para obtener JSON consistente
             prompt = (
                 f"{text}\nConvert the provided text into a short informative podcast conversation "
                 f"between two experts. Return ONLY a JSON object with the following structure:\n"
@@ -51,14 +49,12 @@ class URLToAudioConverter:
             chat_completion = self.llm_client.chat.completions.create(
                 messages=[{"role": "user", "content": prompt}],
                 model=self.config.model_name,
-                response_format={"type": "json_object"}  # Fuerza formato JSON
             )
-            # Extracción robusta de JSON
             response_content = chat_completion.choices[0].message.content
             json_str = response_content.strip()
-            # Limpieza de texto alrededor del JSON
             if not json_str.startswith('{'):
                 start = json_str.find('{')
                 if start != -1:
@@ -71,7 +67,6 @@ class URLToAudioConverter:
             return json.loads(json_str)
         except Exception as e:
-            # Debug: Imprime la respuesta del modelo para diagnóstico
             print(f"Error en extract_conversation: {str(e)}")
             print(f"Respuesta del modelo: {response_content}")
             raise RuntimeError(f"Failed to extract conversation: {str(e)}")
@@ -131,24 +126,13 @@ class URLToAudioConverter:
             combined.export(output_file, format="mp3")
-            # Limpieza mejorada y robusta
             dir_path = os.path.dirname(filenames[0])
-            # Eliminar todos los archivos en el directorio
             for file in os.listdir(dir_path):
                 file_path = os.path.join(dir_path, file)
                 if os.path.isfile(file_path):
-                    try:
-                        os.remove(file_path)
-                    except Exception as e:
-                        print(f"Warning: Could not remove file {file_path}: {str(e)}")
-            # Intentar eliminar el directorio (no crítico si falla)
-            try:
-                os.rmdir(dir_path)
-            except OSError as e:
-                print(f"Info: Could not remove directory {dir_path}: {str(e)}")
-                # No es crítico, el espacio puede continuar
         except Exception as e:
             raise RuntimeError(f"Failed to combine audio files: {e}")
@@ -174,7 +158,7 @@ class URLToAudioConverter:
         return final_output, conversation_text
     async def text_to_audio(self, text: str, voice_1: str, voice_2: str) -> Tuple[str, str]:
-        """Método para procesar texto directo"""
         conversation_json = self.extract_conversation(text)
         conversation_text = "\n".join(
             f"{turn['speaker']}: {turn['text']}" for turn in conversation_json["conversation"]
@@ -184,4 +168,17 @@ class URLToAudioConverter:
         )
         final_output = os.path.join(folder_name, "combined_output.mp3")
         self.combine_audio_files(audio_files, final_output)
-        return final_output, conversation_text

 from pydub import AudioSegment
 import base64
 from pathlib import Path
 @dataclass
 class ConversationConfig:
             raise ValueError("Input text cannot be empty")
         try:
             prompt = (
                 f"{text}\nConvert the provided text into a short informative podcast conversation "
                 f"between two experts. Return ONLY a JSON object with the following structure:\n"
             chat_completion = self.llm_client.chat.completions.create(
                 messages=[{"role": "user", "content": prompt}],
                 model=self.config.model_name,
+                response_format={"type": "json_object"}
             )
             response_content = chat_completion.choices[0].message.content
             json_str = response_content.strip()
             if not json_str.startswith('{'):
                 start = json_str.find('{')
                 if start != -1:
             return json.loads(json_str)
         except Exception as e:
             print(f"Error en extract_conversation: {str(e)}")
             print(f"Respuesta del modelo: {response_content}")
             raise RuntimeError(f"Failed to extract conversation: {str(e)}")
             combined.export(output_file, format="mp3")
+            # Limpieza
             dir_path = os.path.dirname(filenames[0])
             for file in os.listdir(dir_path):
                 file_path = os.path.join(dir_path, file)
                 if os.path.isfile(file_path):
+                    os.remove(file_path)
+            os.rmdir(dir_path)
         except Exception as e:
             raise RuntimeError(f"Failed to combine audio files: {e}")
         return final_output, conversation_text
     async def text_to_audio(self, text: str, voice_1: str, voice_2: str) -> Tuple[str, str]:
+        """Procesamiento normal con LLM"""
         conversation_json = self.extract_conversation(text)
         conversation_text = "\n".join(
             f"{turn['speaker']}: {turn['text']}" for turn in conversation_json["conversation"]
         )
         final_output = os.path.join(folder_name, "combined_output.mp3")
         self.combine_audio_files(audio_files, final_output)
+        return final_output, conversation_text
+    async def raw_text_to_audio(self, text: str, voice_1: str, voice_2: str) -> Tuple[str, str]:
+        """NUEVO: Modo sin LLM (texto directo)"""
+        conversation = {
+            "conversation": [
+                {"speaker": "Host", "text": text},
+                {"speaker": "Co-host", "text": "(Continuación del tema)"}
+            ]
+        }
+        audio_files, folder_name = await self.text_to_speech(conversation, voice_1, voice_2)
+        output_file = os.path.join(folder_name, "raw_podcast.mp3")
+        self.combine_audio_files(audio_files, output_file)
+        return text, output_file