Spaces:

Emeritus-21
/

research-podquery

Runtime error

App Files Files Community

Emeritus-21 commited on Nov 29, 2025

Commit

198f8e5

verified ·

1 Parent(s): 1a78858

Update app.py

Browse files

Files changed (1) hide show

app.py +64 -79

app.py CHANGED Viewed

@@ -6,18 +6,17 @@ import json
 from pypdf import PdfReader
 from dotenv import load_dotenv
-# 1. Load Keys
 load_dotenv()
 GEMINI_API_KEY = os.getenv("GEMINI_API_KEY")
 ELEVEN_API_KEY = os.getenv("ELEVEN_API_KEY")
-# 2. Configure APIs
 if GEMINI_API_KEY:
     genai.configure(api_key=GEMINI_API_KEY)
 if ELEVEN_API_KEY:
     client = ElevenLabs(api_key=ELEVEN_API_KEY)
-# 3. State Management
 class PodcastState:
     def __init__(self):
         self.script = []
@@ -27,35 +26,31 @@ class PodcastState:
 state = PodcastState()
-# =========================
-# PDF TEXT EXTRACTION
-# =========================
-def extract_text_from_pdf(pdf):
     try:
-        reader = PdfReader(pdf)
         text = ""
         for page in reader.pages[:5]:
-            text += page.extract_text() + "\n"
         return text
     except Exception as e:
         return f"Error reading PDF: {e}"
-# =========================
-# SCRIPT GENERATION
-# =========================
 def generate_script(pdf_file, persona_style):
     if not pdf_file:
-        return "⚠️ Upload a PDF first.", None
     if not GEMINI_API_KEY or not ELEVEN_API_KEY:
-        return "⚠️ Missing API Keys in HF Secrets.", None
     pdf_text = extract_text_from_pdf(pdf_file)
     state.full_text = pdf_text
     state.persona = persona_style
-    model = genai.GenerativeModel("gemini-2.0-flash")
     prompts = {
         "Serious Academic": "Two professors discussing the paper. Tone: Intellectual.",
         "Gossip Columnist": "Two gossip hosts reacting dramatically.",
@@ -67,8 +62,8 @@ def generate_script(pdf_file, persona_style):
     Based on the paper:
     "{pdf_text[:4000]}..."
-    Generate a 4-line dialogue script.
-    RETURN JSON ONLY:
     [
         {{"speaker":"Host A","text":"..."}},
         {{"speaker":"Host B","text":"..."}}
@@ -76,25 +71,23 @@ def generate_script(pdf_file, persona_style):
     """
     try:
         response = model.generate_content(system_prompt)
         clean_json = response.text.replace("```json", "").replace("```", "").strip()
         script = json.loads(clean_json)
         state.script = script
         state.current_index = 0
-        return "✅ Script ready.", script
     except Exception as e:
-        return f"Error: {e}", None
-# =========================
-# PLAY NEXT LINE
-# =========================
 def play_next_chunk():
     if state.current_index >= len(state.script):
-        return None, "🎉 Podcast complete."
     line = state.script[state.current_index]
-    voice_id = "nPczCjz82tPNOwVbpGE2"  # Default male
     if state.persona == "Gossip Columnist" and line["speaker"] == "Host B":
         voice_id = "21m00Tcm4TlvDq8ikWAM"
@@ -112,74 +105,66 @@ def play_next_chunk():
         state.current_index += 1
         return save_path, f"{line['speaker']}: {line['text']}"
     except Exception as e:
         return None, f"Audio error: {e}"
-# =========================
-# INTERRUPT + QUESTION
-# =========================
 def interrupt_and_ask(question):
     if not state.full_text:
-        return None, "Upload PDF first."
     model = genai.GenerativeModel("gemini-2.0-flash")
     prompt = f"""
     Persona: {state.persona}
     Context: {state.full_text[:1000]}
-    User asked: {question}
-    Respond briefly, then say:
-    "Anyway, back to the paper..."
     """
-    response = model.generate_content(prompt)
-    answer = response.text
-    audio_stream = client.generate(
-        text=answer,
-        voice="nPczCjz82tPNOwVbpGE2",
-        model="eleven_monolingual_v1"
-    )
-    save_path = "interrupt.mp3"
-    with open(save_path, "wb") as f:
-        for chunk in audio_stream:
-            f.write(chunk)
-    return save_path, answer
-# =========================
-# GRADIO 6 UI
-# =========================
-with gr.App() as app:
     gr.Markdown("# 🎧 PodQuery — Research Paper Podcast Generator")
-    pdf_input = gr.File(label="Upload PDF", file_types=[".pdf"])
-    persona = gr.Dropdown(
-        ["Serious Academic", "Gossip Columnist"],
-        value="Serious Academic",
-        label="Persona Style"
-    )
-    btn_gen = gr.Button("Generate Podcast Script")
-    status = gr.Textbox(label="Status")
-    script_display = gr.JSON(label="Generated Script")
-    player = gr.Audio(label="Audio Output", autoplay=True)
-    transcript = gr.Textbox(label="Transcript")
-    btn_play = gr.Button("▶️ Play Next Line")
-    q_input = gr.Textbox(label="Ask a Question (Interrupt)")
-    btn_interrupt = gr.Button("✋ Interrupt Podcast")
     # Bind events
-    btn_gen.subscribe(generate_script, [pdf_input, persona], [status, script_display])
-    btn_play.subscribe(play_next_chunk, [], [player, transcript])
-    btn_interrupt.subscribe(interrupt_and_ask, [q_input], [player, transcript])
-# ❗ DO NOT CALL app.launch()
-# Hugging Face Spaces auto-launches Gradio 6 apps.

 from pypdf import PdfReader
 from dotenv import load_dotenv
+# 1️⃣ Load API Keys
 load_dotenv()
 GEMINI_API_KEY = os.getenv("GEMINI_API_KEY")
 ELEVEN_API_KEY = os.getenv("ELEVEN_API_KEY")
 if GEMINI_API_KEY:
     genai.configure(api_key=GEMINI_API_KEY)
 if ELEVEN_API_KEY:
     client = ElevenLabs(api_key=ELEVEN_API_KEY)
+# 2️⃣ Podcast State
 class PodcastState:
     def __init__(self):
         self.script = []
 state = PodcastState()
+# 3️⃣ PDF Extraction
+def extract_text_from_pdf(pdf_file):
     try:
+        reader = PdfReader(pdf_file)
         text = ""
         for page in reader.pages[:5]:
+            page_text = page.extract_text()
+            if page_text:
+                text += page_text + "\n"
         return text
     except Exception as e:
         return f"Error reading PDF: {e}"
+# 4️⃣ Generate Script
 def generate_script(pdf_file, persona_style):
     if not pdf_file:
+        return "⚠️ Upload PDF first.", {}
     if not GEMINI_API_KEY or not ELEVEN_API_KEY:
+        return "⚠️ API Keys missing in HF Secrets!", {}
     pdf_text = extract_text_from_pdf(pdf_file)
     state.full_text = pdf_text
     state.persona = persona_style
     prompts = {
         "Serious Academic": "Two professors discussing the paper. Tone: Intellectual.",
         "Gossip Columnist": "Two gossip hosts reacting dramatically.",
     Based on the paper:
     "{pdf_text[:4000]}..."
+    Generate a short 4-turn dialogue script.
+    Return JSON ONLY:
     [
         {{"speaker":"Host A","text":"..."}},
         {{"speaker":"Host B","text":"..."}}
     """
     try:
+        model = genai.GenerativeModel("gemini-2.0-flash")
         response = model.generate_content(system_prompt)
         clean_json = response.text.replace("```json", "").replace("```", "").strip()
         script = json.loads(clean_json)
         state.script = script
         state.current_index = 0
+        return "✅ Script ready!", script
     except Exception as e:
+        return f"Error generating script: {e}", {}
+# 5️⃣ Play next line
 def play_next_chunk():
     if state.current_index >= len(state.script):
+        return None, "🎉 Podcast finished."
     line = state.script[state.current_index]
+    voice_id = "nPczCjz82tPNOwVbpGE2"
     if state.persona == "Gossip Columnist" and line["speaker"] == "Host B":
         voice_id = "21m00Tcm4TlvDq8ikWAM"
         state.current_index += 1
         return save_path, f"{line['speaker']}: {line['text']}"
     except Exception as e:
         return None, f"Audio error: {e}"
+# 6️⃣ Interrupt & Ask
 def interrupt_and_ask(question):
     if not state.full_text:
+        return None, "Upload a PDF first."
     model = genai.GenerativeModel("gemini-2.0-flash")
     prompt = f"""
     Persona: {state.persona}
     Context: {state.full_text[:1000]}
+    User Question: {question}
+    Answer briefly, then say "Anyway, back to the paper..."
     """
+    try:
+        response = model.generate_content(prompt)
+        answer = response.text
+        audio_stream = client.generate(
+            text=answer,
+            voice="nPczCjz82tPNOwVbpGE2",
+            model="eleven_monolingual_v1"
+        )
+        save_path = "interrupt.mp3"
+        with open(save_path, "wb") as f:
+            for chunk in audio_stream:
+                f.write(chunk)
+        return save_path, answer
+    except Exception as e:
+        return None, f"Error: {e}"
+# 7️⃣ Build Gradio 5.7 UI
+with gr.Blocks() as demo:
     gr.Markdown("# 🎧 PodQuery — Research Paper Podcast Generator")
+    with gr.Row():
+        with gr.Column():
+            pdf_input = gr.File(label="Upload PDF", file_types=[".pdf"])
+            persona = gr.Dropdown(
+                ["Serious Academic", "Gossip Columnist"],
+                value="Serious Academic",
+                label="Persona Style"
+            )
+            btn_gen = gr.Button("Generate Podcast Script")
+            status = gr.Textbox(label="Status")
+            script_display = gr.JSON(label="Generated Script")
+        with gr.Column():
+            player = gr.Audio(label="Audio Output", autoplay=True)
+            transcript = gr.Textbox(label="Transcript")
+            btn_play = gr.Button("▶️ Play Next Line")
+            q_input = gr.Textbox(label="Ask a Question")
+            btn_interrupt = gr.Button("✋ Interrupt Podcast")
     # Bind events
+    btn_gen.click(generate_script, [pdf_input, persona], [status, script_display])
+    btn_play.click(play_next_chunk, [], [player, transcript])
+    btn_interrupt.click(interrupt_and_ask, [q_input], [player, transcript])
+# 8️⃣ Launch
+if __name__ == "__main__":
+    demo.launch()