Spaces:

tbdavid2019
/

PDF2podcast-1-script

Sleeping

App Files Files Community

tbdavid2019 commited on Oct 2, 2025

Commit

62f78a2

1 Parent(s): b199afe

feat: 增加可調整的最大輸出 token 限制，並新增摘要生成功能及相關模板

Browse files

Files changed (3) hide show

__pycache__/app.cpython-311.pyc +0 -0
app.py +142 -4
prompts.py +45 -7

__pycache__/app.cpython-311.pyc CHANGED Viewed

Binary files a/__pycache__/app.cpython-311.pyc and b/__pycache__/app.cpython-311.pyc differ

app.py CHANGED Viewed

@@ -72,6 +72,7 @@ def generate_dialogue_via_requests(
     user_feedback: str = None,
     num_parts: int = 3,
     max_input_length: int = 1000000,
     progress_callback=None,
     template_type: str = "podcast"
 ) -> str:
@@ -115,7 +116,7 @@ def generate_dialogue_via_requests(
     max_retries = 5
     retry_delay = 5
-    # 使用 Gemini Flash 2.5 的最大輸出 token 限制
     payload = {
         "model": model,
         "messages": [
@@ -125,7 +126,7 @@ def generate_dialogue_via_requests(
             }
         ],
         "temperature": 0.7,
-        "max_tokens": 65536,  # Gemini Flash 2.5 最大輸出 token 數
         "stream": False  # 先不用流式，確保穩定性
     }
@@ -222,6 +223,73 @@ def generate_dialogue_via_requests(
     return "生成失敗"
 def _generate_in_batches(pdf_text, base_prompt, headers, url, model, num_parts, progress_callback, max_retries, retry_delay):
     """
     分批生成的備用機制，只在單次生成被截斷時使用
@@ -377,6 +445,7 @@ def validate_and_generate_script(
     user_feedback,
     num_parts=3,
     max_input_length=1000000,
     progress_callback=None
 ):
     """驗證輸入並生成腳本"""
@@ -498,6 +567,7 @@ def validate_and_generate_script(
             user_feedback=user_feedback,
             num_parts=num_parts,
             max_input_length=max_input_length,
             progress_callback=progress_callback,
             template_type="podcast"
         )
@@ -628,6 +698,16 @@ with gr.Blocks(title="Script Generator", css="""
                 info="調整模型可處理的最大輸入文本長度（字符數）"
             )
         with gr.Column(scale=1):
             # 輸出區
@@ -635,10 +715,30 @@ with gr.Blocks(title="Script Generator", css="""
             output_text = gr.Textbox(
                 label="生成的腳本 | Generated Script",
-                lines=30,
                 show_copy_button=True
             )
             error_output = gr.Markdown(
                 visible=False,
                 elem_classes=["error"]
@@ -697,6 +797,30 @@ with gr.Blocks(title="Script Generator", css="""
         logger.info("腳本生成成功")
         return script, gr.update(visible=False)
     generate_button.click(
         fn=handle_script_generation,
         inputs=[
@@ -712,10 +836,24 @@ with gr.Blocks(title="Script Generator", css="""
             gr.Textbox(value=""),  # edited_transcript
             custom_prompt,  # user_feedback
             num_parts_slider,  # 添加滑動條參數
-            max_input_length_slider  # 添加最大輸入文本長度參數
         ],
         outputs=[output_text, error_output]
     )
 if __name__ == "__main__":

     user_feedback: str = None,
     num_parts: int = 3,
     max_input_length: int = 1000000,
+    max_output_tokens: int = 65536,
     progress_callback=None,
     template_type: str = "podcast"
 ) -> str:
     max_retries = 5
     retry_delay = 5
+    # 使用可調整的輸出 token 限制
     payload = {
         "model": model,
         "messages": [
             }
         ],
         "temperature": 0.7,
+        "max_tokens": max_output_tokens,  # 可調整的輸出 token 數
         "stream": False  # 先不用流式，確保穩定性
     }
     return "生成失敗"
+def generate_summary(
+    script_content: str,
+    summary_type: str,
+    model: str,
+    llm_api_key: str,
+    api_base: str,
+    max_output_tokens: int = 4096,
+    progress_callback=None
+) -> str:
+    """
+    為生成的腳本創建摘要
+    """
+    if not script_content or not script_content.strip():
+        return "錯誤：請先生成腳本內容"
+    logger.info(f"開始生成摘要，類型: {summary_type}")
+    # 從 prompts 模組獲取摘要模板
+    try:
+        summary_template = get_template(summary_type)["dialog"]
+        prompt = summary_template.format(content=script_content)
+    except KeyError:
+        return f"錯誤：未找到摘要模板 '{summary_type}'"
+    headers = {
+        "Authorization": f"Bearer {llm_api_key}",
+        "Content-Type": "application/json"
+    }
+    base_url = api_base.rstrip("/")
+    url = f"{base_url}/chat/completions"
+    payload = {
+        "model": model,
+        "messages": [
+            {
+                "role": "user",
+                "content": prompt
+            }
+        ],
+        "temperature": 0.7,
+        "max_tokens": max_output_tokens
+    }
+    if progress_callback:
+        progress_callback(f"正在生成{summary_type}摘要...")
+    try:
+        response = requests.post(url, headers=headers, json=payload)
+        response.raise_for_status()
+        result = response.json()
+        summary = result['choices'][0]['message']['content']
+        logger.info(f"摘要生成完成，長度: {len(summary)} 字符")
+        if progress_callback:
+            progress_callback(f"摘要生成完成！")
+        return summary
+    except requests.exceptions.RequestException as e:
+        error_msg = f"摘要生成失敗: {str(e)}"
+        logger.error(error_msg)
+        if progress_callback:
+            progress_callback(error_msg)
+        return error_msg
 def _generate_in_batches(pdf_text, base_prompt, headers, url, model, num_parts, progress_callback, max_retries, retry_delay):
     """
     分批生成的備用機制，只在單次生成被截斷時使用
     user_feedback,
     num_parts=3,
     max_input_length=1000000,
+    max_output_tokens=65536,
     progress_callback=None
 ):
     """驗證輸入並生成腳本"""
             user_feedback=user_feedback,
             num_parts=num_parts,
             max_input_length=max_input_length,
+            max_output_tokens=max_output_tokens,
             progress_callback=progress_callback,
             template_type="podcast"
         )
                 info="調整模型可處理的最大輸入文本長度（字符數）"
             )
+            # 添加最大輸出 token 數的滑動條
+            max_output_tokens_slider = gr.Slider(
+                minimum=1024,
+                maximum=131072,
+                value=65536,
+                step=1024,
+                label="最大輸出 Token 數 | Max Output Tokens",
+                info="調整模型最大輸出 token 數。Gemini Flash 2.5: 65536, GPT-4: 4096, Claude: 8192"
+            )
         with gr.Column(scale=1):
             # 輸出區
             output_text = gr.Textbox(
                 label="生成的腳本 | Generated Script",
+                lines=20,
                 show_copy_button=True
             )
+            # 摘要生成區域
+            gr.Markdown("### 📝 Podcast 摘要生成 | Summary Generation")
+            with gr.Row():
+                summary_type_dropdown = gr.Dropdown(
+                    label="摘要類型 | Summary Type",
+                    choices=["blog-summary", "intro-summary"],
+                    value="intro-summary",
+                    interactive=True
+                )
+                generate_summary_button = gr.Button("生成摘要 | Generate Summary", size="sm")
+            summary_output = gr.Textbox(
+                label="生成的摘要 | Generated Summary",
+                lines=10,
+                show_copy_button=True,
+                placeholder="請先生成腳本，然後點擊「生成摘要」按鈕"
+            )
             error_output = gr.Markdown(
                 visible=False,
                 elem_classes=["error"]
         logger.info("腳本生成成功")
         return script, gr.update(visible=False)
+    def handle_summary_generation(script_content, summary_type, api_key_val, model_val, api_base_val, max_tokens_val):
+        if not script_content or not script_content.strip():
+            return "錯誤：請先生成腳本內容"
+        if not api_key_val or not model_val:
+            return "錯誤：請確保已設定 API 金鑰和模型"
+        logger.info(f"開始生成摘要，類型: {summary_type}")
+        def progress_callback(msg):
+            pass  # 簡化版本，不顯示進度
+        summary = generate_summary(
+            script_content=script_content,
+            summary_type=summary_type,
+            model=model_val,
+            llm_api_key=api_key_val,
+            api_base=api_base_val,
+            max_output_tokens=max_tokens_val // 2,  # 摘要使用較少的 tokens
+            progress_callback=progress_callback
+        )
+        return summary
     generate_button.click(
         fn=handle_script_generation,
         inputs=[
             gr.Textbox(value=""),  # edited_transcript
             custom_prompt,  # user_feedback
             num_parts_slider,  # 添加滑動條參數
+            max_input_length_slider,  # 添加最大輸入文本長度參數
+            max_output_tokens_slider  # 添加最大輸出 token 數參數
         ],
         outputs=[output_text, error_output]
     )
+    generate_summary_button.click(
+        fn=handle_summary_generation,
+        inputs=[
+            output_text,  # 腳本內容
+            summary_type_dropdown,  # 摘要類型
+            api_key,  # API 金鑰
+            model_dropdown,  # 模型
+            api_base,  # API 基礎 URL
+            max_output_tokens_slider  # 最大輸出 tokens
+        ],
+        outputs=[summary_output]
+    )
 if __name__ == "__main__":

prompts.py CHANGED Viewed

@@ -117,18 +117,56 @@ PROMPTS = {
 {content}""",
-    "short summary": """你是專業的內容摘要專家，專門創作簡潔摘要。
 【任務目標】
-- 提取文件的最核心要點
-- 保持簡潔明瞭
-- 目標長度約 250 字
-【輸出格式】
 - **必須使用繁體中文**
-- 重點突出，語言精煉
-請將以下內容整理成簡短摘要：
 {content}"""
 }

 {content}""",
+    "short summary": """你是 David888 Podcast 的內容編輯，專門創作簡潔摘要。
 【任務目標】
+- 為播客內容生成簡潔明瞭的摘要
+- 提取核心觀點和重要資訊
+- 適合社群媒體分享或節目介紹
+【輸出要求】
 - **必須使用繁體中文**
+- 約 256 字的簡潔摘要
+- 直接輸出內容，不使用 Markdown 格式
+請為以下內容生成簡潔摘要：
+{content}""",
+    # 新增的摘要模板
+    "blog-summary": """你是 David888 Podcast 中文博客的編輯，將播客內容改寫成適合搜索引擎收錄的博客文章。
+【工作目標】
+- 使用簡潔明了的語言將播客對話整理為一篇完整的博客文章
+- 開場白使用一句話介紹播客內容，博客名稱是 David888 Podcast
+- 保留核心討論內容，但不要提及「對話」或「播客」等詞彙
+- 確保博客內容生動有趣，具有可讀性
+【輸出要求】
+- **必須使用繁體中文撰寫**，專業術語可保留英文
+- 直接返回 Markdown 格式的正文內容，不要使用 ```markdown 包裹
+- 不要返回前言，直接返回正文內容
+- 文章結構清晰，使用二級標題、三級標題 (如"## 標題"、"### 子標題")
+- 與分段正文形式呈現核心內容
+請將以下播客內容轉換成博客文章：
+{content}""",
+    "intro-summary": """你是 David888 Podcast 中文播客的編輯，為播客文字稿生成極簡摘要。
+【工作目標】
+- **必須使用繁體中文**給播客文字稿生成極簡摘要
+- 提取最核心的討論重點和見解
+- 適合作為節目介紹或平台描述
+【輸出要求】
+- 輸出純文本內容，不要使用 Markdown 格式
+- 只需要返回摘要內容，其他內容都不需要
+- 摘要內容不要超過 200 字
+- 簡潔有力，突出重點
+請為以下播客內容生成極簡摘要：
 {content}"""
 }