Spaces:

hazelhh
/

Linebotpic

Runtime error

App Files Files Community

hazelhh commited on Sep 19, 2025

Commit

6578989

verified ·

1 Parent(s): 6c8ae75

Update main.py

Browse files

Files changed (1) hide show

main.py +114 -94

main.py CHANGED Viewed

@@ -1,11 +1,19 @@
 import os
 import io
 from collections import defaultdict
-from fastapi.middleware.cors import CORSMiddleware
 from fastapi import FastAPI, Request, Header, BackgroundTasks, HTTPException
 from fastapi.staticfiles import StaticFiles
 from google import genai
 from google.genai import types
 from linebot import LineBotApi, WebhookHandler
 from linebot.exceptions import InvalidSignatureError
 from linebot.models import (
@@ -15,8 +23,6 @@ from linebot.models import (
     ImageSendMessage,
     ImageMessage,
 )
-import PIL.Image
-import uvicorn
 # LangChain 相關匯入
 from langchain_core.prompts import ChatPromptTemplate
@@ -26,22 +32,38 @@ from langchain.agents import AgentExecutor, create_tool_calling_agent
 # ==========================
-#  環境設定與工具函式
 # ==========================
-# 設置 Google AI API 金鑰
-google_api = os.environ["GOOGLE_API_KEY"]
-genai_client = genai.Client(api_key=google_api)
-# 設置 Line Bot 的 API 金鑰和秘密金鑰
-line_bot_api = LineBotApi(os.environ["CHANNEL_ACCESS_TOKEN"])
-line_handler = WebhookHandler(os.environ["CHANNEL_SECRET"])
-# 使用字典模擬用戶訊息歷史存儲
-user_message_history = defaultdict(list)
 # 建立 FastAPI 應用程式
 app = FastAPI()
 app.mount("/static", StaticFiles(directory="static"), name="static")
 # 設定 CORS
@@ -53,12 +75,13 @@ app.add_middleware(
     allow_headers=["*"],
 )
-def get_image_url_from_line(message_id):
     """
     從 Line 訊息 ID 獲取圖片內容並儲存到暫存檔案。
     """
     try:
         message_content = line_bot_api.get_message_content(message_id)
         file_path = f"/tmp/{message_id}.png"
         with open(file_path, "wb") as f:
             for chunk in message_content.iter_content():
@@ -66,25 +89,9 @@ def get_image_url_from_line(message_id):
         print(f"✅ 圖片成功儲存到：{file_path}")
         return file_path
     except Exception as e:
-        print(f"❌ 圖片取得失敗：{e}")
         return None
-def store_user_message(user_id, message_type, message_content):
-    """
-    儲存用戶的訊息。
-    """
-    user_message_history[user_id].append(
-        {"type": message_type, "content": message_content}
-    )
-def get_previous_message(user_id):
-    """
-    獲取用戶的上一則訊息。
-    """
-    if user_id in user_message_history and len(user_message_history[user_id]) > 0:
-        return user_message_history[user_id][-1]
-    return {"type": "text", "content": "No message!"}
 # ==========================
 #  LangChain 工具定義
@@ -99,33 +106,37 @@ def generate_and_upload_image(prompt: str) -> str:
         prompt: 用於生成圖片的文字提示。
     Returns:
-        回傳生成圖片的 URL。
     """
     try:
-        response = genai_client.models.generate_content(
-            model="gemini-2.0-flash-preview-image-generation",
             contents=prompt,
-            config=types.GenerateContentConfig(response_modalities=['Text', 'Image'])
         )
         image_binary = None
         for part in response.candidates[0].content.parts:
-            if part.inline_data is not None:
                 image_binary = part.inline_data.data
                 break
         if image_binary:
             image = PIL.Image.open(io.BytesIO(image_binary))
             # 隨機生成一個檔案名以避免衝突
-            file_name = f"static/{os.urandom(16).hex()}.png"
-            image.save(file_name, format="PNG")
-            image_url = os.path.join(os.getenv("HF_SPACE"), file_name)
-            return image_url
-        return "圖片生成失敗。"
     except Exception as e:
-        return f"圖片生成與上傳失敗: {e}"
 @tool
 def analyze_image_with_text(image_path: str, user_text: str) -> str:
@@ -144,19 +155,15 @@ def analyze_image_with_text(image_path: str, user_text: str) -> str:
             return "圖片路徑無效，無法進行分析。"
         img_user = PIL.Image.open(image_path)
-        response = genai_client.models.generate_content(
-                    model="gemini-2.5-flash",
-                    contents=[img_user, user_text]
-        )
-        if (response.text != None):
-            out = response.text
         else:
-            out = "Gemini沒答案!請換個說法！"
     except Exception as e:
-        # 處理錯誤
-        out = f"Gemini執行出錯: {e}"
-    return out
 # ==========================
@@ -167,18 +174,22 @@ def analyze_image_with_text(image_path: str, user_text: str) -> str:
 tools = [generate_and_upload_image, analyze_image_with_text]
 # 建立 LLM 模型實例
-llm = ChatGoogleGenerativeAI(google_api_key=google_api, model="gemini-2.5-flash", temperature=0.2)
 # 建立提示模板
-prompt_template = ChatPromptTemplate([
-    ("system", "你是一個強大的圖像生成與問答助理，可以根據用戶的請求使用提供的工具。當你執行 generate_and_upload_image 工具\
-    成功後會獲得一個 URL，然後你回答的 output 要包含有這個 URL 的完整資訊。如果工具有產生錯誤訊息請解讀並回應。"),
     ("user", "{input}"),
     ("placeholder", "{agent_scratchpad}"),
 ])
 # 建立代理人
-agent = create_tool_calling_agent(llm, tools, prompt_template)
 agent_executor = AgentExecutor(agent=agent, tools=tools, verbose=True)
 # ==========================
@@ -187,16 +198,17 @@ agent_executor = AgentExecutor(agent=agent, tools=tools, verbose=True)
 @app.get("/")
 def root():
-    return {"title": "Line Bot"}
 @app.post("/webhook")
 async def webhook(
     request: Request,
     background_tasks: BackgroundTasks,
-    x_line_signature=Header(None),
 ):
     body = await request.body()
     try:
         background_tasks.add_task(
             line_handler.handle, body.decode("utf-8"), x_line_signature
         )
@@ -207,56 +219,64 @@ async def webhook(
 @line_handler.add(MessageEvent, message=(ImageMessage, TextMessage))
 def handle_message(event):
     user_id = event.source.user_id
-    # 處理圖片上傳
-    if event.message.type == "image":
-        image_path = get_image_url_from_line(event.message.id)
         if image_path:
-            store_user_message(user_id, "image", image_path)
-            line_bot_api.reply_message(
-                event.reply_token, TextSendMessage(text="圖片已接收成功囉，幫我輸入你想詢問的問題喔~")
-            )
         else:
             line_bot_api.reply_message(
-                event.reply_token, TextSendMessage(text="沒有接收到圖片~")
             )
-    # 處理文字訊息
-    elif event.message.type == "text":
         user_text = event.message.text
-        previous_message = get_previous_message(user_id)
-        print(previous_message)
-        # 根據上一則訊息類型，動態傳遞給代理人
-        if previous_message["type"] == "image":
-            image_path = previous_message["content"]
-            agent_input = {
-                "input": f"請根據這張圖片回答問題。圖片的路徑是 {image_path}，我的問題是：{user_text}"
-            }
-            # 清除上一則圖片訊息，避免重複觸發
-            user_message_history[user_id].pop()
-        else:
-            agent_input = {"input": user_text}
         try:
             # 運行代理人
             response = agent_executor.invoke(agent_input)
-            out = response["output"]
-            if 'https' in out:
-                img_tmp = 'https'+out.split('https')[1]
-                image_url = img_tmp.split('png')[0]+'png'
                 line_bot_api.push_message(
                     event.source.user_id,
                     [
-                        TextSendMessage(text="✨ 這是我為你生成的圖片喔～"),
                         ImageSendMessage(original_content_url=image_url, preview_image_url=image_url)
                     ]
                 )
             else:
-                line_bot_api.reply_message(event.reply_token, TextSendMessage(text=out))
         except Exception as e:
             print(f"代理人執行出錯: {e}")
-            out = f"代理人執行出錯!錯誤訊息：{e}"
-            line_bot_api.reply_message(event.reply_token, TextSendMessage(text=out))
 if __name__ == "__main__":
-    uvicorn.run("app:app", host="0.0.0.0", port=7860, reload=True)

 import os
 import io
+import re
 from collections import defaultdict
+import PIL.Image
+import uvicorn
+import requests
+from pydantic_settings import BaseSettings
 from fastapi import FastAPI, Request, Header, BackgroundTasks, HTTPException
+from fastapi.middleware.cors import CORSMiddleware
 from fastapi.staticfiles import StaticFiles
 from google import genai
 from google.genai import types
 from linebot import LineBotApi, WebhookHandler
 from linebot.exceptions import InvalidSignatureError
 from linebot.models import (
     ImageSendMessage,
     ImageMessage,
 )
 # LangChain 相關匯入
 from langchain_core.prompts import ChatPromptTemplate
 # ==========================
+#  環境變數與設定管理
 # ==========================
+class Settings(BaseSettings):
+    """使用 Pydantic 管理環境變數"""
+    google_api_key: str
+    channel_access_token: str
+    channel_secret: str
+    base_url: str  # 應用程式的公開網址，例如 ngrok 或 Hugging Face Space 的 URL
+    class Config:
+        env_file = ".env"
+# 載入設定
+settings = Settings()
+# ==========================
+#  API 客戶端與工具函式初始化
+# ==========================
+# 設置 Google AI API 金鑰
+genai.configure(api_key=settings.google_api_key)
+# 設置 Line Bot API
+line_bot_api = LineBotApi(settings.channel_access_token)
+line_handler = WebhookHandler(settings.channel_secret)
 # 建立 FastAPI 應用程式
 app = FastAPI()
+# 確保靜態檔案目錄存在
+os.makedirs("static", exist_ok=True)
 app.mount("/static", StaticFiles(directory="static"), name="static")
 # 設定 CORS
     allow_headers=["*"],
 )
+def get_image_from_line(message_id: str) -> str | None:
     """
     從 Line 訊息 ID 獲取圖片內容並儲存到暫存檔案。
     """
     try:
         message_content = line_bot_api.get_message_content(message_id)
+        # 使用 /tmp 目錄儲存暫存檔案，適合多數雲端環境
         file_path = f"/tmp/{message_id}.png"
         with open(file_path, "wb") as f:
             for chunk in message_content.iter_content():
         print(f"✅ 圖片成功儲存到：{file_path}")
         return file_path
     except Exception as e:
+        print(f"❌ 從 Line 取得圖片失敗：{e}")
         return None
 # ==========================
 #  LangChain 工具定義
         prompt: 用於生成圖片的文字提示。
     Returns:
+        回傳生成圖片的公開 URL。
     """
     try:
+        # 使用 gemini-2.5-flash-image-preview 模型進行圖片生成
+        model = genai.GenerativeModel('gemini-2.5-flash-image-preview')
+        response = model.generate_content(
             contents=prompt,
+            generation_config=types.GenerationConfig(response_modalities=['IMAGE'])
         )
         image_binary = None
         for part in response.candidates[0].content.parts:
+            if part.inline_data and part.inline_data.data:
                 image_binary = part.inline_data.data
                 break
         if image_binary:
             image = PIL.Image.open(io.BytesIO(image_binary))
             # 隨機生成一個檔案名以避免衝突
+            file_name = f"{os.urandom(16).hex()}.png"
+            file_path = os.path.join("static", file_name)
+            image.save(file_path, format="PNG")
+            # 使用環境變數中的 BASE_URL 來建立完整的公開網址
+            image_url = f"{settings.base_url}/{file_path}"
+            print(f"✅ 圖片生成成功，URL: {image_url}")
+            return f"圖片生成成功，請查看此 URL: {image_url}"
+        return "圖片生成失敗，未收到有效的圖片資料。"
     except Exception as e:
+        return f"圖片生成與上傳過程中發生錯誤: {e}"
 @tool
 def analyze_image_with_text(image_path: str, user_text: str) -> str:
             return "圖片路徑無效，無法進行分析。"
         img_user = PIL.Image.open(image_path)
+        model = genai.GenerativeModel("gemini-1.5-flash") # 使用 gemini 1.5 flash 模型
+        response = model.generate_content([img_user, user_text])
+        if response.text:
+            return response.text
         else:
+            return "Gemini 沒有給出答案，請嘗試換個方式提問！"
     except Exception as e:
+        return f"圖片分析過程中發生錯誤: {e}"
 # ==========================
 tools = [generate_and_upload_image, analyze_image_with_text]
 # 建立 LLM 模型實例
+llm = ChatGoogleGenerativeAI(model="gemini-1.5-flash", temperature=0.3)
 # 建立提示模板
+prompt = ChatPromptTemplate.from_messages([
+    ("system", """你是一個強大的圖像生成與問答助理。
+- 當用戶的指令明顯是要生成圖片時 (例如：'畫一張...'、'生成...'、'幫我做一張圖...')，請使用 `generate_and_upload_image` 工具。
+- 當用戶的指令包含圖片路徑 (image_path) 和問題時，請使用 `analyze_image_with_text` 工具。
+- 成功執行 `generate_and_upload_image` 工具後，你會獲得一個 URL，你的最終回答必須包含這個 URL。
+- 如果工具執行過程中產生任何錯誤訊息，請以友善的方式解讀並回應給用戶。"""),
     ("user", "{input}"),
     ("placeholder", "{agent_scratchpad}"),
 ])
 # 建立代理人
+agent = create_tool_calling_agent(llm, tools, prompt)
 agent_executor = AgentExecutor(agent=agent, tools=tools, verbose=True)
 # ==========================
 @app.get("/")
 def root():
+    return {"message": "Line Bot is running!"}
 @app.post("/webhook")
 async def webhook(
     request: Request,
     background_tasks: BackgroundTasks,
+    x_line_signature: str = Header(None),
 ):
     body = await request.body()
     try:
+        # 使用背景任務處理 Webhook，避免 Line Server 超時
         background_tasks.add_task(
             line_handler.handle, body.decode("utf-8"), x_line_signature
         )
 @line_handler.add(MessageEvent, message=(ImageMessage, TextMessage))
 def handle_message(event):
     user_id = event.source.user_id
+    # 處理圖片上傳：使用者上傳圖片後直接進行分析
+    if isinstance(event.message, ImageMessage):
+        image_path = get_image_from_line(event.message.id)
         if image_path:
+            try:
+                # 組合給代理人的輸入，使用一個通用的問題來分析圖片
+                agent_input = {
+                    "input": f"這是一張使用者上傳的圖片，請詳細描述你看到了什麼。圖片的路徑是 '{image_path}'。"
+                }
+                # 運行代理人
+                response = agent_executor.invoke(agent_input)
+                output_text = response["output"]
+                # 回覆分析結果
+                line_bot_api.reply_message(event.reply_token, TextSendMessage(text=output_text))
+            except Exception as e:
+                print(f"代理人執行出錯: {e}")
+                error_message = f"圖片分析時發生錯誤，請稍後再試。\n錯誤訊息：{e}"
+                line_bot_api.reply_message(event.reply_token, TextSendMessage(text=error_message))
         else:
             line_bot_api.reply_message(
+                event.reply_token, TextSendMessage(text="❌ 圖片接收失敗，請再試一次。")
             )
+    # 處理文字訊息：主要用於生成圖片或一般問答
+    elif isinstance(event.message, TextMessage):
         user_text = event.message.text
+        agent_input = {"input": user_text}
         try:
             # 運行代理人
             response = agent_executor.invoke(agent_input)
+            output_text = response["output"]
+            # 使用正規表示法尋找 URL，更穩定
+            image_url_match = re.search(r'https?://\S+\.(?:png|jpg|jpeg|gif)', output_text, re.IGNORECASE)
+            if image_url_match:
+                image_url = image_url_match.group(0)
+                # 推送訊息，包含生成的圖片
                 line_bot_api.push_message(
                     event.source.user_id,
                     [
+                        TextSendMessage(text="✨ 這是我為您生成的圖片喔～"),
                         ImageSendMessage(original_content_url=image_url, preview_image_url=image_url)
                     ]
                 )
             else:
+                # 若無圖片 URL，則直接回覆文字
+                line_bot_api.reply_message(event.reply_token, TextSendMessage(text=output_text))
         except Exception as e:
             print(f"代理人執行出錯: {e}")
+            error_message = f"代理人執行時發生錯誤，請稍後再試。\n錯誤訊息：{e}"
+            line_bot_api.reply_message(event.reply_token, TextSendMessage(text=error_message))
 if __name__ == "__main__":
+    # 使用 settings 物件中的設定
+    uvicorn.run("main:app", host="0.0.0.0", port=7860, reload=True)