Spaces:

jerrychen428
/

Jerry_LLM_OCR

Sleeping

App Files Files Community

jerrychen428 commited on Sep 14, 2025

Commit

a3acdb5

verified ·

1 Parent(s): 013d633

Update app.py

Browse files

Files changed (1) hide show

app.py +59 -81

app.py CHANGED Viewed

@@ -6,12 +6,24 @@ import gradio as gr
 from google import genai
 import resend
 import html
 class GeminiImageAnalyzer:
     def __init__(self, gemini_api_key, resend_api_key):
         """初始化Gemini客戶端和Resend"""
         self.gemini_api_key = gemini_api_key
-        self.client = genai.Client(api_key=gemini_api_key)
         resend.api_key = resend_api_key
     def validate_image(self, image_path):
@@ -37,45 +49,40 @@ class GeminiImageAnalyzer:
                 mime_type = "image/jpeg"
             elif file_extension == '.png':
                 mime_type = "image/png"
             return encoded_string, mime_type
         except Exception as e:
             raise Exception(f"圖片編碼失敗: {str(e)}")
-    def analyze_image(self, image_path, prompt="請詳細描述這張圖片的內容，並提取圖片中的文字，使用繁體中文"):
         """使用Gemini API分析圖片"""
         try:
             # 驗證圖片
             self.validate_image(image_path)
             # 編碼圖片
             encoded_image, mime_type = self.encode_image(image_path)
             # 構建請求內容
-            contents = [
-                {
-                    "role": "user",
-                    "parts": [
-                        {"text": prompt},
-                        {
-                            "inline_data": {
-                                "mime_type": mime_type,
-                                "data": encoded_image
-                            }
-                        }
-                    ]
-                }
-            ]
             # 調用Gemini API
-            response = self.client.models.generate_content(
-                model="gemini-2.0-flash-exp",  # 使用支援視覺的模型
-                contents=contents
-            )
             return response.text
         except Exception as e:
             return f"分析失敗: {str(e)}"
     def send_analysis_email(self, analysis_result, recipient_email, subject="圖片分析結果"):
@@ -87,23 +94,29 @@ class GeminiImageAnalyzer:
             <head>
                 <meta charset="UTF-8">
                 <title>圖片分析結果</title>
             </head>
             <body>
-                <h2>圖片分析結果</h2>
-                <hr>
-                <div style="font-family: Arial, sans-serif; line-height: 1.6;">
                     <p><strong>分析時間：</strong>{datetime.now().strftime("%Y-%m-%d %H:%M:%S")}</p>
                     <h3>分析內容：</h3>
-                    <div style="background-color: #f5f5f5; padding: 15px; border-radius: 5px; border-left: 4px solid #007bff;">
                         {html.escape(analysis_result).replace('\n', '<br>')}
                     </div>
                 </div>
-                <br>
-                <p style="color: #666; font-size: 12px;">此郵件由Gemini圖片分析系統自動發送</p>
             </body>
             </html>
             """
             params = {
                 "from": "Acme <onboarding@resend.dev>",
                 "to": [recipient_email],
@@ -113,29 +126,26 @@ class GeminiImageAnalyzer:
             }
             email_response = resend.Emails.send(params)
             return f"郵件發送成功！郵件ID: {email_response.get('id', 'Unknown')}"
         except Exception as e:
             return f"郵件發送失敗: {str(e)}"
 def create_gradio_app():
-    # 從環境變量獲取API密鑰
-    GEMINI_API_KEY = os.getenv("GEMINI_API_KEY")
-    RESEND_API_KEY = os.getenv("RESEND_API_KEY")
-    # 檢查API密鑰是否存在
-    if not GEMINI_API_KEY:
-        raise ValueError("請在HuggingFace Spaces設定中添加 GEMINI_API_KEY 環境變量")
-    if not RESEND_API_KEY:
-        raise ValueError("請在HuggingFace Spaces設定中添加 RESEND_API_KEY 環境變量")
     # 創建分析器實例
-    analyzer = GeminiImageAnalyzer(GEMINI_API_KEY, RESEND_API_KEY)
-    def process_image_and_send_email(image, prompt, recipient_email, email_subject, send_email_flag):
         """處理圖片分析並可選發送郵件"""
         try:
-            if image is None:
                 return "請先上傳圖片", ""
             # 使用默認提示詞如果為空
@@ -143,7 +153,7 @@ def create_gradio_app():
                 prompt = "請詳細描述這張圖片的內容，並提取圖片中的文字，使用繁體中文"
             # 分析圖片
-            analysis_result = analyzer.analyze_image(image, prompt)
             email_status = ""
             if send_email_flag and recipient_email.strip():
@@ -166,28 +176,16 @@ def create_gradio_app():
             return f"處理失敗: {str(e)}", ""
     # 創建Gradio介面
-    with gr.Blocks(
-        title="Gemini 圖片分析與郵件發送系統",
-        theme=gr.themes.Soft(),
-        css="""
-        .gradio-container {
-            max-width: 1200px !important;
-        }
-        """
-    ) as app:
-        gr.Markdown(
-            "# 🔍 Gemini 圖片分析與郵件發送系統\n"
-            "上傳圖片進行AI分析，並可選擇將結果發送到指定郵箱\n"
-            "---"
-        )
         with gr.Row():
             with gr.Column(scale=1):
                 # 圖片上傳
                 image_input = gr.Image(
                     type="filepath",
-                    label="上傳圖片 (支援 JPG, PNG 格式)",
-                    height=300
                 )
                 # 提示詞輸入
@@ -254,7 +252,6 @@ def create_gradio_app():
             - 支援的圖片格式：JPG, JPEG, PNG
             - 分析結果會以繁體中文顯示
             - 郵件功能為可選，不影響圖片分析功能
-            - 本應用運行在 HuggingFace Spaces 上
             """)
         # 綁定事件
@@ -285,28 +282,9 @@ def create_gradio_app():
                     lambda x=example: x,
                     outputs=prompt_input
                 )
-        # 添加頁腳
-        gr.Markdown(
-            "---\n"
-            "💡 **提示**: 如果遇到API錯誤，請檢查環境變量設定是否正確\n"
-            "🔗 **技術**: 使用 Gemini 2.0 Flash 模型進行圖片分析"
-        )
     return app
-# HuggingFace Spaces 入口點
-if __name__ == "__main__":
-    try:
-        app = create_gradio_app()
-        app.launch()  # HuggingFace Spaces 會自動處理部署配置
-    except Exception as e:
-        print(f"應用啟動失敗: {e}")
-        # 創建一個錯誤頁面
-        error_app = gr.Interface(
-            fn=lambda: f"配置錯誤: {str(e)}\n\n請檢查以下設定:\n1. GEMINI_API_KEY 環境變量\n2. RESEND_API_KEY 環境變量",
-            inputs=[],
-            outputs=gr.Textbox(label="錯誤信息"),
-            title="配置錯誤"
-        )
-        error_app.launch()

 from google import genai
 import resend
 import html
+import logging
+# 設置日誌級別，以查看 Gradio 和底層庫的詳細資訊
+logging.basicConfig(level=logging.INFO)
 class GeminiImageAnalyzer:
     def __init__(self, gemini_api_key, resend_api_key):
         """初始化Gemini客戶端和Resend"""
+        if not gemini_api_key:
+            raise ValueError("未找到 Gemini API 金鑰。請將其設置為環境變數。")
+        if not resend_api_key:
+            raise ValueError("未找到 Resend API 金鑰。請將其設置為環境變數。")
         self.gemini_api_key = gemini_api_key
+        # 使用提供的金鑰初始化 Gemini 客戶端
+        genai.configure(api_key=gemini_api_key)
+        self.client = genai.GenerativeModel(model_name="gemini-1.5-flash")
+        # 使用提供的金鑰初始化 Resend
         resend.api_key = resend_api_key
     def validate_image(self, image_path):
                 mime_type = "image/jpeg"
             elif file_extension == '.png':
                 mime_type = "image/png"
+            else:
+                mime_type = "application/octet-stream" # 預設類型
             return encoded_string, mime_type
         except Exception as e:
             raise Exception(f"圖片編碼失敗: {str(e)}")
+    def analyze_image(self, image_path, prompt):
         """使用Gemini API分析圖片"""
         try:
             # 驗證圖片
             self.validate_image(image_path)
+            logging.info(f"成功驗證圖片: {image_path}")
             # 編碼圖片
             encoded_image, mime_type = self.encode_image(image_path)
+            logging.info(f"圖片成功編碼為 {mime_type}")
             # 構建請求內容
+            image_part = {
+                "mime_type": mime_type,
+                "data": base64.b64decode(encoded_image)
+            }
+            contents = [prompt, image_part]
             # 調用Gemini API
+            response = self.client.generate_content(contents)
+            logging.info("成功調用 Gemini API")
             return response.text
         except Exception as e:
+            logging.error(f"分析失敗: {str(e)}")
             return f"分析失敗: {str(e)}"
     def send_analysis_email(self, analysis_result, recipient_email, subject="圖片分析結果"):
             <head>
                 <meta charset="UTF-8">
                 <title>圖片分析結果</title>
+                <style>
+                    body {{ font-family: Arial, sans-serif; line-height: 1.6; color: #333; }}
+                    .container {{ max-width: 600px; margin: 20px auto; padding: 20px; border: 1px solid #ddd; border-radius: 8px; }}
+                    h2 {{ color: #0056b3; }}
+                    .info-box {{ background-color: #f0f8ff; padding: 15px; border-radius: 5px; border-left: 4px solid #007bff; }}
+                    .footer {{ margin-top: 20px; font-size: 12px; color: #777; }}
+                </style>
             </head>
             <body>
+                <div class="container">
+                    <h2>圖片分析結果</h2>
+                    <hr>
                     <p><strong>分析時間：</strong>{datetime.now().strftime("%Y-%m-%d %H:%M:%S")}</p>
                     <h3>分析內容：</h3>
+                    <div class="info-box">
                         {html.escape(analysis_result).replace('\n', '<br>')}
                     </div>
+                    <p class="footer">此郵件由Gemini圖片分析系統自動發送</p>
                 </div>
             </body>
             </html>
             """
             params = {
                 "from": "Acme <onboarding@resend.dev>",
                 "to": [recipient_email],
             }
             email_response = resend.Emails.send(params)
+            logging.info(f"郵件發送成功！郵件ID: {email_response.get('id', 'Unknown')}")
             return f"郵件發送成功！郵件ID: {email_response.get('id', 'Unknown')}"
         except Exception as e:
+            logging.error(f"郵件發送失敗: {str(e)}")
             return f"郵件發送失敗: {str(e)}"
 def create_gradio_app():
+    """創建 Gradio 應用介面"""
+    # 從環境變數中讀取 API 密鑰
+    gemini_api_key = os.getenv("GEMINI_API_KEY")
+    resend_api_key = os.getenv("RESEND_API_KEY")
     # 創建分析器實例
+    analyzer = GeminiImageAnalyzer(gemini_api_key, resend_api_key)
+    def process_image_and_send_email(image_file, prompt, recipient_email, email_subject, send_email_flag):
         """處理圖片分析並可選發送郵件"""
         try:
+            if image_file is None:
                 return "請先上傳圖片", ""
             # 使用默認提示詞如果為空
                 prompt = "請詳細描述這張圖片的內容，並提取圖片中的文字，使用繁體中文"
             # 分析圖片
+            analysis_result = analyzer.analyze_image(image_file, prompt)
             email_status = ""
             if send_email_flag and recipient_email.strip():
             return f"處理失敗: {str(e)}", ""
     # 創建Gradio介面
+    with gr.Blocks(title="Gemini 圖片分析與郵件發送系統") as app:
+        gr.Markdown("# 🔍 Gemini 圖片分析與郵件發送系統")
+        gr.Markdown("上傳圖片進行AI分析，並可選擇將結果發送到指定郵箱")
         with gr.Row():
             with gr.Column(scale=1):
                 # 圖片上傳
                 image_input = gr.Image(
                     type="filepath",
+                    label="上傳圖片 (支援 JPG, PNG 格式)"
                 )
                 # 提示詞輸入
             - 支援的圖片格式：JPG, JPEG, PNG
             - 分析結果會以繁體中文顯示
             - 郵件功能為可選，不影響圖片分析功能
             """)
         # 綁定事件
                     lambda x=example: x,
                     outputs=prompt_input
                 )
     return app
+# 在 Hugging Face Spaces 上，應用會自動被 `app.py` 啟動，
+# 所以我們只需將主函數的啟動邏輯放在檔案的頂層。
+app = create_gradio_app()