Spaces:

MichaelChou0806
/

LINE_audio_transcript

Sleeping

App Files Files Community

MichaelChou0806 commited on Oct 8, 2025

Commit

d339fc0

verified ·

1 Parent(s): 7ecf1a3

Update app.py

Browse files

Files changed (1) hide show

app.py +130 -95

app.py CHANGED Viewed

@@ -7,7 +7,7 @@ from fastapi.responses import JSONResponse
 from fastapi.middleware.cors import CORSMiddleware
 # ====== 基本設定 ======
-PASSWORD = os.getenv("APP_PASSWORD")  # 從環境變數讀取，不設預設值
 if not PASSWORD:
     raise ValueError("APP_PASSWORD environment variable is not set!")
@@ -43,11 +43,10 @@ def _extract_effective_path(file_obj) -> str:
     print(f"[DEBUG] 檔案物件類型: {type(file_obj)}")
     print(f"[DEBUG] 檔案物件內容: {file_obj}")
-    # 處理 None
     if file_obj is None:
         raise FileNotFoundError("File object is None")
-    # 如果是字串路徑
     if isinstance(file_obj, str):
         s = file_obj.strip().strip('"')
         print(f"[DEBUG] 字串路徑: {s}")
@@ -56,44 +55,44 @@ def _extract_effective_path(file_obj) -> str:
         if os.path.isfile(s):
             return s
-    # 如果是字典
     if isinstance(file_obj, dict):
         print(f"[DEBUG] 字典 keys: {list(file_obj.keys())}")
-        # 嘗試 data URL
         data = file_obj.get("data")
         if isinstance(data, str) and data.startswith("data:"):
             return _dataurl_to_file(data, file_obj.get("orig_name"))
-        # 嘗試 path
         for key in ["path", "name", "file", "filepath"]:
             p = file_obj.get(key)
             if p and isinstance(p, str):
                 p = p.strip().strip('"')
                 if os.path.isfile(p):
-                    print(f"[DEBUG] 找到有效路徑 (key={key}): {p}")
                     return p
-    # 如果是物件，嘗試獲取屬性
     for attr in ["name", "path", "file", "filepath"]:
         if hasattr(file_obj, attr):
             p = getattr(file_obj, attr, None)
             if p and isinstance(p, str):
                 p = p.strip().strip('"')
                 if os.path.isfile(p):
-                    print(f"[DEBUG] 找到有效路徑 (attr={attr}): {p}")
                     return p
-    # 最後嘗試：直接當作路徑字串
     try:
         path_str = str(file_obj).strip().strip('"')
         if os.path.isfile(path_str):
-            print(f"[DEBUG] 直接轉換為路徑: {path_str}")
             return path_str
     except:
         pass
-    raise FileNotFoundError(f"Cannot parse uploaded file: {type(file_obj)} - {file_obj}")
 def split_audio(path):
     """將音訊檔案分割成多個小於 25MB 的片段"""
@@ -119,7 +118,7 @@ def transcribe_core(path, model="whisper-1"):
     start_time = time.time()
-    # 處理 MP4 格式
     if path.lower().endswith(".mp4"):
         fixed = path[:-4] + ".m4a"
         try:
@@ -164,15 +163,15 @@ def transcribe_core(path, model="whisper-1"):
     summary = summ.choices[0].message.content.strip()
     total_time = time.time() - start_time
-    print(f"[transcribe_core] ✅ 全部完成! 總耗時: {total_time:.1f}秒\n")
     return trad, summary
 # ====== Gradio UI 函式 ======
 def transcribe_web(password, audio_file):
-    """網頁版轉錄處理 - 必須返回三個值"""
     print(f"\n{'='*60}")
-    print(f"🌐 [WEB] 收到網頁請求")
     print(f"密碼: {'已提供' if password else '未提供'}")
     print(f"檔案: {audio_file}")
     print(f"{'='*60}")
@@ -183,35 +182,35 @@ def transcribe_web(password, audio_file):
         return "❌ Please enter password", "", ""
     if password.strip() != PASSWORD:
-        print(f"[WEB] ❌ 密碼錯誤: '{password}' != '{PASSWORD}'")
         return "❌ Incorrect password", "", ""
     # 檢查檔案
     if not audio_file:
         print("[WEB] ❌ 未上傳檔案")
-        return "⚠️ Please upload an audio file", "", ""
     try:
         # 處理檔案
-        print(f"[WEB] 開始處理檔案...")
         path = _extract_effective_path(audio_file)
-        print(f"[WEB] ✅ 檔案路徑: {path}")
         # 轉錄
         print(f"[WEB] 開始轉錄...")
         text, summary = transcribe_core(path)
-        # 統計資訊
         char_count = len(text)
-        status = f"✅ Completed! ({char_count} characters)"
-        print(f"[WEB] ✅ 轉錄成功\n")
         return status, text, summary
     except Exception as e:
         import traceback
         error_msg = traceback.format_exc()
-        print(f"❌ [WEB] 發生錯誤:\n{error_msg}\n")
         return f"❌ Error: {str(e)}", "", ""
 # ====== FastAPI 應用 ======
@@ -231,7 +230,7 @@ async def api_transcribe(request: Request):
     try:
         body = await request.json()
         print(f"\n{'='*60}")
-        print(f"📱 [API] 收到 API 請求")
         print(f"{'='*60}")
         # 驗證密碼
@@ -243,7 +242,7 @@ async def api_transcribe(request: Request):
                 content={"status": "error", "error": "Password incorrect"}
             )
-        # 檢查檔案資料
         file_data = body.get("file_data", "")
         file_name = body.get("file_name", "recording.m4a")
@@ -251,13 +250,13 @@ async def api_transcribe(request: Request):
             print(f"[API] ❌ 檔案格式錯誤")
             return JSONResponse(
                 status_code=400,
-                content={"status": "error", "error": "Invalid file data format"}
             )
         # 處理檔案
         file_dict = {"data": file_data, "orig_name": file_name}
         path = _extract_effective_path(file_dict)
-        print(f"[API] ✅ 檔案解析成功: {path}")
         # 轉錄
         text, summary = transcribe_core(path)
@@ -268,86 +267,123 @@ async def api_transcribe(request: Request):
             "summary": summary
         }
-        print(f"[API] ✅ 轉錄成功\n")
         return JSONResponse(content=result)
     except Exception as e:
         import traceback
         error_trace = traceback.format_exc()
-        print(f"❌ [API] 發生錯誤:\n{error_trace}\n")
         return JSONResponse(
             status_code=500,
             content={"status": "error", "error": str(e)}
         )
 # ====== Gradio 介面 ======
-with gr.Blocks(title="Audio Transcription", theme=gr.themes.Soft()) as demo:
-    gr.Markdown("""
-    # 🎧 Audio Transcription Service
-    ### AI-Powered Speech-to-Text with Summarization
-    """)
-    with gr.Row():
-        with gr.Column(scale=1):
-            gr.Markdown("### 📤 Upload")
-            password_input = gr.Textbox(
-                label="Password",
-                type="password",
-                placeholder="Enter password",
-                max_lines=1
-            )
-            audio_input = gr.File(
-                label="Audio File",
-                file_types=["audio/*", ".mp3", ".m4a", ".wav", ".ogg", ".webm", ".mp4"],
-                file_count="single",
-                type="filepath"
-            )
-            submit_btn = gr.Button(
-                "🚀 Start Transcription",
-                variant="primary",
-                size="lg"
-            )
-            gr.Markdown("""
-            **Supported formats:**
-            MP3, M4A, WAV, OGG, WEBM, MP4
-            **Processing:**
-            Automatic chunking for large files
-            """)
-        with gr.Column(scale=2):
-            gr.Markdown("### 📊 Results")
-            status_output = gr.Textbox(
-                label="Status",
-                interactive=False,
-                lines=1,
-                max_lines=2
-            )
-            transcription_output = gr.Textbox(
-                label="Transcription",
-                lines=12,
-                interactive=True,
-                show_copy_button=True
-            )
-            summary_output = gr.Textbox(
-                label="Summary",
-                lines=6,
-                interactive=True,
-                show_copy_button=True
-            )
-    gr.Markdown("---")
     gr.Markdown("""
-    ## 📱 API Integration
     **Endpoint:** `POST /api/transcribe`
@@ -370,12 +406,11 @@ with gr.Blocks(title="Audio Transcription", theme=gr.themes.Soft()) as demo:
     ```
     """)
-    # 事件綁定 - 這是關鍵！
     submit_btn.click(
         fn=transcribe_web,
         inputs=[password_input, audio_input],
-        outputs=[status_output, transcription_output, summary_output],
-        api_name="transcribe"
     )
 # ====== 掛載到 FastAPI ======

 from fastapi.middleware.cors import CORSMiddleware
 # ====== 基本設定 ======
+PASSWORD = os.getenv("APP_PASSWORD")
 if not PASSWORD:
     raise ValueError("APP_PASSWORD environment variable is not set!")
     print(f"[DEBUG] 檔案物件類型: {type(file_obj)}")
     print(f"[DEBUG] 檔案物件內容: {file_obj}")
     if file_obj is None:
         raise FileNotFoundError("File object is None")
+    # 字串路徑
     if isinstance(file_obj, str):
         s = file_obj.strip().strip('"')
         print(f"[DEBUG] 字串路徑: {s}")
         if os.path.isfile(s):
             return s
+    # 字典格式
     if isinstance(file_obj, dict):
         print(f"[DEBUG] 字典 keys: {list(file_obj.keys())}")
+        # data URL
         data = file_obj.get("data")
         if isinstance(data, str) and data.startswith("data:"):
             return _dataurl_to_file(data, file_obj.get("orig_name"))
+        # 路徑
         for key in ["path", "name", "file", "filepath"]:
             p = file_obj.get(key)
             if p and isinstance(p, str):
                 p = p.strip().strip('"')
                 if os.path.isfile(p):
+                    print(f"[DEBUG] 找到路徑 (key={key}): {p}")
                     return p
+    # 物件屬性
     for attr in ["name", "path", "file", "filepath"]:
         if hasattr(file_obj, attr):
             p = getattr(file_obj, attr, None)
             if p and isinstance(p, str):
                 p = p.strip().strip('"')
                 if os.path.isfile(p):
+                    print(f"[DEBUG] 找到路徑 (attr={attr}): {p}")
                     return p
+    # 直接轉換
     try:
         path_str = str(file_obj).strip().strip('"')
         if os.path.isfile(path_str):
+            print(f"[DEBUG] 直接路徑: {path_str}")
             return path_str
     except:
         pass
+    raise FileNotFoundError(f"Cannot parse file: {type(file_obj)} - {file_obj}")
 def split_audio(path):
     """將音訊檔案分割成多個小於 25MB 的片段"""
     start_time = time.time()
+    # 處理 MP4
     if path.lower().endswith(".mp4"):
         fixed = path[:-4] + ".m4a"
         try:
     summary = summ.choices[0].message.content.strip()
     total_time = time.time() - start_time
+    print(f"[transcribe_core] ✅ 完成! 耗時: {total_time:.1f}秒\n")
     return trad, summary
 # ====== Gradio UI 函式 ======
 def transcribe_web(password, audio_file):
+    """網頁版轉錄處理"""
     print(f"\n{'='*60}")
+    print(f"🌐 [WEB] 收到請求")
     print(f"密碼: {'已提供' if password else '未提供'}")
     print(f"檔案: {audio_file}")
     print(f"{'='*60}")
         return "❌ Please enter password", "", ""
     if password.strip() != PASSWORD:
+        print(f"[WEB] ❌ 密碼錯誤")
         return "❌ Incorrect password", "", ""
     # 檢查檔案
     if not audio_file:
         print("[WEB] ❌ 未上傳檔案")
+        return "⚠️ Please upload audio file", "", ""
     try:
         # 處理檔案
+        print(f"[WEB] 處理檔案...")
         path = _extract_effective_path(audio_file)
+        print(f"[WEB] ✅ 檔案: {path}")
         # 轉錄
         print(f"[WEB] 開始轉錄...")
         text, summary = transcribe_core(path)
+        # 統計
         char_count = len(text)
+        status = f"✅ Completed! ({char_count} chars)"
+        print(f"[WEB] ✅ 成功\n")
         return status, text, summary
     except Exception as e:
         import traceback
         error_msg = traceback.format_exc()
+        print(f"❌ [WEB] 錯誤:\n{error_msg}\n")
         return f"❌ Error: {str(e)}", "", ""
 # ====== FastAPI 應用 ======
     try:
         body = await request.json()
         print(f"\n{'='*60}")
+        print(f"📱 [API] 收到請求")
         print(f"{'='*60}")
         # 驗證密碼
                 content={"status": "error", "error": "Password incorrect"}
             )
+        # 檢查檔案
         file_data = body.get("file_data", "")
         file_name = body.get("file_name", "recording.m4a")
             print(f"[API] ❌ 檔案格式錯誤")
             return JSONResponse(
                 status_code=400,
+                content={"status": "error", "error": "Invalid file format"}
             )
         # 處理檔案
         file_dict = {"data": file_data, "orig_name": file_name}
         path = _extract_effective_path(file_dict)
+        print(f"[API] ✅ 檔案: {path}")
         # 轉錄
         text, summary = transcribe_core(path)
             "summary": summary
         }
+        print(f"[API] ✅ 成功\n")
         return JSONResponse(content=result)
     except Exception as e:
         import traceback
         error_trace = traceback.format_exc()
+        print(f"❌ [API] 錯誤:\n{error_trace}\n")
         return JSONResponse(
             status_code=500,
             content={"status": "error", "error": str(e)}
         )
+# ====== 手機優化 CSS ======
+mobile_css = """
+/* 基本響應式 */
+.gradio-container {
+    max-width: 100% !important;
+    padding: 0.5rem !important;
+}
+/* 手機優化 */
+@media (max-width: 768px) {
+    .gradio-container {
+        padding: 0.25rem !important;
+    }
+    /* 標題縮小 */
+    h1 {
+        font-size: 1.5rem !important;
+    }
+    h3 {
+        font-size: 1.1rem !important;
+    }
+    /* 按鈕加大點擊區域 */
+    button {
+        min-height: 44px !important;
+        font-size: 1rem !important;
+    }
+    /* 輸入框 */
+    input, textarea {
+        font-size: 16px !important; /* 防止手機自動縮放 */
+    }
+    /* 行布局改為列布局 */
+    .row {
+        flex-direction: column !important;
+    }
+    .column {
+        width: 100% !important;
+        max-width: 100% !important;
+    }
+}
+/* 確保文字可選取和複製 */
+textarea {
+    user-select: text !important;
+    -webkit-user-select: text !important;
+}
+"""
 # ====== Gradio 介面 ======
+with gr.Blocks(
+    title="Audio Transcription",
+    theme=gr.themes.Soft(),
+    css=mobile_css
+) as demo:
+    gr.Markdown("# 🎧 Audio Transcription")
+    gr.Markdown("AI-Powered Speech-to-Text")
+    # 密碼輸入
+    password_input = gr.Textbox(
+        label="Password",
+        type="password",
+        placeholder="Enter password"
+    )
+    # 檔案上傳 - 使用最基本的 File 組件
+    audio_input = gr.File(
+        label="Audio File (MP3, M4A, WAV, etc.)",
+        type="filepath"
+    )
+    # 提交按鈕
+    submit_btn = gr.Button(
+        "🚀 Start Transcription",
+        variant="primary",
+        size="lg"
+    )
+    # 狀態顯示
+    status_output = gr.Textbox(
+        label="Status",
+        interactive=False
+    )
+    # 轉錄結果
+    transcription_output = gr.Textbox(
+        label="Transcription",
+        lines=10,
+        max_lines=20
+    )
+    # 摘要
+    summary_output = gr.Textbox(
+        label="Summary",
+        lines=5,
+        max_lines=10
+    )
+    gr.Markdown("---")
     gr.Markdown("""
+    ### 📱 API Integration
     **Endpoint:** `POST /api/transcribe`
     ```
     """)
+    # 事件綁定
     submit_btn.click(
         fn=transcribe_web,
         inputs=[password_input, audio_input],
+        outputs=[status_output, transcription_output, summary_output]
     )
 # ====== 掛載到 FastAPI ======