Spaces:

MichaelChou0806
/

LINE_audio_transcript

Sleeping

App Files Files Community

MichaelChou0806 commited on Oct 8, 2025

Commit

6c57120

verified ·

1 Parent(s): bc06406

Update app.py

Browse files

Files changed (1) hide show

app.py +323 -212

app.py CHANGED Viewed

@@ -14,7 +14,7 @@ client = OpenAI(api_key=os.getenv("OPENAI_API_KEY"))
 print("===== 🚀 啟動中 =====")
 print(f"APP_PASSWORD: {'✅ 已載入' if PASSWORD else '❌ 未載入'}")
-# ====== 工具:把 data:URL 轉成臨時檔 ======
 MIME_EXT = {
     "audio/mp4": "m4a", "audio/m4a": "m4a", "audio/aac": "aac",
     "audio/mpeg": "mp3", "audio/wav": "wav", "audio/x-wav": "wav",
@@ -24,41 +24,31 @@ MIME_EXT = {
 def _dataurl_to_file(data_url: str, orig_name: str | None = None) -> str:
     """將 data URL 轉換為本地檔案"""
-    print(f"  → [_dataurl_to_file] 開始處理 data URL...")
     try:
         header, b64 = data_url.split(",", 1)
     except ValueError:
-        raise ValueError("data URL format error")
     mime = header.split(";")[0].split(":", 1)[-1].strip()
     ext = MIME_EXT.get(mime) or (mimetypes.guess_extension(mime) or "m4a").lstrip(".")
     fname = orig_name if (orig_name and "." in orig_name) else f"upload_{uuid.uuid4().hex}.{ext}"
-    print(f"  → [_dataurl_to_file] 檔名: {fname}, Base64長度: {len(b64)}")
     with open(fname, "wb") as f:
         f.write(base64.b64decode(b64))
-    file_size = os.path.getsize(fname)
-    print(f"  → [_dataurl_to_file] ✅ 檔案已建立, 大小: {file_size} bytes")
     return fname
 def _extract_effective_path(file_obj) -> str:
     """從各種格式中提取有效檔案路徑"""
-    print(f"[_extract_effective_path] 收到類型: {type(file_obj)}")
     # 字串模式
     if isinstance(file_obj, str):
         s = file_obj.strip().strip('"')
         if s.startswith("data:"):
-            print(f"  → 偵測到 data URL")
             return _dataurl_to_file(s, None)
         if os.path.isfile(s):
-            print(f"  → 找到檔案路徑: {s}")
             return s
     # 字典模式
     if isinstance(file_obj, dict):
-        print(f"  → 字典模式, Keys: {list(file_obj.keys())}")
         data = file_obj.get("data")
         if isinstance(data, str) and data.startswith("data:"):
-            print(f"  → 找到 data URL")
             return _dataurl_to_file(data, file_obj.get("orig_name"))
         p = str(file_obj.get("path") or "").strip().strip('"')
         if p and os.path.isfile(p):
@@ -74,19 +64,15 @@ def _extract_effective_path(file_obj) -> str:
     raise FileNotFoundError("Cannot parse uploaded file")
-# ====== 分段處理 ======
 def split_audio(path):
     """將音訊檔案分割成多個小於 25MB 的片段"""
     size = os.path.getsize(path)
-    print(f"[split_audio] 檔案大小: {size} bytes ({size/1024/1024:.2f} MB)")
     if size <= MAX_SIZE:
-        print(f"[split_audio] 不需分割")
         return [path]
-    print(f"[split_audio] 開始分割...")
     audio = AudioSegment.from_file(path)
     n = int(size / MAX_SIZE) + 1
     chunk_ms = len(audio) / n
-    print(f"[split_audio] 分割成 {n} 個片段")
     parts = []
     for i in range(n):
         fn = f"chunk_{i+1}.wav"
@@ -94,7 +80,6 @@ def split_audio(path):
         parts.append(fn)
     return parts
-# ====== 轉錄核心 ======
 def transcribe_core(path, model="whisper-1"):
     """使用 Whisper 進行語音轉錄，並使用 GPT 進行繁簡轉換和摘要"""
     print(f"\n{'='*60}")
@@ -112,9 +97,8 @@ def transcribe_core(path, model="whisper-1"):
         except:
             pass
-    # 分割音訊
     chunks = split_audio(path)
-    print(f"\n[transcribe_core] === Whisper 轉錄 ({len(chunks)} 片段) ===")
     raw = []
     for i, c in enumerate(chunks, 1):
         print(f"[transcribe_core] 轉錄片段 {i}/{len(chunks)}")
@@ -123,13 +107,10 @@ def transcribe_core(path, model="whisper-1"):
                 model=model, file=af, response_format="text"
             )
             raw.append(txt)
-        print(f"[transcribe_core] ✅ 片段 {i} 完成")
     raw_txt = "\n".join(raw)
-    print(f"[transcribe_core] 原始轉錄: {len(raw_txt)} 字元")
     # 簡轉繁
-    print(f"\n[transcribe_core] === 簡轉繁 ===")
     conv = client.chat.completions.create(
         model="gpt-4o-mini",
         messages=[
@@ -139,10 +120,8 @@ def transcribe_core(path, model="whisper-1"):
         temperature=0.0
     )
     trad = conv.choices[0].message.content.strip()
-    print(f"[transcribe_core] ✅ 繁體轉換完成: {len(trad)} 字元")
     # AI 摘要
-    print(f"\n[transcribe_core] === AI 摘要 ===")
     summ = client.chat.completions.create(
         model="gpt-4o-mini",
         messages=[
@@ -154,33 +133,47 @@ def transcribe_core(path, model="whisper-1"):
     summary = summ.choices[0].message.content.strip()
     total_time = time.time() - start_time
-    print(f"\n{'='*60}")
-    print(f"[transcribe_core] ✅✅✅ 全部完成! 總耗時: {total_time:.1f}秒")
-    print(f"{'='*60}\n")
     return trad, summary
 # ====== Gradio UI 函式 ======
-def transcribe_ui(password, file):
-    """網頁界面的轉錄處理函式"""
-    print(f"\n🌐 [UI] 網頁版請求")
     if not password or password.strip() != PASSWORD:
-        return "❌ Password incorrect", "", ""
-    if not file:
-        return "⚠️ No file uploaded", "", ""
     try:
-        path = _extract_effective_path(file)
         text, summary = transcribe_core(path)
-        return "✅ Transcription completed", text, summary
     except Exception as e:
         import traceback
-        print(f"❌ [UI] 錯誤:\n{traceback.format_exc()}")
-        return f"❌ Error: {e}", "", ""
-# ====== 建立 FastAPI 應用 ======
 fastapi_app = FastAPI()
-# CORS 設定
 fastapi_app.add_middleware(
     CORSMiddleware,
     allow_origins=["*"],
@@ -189,51 +182,37 @@ fastapi_app.add_middleware(
     allow_headers=["*"],
 )
-# ====== 完全同步的 API 端點 ======
 @fastapi_app.post("/api/transcribe")
-async def api_transcribe_sync(request: Request):
-    """
-    完全同步的 API 端點 - 直接返回結果,不用輪詢
-    請求格式:
-    {
-      "password": "chou",
-      "file_data": "data:audio/m4a;base64,...",
-      "file_name": "recording.m4a"
-    }
-    """
     try:
         body = await request.json()
-        print(f"\n{'📱'*30}")
-        print(f"🎯 [SYNC API] 收到同步 API 請求")
-        print(f"📦 Keys: {list(body.keys())}")
-        print(f"{'📱'*30}")
         password = body.get("password", "")
         if password.strip() != PASSWORD:
-            print(f"❌ [SYNC API] 密碼錯誤")
             return JSONResponse(
                 status_code=401,
                 content={"status": "error", "error": "Password incorrect"}
             )
         file_data = body.get("file_data", "")
         file_name = body.get("file_name", "recording.m4a")
         if not file_data or not file_data.startswith("data:"):
-            print(f"❌ [SYNC API] 檔案格式錯誤")
             return JSONResponse(
                 status_code=400,
                 content={"status": "error", "error": "Invalid file data format"}
             )
-        print(f"[SYNC API] 檔案長度: {len(file_data)}, 檔名: {file_name}")
-        # 直接處理,同步執行
         file_dict = {"data": file_data, "orig_name": file_name}
         path = _extract_effective_path(file_dict)
-        print(f"✅ [SYNC API] 檔案解析成功: {path}")
         text, summary = transcribe_core(path)
         result = {
@@ -242,234 +221,366 @@ async def api_transcribe_sync(request: Request):
             "summary": summary
         }
-        print(f"\n{'✅'*30}")
-        print(f"✅✅✅ [SYNC API] 完成! 返回結果")
-        print(json.dumps(result, ensure_ascii=False, indent=2))
-        print(f"{'✅'*30}\n")
         return JSONResponse(content=result)
     except Exception as e:
         import traceback
         error_trace = traceback.format_exc()
-        print(f"\n{'❌'*30}")
-        print(f"❌ [SYNC API] 錯誤:\n{error_trace}")
-        print(f"{'❌'*30}\n")
         return JSONResponse(
             status_code=500,
             content={"status": "error", "error": str(e)}
         )
-# ====== 自定義 CSS ======
 custom_css = """
 .gradio-container {
-    max-width: 1200px !important;
-    margin: auto !important;
 }
-/* 主標題 */
-.main-header {
     text-align: center;
-    padding: 2.5rem 1rem;
     background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
-    border-radius: 12px;
-    margin-bottom: 2rem;
-    color: white;
 }
-.main-header h1 {
-    font-size: 2.2rem;
-    margin: 0 0 0.5rem 0;
     font-weight: 700;
 }
-.main-header p {
-    font-size: 1rem;
     margin: 0;
-    opacity: 0.95;
 }
-/* 按鈕 */
-.primary-btn {
     background: linear-gradient(135deg, #667eea 0%, #764ba2 100%) !important;
     border: none !important;
     color: white !important;
     font-weight: 600 !important;
-    font-size: 1.05rem !important;
 }
-/* 文字框 */
-textarea {
-    font-size: 0.95rem !important;
     line-height: 1.6 !important;
 }
-/* 資訊卡片 */
-.info-box {
-    background: #f0f9ff;
-    border-left: 4px solid #3b82f6;
     padding: 1rem;
-    border-radius: 6px;
     margin: 1rem 0;
     font-size: 0.9rem;
 }
-/* 程式碼 */
-pre {
-    background: #1f2937 !important;
-    color: #f3f4f6 !important;
-    padding: 1rem !important;
-    border-radius: 6px !important;
-    font-size: 0.85rem !important;
 }
-code {
-    background: #e5e7eb !important;
-    color: #1f2937 !important;
-    padding: 0.2rem 0.4rem !important;
-    border-radius: 3px !important;
-    font-size: 0.9rem !important;
 }
 """
-# ====== 建立 Gradio 介面 ======
-with gr.Blocks(css=custom_css, theme=gr.themes.Soft(), title="Audio Transcription") as demo:
     # 標題
     gr.HTML("""
-        <div class="main-header">
             <h1>🎧 Audio Transcription Service</h1>
-            <p>AI-Powered Speech-to-Text with Summarization</p>
         </div>
     """)
-    with gr.Tabs():
-        # ====== Tab 1: Upload ======
-        with gr.Tab("🌐 Web Upload"):
-            with gr.Row():
-                with gr.Column(scale=1):
-                    pw = gr.Textbox(label="Password", type="password", placeholder="Enter password")
-                    audio_file = gr.File(label="Audio File", file_types=["audio", ".mp4"])
-                    submit_btn = gr.Button("🚀 Start Transcription", variant="primary", elem_classes="primary-btn")
-                    gr.HTML("""
-                        <div class="info-box">
-                            <strong>Supported:</strong> MP3, M4A, WAV, OGG, WEBM, MP4<br>
-                            <strong>Max Size:</strong> Auto-split for large files
-                        </div>
-                    """)
-                with gr.Column(scale=2):
-                    status = gr.Textbox(label="Status", interactive=False)
-                    transcription = gr.Textbox(label="Transcription", lines=12, show_copy_button=True)
-                    summary = gr.Textbox(label="Summary", lines=5, show_copy_button=True)
-            submit_btn.click(transcribe_ui, [pw, audio_file], [status, transcription, summary])
-        # ====== Tab 2: API ======
-        with gr.Tab("📱 API Documentation"):
-            gr.Markdown("""
-## API Endpoint
-**URL:** `/api/transcribe` (POST)
-**Type:** Synchronous - returns complete results in one request
-### Request Format
 ```json
 {
   "password": "your_password",
-  "file_data": "data:audio/m4a;base64,UklGR...",
   "file_name": "recording.m4a"
 }
 ```
-### Response Format
 ```json
 {
   "status": "success",
-  "transcription": "Full transcription text...",
-  "summary": "AI-generated summary..."
 }
 ```
----
-## iPhone Shortcuts Setup
-1. **Get File** → Audio recording
-2. **Base64 Encode** → File content
-3. **Text** → Create data URL:
-   ```
-   data:audio/m4a;base64,[Base64 Result]
-   ```
-4. **Dictionary** → Request body:
-   - `password`: `chou`
-   - `file_data`: [Text from step 3]
-   - `file_name`: `recording.m4a`
-5. **Get Contents of URL**:
-   - URL: `https://your-domain.com/api/transcribe`
-   - Method: `POST`
-   - Headers: `Content-Type: application/json`
-   - Body: [Dictionary], Type: `JSON`
-6. **Get Dictionary Value**:
-   - `transcription` → Full text
-   - `summary` → Summary
----
-## Testing with cURL
-```bash
-curl -X POST https://your-domain.com/api/transcribe \\
-  -H "Content-Type: application/json" \\
-  -d '{
-    "password": "chou",
-    "file_data": "data:audio/m4a;base64,AAAA...",
-    "file_name": "test.m4a"
-  }'
-```
----
-## Technical Details
-- **Transcription:** OpenAI Whisper (high accuracy)
-- **Summarization:** GPT-4o-mini
-- **Output:** Traditional Chinese (Taiwan)
-- **Processing:** Fully synchronous, no polling needed
-- **File Handling:** Auto-split for files > 25MB
----
-## Error Codes
-- `401` - Incorrect password
-- `400` - Invalid file format
-- `500` - Processing error
-For support, contact your administrator.
-            """)
     # 頁腳
     gr.HTML("""
-        <div style="text-align: center; margin-top: 2rem; padding: 1.5rem; background: #f9fafb; border-radius: 8px;">
-            <p style="color: #6b7280; font-size: 0.9rem; margin: 0;">
-                Audio Transcription Service v2.0 | Powered by OpenAI
-            </p>
         </div>
     """)
-# ====== 掛載 Gradio 到 FastAPI ======
 app = gr.mount_gradio_app(fastapi_app, demo, path="/")
 # ====== 啟動 ======
 if __name__ == "__main__":
     print("\n" + "="*60)
-    print("🚀 啟動 FastAPI + Gradio 應用")
-    print("📱 同步 API: /api/transcribe")
-    print("🌐 網頁介面: /")
     print("="*60 + "\n")
     import uvicorn
     uvicorn.run(app, host="0.0.0.0", port=7860)

 print("===== 🚀 啟動中 =====")
 print(f"APP_PASSWORD: {'✅ 已載入' if PASSWORD else '❌ 未載入'}")
+# ====== 工具函數 ======
 MIME_EXT = {
     "audio/mp4": "m4a", "audio/m4a": "m4a", "audio/aac": "aac",
     "audio/mpeg": "mp3", "audio/wav": "wav", "audio/x-wav": "wav",
 def _dataurl_to_file(data_url: str, orig_name: str | None = None) -> str:
     """將 data URL 轉換為本地檔案"""
     try:
         header, b64 = data_url.split(",", 1)
     except ValueError:
+        raise ValueError("Invalid data URL format")
     mime = header.split(";")[0].split(":", 1)[-1].strip()
     ext = MIME_EXT.get(mime) or (mimetypes.guess_extension(mime) or "m4a").lstrip(".")
     fname = orig_name if (orig_name and "." in orig_name) else f"upload_{uuid.uuid4().hex}.{ext}"
     with open(fname, "wb") as f:
         f.write(base64.b64decode(b64))
     return fname
 def _extract_effective_path(file_obj) -> str:
     """從各種格式中提取有效檔案路徑"""
     # 字串模式
     if isinstance(file_obj, str):
         s = file_obj.strip().strip('"')
         if s.startswith("data:"):
             return _dataurl_to_file(s, None)
         if os.path.isfile(s):
             return s
     # 字典模式
     if isinstance(file_obj, dict):
         data = file_obj.get("data")
         if isinstance(data, str) and data.startswith("data:"):
             return _dataurl_to_file(data, file_obj.get("orig_name"))
         p = str(file_obj.get("path") or "").strip().strip('"')
         if p and os.path.isfile(p):
     raise FileNotFoundError("Cannot parse uploaded file")
 def split_audio(path):
     """將音訊檔案分割成多個小於 25MB 的片段"""
     size = os.path.getsize(path)
     if size <= MAX_SIZE:
         return [path]
     audio = AudioSegment.from_file(path)
     n = int(size / MAX_SIZE) + 1
     chunk_ms = len(audio) / n
     parts = []
     for i in range(n):
         fn = f"chunk_{i+1}.wav"
         parts.append(fn)
     return parts
 def transcribe_core(path, model="whisper-1"):
     """使用 Whisper 進行語音轉錄，並使用 GPT 進行繁簡轉換和摘要"""
     print(f"\n{'='*60}")
         except:
             pass
+    # 分割並轉錄
     chunks = split_audio(path)
     raw = []
     for i, c in enumerate(chunks, 1):
         print(f"[transcribe_core] 轉錄片段 {i}/{len(chunks)}")
                 model=model, file=af, response_format="text"
             )
             raw.append(txt)
     raw_txt = "\n".join(raw)
     # 簡轉繁
     conv = client.chat.completions.create(
         model="gpt-4o-mini",
         messages=[
         temperature=0.0
     )
     trad = conv.choices[0].message.content.strip()
     # AI 摘要
     summ = client.chat.completions.create(
         model="gpt-4o-mini",
         messages=[
     summary = summ.choices[0].message.content.strip()
     total_time = time.time() - start_time
+    print(f"[transcribe_core] ✅ 全部完成! 總耗時: {total_time:.1f}秒\n")
     return trad, summary
 # ====== Gradio UI 函式 ======
+def transcribe_web(password, audio_file):
+    """網頁版轉錄處理"""
+    print(f"\n🌐 [WEB] 收到網頁請求")
+    # 驗證密碼
     if not password or password.strip() != PASSWORD:
+        return "❌ Incorrect password. Please try again.", "", ""
+    # 檢查檔案
+    if not audio_file:
+        return "⚠️ Please upload an audio file first.", "", ""
     try:
+        # 處理檔案
+        path = _extract_effective_path(audio_file)
+        print(f"[WEB] 檔案路徑: {path}")
+        # 轉錄
         text, summary = transcribe_core(path)
+        # 統計資訊
+        char_count = len(text)
+        status = f"✅ Transcription completed successfully!\n📝 Total characters: {char_count}"
+        print(f"[WEB] ✅ 成功完成")
+        return status, text, summary
     except Exception as e:
         import traceback
+        error_msg = traceback.format_exc()
+        print(f"❌ [WEB] 錯誤:\n{error_msg}")
+        return f"❌ Error: {str(e)}", "", ""
+# ====== FastAPI 應用 ======
 fastapi_app = FastAPI()
 fastapi_app.add_middleware(
     CORSMiddleware,
     allow_origins=["*"],
     allow_headers=["*"],
 )
 @fastapi_app.post("/api/transcribe")
+async def api_transcribe(request: Request):
+    """API 端點 - 用於手機等外部調用"""
     try:
         body = await request.json()
+        print(f"\n📱 [API] 收到 API 請求")
+        # 驗證密碼
         password = body.get("password", "")
         if password.strip() != PASSWORD:
             return JSONResponse(
                 status_code=401,
                 content={"status": "error", "error": "Password incorrect"}
             )
+        # 檢查檔案資料
         file_data = body.get("file_data", "")
         file_name = body.get("file_name", "recording.m4a")
         if not file_data or not file_data.startswith("data:"):
             return JSONResponse(
                 status_code=400,
                 content={"status": "error", "error": "Invalid file data format"}
             )
+        # 處理檔案
         file_dict = {"data": file_data, "orig_name": file_name}
         path = _extract_effective_path(file_dict)
+        print(f"[API] 檔案解析成功: {path}")
+        # 轉錄
         text, summary = transcribe_core(path)
         result = {
             "summary": summary
         }
+        print(f"[API] ✅ 成功完成\n")
         return JSONResponse(content=result)
     except Exception as e:
         import traceback
         error_trace = traceback.format_exc()
+        print(f"❌ [API] 錯誤:\n{error_trace}\n")
         return JSONResponse(
             status_code=500,
             content={"status": "error", "error": str(e)}
         )
+# ====== 自定義樣式 ======
 custom_css = """
+/* 全局設定 */
+* {
+    font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
+}
 .gradio-container {
+    max-width: 1400px !important;
+    margin: 0 auto !important;
 }
+/* 主容器 */
+.main-container {
+    padding: 2rem;
+}
+/* 標題區 */
+.hero-section {
     text-align: center;
+    padding: 3rem 2rem;
     background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
+    border-radius: 16px;
+    margin-bottom: 3rem;
+    box-shadow: 0 8px 32px rgba(102, 126, 234, 0.3);
 }
+.hero-section h1 {
+    color: white;
+    font-size: 2.5rem;
     font-weight: 700;
+    margin: 0 0 0.5rem 0;
+    letter-spacing: -0.02em;
 }
+.hero-section p {
+    color: rgba(255, 255, 255, 0.9);
+    font-size: 1.15rem;
     margin: 0;
 }
+/* 卡片樣式 */
+.card {
+    background: white;
+    border-radius: 12px;
+    padding: 2rem;
+    box-shadow: 0 4px 16px rgba(0, 0, 0, 0.08);
+    margin-bottom: 1.5rem;
+}
+.card h2 {
+    font-size: 1.5rem;
+    font-weight: 600;
+    margin: 0 0 1.5rem 0;
+    color: #1f2937;
+}
+/* 輸入框樣式 */
+.input-group {
+    margin-bottom: 1.5rem;
+}
+.input-group label {
+    display: block;
+    font-weight: 600;
+    color: #374151;
+    margin-bottom: 0.5rem;
+    font-size: 0.95rem;
+}
+input[type="password"],
+textarea {
+    width: 100%;
+    padding: 0.75rem;
+    border: 2px solid #e5e7eb;
+    border-radius: 8px;
+    font-size: 0.95rem;
+    transition: all 0.2s;
+}
+input[type="password"]:focus,
+textarea:focus {
+    outline: none;
+    border-color: #667eea;
+    box-shadow: 0 0 0 3px rgba(102, 126, 234, 0.1);
+}
+/* 按鈕樣式 */
+button.primary-btn {
+    width: 100%;
+    padding: 1rem 2rem !important;
     background: linear-gradient(135deg, #667eea 0%, #764ba2 100%) !important;
     border: none !important;
     color: white !important;
+    font-size: 1.1rem !important;
     font-weight: 600 !important;
+    border-radius: 10px !important;
+    cursor: pointer !important;
+    transition: all 0.3s !important;
+    box-shadow: 0 4px 12px rgba(102, 126, 234, 0.3) !important;
 }
+button.primary-btn:hover {
+    transform: translateY(-2px) !important;
+    box-shadow: 0 6px 20px rgba(102, 126, 234, 0.4) !important;
+}
+/* 檔案上傳區 */
+.file-upload-area {
+    border: 2px dashed #d1d5db;
+    border-radius: 12px;
+    padding: 2.5rem;
+    text-align: center;
+    background: #f9fafb;
+    transition: all 0.3s;
+    cursor: pointer;
+}
+.file-upload-area:hover {
+    border-color: #667eea;
+    background: #f0f4ff;
+}
+/* 狀態框 */
+.status-box {
+    padding: 1rem;
+    border-radius: 8px;
+    margin-bottom: 1rem;
+    font-size: 0.95rem;
+    line-height: 1.5;
+}
+.status-success {
+    background: #d1fae5;
+    border-left: 4px solid #10b981;
+    color: #065f46;
+}
+.status-error {
+    background: #fee2e2;
+    border-left: 4px solid #ef4444;
+    color: #991b1b;
+}
+.status-warning {
+    background: #fef3c7;
+    border-left: 4px solid #f59e0b;
+    color: #92400e;
+}
+/* 結果文字框 */
+textarea.result-text {
+    min-height: 200px !important;
+    font-family: "SF Mono", Monaco, monospace !important;
+    font-size: 0.9rem !important;
     line-height: 1.6 !important;
+    background: #f9fafb !important;
 }
+/* 資訊提示 */
+.info-banner {
+    background: #eff6ff;
+    border: 1px solid #bfdbfe;
+    border-radius: 8px;
     padding: 1rem;
     margin: 1rem 0;
     font-size: 0.9rem;
+    color: #1e40af;
 }
+/* 分隔線 */
+.divider {
+    height: 1px;
+    background: #e5e7eb;
+    margin: 2rem 0;
 }
+/* API 文檔區 */
+.api-section {
+    background: #f9fafb;
+    border-radius: 12px;
+    padding: 2rem;
+    margin-top: 2rem;
+}
+.api-section h3 {
+    font-size: 1.25rem;
+    font-weight: 600;
+    color: #1f2937;
+    margin: 0 0 1rem 0;
+}
+.api-endpoint {
+    background: #1f2937;
+    color: #f3f4f6;
+    padding: 1rem;
+    border-radius: 8px;
+    font-family: monospace;
+    font-size: 0.9rem;
+    margin: 1rem 0;
+}
+/* 響應式設計 */
+@media (max-width: 768px) {
+    .hero-section h1 {
+        font-size: 2rem;
+    }
+    .card {
+        padding: 1.5rem;
+    }
 }
 """
+# ====== Gradio 介面 ======
+with gr.Blocks(css=custom_css, theme=gr.themes.Soft(), title="Audio Transcription Service") as demo:
     # 標題
     gr.HTML("""
+        <div class="hero-section">
             <h1>🎧 Audio Transcription Service</h1>
+            <p>AI-Powered Speech Recognition & Summarization</p>
         </div>
     """)
+    # 主要上傳區域
+    gr.HTML('<div class="card">')
+    gr.Markdown("## 🎵 Upload & Transcribe")
+    with gr.Row():
+        with gr.Column(scale=1):
+            password_input = gr.Textbox(
+                label="🔐 Password",
+                type="password",
+                placeholder="Enter password",
+                elem_classes="input-group"
+            )
+            audio_input = gr.File(
+                label="📁 Audio File",
+                file_types=["audio", ".mp4"],
+                file_count="single",
+                elem_classes="file-upload-area"
+            )
+            gr.HTML("""
+                <div class="info-banner">
+                    <strong>💡 Supported formats:</strong> MP3, M4A, WAV, OGG, WEBM, MP4<br>
+                    <strong>📦 File size:</strong> Automatic chunking for large files
+                </div>
+            """)
+            submit_button = gr.Button(
+                "🚀 Start Transcription",
+                variant="primary",
+                elem_classes="primary-btn"
+            )
+        with gr.Column(scale=2):
+            status_output = gr.Textbox(
+                label="📊 Status",
+                interactive=False,
+                lines=2,
+                elem_classes="status-box"
+            )
+            transcription_output = gr.Textbox(
+                label="📝 Transcription Result",
+                lines=15,
+                placeholder="Transcription will appear here...",
+                show_copy_button=True,
+                elem_classes="result-text"
+            )
+            summary_output = gr.Textbox(
+                label="💡 AI Summary",
+                lines=6,
+                placeholder="AI-generated summary will appear here...",
+                show_copy_button=True,
+                elem_classes="result-text"
+            )
+    gr.HTML('</div>')
+    # API 文檔
+    gr.HTML('<div class="api-section">')
+    gr.Markdown("## 📱 API Integration")
+    gr.Markdown("""
+### For Mobile Apps & External Services
+**Endpoint:** `POST /api/transcribe`
+**Request Body (JSON):**
 ```json
 {
   "password": "your_password",
+  "file_data": "data:audio/m4a;base64,...",
   "file_name": "recording.m4a"
 }
 ```
+**Response:**
 ```json
 {
   "status": "success",
+  "transcription": "Full text...",
+  "summary": "Summary..."
 }
 ```
+**Features:**
+- ✅ Fully synchronous - returns complete results
+- ✅ Automatic file chunking for large files
+- ✅ Traditional Chinese output
+- ✅ AI-powered summarization
+**Use Cases:**
+- iPhone Shortcuts automation
+- Mobile app integration
+- Webhook processing
+- Batch transcription systems
+    """)
+    gr.HTML('</div>')
     # 頁腳
     gr.HTML("""
+        <div style="text-align: center; margin-top: 3rem; padding: 1.5rem; color: #6b7280; font-size: 0.9rem;">
+            <p><strong>Audio Transcription Service</strong> v2.0</p>
+            <p>Powered by OpenAI Whisper & GPT-4</p>
         </div>
     """)
+    # 綁定事件
+    submit_button.click(
+        fn=transcribe_web,
+        inputs=[password_input, audio_input],
+        outputs=[status_output, transcription_output, summary_output]
+    )
+# ====== 掛載到 FastAPI ======
 app = gr.mount_gradio_app(fastapi_app, demo, path="/")
 # ====== 啟動 ======
 if __name__ == "__main__":
     print("\n" + "="*60)
+    print("🚀 啟動服務")
+    print("🌐 網頁介面: http://0.0.0.0:7860")
+    print("📱 API 端點: http://0.0.0.0:7860/api/transcribe")
     print("="*60 + "\n")
     import uvicorn
     uvicorn.run(app, host="0.0.0.0", port=7860)