Spaces:

MichaelChou0806
/

LINE_audio_transcript

Sleeping

App Files Files Community

MichaelChou0806 commited on Oct 8, 2025

Commit

cf686cb

verified ·

1 Parent(s): d634404

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -175

app.py CHANGED Viewed

@@ -4,7 +4,7 @@ import shutil
 from pydub import AudioSegment
 from openai import OpenAI
 import gradio as gr
-from fastapi import FastAPI, File, UploadFile, Form, HTTPException
 # ======================================================
 # 🔐 設定區
@@ -17,58 +17,6 @@ print("===== 🚀 啟動中 =====")
 print(f"APP_PASSWORD: {'✅ 已載入' if PASSWORD else '❌ 未載入'}")
 print(f"目前密碼內容：{PASSWORD}")
-# ======================================================
-# ⚔️ 防暴力破解
-# ======================================================
-MAX_FAILED_IN_WINDOW = 10
-WINDOW_SECONDS = 24 * 3600
-LOCK_DURATION_SECONDS = 24 * 3600
-SHORT_BURST_LIMIT = 5
-SHORT_BURST_SECONDS = 60
-attempts = {}
-locked = {}
-def _now():
-    return int(time.time())
-def prune_old_attempts(sid):
-    cutoff = _now() - WINDOW_SECONDS
-    if sid in attempts:
-        attempts[sid] = [t for t in attempts[sid] if t >= cutoff]
-        if not attempts[sid]:
-            del attempts[sid]
-def check_lock(sid):
-    if sid in locked:
-        if _now() < locked[sid]:
-            remain = locked[sid] - _now()
-            return True, f"🔒 已被鎖定，請 {remain // 60} 分鐘後再試。"
-        else:
-            locked.pop(sid, None)
-            attempts.pop(sid, None)
-    prune_old_attempts(sid)
-    cnt = len(attempts.get(sid, []))
-    if cnt >= MAX_FAILED_IN_WINDOW:
-        locked[sid] = _now() + LOCK_DURATION_SECONDS
-        return True, f"🔒 嘗試過多，已鎖定 24 小時。"
-    return False, ""
-def record_failed_attempt(sid):
-    now = _now()
-    attempts.setdefault(sid, []).append(now)
-    prune_old_attempts(sid)
-    recent_cutoff = now - SHORT_BURST_SECONDS
-    recent = [t for t in attempts[sid] if t >= recent_cutoff]
-    if len(recent) >= SHORT_BURST_LIMIT:
-        locked[sid] = now + 300
-        return len(attempts[sid]), "⚠️ 多次快速嘗試，暫時鎖定5分鐘。"
-    return len(attempts[sid]), ""
-def clear_attempts(sid):
-    attempts.pop(sid, None)
-    locked.pop(sid, None)
 # ======================================================
 # 🎧 音訊轉錄核心
 # ======================================================
@@ -88,8 +36,7 @@ def split_audio_if_needed(path):
         files.append(fn)
     return files
-def transcribe_core(path, model):
-    # 1️⃣ 修正 LINE 語音 mp4 假副檔名
     if path and path.lower().endswith(".mp4"):
         fixed_path = path[:-4] + ".m4a"
         try:
@@ -97,9 +44,8 @@ def transcribe_core(path, model):
             path = fixed_path
             print("🔧 已自動修正 mp4 → m4a")
         except Exception as e:
-            print(f"⚠️ mp4→m4a 複製失敗：{e}，改用原檔嘗試")
-    # 2️⃣ Whisper 轉錄
     chunks = split_audio_if_needed(path)
     raw_parts = []
     for f in chunks:
@@ -112,7 +58,7 @@ def transcribe_core(path, model):
             raw_parts.append(res)
     full_raw = "\n".join(raw_parts)
-    # 3️⃣ 簡轉繁（不改寫內容）
     conv_prompt = (
         "請將以下內容完整轉換為「繁體中文（台灣用語）」：\n"
         "規則：1) 僅做簡→繁字形轉換；2) 不要意譯或改寫；3) 不要添加任何前後綴。\n"
@@ -128,11 +74,10 @@ def transcribe_core(path, model):
     )
     full_trad = trad_resp.choices[0].message.content.strip()
-    # 4️⃣ 生成繁體摘要（自動決定條列與否）
     sum_prompt = (
-        "請用台灣繁體中文撰寫摘要。"
-        "若內容資訊較多，可條列出重點；若內容簡短，請用一句話概述即可。"
-        "請勿添加前綴或評論，僅輸出摘要。\n\n" + full_trad
     )
     sum_resp = client.chat.completions.create(
         model="gpt-4o-mini",
@@ -143,126 +88,33 @@ def transcribe_core(path, model):
         temperature=0.2,
     )
     summ = sum_resp.choices[0].message.content.strip()
     return full_trad, summ
 # ======================================================
-# 🌐 FastAPI API（捷徑用）
 # ======================================================
-app = FastAPI(title="LINE Transcription API")
-@app.post("/api/transcribe")
-async def api_transcribe(
-    file: UploadFile = File(...),
-    token: str = Form(default=None)
-):
-    """供捷徑上傳音訊並取得 JSON"""
-    if token != PASSWORD:
-        raise HTTPException(status_code=403, detail="Invalid token")
-    temp = file.filename
-    with open(temp, "wb") as f:
-        f.write(await file.read())
-    text, summary = transcribe_core(temp, "whisper-1")
-    os.remove(temp)
-    return {"text": text, "summary": summary}
-@app.get("/health")
-def health():
-    """捷徑可 ping 這個確認服務運作中"""
-    return {"status": "ok", "time": int(time.time())}
-# ======================================================
-# 💬 Gradio 主介面
-# ======================================================
-def _normalize_upload_path(file_input):
-    if not file_input:
-        return None
-    if isinstance(file_input, str):
-        return file_input
-    if isinstance(file_input, list) and file_input:
-        return _normalize_upload_path(file_input[0])
-    path = getattr(file_input, "name", None)
-    if not path and isinstance(file_input, dict):
-        path = file_input.get("name") or file_input.get("path")
-    return path
-def transcribe_with_password(session_id, password, file_input, model_choice):
-    password = password.strip().replace(" ", "").replace("\u200b", "")
-    locked_flag, msg = check_lock(session_id)
-    if locked_flag:
-        return msg, "", ""
-    if password != PASSWORD:
-        cnt, msg2 = record_failed_attempt(session_id)
-        return msg2 or f"密碼錯誤（第 {cnt} 次）", "", ""
-    path = _normalize_upload_path(file_input)
-    if not path or not os.path.exists(path):
-        return "找不到上傳檔案，請重新選擇。", "", ""
-    clear_attempts(session_id)
-    full, summ = transcribe_core(path, model_choice)
-    return "✅ 轉錄完成", full, summ
-def ask_about_transcript(full_text, q):
-    if not full_text.strip():
-        return "⚠️ 尚未有轉錄內容"
-    if not q.strip():
-        return "請輸入問題"
-    prompt = f"以下是轉錄內容：\n{full_text}\n\n問題：{q}\n請用繁體中文回答。"
-    res = client.chat.completions.create(
-        model="gpt-4o-mini",
-        messages=[{"role":"user","content":prompt}],
-        temperature=0.6,
-    )
-    return res.choices[0].message.content.strip()
-# ======================================================
-# 🖥️ Gradio UI
-# ======================================================
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
-    gr.Markdown("## 🎧 語音轉錄與摘要工具（私人API勿轉傳｜支援 iPhone LINE .mp4）")
-    session_state = gr.State(value=None)
-    with gr.Row():
-        password_input = gr.Textbox(label="輸入密碼", placeholder="請輸入英文與數字（請切換成英文輸入法）", type="password", max_lines=1)
-        model_choice = gr.Dropdown(["whisper-1", "gpt-4o-mini-transcribe"], value="whisper-1", label="選擇模型")
-    file_input = gr.File(label="上傳音訊 / LINE 語音檔（支援 .m4a, .aac, .wav, .mp4）", file_count="single", file_types=["audio", ".mp4", ".m4a", ".aac", ".wav"])
-    transcribe_btn = gr.Button("開始轉錄與摘要 🚀")
-    status_box = gr.Textbox(label="狀態", interactive=False)
-    transcript_box = gr.Textbox(label="完整轉錄文字", lines=10)
-    copy_transcript = gr.Button("📋 複製轉錄文字")
-    summary_box = gr.Textbox(label="摘要結果", lines=10)
-    copy_summary = gr.Button("📋 複製摘要結果")
-    with gr.Accordion("💬 進一步問 AI", open=False):
-        user_q = gr.Textbox(label="輸入問題", lines=2)
-        ask_btn = gr.Button("詢問 AI 🤔")
-        ai_reply = gr.Textbox(label="AI 回覆", lines=6)
-        copy_reply = gr.Button("📋 複製 AI 回覆")
-    def init_session():
-        import uuid
-        return str(uuid.uuid4())
-    demo.load(init_session, None, session_state)
-    transcribe_btn.click(transcribe_with_password, [session_state, password_input, file_input, model_choice], [status_box, transcript_box, summary_box])
-    ask_btn.click(ask_about_transcript, [transcript_box, user_q], [ai_reply])
-    copy_js = """async (text) => {try {await navigator.clipboard.writeText(text); alert("✅ 已複製到剪貼簿！");} catch (e) {alert("❌ 複製失敗：" + e);}}"""
-    copy_transcript.click(fn=None, inputs=transcript_box, outputs=None, js=copy_js)
-    copy_summary.click(fn=None, inputs=summary_box, outputs=None, js=copy_js)
-    copy_reply.click(fn=None, inputs=ai_reply, outputs=None, js=copy_js)
 # ======================================================
-# 🚀 啟動（Hugging Face 最終穩定版）
 # ======================================================
-# ✅ Hugging Face 會自動搜尋變數 `app` 作為入口
-# 所以我們要在這裡重新指派回 FastAPI + Gradio 結合後的物件
-app = gr.mount_gradio_app(app, demo, path="/")
-# ✅ 不要在 Hugging Face 上手動啟動 uvicorn
-# 若你要在本機測試，再用 python app.py 啟動即可
 if __name__ == "__main__":
-    import uvicorn
-    print("🌐 本地測試模式啟動中：http://127.0.0.1:7860")
-    uvicorn.run(app, host="0.0.0.0", port=7860)

 from pydub import AudioSegment
 from openai import OpenAI
 import gradio as gr
+from fastapi import HTTPException
 # ======================================================
 # 🔐 設定區
 print(f"APP_PASSWORD: {'✅ 已載入' if PASSWORD else '❌ 未載入'}")
 print(f"目前密碼內容：{PASSWORD}")
 # ======================================================
 # 🎧 音訊轉錄核心
 # ======================================================
         files.append(fn)
     return files
+def transcribe_core(path, model="whisper-1"):
     if path and path.lower().endswith(".mp4"):
         fixed_path = path[:-4] + ".m4a"
         try:
             path = fixed_path
             print("🔧 已自動修正 mp4 → m4a")
         except Exception as e:
+            print(f"⚠️ mp4→m4a 轉檔失敗：{e}")
     chunks = split_audio_if_needed(path)
     raw_parts = []
     for f in chunks:
             raw_parts.append(res)
     full_raw = "\n".join(raw_parts)
+    # 簡轉繁
     conv_prompt = (
         "請將以下內容完整轉換為「繁體中文（台灣用語）」：\n"
         "規則：1) 僅做簡→繁字形轉換；2) 不要意譯或改寫；3) 不要添加任何前後綴。\n"
     )
     full_trad = trad_resp.choices[0].message.content.strip()
+    # 摘要
     sum_prompt = (
+        "請用台灣繁體中文撰寫摘要。若內容資訊多，可條列出重點；若內容簡短，請用一句話概述即可。\n\n"
+        + full_trad
     )
     sum_resp = client.chat.completions.create(
         model="gpt-4o-mini",
         temperature=0.2,
     )
     summ = sum_resp.choices[0].message.content.strip()
     return full_trad, summ
 # ======================================================
+# 💬 Gradio 介面
 # ======================================================
+def transcribe_with_password(password, file):
+    if password.strip() != PASSWORD:
+        raise HTTPException(status_code=403, detail="密碼錯誤 ❌")
+    if not file:
+        return "⚠️ 未選擇��案", "", ""
+    text, summary = transcribe_core(file.name)
+    return "✅ 完成", text, summary
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
+    gr.Markdown("## 🎧 LINE 語音轉錄與摘要（支援 .m4a / .mp4）")
+    pw = gr.Textbox(label="輸入密碼", type="password")
+    f = gr.File(label="上傳音訊檔")
+    run = gr.Button("開始轉錄 🚀")
+    s = gr.Textbox(label="狀態", interactive=False)
+    t = gr.Textbox(label="轉錄結果", lines=10)
+    su = gr.Textbox(label="AI 摘要", lines=8)
+    run.click(transcribe_with_password, [pw, f], [s, t, su])
 # ======================================================
+# 🚀 啟動
 # ======================================================
 if __name__ == "__main__":
+    demo.launch(server_name="0.0.0.0", server_port=7860)
+else:
+    demo.launch()