Spaces:

MichaelChou0806
/

LINE_audio_transcript

Sleeping

App Files Files Community

MichaelChou0806 commited on Oct 8, 2025

Commit

bcd946f

verified ·

1 Parent(s): 2c881ff

Update app.py

Browse files

Files changed (1) hide show

app.py +40 -45

app.py CHANGED Viewed

@@ -1,23 +1,29 @@
 import os
 import time
 import shutil
-from pydub import AudioSegment
-from openai import OpenAI
 import gradio as gr
-from fastapi import FastAPI, File, UploadFile
 # ========================
-# 🔐 基本設定
 # ========================
-PASSWORD = os.getenv("APP_PASSWORD", "defaultpass")
-MAX_SIZE = 25 * 1024 * 1024
-client = OpenAI(api_key=os.getenv("OPENAI_API_KEY"))
-# FastAPI App for捷徑 API
-app = FastAPI()
 # ========================
-# 🎧 音訊轉錄核心
 # ========================
 def split_audio_if_needed(path: str):
     size = os.path.getsize(path)
@@ -34,22 +40,11 @@ def split_audio_if_needed(path: str):
     return parts
 def transcribe_core(path: str, model: str = "whisper-1"):
-    if path.lower().endswith(".mp4"):
-        fixed = path[:-4] + ".m4a"
-        try:
-            shutil.copy(path, fixed)
-            path = fixed
-            print("🔧 已自動修正 mp4 → m4a")
-        except Exception as e:
-            print(f"⚠️ mp4→m4a 轉檔失敗：{e}")
     chunks = split_audio_if_needed(path)
     txts = []
     for f in chunks:
         with open(f, "rb") as af:
-            t = client.audio.transcriptions.create(
-                model=model, file=af, response_format="text"
-            )
             txts.append(t)
     full = "\n".join(txts)
     summ = client.chat.completions.create(
@@ -60,52 +55,52 @@ def transcribe_core(path: str, model: str = "whisper-1"):
     return full, summ
 # ========================
-# 🌐 FastAPI 端點（捷徑用）
 # ========================
 @app.post("/api/transcribe")
-async def api_transcribe(file: UploadFile = File(...)):
-    """供 iPhone 捷徑上傳音訊並取得 JSON"""
     temp = file.filename
     with open(temp, "wb") as f:
         f.write(await file.read())
     text, summary = transcribe_core(temp)
     os.remove(temp)
-    return {"text": text, "summary": summary}
-@app.get("/health")
-def health():
-    """捷徑可先 ping 這個確認服務運作中"""
-    return {"status": "ok", "time": int(time.time())}
 # ========================
-# 💬 Gradio 介面
 # ========================
-def transcribe_with_pw(password, file):
-    if password.strip() != PASSWORD:
         return "❌ 密碼錯誤", "", ""
     if not file:
-        return "⚠️ 未選擇檔案", "", ""
     text, summary = transcribe_core(file.name)
     return "✅ 完成", text, summary
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
-    gr.Markdown("## 🎧 LINE 語音轉錄與摘要工具（支援 .m4a / .mp4）")
     pw = gr.Textbox(label="輸入密碼", type="password")
     f = gr.File(label="上傳音訊檔 (.m4a/.mp3/.wav/.mp4)")
     run = gr.Button("開始轉錄 🚀")
     s = gr.Textbox(label="狀態", interactive=False)
     t = gr.Textbox(label="逐字稿", lines=10)
     su = gr.Textbox(label="摘要", lines=8)
-    run.click(transcribe_with_pw, [pw, f], [s, t, su])
-# ========================
-# 🚀 啟動（單一埠）
-# ========================
-# 讓 Gradio 介面掛載到 FastAPI
 gr.mount_gradio_app(app, demo, path="/")
-# Hugging Face 自動綁定 port=7860，不用手動設定
-if __name__ == "__main__":
-    import uvicorn
-    uvicorn.run(app, host="0.0.0.0", port=7860)

 import os
 import time
 import shutil
 import gradio as gr
+from fastapi import FastAPI, File, UploadFile, Form, HTTPException
+from openai import OpenAI
+from pydub import AudioSegment
+from fastapi.responses import JSONResponse
 # ========================
+# 🔐 環境變數 / Secret 修正
 # ========================
+# Hugging Face 有時不會正確傳入 Secret，所以做雙重保險：
+OPENAI_API_KEY = os.environ.get("OPENAI_API_KEY") or os.getenv("OPENAI_API_KEY")
+APP_PASSWORD = os.environ.get("APP_PASSWORD") or os.getenv("APP_PASSWORD")
+print("===== 🚀 啟動中 =====")
+print(f"OPENAI_API_KEY: {'✅ 已載入' if OPENAI_API_KEY else '❌ 未載入'}")
+print(f"APP_PASSWORD: {'✅ 已載入' if APP_PASSWORD else '❌ 未載入'}")
+client = OpenAI(api_key=OPENAI_API_KEY)
+MAX_SIZE = 25 * 1024 * 1024
+app = FastAPI(title="LINE Audio Transcriber")
 # ========================
+# 🎧 核心轉錄函式
 # ========================
 def split_audio_if_needed(path: str):
     size = os.path.getsize(path)
     return parts
 def transcribe_core(path: str, model: str = "whisper-1"):
     chunks = split_audio_if_needed(path)
     txts = []
     for f in chunks:
         with open(f, "rb") as af:
+            t = client.audio.transcriptions.create(model=model, file=af, response_format="text")
             txts.append(t)
     full = "\n".join(txts)
     summ = client.chat.completions.create(
     return full, summ
 # ========================
+# 🌐 API 路由 (for 捷徑)
 # ========================
 @app.post("/api/transcribe")
+async def api_transcribe(
+    file: UploadFile = File(...),
+    token: str = Form(default=None)
+):
+    """捷徑可 POST 來呼叫語音轉錄"""
+    if APP_PASSWORD and token != APP_PASSWORD:
+        raise HTTPException(status_code=403, detail="Forbidden: invalid token")
     temp = file.filename
     with open(temp, "wb") as f:
         f.write(await file.read())
     text, summary = transcribe_core(temp)
     os.remove(temp)
+    return JSONResponse({"text": text, "summary": summary})
+@app.get("/ping")
+def ping():
+    return {"status": "ok", "key": bool(OPENAI_API_KEY), "pw": bool(APP_PASSWORD)}
 # ========================
+# 💬 Gradio 前端
 # ========================
+def gradio_ui(password, file):
+    if APP_PASSWORD and password.strip() != APP_PASSWORD:
         return "❌ 密碼錯誤", "", ""
     if not file:
+        return "⚠️ 未上傳音訊", "", ""
     text, summary = transcribe_core(file.name)
     return "✅ 完成", text, summary
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
+    gr.Markdown("## 🎧 LINE 語音轉錄與摘要工具")
     pw = gr.Textbox(label="輸入密碼", type="password")
     f = gr.File(label="上傳音訊檔 (.m4a/.mp3/.wav/.mp4)")
     run = gr.Button("開始轉錄 🚀")
     s = gr.Textbox(label="狀態", interactive=False)
     t = gr.Textbox(label="逐字稿", lines=10)
     su = gr.Textbox(label="摘要", lines=8)
+    run.click(gradio_ui, [pw, f], [s, t, su])
+# 掛上 Gradio
 gr.mount_gradio_app(app, demo, path="/")
+# ✅ Hugging Face Spaces 需要這行來啟動 FastAPI app
+application = app