Spaces:

MichaelChou0806
/

LINE_audio_transcript

Sleeping

App Files Files Community

MichaelChou0806 commited on Oct 8, 2025

Commit

c313f52

verified ·

1 Parent(s): 8fa55d3

Update app.py

Browse files

Files changed (1) hide show

app.py +55 -46

app.py CHANGED Viewed

@@ -4,26 +4,23 @@ import shutil
 from pydub import AudioSegment
 from openai import OpenAI
 import gradio as gr
-from fastapi import FastAPI, File, UploadFile, Form, HTTPException
-from fastapi.responses import JSONResponse
-# ======================================================
-# 🔐 基本設定（支援 Secrets）
-# ======================================================
-OPENAI_API_KEY = os.environ.get("OPENAI_API_KEY")
-APP_PASSWORD = os.environ.get("APP_PASSWORD")
-print("===== 🚀 啟動中 =====")
-print(f"OPENAI_API_KEY: {'✅ 已載入' if OPENAI_API_KEY else '❌ 未載入'}")
-print(f"APP_PASSWORD: {'✅ 已載入' if APP_PASSWORD else '❌ 未載入'}")
-print(APP_PASSWORD)
-client = OpenAI(api_key=OPENAI_API_KEY)
-MAX_SIZE = 25 * 1024 * 1024
-# ======================================================
-# 🎧 音訊處理核心
-# ======================================================
 def split_audio_if_needed(path: str):
     size = os.path.getsize(path)
     if size <= MAX_SIZE:
@@ -38,56 +35,62 @@ def split_audio_if_needed(path: str):
         parts.append(fn)
     return parts
 def transcribe_core(path: str, model: str = "whisper-1"):
     chunks = split_audio_if_needed(path)
     txts = []
     for f in chunks:
         with open(f, "rb") as af:
-            t = client.audio.transcriptions.create(model=model, file=af, response_format="text")
             txts.append(t)
     full = "\n".join(txts)
     summ = client.chat.completions.create(
         model="gpt-4o-mini",
         messages=[{"role": "user", "content": f"請用繁體中文摘要以下內容：\n{full}"}],
         temperature=0.4,
     ).choices[0].message.content.strip()
     return full, summ
-# ======================================================
-# 🌐 FastAPI 主要端點
-# ======================================================
-app = FastAPI(title="LINE Audio Transcriber")
-@app.get("/ping")
-def ping():
-    return {"status": "ok", "key": bool(OPENAI_API_KEY), "pw": bool(APP_PASSWORD)}
 @app.post("/api/transcribe")
-async def api_transcribe(
-    file: UploadFile = File(...),
-    token: str = Form(default=None)
-):
-    """捷徑上傳音訊"""
-    if APP_PASSWORD and token != APP_PASSWORD:
-        raise HTTPException(status_code=403, detail="Forbidden: invalid token")
     temp = file.filename
     with open(temp, "wb") as f:
         f.write(await file.read())
     text, summary = transcribe_core(temp)
     os.remove(temp)
-    return JSONResponse({"text": text, "summary": summary})
-# ======================================================
 # 💬 Gradio 介面
-# ======================================================
 def transcribe_with_pw(password, file):
-    if APP_PASSWORD and password.strip() != APP_PASSWORD:
         return "❌ 密碼錯誤", "", ""
     if not file:
-        return "⚠️ 未上傳音訊", "", ""
     text, summary = transcribe_core(file.name)
     return "✅ 完成", text, summary
@@ -99,10 +102,16 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
     s = gr.Textbox(label="狀態", interactive=False)
     t = gr.Textbox(label="逐字稿", lines=10)
     su = gr.Textbox(label="摘要", lines=8)
     run.click(transcribe_with_pw, [pw, f], [s, t, su])
-# ======================================================
-# 🚀 關鍵啟動（讓 HF 正確偵測）
-# ======================================================
-from gradio.routes import mount_gradio_app
-application = mount_gradio_app(app, demo, path="/")

 from pydub import AudioSegment
 from openai import OpenAI
 import gradio as gr
+from fastapi import FastAPI, File, UploadFile
+# ========================
+# 🔐 基本設定
+# ========================
+PASSWORD = os.getenv("APP_PASSWORD", "defaultpass")
+MAX_SIZE = 25 * 1024 * 1024
+client = OpenAI(api_key=os.getenv("OPENAI_API_KEY"))
+print(PASSWORD)
+# FastAPI App for捷徑 API
+app = FastAPI()
+# ========================
+# 🎧 音訊轉錄核心
+# ========================
 def split_audio_if_needed(path: str):
     size = os.path.getsize(path)
     if size <= MAX_SIZE:
         parts.append(fn)
     return parts
 def transcribe_core(path: str, model: str = "whisper-1"):
+    if path.lower().endswith(".mp4"):
+        fixed = path[:-4] + ".m4a"
+        try:
+            shutil.copy(path, fixed)
+            path = fixed
+            print("🔧 已自動修正 mp4 → m4a")
+        except Exception as e:
+            print(f"⚠️ mp4→m4a 轉檔失敗：{e}")
     chunks = split_audio_if_needed(path)
     txts = []
     for f in chunks:
         with open(f, "rb") as af:
+            t = client.audio.transcriptions.create(
+                model=model, file=af, response_format="text"
+            )
             txts.append(t)
     full = "\n".join(txts)
     summ = client.chat.completions.create(
         model="gpt-4o-mini",
         messages=[{"role": "user", "content": f"請用繁體中文摘要以下內容：\n{full}"}],
         temperature=0.4,
     ).choices[0].message.content.strip()
     return full, summ
+# ========================
+# 🌐 FastAPI 端點（捷徑用）
+# ========================
 @app.post("/api/transcribe")
+async def api_transcribe(file: UploadFile = File(...)):
+    """供 iPhone 捷徑上傳音訊並取得 JSON"""
     temp = file.filename
     with open(temp, "wb") as f:
         f.write(await file.read())
     text, summary = transcribe_core(temp)
     os.remove(temp)
+    return {"text": text, "summary": summary}
+@app.get("/health")
+def health():
+    """捷徑可先 ping 這個確認服務運作中"""
+    return {"status": "ok", "time": int(time.time())}
+# ========================
 # 💬 Gradio 介面
+# ========================
 def transcribe_with_pw(password, file):
+    if password.strip() != PASSWORD:
         return "❌ 密碼錯誤", "", ""
     if not file:
+        return "⚠️ 未選擇檔案", "", ""
     text, summary = transcribe_core(file.name)
     return "✅ 完成", text, summary
     s = gr.Textbox(label="狀態", interactive=False)
     t = gr.Textbox(label="逐字稿", lines=10)
     su = gr.Textbox(label="摘要", lines=8)
     run.click(transcribe_with_pw, [pw, f], [s, t, su])
+# ========================
+# 🚀 啟動（單一埠）
+# ========================
+# 讓 Gradio 介面掛載到 FastAPI
+gr.mount_gradio_app(app, demo, path="/")
+# Hugging Face 自動綁定 port=7860，不用手動設定
+if __name__ == "__main__":
+    import uvicorn
+    uvicorn.run(app, host="0.0.0.0", port=7860)