Spaces:

maylinejix
/

Transcript

Running

File size: 2,766 Bytes

import whisper
import tempfile
import os
from fastapi import FastAPI, UploadFile, File, Form
from fastapi.responses import JSONResponse, HTMLResponse
from fastapi.middleware.cors import CORSMiddleware
import uvicorn

app = FastAPI(title="Whisper Transcription API")

print("Loading Whisper model...")
model = whisper.load_model("base")
print("Model loaded.")

app.add_middleware(
    CORSMiddleware,
    allow_origins=["*"],
    allow_methods=["*"],
    allow_headers=["*"],
)

@app.get("/", response_class=HTMLResponse)
async def root():
    return """
    <!DOCTYPE html>
    <html>
    <head>
        <title>Whisper Transcription API</title>
        <style>
            body { font-family: monospace; background: #0d0d0d; color: #e0e0e0; padding: 40px; }
            h1 { color: #7fff7f; }
            a { color: #7fbfff; }
            code { background: #1a1a1a; padding: 2px 6px; border-radius: 4px; }
        </style>
    </head>
    <body>
        <h1>🎙️ Whisper Transcription API</h1>
        <p>Status: <strong style="color:#7fff7f">Running</strong></p>
        <p>Endpoints:</p>
        <ul>
            <li><code>POST /transcribe</code> — Upload audio file, returns text</li>
            <li><code>GET /health</code> — Health check</li>
            <li><a href="/docs">📖 Swagger Docs</a></li>
        </ul>
        <p>Example curl:</p>
        <pre style="background:#1a1a1a;padding:16px;border-radius:8px;">
curl -X POST /transcribe \\
  -F "file=@audio.wav" \\
  -F "language=auto"
        </pre>
    </body>
    </html>
    """

@app.post("/transcribe")
async def transcribe(
    file: UploadFile = File(...),
    language: str = Form(default="auto")
):
    suffix = os.path.splitext(file.filename)[-1] if file.filename else ".wav"
    with tempfile.NamedTemporaryFile(suffix=suffix, delete=False) as tmp:
        content = await file.read()
        tmp.write(content)
        tmp_path = tmp.name

    try:
        lang = language if language != "auto" else None
        result = model.transcribe(tmp_path, language=lang)
        return JSONResponse({
            "text": result["text"].strip(),
            "language": result.get("language", "unknown"),
            "segments": [
                {
                    "start": round(s["start"], 2),
                    "end": round(s["end"], 2),
                    "text": s["text"].strip()
                }
                for s in result.get("segments", [])
            ]
        })
    except Exception as e:
        return JSONResponse({"error": str(e)}, status_code=500)
    finally:
        os.unlink(tmp_path)

@app.get("/health")
async def health():
    return {"status": "ok", "model": "whisper-base"}

if __name__ == "__main__":
    uvicorn.run(app, host="0.0.0.0", port=7860)