Spaces:

leekwoon
/

Whisper-FastAPI

Sleeping

dahyedahye commited on Sep 2, 2024

Commit

f8e3c2f

1 Parent(s): 0faa266

Add application file

Files changed (6) hide show

Dockerfile CHANGED Viewed

@@ -1,13 +1,35 @@
-FROM python:3.9
-RUN useradd -m -u 1000 user
-USER user
-ENV PATH="/home/user/.local/bin:$PATH"
-WORKDIR /app
-COPY --chown=user ./requirements.txt requirements.txt
-RUN pip install --no-cache-dir --upgrade -r requirements.txt
 COPY --chown=user . /app
 CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860"]

+FROM debian:bookworm-slim AS builder
+RUN apt-get update && \
+    apt-get install -y curl git python3 python3-pip python3-venv && \
+    rm -rf /var/lib/apt/lists/* /var/cache/apt/archives/* && \
+    mkdir -p /Whisper-WebUI
+WORKDIR /Whisper-WebUI
+COPY requirements.txt .
+RUN python3 -m venv venv && \
+    . venv/bin/activate && \
+    pip install --no-cache-dir -r requirements.txt
+FROM debian:bookworm-slim AS runtime
+RUN apt-get update && \
+    apt-get install -y curl ffmpeg python3 && \
+    rm -rf /var/lib/apt/lists/* /var/cache/apt/archives/*
+WORKDIR /Whisper-WebUI
+COPY . .
+COPY --from=builder /Whisper-WebUI/venv /Whisper-WebUI/venv
+VOLUME [ "/Whisper-WebUI/models" ]
+VOLUME [ "/Whisper-WebUI/outputs" ]
+ENV PATH="/Whisper-WebUI/venv/bin:$PATH"
+ENV LD_LIBRARY_PATH=/Whisper-WebUI/venv/lib64/python3.11/site-packages/nvidia/cublas/lib:/Whisper-WebUI/venv/lib64/python3.11/site-packages/nvidia/cudnn/lib
 COPY --chown=user . /app
 CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860"]

main.py CHANGED Viewed

@@ -1,10 +1,38 @@
-from fastapi import FastAPI
 app = FastAPI()
-@app.get("/hello")
-def hello():
     """
-    this test hello
     """
-    return {"hello": "you success deploy"}

+from fastapi import FastAPI, File, UploadFile
+from fastapi.responses import FileResponse
+import os
+import shutil
+from modules.whisper.whisper_factory import WhisperFactory
 app = FastAPI()
+# Initialize Whisper inference engine
+whisper_inf = WhisperFactory.create_whisper_inference(
+    whisper_type="faster-whisper",
+    whisper_model_dir=os.path.join("models", "Whisper"),
+    faster_whisper_model_dir=os.path.join("models", "Whisper", "faster-whisper"),
+    insanely_fast_whisper_model_dir=os.path.join("models", "Whisper", "insanely-fast-whisper"),
+    output_dir=os.path.join("outputs"),
+)
+@app.post("/upload-video/")
+async def upload_video(file: UploadFile = File(...)):
     """
+    Upload a video file and get the generated SRT file as a response.
     """
+    # Save the uploaded video file temporarily
+    input_video_path = os.path.join("temp", file.filename)
+    os.makedirs("temp", exist_ok=True)
+    with open(input_video_path, "wb") as buffer:
+        shutil.copyfileobj(file.file, buffer)
+    # Generate the subtitle file
+    output_srt_path = whisper_inf.transcribe_file(
+        input_video_path,
+        file_format="SRT",
+        add_timestamp=True
+    )
+    # Return the SRT file as a response
+    return FileResponse(path=output_srt_path, filename=os.path.basename(output_srt_path))

models/models will be saved here.txt ADDED Viewed

File without changes

outputs/outputs are saved here.txt ADDED Viewed

File without changes

outputs/translations/outputs for translation are saved here.txt ADDED Viewed

File without changes

requirements.txt CHANGED Viewed

@@ -1,2 +1,16 @@
 fastapi
 uvicorn

+# Remove the --extra-index-url line below if you're not using Nvidia GPU.
+# If you're using it, update url to your CUDA version (CUDA 12.1 is minimum requirement):
+# For CUDA 12.1, use : https://download.pytorch.org/whl/cu121
+# For CUDA 12.4, use : https://download.pytorch.org/whl/cu124
+--extra-index-url https://download.pytorch.org/whl/cu124
+torch
+git+https://github.com/jhj0517/jhj0517-whisper.git
+faster-whisper==1.0.3
+transformers==4.42.3
+gradio==4.29.0
+pytubefix
+pyannote.audio==3.3.1
 fastapi
 uvicorn