File size: 5,065 Bytes
c564fad
b6093b0
0cb486a
c564fad
0cb486a
b6093b0
2b0ce36
23e5406
c564fad
0cb486a
228a3b1
0cb486a
 
c564fad
 
2b0ce36
0cb486a
228a3b1
0cb486a
 
 
228a3b1
0cb486a
228a3b1
78c135b
3fc2a44
228a3b1
 
0cb486a
 
3fc2a44
ab25f71
 
2a6a104
 
 
 
 
 
 
ab25f71
d0c0836
ab25f71
 
 
 
 
b6093b0
 
1aceee0
 
 
 
 
0cb486a
b6093b0
23e5406
0cb486a
b6093b0
 
 
c564fad
0cb486a
c564fad
 
0cb486a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
c564fad
b6093b0
0cb486a
 
d63a8c1
0cb486a
b6093b0
3fc2a44
d0c0836
c564fad
8cdcb92
b6093b0
0cb486a
 
 
 
228a3b1
0cb486a
 
 
 
 
 
 
b6093b0
 
3fc2a44
 
25a7124
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
import shutil, os, logging, uvicorn, tempfile
from typing import Optional
from uuid import uuid4

from utils.transcriber import transcriber
from utils.process_video import process_video
from utils.zip_response import zip_response
from utils.read_html import read_html

from fastapi import FastAPI, UploadFile, HTTPException, Request, Form, Depends
from fastapi.staticfiles import StaticFiles
from fastapi.templating import Jinja2Templates
from fastapi.responses import HTMLResponse, Response, RedirectResponse
from fastapi.security import HTTPBasic
from pydantic import BaseModel, field_validator


## THIS IS A BREAKING CHANGE. SRT FILE INPUT DEPRECATED. WIP.
## DONE: separate transcriber from subtitler logic. WIP.
## DONE: improve loading spinner. WIP (with redirect)
## TODO: add transcription preview component + allow for interactive validation of transcription in-browser. WIP
## TODO: add word level highlighting option


app = FastAPI()
security = HTTPBasic()
static_dir = os.path.join(os.path.dirname(__file__), 'static')
app.mount("/static", StaticFiles(directory=static_dir), name="static")
templates = Jinja2Templates(directory=static_dir) 
temp_store = {}

class MP4Video(BaseModel):
    video_file: UploadFile
    
    @property
    def filename(self):
        return self.video_file.filename
    @property
    def file(self):
        return self.video_file.file

    @field_validator('video_file')
    def validate_video_file(cls, v):
        if not v.filename.endswith('.mp4'):
            raise HTTPException(status_code=500, detail='Invalid video file type. Please upload an MP4 file.')
        return v

@app.get("/")
async def root():
    html_content = f"""
    {read_html(os.path.join(os.getcwd(),"static/landing_page.html"))}
    """
    return HTMLResponse(content=html_content)

@app.get("/transcribe_video/")
async def get_form():
    html_content = f"""
    {read_html(os.path.join(os.getcwd(),"static/transcribe_video.html"))}
    """
    return HTMLResponse(content=html_content)

async def get_temp_dir():
    dir = tempfile.TemporaryDirectory(delete=False)
    try:
        yield dir.name
    except Exception as e:
        HTTPException(status_code=500, detail=str(e))

@app.post("/transcribe/")
async def transcribe_api(video_file: MP4Video = Depends(),
                         task: str = Form("transcribe"),
                         model_version: str = Form("deepdml/faster-whisper-large-v3-turbo-ct2"),
                         max_words_per_line: int = Form(6),
                         temp_dir: str = Depends(get_temp_dir)):
    try:
        video_path = os.path.join(temp_dir, video_file.filename)
        with open(video_path, 'wb') as f:
            shutil.copyfileobj(video_file.file, f)

        transcription = transcriber(video_path, max_words_per_line, task, model_version)

        uid = str(uuid4())
        temp_store[uid] = {"video_path": video_path, "transcription": transcription}
        return RedirectResponse(url=f"/process_settings/?uid={uid}", status_code=303)
    
    except Exception as e:
        raise HTTPException(status_code=500, detail=str(e))

@app.get("/process_settings/")
async def process_settings(request: Request, uid: str):
    data = temp_store.get(uid)
    if not data:
        raise HTTPException(404, "Data not found")
    return templates.TemplateResponse("process_settings.html", {
        "request": request,
        "transcription": data["transcription"],
        "video_path": data["video_path"]
    })

@app.post("/process_video/")
async def process_video_api(video_path: str = Form(...),
                            srt_string: str = Form(...),
                            fontsize: Optional[int] = Form(42),
                            font: Optional[str] = Form("Helvetica"),
                            bg_color: Optional[str] = Form("#070a13b3"),
                            text_color: Optional[str] = Form("white"),
                            caption_mode: Optional[str] = Form("desktop"),
                            temp_dir: str = Depends(get_temp_dir)
                            ):
    try:
        output_path = process_video(video_path, srt_string, fontsize, font, bg_color, text_color, caption_mode)
        with open(os.path.join(temp_dir, f"{video_path.split('.')[0]}.srt"), 'w+') as temp_srt_file:
            logging.info("Processing the video...")
            temp_srt_file.write(srt_string)    
            logging.info("Zipping response...")
        with open(os.path.join(temp_dir, f"{video_path.split('.')[0]}.zip"), 'w+b') as temp_zip_file:
            zip_file = zip_response(temp_zip_file.name, [output_path, temp_srt_file.name])
            return Response(
                content = zip_file,
                media_type="application/zip",
                headers={"Content-Disposition": f"attachment; filename={os.path.basename(video_path).split('.')[0]}.zip"}
                )
    except Exception as e:
        raise HTTPException(status_code=500, detail=str(e))
    
if __name__ == "__main__":
    uvicorn.run(app, host="0.0.0.0", port=8000)