Spaces:

AxleToe
/

whisper-subtitle-generator

Sleeping

App Files Files Community

Akhil commited on Aug 27, 2025

Commit

3e9f66f

1 Parent(s): 22f48d5

fix: better FastAPI2

Browse files

Files changed (6) hide show

.gitignore +2 -1
Dockerfile +3 -2
__pycache__/main.cpython-312.pyc +0 -0
__pycache__/main.cpython-313.pyc +0 -0
main.py +58 -30
test.py +3 -13

.gitignore CHANGED Viewed

@@ -1,4 +1,5 @@
 audio/*
 .venv
 .idea
-models/*

 audio/*
 .venv
 .idea
+models/*
+__pychache__

Dockerfile CHANGED Viewed

@@ -7,6 +7,7 @@ RUN apt-get update && \
 WORKDIR /app
 COPY requirements.txt .
-RUN pip3 install --no-cache-dir -r requirements.txt
-CMD ["tail", "-f", "/dev/null"]

 WORKDIR /app
 COPY requirements.txt .
+RUN pip3 install --no-cache-dir --upgrade -r requirements.txt
+CMD ["tail", "-f", "/dev/null"]
+CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860"]

__pycache__/main.cpython-312.pyc ADDED Viewed

Binary file (13.3 kB). View file

__pycache__/main.cpython-313.pyc ADDED Viewed

Binary file (14.4 kB). View file

main.py CHANGED Viewed

@@ -3,12 +3,27 @@ import time
 import os
 import yt_dlp
 import subprocess
 import logging
-from fastapi import FastAPI
 app = FastAPI()
 logging.basicConfig()
 logging.getLogger("faster_whisper").setLevel(logging.DEBUG)
@@ -69,7 +84,6 @@ def local_audio_file(DOWNLOAD_DIR, AUDIO_FILE):
     finally:
         return final_filepath
 def create_subtitle_chunks(segments, max_words=8, max_duration=5.0):
             subtitle_chunks = []
@@ -111,7 +125,6 @@ def create_subtitle_chunks(segments, max_words=8, max_duration=5.0):
             return subtitle_chunks
 def format_time(seconds):
     seconds -= 0.2
     hours = int(seconds // 3600)
@@ -121,7 +134,6 @@ def format_time(seconds):
     return f"{hours:02d}:{minutes:02d}:{int(seconds_remainder):02d},{milliseconds:03d}"
 def add_subtitles(media_path):
     base, ext = os.path.splitext(os.path.basename(media_path))
     dir_path = os.path.dirname(media_path)
@@ -168,25 +180,30 @@ def add_subtitles(media_path):
     except Exception as e:
         print(f"An error occurred: {e}")
-def main():
-    all_files = ["YOUTUBE VIDEO URL"]
-    all_files += os.listdir('audio')
-    for i, file in enumerate(all_files):
-       print(f"[{i+1}] - {file}")
-    DOWNLOAD_DIR = "audio"
-    output_template = os.path.join(DOWNLOAD_DIR, '%(title)s.%(ext)s')
-    file_idx = int(input('Enter file index: '))
-    if file_idx != 1:
-        input_file_path = all_files[file_idx-1];
-        AUDIO_FILE=os.path.join(DOWNLOAD_DIR, input_file_path)
-        final_filepath = local_audio_file(DOWNLOAD_DIR=DOWNLOAD_DIR, AUDIO_FILE=AUDIO_FILE)
     else:
-        YT_URL = input("Enter URL: ")
-        final_filepath = youtube_download_video(YT_URL, DOWNLOAD_DIR, output_template)
     if final_filepath and os.path.exists(final_filepath):
@@ -216,8 +233,8 @@ def main():
                 word_timestamps=True
             )
-            os.makedirs(DOWNLOAD_DIR, exist_ok=True)
-            transcript_filename = os.path.join(DOWNLOAD_DIR, f"{FILE_NAME_FOR_TXT}.srt")
             subtitle_chunks = create_subtitle_chunks(segments, max_words=12, max_duration=4.0)
@@ -243,10 +260,22 @@ def main():
             print(f"\nTranscription complete and saved to {transcript_filename}.")
             print(f"Processed in {processed_time:.2f} seconds")
-            add_subtitles(final_filepath)
         except Exception as e:
-            print(f"An error occurred during transcription: {e}")
         finally:
             if 'model' in locals():
@@ -258,7 +287,6 @@ def main():
             gc.collect()
     else:
-        print("Audio file acquisition failed (YouTube download or local file not found). Cannot proceed with transcription.")
-if __name__ == "__main__":
-    main()

 import os
 import yt_dlp
 import subprocess
+from typing import Optional
 import logging
+from fastapi import FastAPI, File, UploadFile, HTTPException, Form
+from fastapi.responses import FileResponse
+import os, time
+from fastapi.middleware.cors import CORSMiddleware
+from pathlib import Path
+import zipfile
+import tempfile
 app = FastAPI()
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["http://localhost:5173", "http://127.0.0.1:5173"],
+    allow_credentials=True,
+    allow_methods=["GET", "POST", "PUT", "DELETE", "OPTIONS"],
+    allow_headers=["*"],
+)
 logging.basicConfig()
 logging.getLogger("faster_whisper").setLevel(logging.DEBUG)
     finally:
         return final_filepath
 def create_subtitle_chunks(segments, max_words=8, max_duration=5.0):
             subtitle_chunks = []
             return subtitle_chunks
 def format_time(seconds):
     seconds -= 0.2
     hours = int(seconds // 3600)
     return f"{hours:02d}:{minutes:02d}:{int(seconds_remainder):02d},{milliseconds:03d}"
 def add_subtitles(media_path):
     base, ext = os.path.splitext(os.path.basename(media_path))
     dir_path = os.path.dirname(media_path)
     except Exception as e:
         print(f"An error occurred: {e}")
+@app.get('/test')
+async def test_endpoint():
+    return {"message": "FastAPI is working!"}
+@app.post('/generate-subtitles')
+async def generate_subtitles(
+        file: Optional[UploadFile] = File(None),
+        youtube_url: Optional[str] = Form(None)
+):
+    upload_dir = 'audio'
+    os.makedirs(upload_dir, exist_ok=True)
+    if file:
+        file_path = os.path.join(upload_dir, file.filename)
+        with open(file_path, "wb") as f:
+            f.write(await file.read())
+        final_filepath = file_path
+        print(f"Uploaded file saved to {final_filepath}")
+    elif youtube_url:
+        output_template = os.path.join(upload_dir, "%(title)s.%(ext)s")
+        final_filepath = youtube_download_video(youtube_url, upload_dir, output_template)
     else:
+        raise HTTPException(status_code=400, detail="You must provide either a file or youtube URL.")
     if final_filepath and os.path.exists(final_filepath):
                 word_timestamps=True
             )
+            os.makedirs(upload_dir, exist_ok=True)
+            transcript_filename = os.path.join(upload_dir, f"{FILE_NAME_FOR_TXT}.srt")
             subtitle_chunks = create_subtitle_chunks(segments, max_words=12, max_duration=4.0)
             print(f"\nTranscription complete and saved to {transcript_filename}.")
             print(f"Processed in {processed_time:.2f} seconds")
+            video_output = Path(final_filepath).resolve()
+            subtitle_output = Path(transcript_filename).resolve()
+            files_to_send = [video_output, subtitle_output]
+            with tempfile.NamedTemporaryFile(delete=False, suffix=".zip") as tmp:
+                with zipfile.ZipFile(tmp, "w", zipfile.ZIP_DEFLATED) as zf:
+                    for f in files_to_send:
+                        zf.write(f, arcname=f.name)
+                tmp_path = tmp.name
+            return FileResponse(tmp_path, media_type="application/zip", filename="subtitles.zip")
         except Exception as e:
+            raise HTTPException(status_code=400, detail=str(e))
         finally:
             if 'model' in locals():
             gc.collect()
     else:
+        raise HTTPException(status_code=400, detail="Failed to process the file.")

test.py CHANGED Viewed

@@ -1,14 +1,4 @@
-import os
-all_files = os.listdir('audio')
-for i, file in enumerate(all_files):
-    print(f"[{i}] - {file}")
-file_idx = int(input('Enter file index: '))
-input_file_path = all_files[file_idx];
-DOWNLOAD_DIR = "audio"
-AUDIO_FILE=os.path.join(DOWNLOAD_DIR, input_file_path)
-print(AUDIO_FILE)
-print(DOWNLOAD_DIR)

+from pathlib import Path
+file_path = r'audio\Never install locally [J0NuOlA2xDc].mp4'
+print(Path(file_path).resolve())