Spaces:

habulaj
/

subapi

Running

App Files Files Community

habulaj commited on Jan 28

Commit

fc9986c

verified ·

1 Parent(s): bf38176

Update app.py

Browse files

Files changed (1) hide show

app.py +29 -5

app.py CHANGED Viewed

@@ -677,6 +677,8 @@ class GroqRequest(BaseModel):
     language: Optional[str] = None
     temperature: Optional[float] = 0.4
     has_bg_music: Optional[bool] = False # Default to False for speed/resources
 def groq_json_to_srt(data):
     """Converte resposta verbose_json do Whisper/Groq para SRT"""
@@ -706,9 +708,9 @@ def groq_json_to_srt(data):
     return srt_output
-from srt_utils import apply_netflix_style_filter, process_audio_for_transcription
-async def get_groq_srt_base(url: str, language: Optional[str] = None, temperature: Optional[float] = 0.4, has_bg_music: bool = False):
     """
     Helper para gerar SRT base usando Groq (dando suporte a filtro Netflix).
     Retorna (srt_filtered, srt_word_level, processed_audio_url)
@@ -748,7 +750,7 @@ async def get_groq_srt_base(url: str, language: Optional[str] = None, temperatur
         # 2. Pré-processar (Remover ruído, filtrar voz, etc)
         print(f"🔊 [Groq] Pré-processando áudio (has_bg_music={has_bg_music})...")
         # O process_audio cria um arquivo novo com .processed.mp3
-        processed_file_path = process_audio_for_transcription(filepath, has_bg_music=has_bg_music)
         # Se processou, o caminho mudou. Vamos ver.
         if processed_file_path != filepath:
@@ -845,9 +847,16 @@ async def generate_subtitle_groq(request: GroqRequest):
             url=request.url,
             language=request.language,
             temperature=request.temperature,
-            has_bg_music=request.has_bg_music
         )
         return JSONResponse(content={
             "srt": srt_filtered,
             "srt_word": srt_word
@@ -865,6 +874,8 @@ class GeminiSubtitleRequest(BaseModel):
     has_bg_music: Optional[bool] = False
     context: Optional[str] = "N/A"
     model: Optional[str] = "flash" # 'flash' or 'thinking'
 @app.post("/subtitle")
 async def generate_subtitle(request: GeminiSubtitleRequest):
@@ -886,7 +897,9 @@ async def generate_subtitle(request: GeminiSubtitleRequest):
             url=request.url,
             language="en",
             temperature=0.4,
-            has_bg_music=request.has_bg_music
         )
         # Converter URL /static/xyz.mp3 para path local
@@ -940,6 +953,17 @@ INSTRUÇÕES/CONTEXTO DO USUÁRIO: {processed_context}
         # Limpar markdown do SRT se houver
         cleaned_srt = clean_and_validate_srt(content)
         return JSONResponse(content={
             "srt": cleaned_srt,
             "original_srt": srt_filtered,

     language: Optional[str] = None
     temperature: Optional[float] = 0.4
     has_bg_music: Optional[bool] = False # Default to False for speed/resources
+    time_start: Optional[float] = None
+    time_end: Optional[float] = None
 def groq_json_to_srt(data):
     """Converte resposta verbose_json do Whisper/Groq para SRT"""
     return srt_output
+from srt_utils import apply_netflix_style_filter, process_audio_for_transcription, shift_srt_timestamps
+async def get_groq_srt_base(url: str, language: Optional[str] = None, temperature: Optional[float] = 0.4, has_bg_music: bool = False, time_start: float = None, time_end: float = None):
     """
     Helper para gerar SRT base usando Groq (dando suporte a filtro Netflix).
     Retorna (srt_filtered, srt_word_level, processed_audio_url)
         # 2. Pré-processar (Remover ruído, filtrar voz, etc)
         print(f"🔊 [Groq] Pré-processando áudio (has_bg_music={has_bg_music})...")
         # O process_audio cria um arquivo novo com .processed.mp3
+        processed_file_path = process_audio_for_transcription(filepath, has_bg_music=has_bg_music, time_start=time_start, time_end=time_end)
         # Se processou, o caminho mudou. Vamos ver.
         if processed_file_path != filepath:
             url=request.url,
             language=request.language,
             temperature=request.temperature,
+            has_bg_music=request.has_bg_music,
+            time_start=request.time_start,
+            time_end=request.time_end
         )
+        # Shift timestamps if needed
+        if request.time_start and request.time_start > 0:
+            srt_filtered = shift_srt_timestamps(srt_filtered, request.time_start)
+            srt_word = shift_srt_timestamps(srt_word, request.time_start)
         return JSONResponse(content={
             "srt": srt_filtered,
             "srt_word": srt_word
     has_bg_music: Optional[bool] = False
     context: Optional[str] = "N/A"
     model: Optional[str] = "flash" # 'flash' or 'thinking'
+    time_start: Optional[float] = None
+    time_end: Optional[float] = None
 @app.post("/subtitle")
 async def generate_subtitle(request: GeminiSubtitleRequest):
             url=request.url,
             language="en",
             temperature=0.4,
+            has_bg_music=request.has_bg_music,
+            time_start=request.time_start,
+            time_end=request.time_end
         )
         # Converter URL /static/xyz.mp3 para path local
         # Limpar markdown do SRT se houver
         cleaned_srt = clean_and_validate_srt(content)
+        # Shift final timestamps if needed
+        if request.time_start and request.time_start > 0:
+            cleaned_srt = shift_srt_timestamps(cleaned_srt, request.time_start)
+            # original_srt was already shifted? No, srt_filtered comes from get_groq_srt_base which is 0-based
+            # But wait, did we shift srt_filtered before sending to Gemini?
+            # NO. srt_filtered is 0-based.
+            # So send 0-based to Gemini. Gemini returns 0-based.
+            # We shift cleaned_srt.
+            # Optionally shift original_srt for reference
+            srt_filtered = shift_srt_timestamps(srt_filtered, request.time_start)
         return JSONResponse(content={
             "srt": cleaned_srt,
             "original_srt": srt_filtered,