Spaces:

habulaj
/

subapi

Running

habulaj commited on 16 days ago

Commit

4aa5e54

verified ·

1 Parent(s): f2b004b

Update srt_utils.py

Files changed (1) hide show

srt_utils.py CHANGED Viewed

@@ -367,11 +367,21 @@ def process_audio_for_transcription(input_file: str) -> str:
                 ffmpeg_cmd = shutil.which("ffmpeg")
                 if ffmpeg_cmd:
-                     # Compress to mono mp3 16k
                      cmd_convert = [
                         ffmpeg_cmd, "-y",
                         "-i", vocals_path,
                         "-ac", "1", "-ar", "16000",
                         "-c:a", "libmp3lame", "-q:a", "2",
                         final_output
                      ]
@@ -391,4 +401,4 @@ def process_audio_for_transcription(input_file: str) -> str:
         traceback.print_exc()
     print("⚠️ Retornando arquivo original (fallback)")
-    return input_file

                 ffmpeg_cmd = shutil.which("ffmpeg")
                 if ffmpeg_cmd:
+                     # Compress to mono mp3 16k with aggressive voice enhancement
+                     # Filters include highpass, noise reduction, compression, EQ, and normalization
+                     filter_chain = (
+                        "highpass=f=100,"
+                        "afftdn=nr=10:nf=-50:tn=1,"
+                        "compand=attacks=0:points=-80/-90|-45/-25|-27/-9|0/-7:gain=5,"
+                        "equalizer=f=3000:width_type=h:width=1000:g=5,"
+                        "loudnorm"
+                     )
                      cmd_convert = [
                         ffmpeg_cmd, "-y",
                         "-i", vocals_path,
                         "-ac", "1", "-ar", "16000",
+                        "-af", filter_chain,
                         "-c:a", "libmp3lame", "-q:a", "2",
                         final_output
                      ]
         traceback.print_exc()
     print("⚠️ Retornando arquivo original (fallback)")
+    return input_file