Fast-Subtitle-Maker

Build error

App Files Files Community

Jose Manuel Perez commited on Sep 16, 2024

Commit

4e34fb8

unverified ·

1 Parent(s): 84c604a

Update app.py

Browse files

Files changed (1) hide show

app.py +95 -60

app.py CHANGED Viewed

@@ -308,12 +308,10 @@ def generate_subtitles(input_mode, input_file, link_input, prompt, language, aut
     segment_id_offset = 0
     if split_status == "split":
-        # Processing chunks when file is split
         srt_chunks = []
         video_chunks = []
         for i, chunk_path in enumerate(processed_path):
             try:
-                # Transcribe each chunk using the model
                 with open(chunk_path, "rb") as file:
                     transcription_json_response = client.audio.transcriptions.create(
                         file=(os.path.basename(chunk_path), file.read()),
@@ -325,7 +323,7 @@ def generate_subtitles(input_mode, input_file, link_input, prompt, language, aut
                     )
                 transcription_json = transcription_json_response.segments
-                # Adjust timestamps and IDs
                 for segment in transcription_json:
                     segment['start'] += total_duration
                     segment['end'] += total_duration
@@ -338,47 +336,73 @@ def generate_subtitles(input_mode, input_file, link_input, prompt, language, aut
                 temp_srt_path = f"{os.path.splitext(chunk_path)[0]}.srt"
                 with open(temp_srt_path, "w", encoding="utf-8") as temp_srt_file:
                     temp_srt_file.write(srt_content)
-                    temp_srt_file.write("\n")  # Newline at end for proper merging
                 srt_chunks.append(temp_srt_path)
-                # If the user requested video output with subtitles
                 if include_video and input_file_path.lower().endswith((".mp4", ".webm")):
-                    output_file_path = chunk_path.replace(os.path.splitext(chunk_path)[1], "_with_subs" + os.path.splitext(chunk_path)[1])
-                    # Handle font selection
-                    font_name, font_dir = None, None
-                    if font_selection == "Custom Font File" and font_file:
-                        font_name = os.path.splitext(os.path.basename(font_file.name))[0]
-                        font_dir = os.path.dirname(font_file.name)
-                    # FFmpeg command for adding subtitles with customization
-                    ffmpeg_command = [
-                        "ffmpeg",
-                        "-y",
-                        "-i",
-                        chunk_path,
-                        "-vf",
-                        f"subtitles={temp_srt_path}:fontsdir={font_dir if font_selection == 'Custom Font File' else ''}:force_style='Fontname={font_name if font_selection == 'Custom Font File' else 'Arial'},Fontsize={font_size},PrimaryColour=&H{font_color[1:]}&,OutlineColour=&H{outline_color[1:]}&,Outline={outline_thickness}'",
-                        "-preset", "fast",
-                        output_file_path,
-                    ]
-                    subprocess.run(ffmpeg_command, check=True)
-                    video_chunks.append(output_file_path)
             except groq.AuthenticationError as e:
                 handle_groq_error(e, model)
             except groq.RateLimitError as e:
                 handle_groq_error(e, model)
-        # Merge the chunks and return the results
         if video_chunks:
             merge_audio(video_chunks, 'merged_output_video.mp4')
-            return 'merged_output_video.mp4', None
         else:
-            return full_srt_content, None
-    else:
-        # Process single file (no splitting)
         try:
             with open(processed_path, "rb") as file:
                 transcription_json_response = client.audio.transcriptions.create(
@@ -390,37 +414,49 @@ def generate_subtitles(input_mode, input_file, link_input, prompt, language, aut
                     temperature=0.0,
                 )
             transcription_json = transcription_json_response.segments
             srt_content = json_to_srt(transcription_json)
             temp_srt_path = os.path.splitext(input_file_path)[0] + ".srt"
             with open(temp_srt_path, "w", encoding="utf-8") as temp_srt_file:
                 temp_srt_file.write(srt_content)
-            # If including the video with subtitles
             if include_video and input_file_path.lower().endswith((".mp4", ".webm")):
-                output_file_path = input_file_path.replace(
-                    os.path.splitext(input_file_path)[1], "_with_subs" + os.path.splitext(input_file_path)[1]
-                )
-                font_name, font_dir = None, None
-                if font_selection == "Custom Font File" and font_file:
-                    font_name = os.path.splitext(os.path.basename(font_file.name))[0]
-                    font_dir = os.path.dirname(font_file.name)
-                # Add subtitles using FFmpeg
-                ffmpeg_command = [
-                    "ffmpeg",
-                    "-y",
-                    "-i",
-                    input_file_path,
-                    "-vf",
-                    f"subtitles={temp_srt_path}:fontsdir={font_dir if font_selection == 'Custom Font File' else ''}:force_style='Fontname={font_name if font_selection == 'Custom Font File' else 'Arial'},Fontsize={font_size},PrimaryColour=&H{font_color[1:]}&,OutlineColour=&H{outline_color[1:]}&,Outline={outline_thickness}'",
-                    "-preset", "fast",
-                    output_file_path,
-                ]
-                subprocess.run(ffmpeg_command, check=True)
-                return temp_srt_path, output_file_path
             return temp_srt_path, None
         except groq.AuthenticationError as e:
             handle_groq_error(e, model)
@@ -430,7 +466,6 @@ def generate_subtitles(input_mode, input_file, link_input, prompt, language, aut
             raise gr.Error(f"Error creating SRT file: {e}")
 theme = gr.themes.Soft(
     primary_hue="indigo",
     secondary_hue="orange",

     segment_id_offset = 0
     if split_status == "split":
         srt_chunks = []
         video_chunks = []
         for i, chunk_path in enumerate(processed_path):
             try:
                 with open(chunk_path, "rb") as file:
                     transcription_json_response = client.audio.transcriptions.create(
                         file=(os.path.basename(chunk_path), file.read()),
                     )
                 transcription_json = transcription_json_response.segments
+                # Adjust timestamps and segment IDs
                 for segment in transcription_json:
                     segment['start'] += total_duration
                     segment['end'] += total_duration
                 temp_srt_path = f"{os.path.splitext(chunk_path)[0]}.srt"
                 with open(temp_srt_path, "w", encoding="utf-8") as temp_srt_file:
                     temp_srt_file.write(srt_content)
+                    temp_srt_file.write("\n") # add a new line at the end of the srt chunk file to fix format when merged
                 srt_chunks.append(temp_srt_path)
                 if include_video and input_file_path.lower().endswith((".mp4", ".webm")):
+                    try:
+                        output_file_path = chunk_path.replace(os.path.splitext(chunk_path)[1], "_with_subs" + os.path.splitext(chunk_path)[1])
+                        # Handle font selection
+                        if font_selection == "Custom Font File" and font_file:
+                            font_name = os.path.splitext(os.path.basename(font_file.name))[0]  # Get font filename without extension
+                            font_dir = os.path.dirname(font_file.name)  # Get font directory path
+                        elif font_selection == "Custom Font File" and not font_file:
+                            font_name = None  # Let FFmpeg use its default Arial
+                            font_dir = None  # No font directory
+                            gr.Warning(f"You want to use a Custom Font File, but uploaded none. Using the default Arial font.")
+                        elif font_selection == "Arial":
+                            font_name = None  # Let FFmpeg use its default Arial
+                            font_dir = None  # No font directory
+                        # FFmpeg command
+                        subprocess.run(
+                            [
+                                "ffmpeg",
+                                "-y",
+                                "-i",
+                                chunk_path,
+                                "-vf",
+                                f"subtitles={temp_srt_path}:fontsdir={font_dir}:force_style='Fontname={font_name},Fontsize={int(font_size)},PrimaryColour=&H{font_color[1:]}&,OutlineColour=&H{outline_color[1:]}&,BorderStyle={int(outline_thickness)},Outline=1'",
+                                "-preset", "fast",
+                                output_file_path,
+                            ],
+                            check=True,
+                        )
+                        video_chunks.append(output_file_path)
+                    except subprocess.CalledProcessError as e:
+                        raise gr.Error(f"Error during subtitle addition: {e}")
+                elif include_video and not input_file_path.lower().endswith((".mp4", ".webm")):
+                    gr.Warning(f"You have checked on the 'Include Video with Subtitles', but the input file {input_file_path} isn't a video (.mp4 or .webm). Returning only the SRT File.", duration=15)
             except groq.AuthenticationError as e:
                 handle_groq_error(e, model)
             except groq.RateLimitError as e:
                 handle_groq_error(e, model)
+                gr.Warning(f"API limit reached during chunk {i+1}. Returning processed chunks only.")
+                if srt_chunks and video_chunks:
+                    merge_audio(video_chunks, 'merged_output_video.mp4')
+                    with open('merged_output.srt', 'w', encoding="utf-8") as outfile:
+                        for chunk_srt in srt_chunks:
+                            with open(chunk_srt, 'r', encoding="utf-8") as infile:
+                                outfile.write(infile.read())
+                    return 'merged_output.srt', 'merged_output_video.mp4'
+                else:
+                    raise gr.Error("Subtitle generation failed due to API limits.")
+        # Merge SRT chunks
+        final_srt_path = os.path.splitext(input_file_path)[0] + "_final.srt"
+        with open(final_srt_path, 'w', encoding="utf-8") as outfile:
+            for chunk_srt in srt_chunks:
+                with open(chunk_srt, 'r', encoding="utf-8") as infile:
+                    outfile.write(infile.read())
+        # Merge video chunks
         if video_chunks:
             merge_audio(video_chunks, 'merged_output_video.mp4')
+            return final_srt_path, 'merged_output_video.mp4'
         else:
+            return final_srt_path, None
+    else:  # Single file processing (no splitting)
         try:
             with open(processed_path, "rb") as file:
                 transcription_json_response = client.audio.transcriptions.create(
                     temperature=0.0,
                 )
             transcription_json = transcription_json_response.segments
             srt_content = json_to_srt(transcription_json)
             temp_srt_path = os.path.splitext(input_file_path)[0] + ".srt"
             with open(temp_srt_path, "w", encoding="utf-8") as temp_srt_file:
                 temp_srt_file.write(srt_content)
             if include_video and input_file_path.lower().endswith((".mp4", ".webm")):
+                try:
+                    output_file_path = input_file_path.replace(
+                        os.path.splitext(input_file_path)[1], "_with_subs" + os.path.splitext(input_file_path)[1]
+                    )
+                    # Handle font selection
+                    if font_selection == "Custom Font File" and font_file:
+                        font_name = os.path.splitext(os.path.basename(font_file.name))[0]  # Get font filename without extension
+                        font_dir = os.path.dirname(font_file.name)  # Get font directory path
+                    elif font_selection == "Custom Font File" and not font_file:
+                        font_name = None  # Let FFmpeg use its default Arial
+                        font_dir = None  # No font directory
+                        gr.Warning(f"You want to use a Custom Font File, but uploaded none. Using the default Arial font.")
+                    elif font_selection == "Arial":
+                        font_name = None  # Let FFmpeg use its default Arial
+                        font_dir = None  # No font directory
+                    # FFmpeg command
+                    subprocess.run(
+                        [
+                            "ffmpeg",
+                            "-y",
+                            "-i",
+                            input_file_path,
+                            "-vf",
+                            f"subtitles={temp_srt_path}:fontsdir={font_dir}:force_style='FontName={font_name},Fontsize={int(font_size)},PrimaryColour=&H{font_color[1:]}&,OutlineColour=&H{outline_color[1:]}&,BorderStyle={int(outline_thickness)},Outline=1'",
+                            "-preset", "fast",
+                            output_file_path,
+                        ],
+                        check=True,
+                    )
+                    return temp_srt_path, output_file_path
+                except subprocess.CalledProcessError as e:
+                    raise gr.Error(f"Error during subtitle addition: {e}")
+            elif include_video and not input_file_path.lower().endswith((".mp4", ".webm")):
+                gr.Warning(f"You have checked on the 'Include Video with Subtitles', but the input file {input_file_path} isn't a video (.mp4 or .webm). Returning only the SRT File.", duration=15)
             return temp_srt_path, None
         except groq.AuthenticationError as e:
             handle_groq_error(e, model)
             raise gr.Error(f"Error creating SRT file: {e}")
 theme = gr.themes.Soft(
     primary_hue="indigo",
     secondary_hue="orange",