master-tts-pro-Copy

Sleeping

hivecorp commited on Nov 3, 2024

Commit

46d2980

verified ·

1 Parent(s): ae05d26

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -47,7 +47,7 @@ async def generate_accurate_srt(batch_text, batch_num, start_offset, pitch, rate
     audio_file = f"batch_{batch_num}_audio.wav"
     # Generate the audio using edge-tts
-    tts = edge_tts.Communicate(batch_text, voice, rate=rate, pitch=f"{pitch}Hz")
     await tts.save(audio_file)
     # Get the actual length of the audio file
@@ -116,9 +116,11 @@ async def batch_process_srt_and_audio(script_text, pitch, rate, voice, progress=
     return final_srt_path, final_audio_path
 # Gradio interface function
-async def process_script(script_text, pitch, rate, voice, _):
     formatted_rate = f"{'+' if rate > 0 else ''}{int(rate)}%"
-    srt_path, audio_path = await batch_process_srt_and_audio(script_text, pitch, formatted_rate, voice_options[voice])
     return srt_path, audio_path, audio_path
 # Gradio interface setup
@@ -170,14 +172,15 @@ app = gr.Interface(
         gr.Slider(label="Pitch Adjustment (Hz)", minimum=-100, maximum=100, step=1, value=1),
         gr.Slider(label="Rate Adjustment (%)", minimum=-100, maximum=100, step=1, value=1),
         gr.Dropdown(label="Select Voice", choices=list(voice_options.keys()), value="Andrew"),
-        gr.Button("Submit")  # Create a submit button with text "Submit"
     ],
     outputs=[
-        gr.File(label="Download SRT"),
-        gr.File(label="Download Audio"),
         gr.Audio(label="Audio Playback")
     ],
-    live=False  # Set live to False to prevent real-time updates
 )
 app.launch()

     audio_file = f"batch_{batch_num}_audio.wav"
     # Generate the audio using edge-tts
+    tts = edge_tts.Communicate(batch_text, voice, rate=rate, pitch=pitch)
     await tts.save(audio_file)
     # Get the actual length of the audio file
     return final_srt_path, final_audio_path
 # Gradio interface function
+async def process_script(script_text, pitch, rate, voice):
+    # Format pitch correctly for edge-tts
+    pitch_str = f"{pitch}Hz" if pitch != 0 else "0Hz"
     formatted_rate = f"{'+' if rate > 0 else ''}{int(rate)}%"
+    srt_path, audio_path = await batch_process_srt_and_audio(script_text, pitch_str, formatted_rate, voice_options[voice])
     return srt_path, audio_path, audio_path
 # Gradio interface setup
         gr.Slider(label="Pitch Adjustment (Hz)", minimum=-100, maximum=100, step=1, value=1),
         gr.Slider(label="Rate Adjustment (%)", minimum=-100, maximum=100, step=1, value=1),
         gr.Dropdown(label="Select Voice", choices=list(voice_options.keys()), value="Andrew"),
     ],
     outputs=[
+        gr.File(label="Download SRT File"),
+        gr.File(label="Download Audio File"),
         gr.Audio(label="Audio Playback")
     ],
+    title="Text-to-Speech with SRT Generation",
+    description="Convert your script into audio and generate subtitles.",
+    theme="compact",
 )
 app.launch()