Spaces:

Kurian07
/

Text-Speech-Project

Sleeping

App Files Files Community

Kurian07 commited on Nov 24, 2024

Commit

daeeb06

verified ·

1 Parent(s): 56774bb

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -9

app.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import streamlit as st
-import fitz  # PyMuPDF for PDF text extraction
-from TTS.api import TTS  # Coqui TTS
 import os
 # Title of the app
@@ -27,21 +27,39 @@ if uploaded_file is not None:
     if text.strip() == "":
         st.warning("No text found in the PDF. Please upload a valid document.")
     else:
-        # Select TTS model
         st.subheader("Generate Speech")
         st.info("Using TTS single-speaker model: 'tts_models/en/ljspeech/tacotron2-DDC'")
         model_name = "tts_models/en/ljspeech/tacotron2-DDC"  # Single-speaker model
         tts = TTS(model_name)
-        # Specify output file
         audio_path = "output.wav"
         try:
-            # Generate speech
-            tts.tts_to_file(text=text, file_path=audio_path)  # Ensure no `speaker` for single-speaker models
             st.success("Speech generation complete!")
-            # Audio playback
             st.audio(audio_path, format="audio/wav", start_time=0)
             # Cleanup button

 import streamlit as st
+import fitz  # PyMuPDF
+from TTS.api import TTS
 import os
 # Title of the app
     if text.strip() == "":
         st.warning("No text found in the PDF. Please upload a valid document.")
     else:
+        # Text-to-Speech Conversion
         st.subheader("Generate Speech")
         st.info("Using TTS single-speaker model: 'tts_models/en/ljspeech/tacotron2-DDC'")
         model_name = "tts_models/en/ljspeech/tacotron2-DDC"  # Single-speaker model
         tts = TTS(model_name)
         audio_path = "output.wav"
+        # Split text into smaller chunks (e.g., 500 characters)
+        def split_text(text, max_length=500):
+            sentences = text.split(". ")
+            chunks = []
+            chunk = ""
+            for sentence in sentences:
+                if len(chunk) + len(sentence) < max_length:
+                    chunk += sentence + ". "
+                else:
+                    chunks.append(chunk.strip())
+                    chunk = sentence + ". "
+            if chunk:
+                chunks.append(chunk.strip())
+            return chunks
+        chunks = split_text(text)
+        # Generate audio for each chunk
         try:
+            with open(audio_path, "wb") as audio_file:
+                for i, chunk in enumerate(chunks):
+                    st.write(f"Processing chunk {i + 1} of {len(chunks)}...")
+                    audio_chunk = tts.tts(chunk)
+                    audio_file.write(audio_chunk)
             st.success("Speech generation complete!")
             st.audio(audio_path, format="audio/wav", start_time=0)
             # Cleanup button