Spaces:

pradeep4321
/

text2speech

Sleeping

App Files Files Community

pradeep4321 commited on May 19, 2025

Commit

36d7981

verified ·

1 Parent(s): ab8c1ea

Update src/app.py

Browse files

Files changed (1) hide show

src/app.py +41 -46

src/app.py CHANGED Viewed

@@ -1,21 +1,14 @@
 import os
-os.environ["HOME"] = "/tmp"  # Fix: Redirect .streamlit to a writable path
 import tempfile
-import pyttsx3
 from docx import Document
 from PyPDF2 import PdfReader
 import streamlit as st
 import base64
-from io import BytesIO
 def text_to_speech(text, output_file):
-    engine = pyttsx3.init()
-    engine.setProperty('rate', 150)
-    voices = engine.getProperty('voices')
-    engine.setProperty('voice', voices[1].id)
-    engine.save_to_file(text, output_file)
-    engine.runAndWait()
 def convert_docx_to_text(docx_file):
     doc = Document(docx_file)
@@ -28,55 +21,57 @@ def convert_pdf_to_text(pdf_file):
     text = ""
     pdf_reader = PdfReader(pdf_file)
     for page in pdf_reader.pages:
-        text += page.extract_text()
     return text
 def main():
     st.title("Text to Speech Converter")
     uploaded_file = st.file_uploader("Upload a text, docx, or pdf file", type=["txt", "docx", "pdf"])
     if uploaded_file:
         try:
-            # Save uploaded file content to a temporary file
-            temp_file = tempfile.NamedTemporaryFile(delete=False)
-            temp_file.write(uploaded_file.read())
-            temp_file.close()
-            file_extension = uploaded_file.name.split('.')[-1]
-            if file_extension.lower() == 'txt':
-                with open(temp_file.name, 'r', encoding='utf-8') as txt_file:
-                    text = txt_file.read()
-            elif file_extension.lower() == 'docx':
-                text = convert_docx_to_text(temp_file.name)
-            elif file_extension.lower() == 'pdf':
-                text = convert_pdf_to_text(temp_file.name)
             else:
                 st.error("Unsupported file format")
                 return
             with st.spinner("Converting text to speech..."):
-                output_audio_file = "output.mp3"
                 text_to_speech(text, output_audio_file)
-            st.audio(output_audio_file, format="audio/mp3", start_time=0)
-            # Provide a download link for the audio file
-            with open(output_audio_file, 'rb') as audio_file:
-                audio_bytes = audio_file.read()
-            st.markdown(get_binary_file_downloader_html(audio_bytes, output_audio_file), unsafe_allow_html=True)
-        except Exception as e:
-            st.error(f"An error occurred: {str(e)}")
-# Function to create a download link
-def get_binary_file_downloader_html(bin_file, file_label='File'):
-    with st.spinner("Preparing download link..."):
-        data = bin_file
-        b64 = base64.b64encode(data).decode()
-        href = f'<a href="data:application/octet-stream;base64,{b64}" download="{file_label}" target="_blank">Download {file_label}</a>'
-        return href
-if __name__ == '__main__':
     main()

 import os
 import tempfile
+from gtts import gTTS
 from docx import Document
 from PyPDF2 import PdfReader
 import streamlit as st
 import base64
 def text_to_speech(text, output_file):
+    tts = gTTS(text)
+    tts.save(output_file)
 def convert_docx_to_text(docx_file):
     doc = Document(docx_file)
     text = ""
     pdf_reader = PdfReader(pdf_file)
     for page in pdf_reader.pages:
+        page_text = page.extract_text()
+        if page_text:
+            text += page_text
     return text
+def get_binary_file_downloader_html(bin_file, file_label='File'):
+    data = bin_file
+    b64 = base64.b64encode(data).decode()
+    href = f'<a href="data:application/octet-stream;base64,{b64}" download="{file_label}" target="_blank">Download {file_label}</a>'
+    return href
 def main():
     st.title("Text to Speech Converter")
     uploaded_file = st.file_uploader("Upload a text, docx, or pdf file", type=["txt", "docx", "pdf"])
     if uploaded_file:
         try:
+            with tempfile.NamedTemporaryFile(delete=False, suffix='.' + uploaded_file.name.split('.')[-1]) as temp_file:
+                temp_file.write(uploaded_file.read())
+                temp_file_path = temp_file.name
+            file_extension = uploaded_file.name.split('.')[-1].lower()
+            if file_extension == 'txt':
+                with open(temp_file_path, 'r', encoding='utf-8') as f:
+                    text = f.read()
+            elif file_extension == 'docx':
+                text = convert_docx_to_text(temp_file_path)
+            elif file_extension == 'pdf':
+                text = convert_pdf_to_text(temp_file_path)
             else:
                 st.error("Unsupported file format")
                 return
+            if not text.strip():
+                st.warning("No text found in the file.")
+                return
             with st.spinner("Converting text to speech..."):
+                output_audio_file = os.path.join(tempfile.gettempdir(), "output.mp3")
                 text_to_speech(text, output_audio_file)
+            st.audio(output_audio_file, format="audio/mp3")
+            with open(output_audio_file, 'rb') as f:
+                audio_bytes = f.read()
+            st.markdown(get_binary_file_downloader_html(audio_bytes, "output.mp3"), unsafe_allow_html=True)
+        except Exception as e:
+            st.error(f"An error occurred: {e}")
+if __name__ == "__main__":
     main()