Spaces:

pradeep4321
/

text2speech

Sleeping

App Files Files Community

pradeep4321 commited on May 19, 2025

Commit

2b5b7f0

verified ·

1 Parent(s): ad487d7

Update src/app.py

Browse files

Files changed (1) hide show

src/app.py +25 -26

src/app.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import os
-os.environ["STREAMLIT_CONFIG_DIR"] = "/src/.streamlit"
-os.makedirs("/src/.streamlit", exist_ok=True)
 import tempfile
 from gtts import gTTS
@@ -8,58 +8,57 @@ from docx import Document
 from PyPDF2 import PdfReader
 import streamlit as st
 import base64
-def text_to_speech(text, output_file):
     tts = gTTS(text)
-    tts.save(output_file)
 def convert_docx_to_text(docx_file):
     doc = Document(docx_file)
     return "\n".join([p.text for p in doc.paragraphs])
 def convert_pdf_to_text(pdf_file):
-    pdf_reader = PdfReader(pdf_file)
-    return "\n".join([page.extract_text() or '' for page in pdf_reader.pages])
-def get_binary_file_downloader_html(bin_file, file_label='File'):
-    b64 = base64.b64encode(bin_file).decode()
-    href = f'<a href="data:application/octet-stream;base64,{b64}" download="{file_label}" target="_blank">Download {file_label}</a>'
     return href
 def main():
-    st.title("Text to Speech Converter")
     uploaded_file = st.file_uploader("Upload a text, docx, or pdf file", type=["txt", "docx", "pdf"])
     if uploaded_file:
-        with tempfile.NamedTemporaryFile(delete=False, suffix='.' + uploaded_file.name.split('.')[-1]) as tmp:
-            tmp.write(uploaded_file.read())
-            tmp_path = tmp.name
         ext = uploaded_file.name.split('.')[-1].lower()
         text = ""
         if ext == 'txt':
-            with open(tmp_path, 'r', encoding='utf-8') as f:
-                text = f.read()
         elif ext == 'docx':
-            text = convert_docx_to_text(tmp_path)
         elif ext == 'pdf':
-            text = convert_pdf_to_text(tmp_path)
         if not text.strip():
             st.warning("No readable text found.")
             return
-        output_audio_path = os.path.join(tempfile.gettempdir(), "output.mp3")
-        text_to_speech(text, output_audio_path)
-        st.audio(output_audio_path, format="audio/mp3")
-        with open(output_audio_path, 'rb') as audio_file:
-            audio_bytes = audio_file.read()
-        st.markdown(get_binary_file_downloader_html(audio_bytes, "output.mp3"), unsafe_allow_html=True)
 if __name__ == "__main__":
     main()

 import os
+os.environ["STREAMLIT_CONFIG_DIR"] = "/tmp/.streamlit"
+os.makedirs("/tmp/.streamlit", exist_ok=True)
 import tempfile
 from gtts import gTTS
 from PyPDF2 import PdfReader
 import streamlit as st
 import base64
+from io import BytesIO
+def text_to_speech(text):
     tts = gTTS(text)
+    audio_buffer = BytesIO()
+    tts.write_to_fp(audio_buffer)
+    audio_buffer.seek(0)
+    return audio_buffer
 def convert_docx_to_text(docx_file):
     doc = Document(docx_file)
     return "\n".join([p.text for p in doc.paragraphs])
 def convert_pdf_to_text(pdf_file):
+    reader = PdfReader(pdf_file)
+    return "\n".join([page.extract_text() or '' for page in reader.pages])
+def get_download_link(audio_data, filename="output.mp3"):
+    b64 = base64.b64encode(audio_data).decode()
+    href = f'<a href="data:audio/mp3;base64,{b64}" download="{filename}">Download {filename}</a>'
     return href
 def main():
+    st.title("Text to Speech Converter (No File Write)")
     uploaded_file = st.file_uploader("Upload a text, docx, or pdf file", type=["txt", "docx", "pdf"])
     if uploaded_file:
         ext = uploaded_file.name.split('.')[-1].lower()
         text = ""
         if ext == 'txt':
+            text = uploaded_file.read().decode("utf-8")
         elif ext == 'docx':
+            text = convert_docx_to_text(uploaded_file)
         elif ext == 'pdf':
+            text = convert_pdf_to_text(uploaded_file)
+        else:
+            st.error("Unsupported file format")
+            return
         if not text.strip():
             st.warning("No readable text found.")
             return
+        with st.spinner("Converting to speech..."):
+            audio_buffer = text_to_speech(text)
+            audio_bytes = audio_buffer.read()
+        st.audio(audio_bytes, format="audio/mp3")
+        st.markdown(get_download_link(audio_bytes), unsafe_allow_html=True)
 if __name__ == "__main__":
     main()