Spaces:

AzizWazir
/

PDF-Convertor

Sleeping

AzizWazir commited on Dec 29, 2024

Commit

09938bc

verified ·

1 Parent(s): d7b6485

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,31 +1,38 @@
 from docx import Document
-def extract_text_from_docx(file_path):
-    """Extracts all text from a .docx file"""
     try:
-        # Open the .docx file
-        doc = Document(file_path)
         # Extract text from each paragraph in the document
         text = ""
         for paragraph in doc.paragraphs:
             text += paragraph.text + '\n'
         return text
     except Exception as e:
-        print(f"Error processing the document: {e}")
         return None
 def main():
-    file_path = "your_document.docx"  # Replace with your actual file path
-    text = extract_text_from_docx(file_path)
-    if text:
-        print("Extracted Text:")
-        print(text)
-    else:
-        print("Failed to extract text.")
 if __name__ == "__main__":
     main()

+import streamlit as st
 from docx import Document
+import io
+def extract_text_from_docx(file):
+    """Extracts all text from an uploaded .docx file"""
     try:
+        # Open the uploaded .docx file
+        doc = Document(io.BytesIO(file.read()))
         # Extract text from each paragraph in the document
         text = ""
         for paragraph in doc.paragraphs:
             text += paragraph.text + '\n'
         return text
     except Exception as e:
+        st.error(f"Error processing the document: {e}")
         return None
 def main():
+    st.title("Extract Text from DOCX")
+    # File upload
+    uploaded_file = st.file_uploader("Choose a DOCX file", type=["docx"])
+    if uploaded_file is not None:
+        text = extract_text_from_docx(uploaded_file)
+        if text:
+            st.subheader("Extracted Text")
+            st.text(text)
+        else:
+            st.error("Failed to extract text.")
 if __name__ == "__main__":
     main()