Spaces:

the-carnage
/

docurizer

Sleeping

App Files Files Community

the-carnage commited on Dec 28, 2025

Commit

2a54e7f

1 Parent(s): b00aa55

Add text input and improved UI

Browse files

Files changed (1) hide show

app.py +69 -23

app.py CHANGED Viewed

@@ -7,8 +7,9 @@ import tempfile
 import os
 # Page config
-st.set_page_config(page_title="PDF & Image Summarizer", layout="centered")
-st.title("📄🖼 Document Summarizer")
 # Load summarization model
 @st.cache_resource
@@ -17,12 +18,6 @@ def load_model():
 summarizer = load_model()
-# File uploader
-uploaded_file = st.file_uploader(
-    "Upload PDF or Image",
-    type=["pdf", "png", "jpg", "jpeg"]
-)
 def extract_text_from_image(image):
     return pytesseract.image_to_string(image)
@@ -35,31 +30,82 @@ def extract_text_from_pdf(file_path):
                 text += page_text
     return text
-if uploaded_file:
-    # Save temp file
-    with tempfile.NamedTemporaryFile(delete=False) as tmp:
-        tmp.write(uploaded_file.read())
-        file_path = tmp.name
-    ext = os.path.splitext(uploaded_file.name)[1].lower()
-    if ext == ".pdf":
         text = extract_text_from_pdf(file_path)
-    else:
-        image = Image.open(file_path)
-        text = extract_text_from_image(image)
-    st.subheader("📃 Extracted Text (Preview)")
-    st.text_area("", text[:3000], height=200)
-    if st.button("Summarize"):
         with st.spinner("Summarizing..."):
             summary = summarizer(
-                text,
-                max_length=120,
                 min_length=40,
                 do_sample=False
             )[0]["summary_text"]
         st.subheader("📝 Summary")
         st.success(summary)

 import os
 # Page config
+st.set_page_config(page_title="Docurizzer - Document Summarizer", layout="centered")
+st.title("📄🖼 Docurizzer")
+st.markdown("*Extract and summarize text from documents, images, or paste your own text*")
 # Load summarization model
 @st.cache_resource
 summarizer = load_model()
 def extract_text_from_image(image):
     return pytesseract.image_to_string(image)
                 text += page_text
     return text
+# Input method selection
+input_method = st.radio(
+    "Choose input method:",
+    ["📝 Paste Text", "📄 Upload PDF", "🖼 Upload Image"],
+    horizontal=True
+)
+text = ""
+if input_method == "📝 Paste Text":
+    st.subheader("📝 Enter Your Text")
+    text = st.text_area(
+        "Paste or type your text here:",
+        height=250,
+        placeholder="Enter the text you want to summarize..."
+    )
+elif input_method == "📄 Upload PDF":
+    uploaded_file = st.file_uploader(
+        "Upload a PDF file",
+        type=["pdf"]
+    )
+    if uploaded_file:
+        with tempfile.NamedTemporaryFile(delete=False, suffix=".pdf") as tmp:
+            tmp.write(uploaded_file.read())
+            file_path = tmp.name
         text = extract_text_from_pdf(file_path)
+        st.subheader("📃 Extracted Text (Preview)")
+        st.text_area("", text[:3000], height=200, disabled=True)
+elif input_method == "🖼 Upload Image":
+    uploaded_file = st.file_uploader(
+        "Upload an image (PNG, JPG, JPEG)",
+        type=["png", "jpg", "jpeg"]
+    )
+    if uploaded_file:
+        with tempfile.NamedTemporaryFile(delete=False) as tmp:
+            tmp.write(uploaded_file.read())
+            file_path = tmp.name
+        image = Image.open(file_path)
+        st.image(image, caption="Uploaded Image", use_container_width=True)
+        with st.spinner("Extracting text from image..."):
+            text = extract_text_from_image(image)
+        st.subheader("📃 Extracted Text (Preview)")
+        st.text_area("", text[:3000], height=200, disabled=True)
+# Summarize button
+if text.strip():
+    if st.button("🚀 Summarize", type="primary"):
         with st.spinner("Summarizing..."):
+            # Handle text length for T5 model
+            input_text = text[:4000] if len(text) > 4000 else text
             summary = summarizer(
+                input_text,
+                max_length=150,
                 min_length=40,
                 do_sample=False
             )[0]["summary_text"]
         st.subheader("📝 Summary")
         st.success(summary)
+        # Copy button
+        st.download_button(
+            label="📋 Download Summary",
+            data=summary,
+            file_name="summary.txt",
+            mime="text/plain"
+        )
+else:
+    st.info("👆 Please provide some text using one of the methods above.")