PDF_Upload

Sleeping

App Files Files Community

Seth0330 commited on May 20, 2025

Commit

e3ce562

verified ·

1 Parent(s): cdae312

Update app.py

Browse files

Files changed (1) hide show

app.py +83 -83

app.py CHANGED Viewed

@@ -39,88 +39,7 @@ MODELS = {
     }
 }
-# Create tabs for different functionalities
-tab1, tab2 = st.tabs(["PDF Summarizer", "Invoice Extractor"])
-# PDF Summarizer Tab
-with tab1:
-    st.title("PDF to Bullet Point Summarizer 🗟 🔏")
-    # File uploader for the PDF
-    uploaded_file = st.file_uploader("Upload your PDF document", type="pdf", key="pdf_uploader")
-    # Slider for users to select the summarization extent
-    summary_scale = st.slider("Select the extent of summarization (%)", min_value=1, max_value=100, value=20, key="summary_scale")
-    # Submit button
-    submit_button = st.button("Generate Summary", key="summary_button")
-    # Check if the submit button is pressed
-    if submit_button and uploaded_file is not None:
-        with st.spinner('Processing...'):
-            # Read the PDF content
-            text = read_pdf(io.BytesIO(uploaded_file.getvalue()))
-            # Extract key phrases from the text
-            key_phrases = extract_key_phrases(text)
-            # Score sentences based on the key phrases
-            sentence_scores = score_sentences(text, key_phrases)
-            # Determine the number of bullet points based on the selected summarization scale
-            total_sentences = len(list(sentence_scores.keys()))
-            num_points = max(1, total_sentences * summary_scale // 100)
-            # Generate the bullet-point summary
-            summary = summarize_text(sentence_scores, num_points=num_points)
-            # Display the summary as bullet points
-            st.subheader("Here's the summary: ")
-            st.markdown(summary)
-# Invoice Extractor Tab
-with tab2:
-    st.title("📋 Invoice Extractor from PDF")
-    st.write("Upload an invoice PDF to extract key details")
-    # Model selection
-    model_choice = st.selectbox(
-        "Select AI Model",
-        list(MODELS.keys()),
-        index=0,
-        help="Choose which AI model to use for extraction",
-        key="model_choice"
-    )
-    # File uploader for the invoice PDF
-    invoice_pdf = st.file_uploader("Upload Invoice PDF", type="pdf", key="invoice_pdf_uploader")
-    if st.button("Extract Invoice Information", key="invoice_button") and invoice_pdf is not None:
-        with st.spinner('Reading PDF...'):
-            # Read the PDF content
-            invoice_text = read_pdf(io.BytesIO(invoice_pdf.getvalue()))
-        # Process in status container
-        with st.status("Processing...", expanded=True) as status:
-            st.write(f"🤖 Querying {model_choice} API...")
-            invoice_data = extract_invoice_info(model_choice, invoice_text)
-            if invoice_data:
-                status.update(label="✅ Extraction Complete!", state="complete")
-                display_invoice_data(model_choice, invoice_data)
-            else:
-                status.update(label="❌ Extraction Failed", state="error")
-                st.error("Failed to extract information. Try simplifying the text.")
-        # Debug information outside the status container
-        if invoice_data and "last_api_response" in st.session_state:
-            with st.expander("Debug Information"):
-                st.write("API Response:")
-                st.json(st.session_state.last_api_response)
-                st.write("Raw API Response:")
-                st.code(st.session_state.get("last_api_response_raw", "No response"))
-# Invoice Extractor Functions
 def get_api_key(model_choice):
     """Get the appropriate API key based on model choice"""
     api_key_env = MODELS[model_choice]["api_key_env"]
@@ -438,4 +357,85 @@ def extract_invoice_info(model_choice, text):
                     if field not in item:
                         item[field] = None if field != "quantity" else 0
-    return parsed_data

     }
 }
+# Define all invoice extraction functions first
 def get_api_key(model_choice):
     """Get the appropriate API key based on model choice"""
     api_key_env = MODELS[model_choice]["api_key_env"]
                     if field not in item:
                         item[field] = None if field != "quantity" else 0
+    return parsed_data
+# Create tabs for different functionalities
+tab1, tab2 = st.tabs(["PDF Summarizer", "Invoice Extractor"])
+# PDF Summarizer Tab
+with tab1:
+    st.title("PDF to Bullet Point Summarizer 🗟 🔏")
+    # File uploader for the PDF
+    uploaded_file = st.file_uploader("Upload your PDF document", type="pdf", key="pdf_uploader")
+    # Slider for users to select the summarization extent
+    summary_scale = st.slider("Select the extent of summarization (%)", min_value=1, max_value=100, value=20, key="summary_scale")
+    # Submit button
+    submit_button = st.button("Generate Summary", key="summary_button")
+    # Check if the submit button is pressed
+    if submit_button and uploaded_file is not None:
+        with st.spinner('Processing...'):
+            # Read the PDF content
+            text = read_pdf(io.BytesIO(uploaded_file.getvalue()))
+            # Extract key phrases from the text
+            key_phrases = extract_key_phrases(text)
+            # Score sentences based on the key phrases
+            sentence_scores = score_sentences(text, key_phrases)
+            # Determine the number of bullet points based on the selected summarization scale
+            total_sentences = len(list(sentence_scores.keys()))
+            num_points = max(1, total_sentences * summary_scale // 100)
+            # Generate the bullet-point summary
+            summary = summarize_text(sentence_scores, num_points=num_points)
+            # Display the summary as bullet points
+            st.subheader("Here's the summary: ")
+            st.markdown(summary)
+# Invoice Extractor Tab
+with tab2:
+    st.title("📋 Invoice Extractor from PDF")
+    st.write("Upload an invoice PDF to extract key details")
+    # Model selection
+    model_choice = st.selectbox(
+        "Select AI Model",
+        list(MODELS.keys()),
+        index=0,
+        help="Choose which AI model to use for extraction",
+        key="model_choice"
+    )
+    # File uploader for the invoice PDF
+    invoice_pdf = st.file_uploader("Upload Invoice PDF", type="pdf", key="invoice_pdf_uploader")
+    if st.button("Extract Invoice Information", key="invoice_button") and invoice_pdf is not None:
+        with st.spinner('Reading PDF...'):
+            # Read the PDF content
+            invoice_text = read_pdf(io.BytesIO(invoice_pdf.getvalue()))
+        # Process in status container
+        with st.status("Processing...", expanded=True) as status:
+            st.write(f"🤖 Querying {model_choice} API...")
+            invoice_data = extract_invoice_info(model_choice, invoice_text)
+            if invoice_data:
+                status.update(label="✅ Extraction Complete!", state="complete")
+                display_invoice_data(model_choice, invoice_data)
+            else:
+                status.update(label="❌ Extraction Failed", state="error")
+                st.error("Failed to extract information. Try simplifying the text.")
+        # Debug information outside the status container
+        if invoice_data and "last_api_response" in st.session_state:
+            with st.expander("Debug Information"):
+                st.write("API Response:")
+                st.json(st.session_state.last_api_response)
+                st.write("Raw API Response:")
+                st.code(st.session_state.get("last_api_response_raw", "No response"))