Spaces:

Marthee
/

NavigateToPage

Sleeping

App Files Files Community

Marthee commited on Dec 7, 2024

Commit

46886f1

verified ·

1 Parent(s): 1abd7ac

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -11

app.py CHANGED Viewed

@@ -5,12 +5,18 @@ import fitz  # PyMuPDF
 app = Flask(__name__)
-# Route to render the main page
 @app.route("/", methods=["GET", "POST"])
-def getInfotoMeasure(pagenum):
-    return render_template("gui.html", page=pagenum)
-# Function to highlight text in PDF
 def highlight_text_from_pdf(pdfshareablelinks, keyword):
     print('PDF Links:', pdfshareablelinks)
     for link in pdfshareablelinks:
@@ -21,11 +27,11 @@ def highlight_text_from_pdf(pdfshareablelinks, keyword):
             if 'dl=0' in link:
                 link = link.replace('dl=0', 'dl=1')
-            # Download the PDF content from the shareable link
             response = requests.get(link)
             if response.status_code == 200:
                 pdf_content = BytesIO(response.content)
-                print('Downloaded from shareable link.')
         if pdf_content is None:
             raise ValueError("No valid PDF content found.")
@@ -40,11 +46,11 @@ def highlight_text_from_pdf(pdfshareablelinks, keyword):
             if matched:
                 for word in matched:
                     page.add_highlight_annot(word)
-                pageNumTextFound = page_num + 1  # 1-indexed pages
         return pdf_document, pageNumTextFound
-# Route to serve PDF with a specified page
 @app.route('/view-pdf', methods=['GET'])
 def download_pdf():
     pdf_link = [
@@ -55,9 +61,7 @@ def download_pdf():
     # Call function to highlight text and get PDF page
     pdf_content, pageNumTextFound = highlight_text_from_pdf(pdf_link, keyword)
-    # Render the main GUI with the detected page number
-    getInfotoMeasure(pageNumTextFound)
     pdf_bytes = BytesIO()
     pdf_content.save(pdf_bytes)
     pdf_bytes.seek(0)

 app = Flask(__name__)
+# Route to render the main page with page number
 @app.route("/", methods=["GET", "POST"])
+def getInfotoMeasure():
+    # Call the function to highlight text and get the page number
+    pdf_link = ['https://www.dropbox.com/scl/fi/fjykwhhn9gu9t3kqrflxd/LA002-NOR-ZZ-ZZ-T-A-2403_Architectural-Specification-F10-Brick-and-Block-Walling_A4-_C01.pdf?rlkey=ek9i66i79m0hwp8z5yjs6rp5p&st=jh05a6qs&dl=0']
+    keyword = "To be read with preliminaries/ general conditions"
+    pdf_content, pageNumTextFound = highlight_text_from_pdf(pdf_link, keyword)
+    # Pass pageNumTextFound to the template for rendering
+    return render_template("gui.html", page=pageNumTextFound)
+# Function to highlight text in PDF and return the page number
 def highlight_text_from_pdf(pdfshareablelinks, keyword):
     print('PDF Links:', pdfshareablelinks)
     for link in pdfshareablelinks:
             if 'dl=0' in link:
                 link = link.replace('dl=0', 'dl=1')
+            # Download PDF content from the link
             response = requests.get(link)
             if response.status_code == 200:
                 pdf_content = BytesIO(response.content)
+                print('Downloaded PDF content.')
         if pdf_content is None:
             raise ValueError("No valid PDF content found.")
             if matched:
                 for word in matched:
                     page.add_highlight_annot(word)
+                pageNumTextFound = page_num + 1  # 1-indexed
         return pdf_document, pageNumTextFound
+# Flask route to serve the highlighted PDF
 @app.route('/view-pdf', methods=['GET'])
 def download_pdf():
     pdf_link = [
     # Call function to highlight text and get PDF page
     pdf_content, pageNumTextFound = highlight_text_from_pdf(pdf_link, keyword)
+    # Create a BytesIO object from the modified PDF content
     pdf_bytes = BytesIO()
     pdf_content.save(pdf_bytes)
     pdf_bytes.seek(0)