Spaces:

Marthee
/

NavigateToPage

Sleeping

App Files Files Community

Marthee commited on Dec 7, 2024

Commit

bd99369

verified ·

1 Parent(s): 46886f1

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -38

app.py CHANGED Viewed

@@ -1,37 +1,49 @@
-from flask import Flask, send_file, render_template, request
 import requests
 from io import BytesIO
 import fitz  # PyMuPDF
 app = Flask(__name__)
-# Route to render the main page with page number
 @app.route("/", methods=["GET", "POST"])
 def getInfotoMeasure():
-    # Call the function to highlight text and get the page number
-    pdf_link = ['https://www.dropbox.com/scl/fi/fjykwhhn9gu9t3kqrflxd/LA002-NOR-ZZ-ZZ-T-A-2403_Architectural-Specification-F10-Brick-and-Block-Walling_A4-_C01.pdf?rlkey=ek9i66i79m0hwp8z5yjs6rp5p&st=jh05a6qs&dl=0']
-    keyword = "To be read with preliminaries/ general conditions"
-    pdf_content, pageNumTextFound = highlight_text_from_pdf(pdf_link, keyword)
-    # Pass pageNumTextFound to the template for rendering
-    return render_template("gui.html", page=pageNumTextFound)
-# Function to highlight text in PDF and return the page number
-def highlight_text_from_pdf(pdfshareablelinks, keyword):
     print('PDF Links:', pdfshareablelinks)
     for link in pdfshareablelinks:
         pdf_content = None
         if link and ('http' in link or 'dropbox' in link):
-            # Modify Dropbox link for direct download
             if 'dl=0' in link:
                 link = link.replace('dl=0', 'dl=1')
-            # Download PDF content from the link
             response = requests.get(link)
             if response.status_code == 200:
                 pdf_content = BytesIO(response.content)
-                print('Downloaded PDF content.')
         if pdf_content is None:
             raise ValueError("No valid PDF content found.")
@@ -46,32 +58,9 @@ def highlight_text_from_pdf(pdfshareablelinks, keyword):
             if matched:
                 for word in matched:
                     page.add_highlight_annot(word)
-                pageNumTextFound = page_num + 1  # 1-indexed
         return pdf_document, pageNumTextFound
-# Flask route to serve the highlighted PDF
-@app.route('/view-pdf', methods=['GET'])
-def download_pdf():
-    pdf_link = [
-        'https://www.dropbox.com/scl/fi/fjykwhhn9gu9t3kqrflxd/LA002-NOR-ZZ-ZZ-T-A-2403_Architectural-Specification-F10-Brick-and-Block-Walling_A4-_C01.pdf?rlkey=ek9i66i79m0hwp8z5yjs6rp5p&st=jh05a6qs&dl=0'
-    ]
-    keyword = "To be read with preliminaries/ general conditions"
-    # Call function to highlight text and get PDF page
-    pdf_content, pageNumTextFound = highlight_text_from_pdf(pdf_link, keyword)
-    # Create a BytesIO object from the modified PDF content
-    pdf_bytes = BytesIO()
-    pdf_content.save(pdf_bytes)
-    pdf_bytes.seek(0)
-    return send_file(
-        pdf_bytes,
-        mimetype='application/pdf',
-        as_attachment=False,
-        download_name=f"highlighted_page_{pageNumTextFound}.pdf"
-    )
 if __name__ == '__main__':
     app.run(host='0.0.0.0', port=7860)

+from flask import Flask, send_file, render_template, request, session
 import requests
 from io import BytesIO
 import fitz  # PyMuPDF
 app = Flask(__name__)
+# Store the result in session to reuse it across routes
 @app.route("/", methods=["GET", "POST"])
 def getInfotoMeasure():
+    if 'pageNumTextFound' not in session:
+        pdf_link = ['https://www.dropbox.com/scl/fi/fjykwhhn9gu9t3kqrflxd/LA002-NOR-ZZ-ZZ-T-A-2403_Architectural-Specification-F10-Brick-and-Block-Walling_A4-_C01.pdf?rlkey=ek9i66i79m0hwp8z5yjs6rp5p&st=jh05a6qs&dl=0']
+        keyword = "To be read with preliminaries/ general conditions"
+        # Call the function once and store the result in session
+        pdf_content, pageNumTextFound = highlight_text_from_pdf(pdf_link, keyword)
+        session['pageNumTextFound'] = pageNumTextFound
+        session['pdf_content'] = pdf_content.getvalue()
+    return render_template("gui.html", page=session['pageNumTextFound'])
+@app.route('/view-pdf', methods=['GET'])
+def download_pdf():
+    if 'pdf_content' not in session:
+        return "PDF content not found in session.", 404
+    pdf_bytes = BytesIO(session['pdf_content'])
+    return send_file(
+        pdf_bytes,
+        mimetype='application/pdf',
+        as_attachment=False,
+        download_name=f"highlighted_page_{session['pageNumTextFound']}.pdf"
+    )
+def highlight_text_from_pdf(pdfshareablelinks, keyword):
     print('PDF Links:', pdfshareablelinks)
     for link in pdfshareablelinks:
         pdf_content = None
         if link and ('http' in link or 'dropbox' in link):
             if 'dl=0' in link:
                 link = link.replace('dl=0', 'dl=1')
             response = requests.get(link)
             if response.status_code == 200:
                 pdf_content = BytesIO(response.content)
         if pdf_content is None:
             raise ValueError("No valid PDF content found.")
             if matched:
                 for word in matched:
                     page.add_highlight_annot(word)
+                pageNumTextFound = page_num + 1
         return pdf_document, pageNumTextFound
 if __name__ == '__main__':
     app.run(host='0.0.0.0', port=7860)