InitialMarkups

Runtime error

App Files Files Community

Marthee commited on Jun 5, 2025

Commit

09f4b44

verified ·

1 Parent(s): a5d06df

Update InitialMarkups.py

Browse files

Files changed (1) hide show

InitialMarkups.py +48 -1

InitialMarkups.py CHANGED Viewed

@@ -6,7 +6,7 @@ Automatically generated by Colab.
 Original file is located at
     https://colab.research.google.com/drive/12XfVkmKmN3oVjHhLVE0_GgkftgArFEK2
 """
-baselink='https://find-initialmarkups.hf.space/view-pdf?'
@@ -898,6 +898,53 @@ def extract_section_under_header(pdf_path):
                                         current_bbox[page_num] = header_bbox
                                     last_y1s[page_num] = header_bbox[3]
                                     i += 2
                                     continue
                     if collecting:

 Original file is located at
     https://colab.research.google.com/drive/12XfVkmKmN3oVjHhLVE0_GgkftgArFEK2
 """
+baselink='https://findconsole-initialmarkups.hf.space/view-pdf?'
                                         current_bbox[page_num] = header_bbox
                                     last_y1s[page_num] = header_bbox[3]
+                                    x0, y0, x1, y1 = header_bbox
+                                    zoom = 200
+                                    left = int(x0)
+                                    top = int(y0)
+                                    zoom_str = f"{zoom},{left},{top}"
+                                    pageNumberFound = page_num + 1
+                                  # Build the query parameters
+                                    params = {
+                                        'pdfLink': pdf_path,  # Your PDF link
+                                        'keyword': heading_to_search,  # Your keyword (could be a string or list)
+                                    }
+                                    # URL encode each parameter
+                                    encoded_params = {key: urllib.parse.quote(value, safe='') for key, value in params.items()}
+                                    # Construct the final encoded link
+                                    encoded_link = '&'.join([f"{key}={value}" for key, value in encoded_params.items()])
+                                    # Correctly construct the final URL with page and zoom
+                                    final_url = f"{baselink}{encoded_link}#page={str(pageNumberFound)}&zoom={zoom_str}"
+                                    # Get current date and time
+                                    now = datetime.now()
+                                    # Format the output
+                                    formatted_time = now.strftime("%d/%m/%Y %I:%M:%S %p")
+                                    # Optionally, add the URL to a DataFrame
+                                    data_entry = {
+                                            "NBSLink": final_url,
+                                            "Subject": heading_to_search,
+                                            "Page": str(pageNumberFound),
+                                            "Author": "ADR",
+                                            "Creation Date": formatted_time,
+                                            "Layer": "Initial",
+                                            "Code": "to be added",
+                                            "head above 1":  paths[-2],
+                                            "head above 2":  paths[0]
+                                        }
+                                    data_list_JSON.append(data_entry)
+                                    # Convert list to JSON
+                                    json_output = json.dumps(data_list_JSON, indent=4)
+                                    print("Final URL:", final_url)
                                     i += 2
                                     continue
                     if collecting: