InitialMarkups

Runtime error

Marthee commited on Oct 22, 2025

Commit

2bf08bc

verified ·

1 Parent(s): 88906a0

Update InitialMarkups.py

Files changed (1) hide show

InitialMarkups.py CHANGED Viewed

@@ -36,7 +36,38 @@ def filteredJsons(pdf_path,filteredjsonsfromrawan):
 def get_regular_font_size_and_color(doc):
     font_sizes = []
     colors = []
@@ -1041,35 +1072,6 @@ def extract_section_under_header(pdf_path):
     return pdf_bytes.getvalue(), docHighlights , json_output
-def changepdflinks(data_list_JSON, pdflink):
-    # If the input is a JSON string, convert it to a Python list
-    if isinstance(data_list_JSON, str):
-        data_list_JSON = json.loads(data_list_JSON)
-    # Loop through all entries and update their NBSLink
-    for entry in data_list_JSON:
-        old_url = entry.get("NBSLink", "")
-        # Parse URL and query params
-        parsed = urllib.parse.urlparse(old_url)
-        query = urllib.parse.parse_qs(parsed.query)
-        # Replace only the 'pdfLink' parameter if present
-        if "pdfLink" in query:
-            query["pdfLink"] = [pdflink]
-            # Rebuild query string
-            new_query = urllib.parse.urlencode(query, doseq=True)
-            # Rebuild full URL with the same fragment (page/zoom)
-            new_url = f"{parsed.scheme}://{parsed.netloc}{parsed.path}?{new_query}"
-            if parsed.fragment:
-                new_url += f"#{parsed.fragment}"
-            # Update the entry
-            entry["NBSLink"] = new_url
-    return data_list_JSON

+def changepdflinks(data_list_JSON, pdflink):
+    print('henaaaa weee')
+    # If the input is a JSON string, convert it to a Python list
+    if isinstance(data_list_JSON, str):
+        data_list_JSON = json.loads(data_list_JSON)
+    # Loop through all entries and update their NBSLink
+    for entry in data_list_JSON:
+        old_url = entry.get("NBSLink", "")
+        # Parse URL and query params
+        parsed = urllib.parse.urlparse(old_url)
+        query = urllib.parse.parse_qs(parsed.query)
+        # Replace only the 'pdfLink' parameter if present
+        if "pdfLink" in query:
+            query["pdfLink"] = [pdflink]
+            # Rebuild query string
+            new_query = urllib.parse.urlencode(query, doseq=True)
+            # Rebuild full URL with the same fragment (page/zoom)
+            new_url = f"{parsed.scheme}://{parsed.netloc}{parsed.path}?{new_query}"
+            if parsed.fragment:
+                new_url += f"#{parsed.fragment}"
+            # Update the entry
+            entry["NBSLink"] = new_url
+    return data_list_JSON
 def get_regular_font_size_and_color(doc):
     font_sizes = []
     colors = []
     return pdf_bytes.getvalue(), docHighlights , json_output