Digitaljoint
/

ProofCheck

Yaz Hobooti commited on Sep 16, 2025

Commit

2874826

1 Parent(s): bae9f7f

Fix indentation error in find_misspell_boxes function

Files changed (1) hide show

pdf_comparator.py CHANGED Viewed

@@ -131,25 +131,25 @@ def find_misspell_boxes(img: Image.Image) -> List[Box]:
     try:
         spell = SpellChecker()
         data = pytesseract.image_to_data(img, output_type=pytesseract.Output.DICT)
-            except Exception:
-            return []
-        n = len(data.get("text", []))
     boxes: List[Box] = []
-        for i in range(n):
         text = data["text"][i]
         if not text:
-                continue
         token = normalize_token(text)
         if len(token) < 2:
-                    continue
         if token in spell:
-                    continue
         left  = data.get("left",  [0])[i]
         top   = data.get("top",   [0])[i]
         width = data.get("width", [0])[i]
         height= data.get("height",[0])[i]
         if width <= 0 or height <= 0:
-                    continue
         boxes.append(Box(top, left, top+height, left+width, width*height))
     return boxes

     try:
         spell = SpellChecker()
         data = pytesseract.image_to_data(img, output_type=pytesseract.Output.DICT)
+    except Exception:
+        return []
+    n = len(data.get("text", []))
     boxes: List[Box] = []
+    for i in range(n):
         text = data["text"][i]
         if not text:
+            continue
         token = normalize_token(text)
         if len(token) < 2:
+            continue
         if token in spell:
+            continue
         left  = data.get("left",  [0])[i]
         top   = data.get("top",   [0])[i]
         width = data.get("width", [0])[i]
         height= data.get("height",[0])[i]
         if width <= 0 or height <= 0:
+            continue
         boxes.append(Box(top, left, top+height, left+width, width*height))
     return boxes