Spaces:

lulavc
/

BubbleScribe

Runtime error

App Files Files Community

lulavc commited on Dec 10, 2025

Commit

e625573

verified ·

1 Parent(s): 37ef455

Fix bbox validation and strip GLM tokens

Browse files

Files changed (1) hide show

app.py +20 -2

app.py CHANGED Viewed

@@ -294,6 +294,9 @@ CRITICAL: Find at least 20-50 text regions. This image has many text elements. S
             # Append reasoning content if present
             result_text = result_text + "\n" + msg.reasoning_content if result_text else msg.reasoning_content
         print(f"📝 GLM Response length: {len(result_text)} chars")
         print(f"📝 GLM Response preview: {result_text[:500] if result_text else 'EMPTY'}...")
@@ -331,12 +334,22 @@ def create_text_mask(image: Image.Image, detections: list, padding: int = 12) ->
         bbox = det.get('bbox', [])
         if len(bbox) == 4:
             x1, y1, x2, y2 = [int(v) for v in bbox]
             # Larger padding for cleaner inpainting
             x1 = max(0, x1 - padding)
             y1 = max(0, y1 - padding)
             x2 = min(image.width, x2 + padding)
             y2 = min(image.height, y2 + padding)
-            draw.rectangle([x1, y1, x2, y2], fill=255)
     return mask
@@ -386,10 +399,15 @@ def add_translated_text(image: Image.Image, detections: list) -> Image.Image:
         if len(bbox) == 4 and translated:
             x1, y1, x2, y2 = [int(v) for v in bbox]
             box_width = x2 - x1
             box_height = y2 - y1
-            # Skip very small boxes
             if box_width < 20 or box_height < 10:
                 continue

             # Append reasoning content if present
             result_text = result_text + "\n" + msg.reasoning_content if result_text else msg.reasoning_content
+        # Strip GLM special tokens
+        result_text = result_text.replace('<|begin_of_box|>', '').replace('<|end_of_box|>', '')
         print(f"📝 GLM Response length: {len(result_text)} chars")
         print(f"📝 GLM Response preview: {result_text[:500] if result_text else 'EMPTY'}...")
         bbox = det.get('bbox', [])
         if len(bbox) == 4:
             x1, y1, x2, y2 = [int(v) for v in bbox]
+            # Ensure coordinates are valid (x2 > x1, y2 > y1)
+            if x2 < x1:
+                x1, x2 = x2, x1
+            if y2 < y1:
+                y1, y2 = y2, y1
+            # Skip invalid boxes
+            if x2 <= x1 or y2 <= y1:
+                continue
             # Larger padding for cleaner inpainting
             x1 = max(0, x1 - padding)
             y1 = max(0, y1 - padding)
             x2 = min(image.width, x2 + padding)
             y2 = min(image.height, y2 + padding)
+            # Final validation
+            if x2 > x1 and y2 > y1:
+                draw.rectangle([x1, y1, x2, y2], fill=255)
     return mask
         if len(bbox) == 4 and translated:
             x1, y1, x2, y2 = [int(v) for v in bbox]
+            # Ensure coordinates are valid
+            if x2 < x1:
+                x1, x2 = x2, x1
+            if y2 < y1:
+                y1, y2 = y2, y1
             box_width = x2 - x1
             box_height = y2 - y1
+            # Skip very small or invalid boxes
             if box_width < 20 or box_height < 10:
                 continue