Spaces:

iammraat
/

document

Running

App Files Files Community

iammraat commited on 11 days ago

Commit

583f78a

verified ·

1 Parent(s): 0cf77d7

Update app.py

Browse files

Files changed (1) hide show

app.py +21 -18

app.py CHANGED Viewed

@@ -3,9 +3,6 @@ import cv2
 import numpy as np
 import os
 from huggingface_hub import snapshot_download
-# --- STRICT UPDATE: Use PPStructureV3 directly ---
-# Your logs confirmed this class exists in your installed version.
 from paddleocr import PPStructureV3
 # --- STEP 1: Download the Model ---
@@ -14,14 +11,16 @@ model_path = snapshot_download(repo_id="PaddlePaddle/PP-DocLayoutV3", allow_patt
 print(f"Model downloaded to: {model_path}")
 # --- STEP 2: Initialize V3 Engine ---
-# We instantiate PPStructureV3 directly.
 layout_engine = PPStructureV3(
     layout_model_dir=model_path,
     table=False,
     ocr=False,
-    show_log=True,
-    use_angle_cls=True,
-    enable_mkldnn=False # Keeps the crash fix while using the new model
 )
 def analyze_layout(input_image):
@@ -45,8 +44,9 @@ def analyze_layout(input_image):
     # Iterate through results
     for region in result:
-        # V3 Output format usually includes 'layout_bbox'
         if isinstance(region, dict):
             box = region.get('layout_bbox') or region.get('bbox')
             label = region.get('label', 'unknown')
         else:
@@ -55,17 +55,20 @@ def analyze_layout(input_image):
         if box is None: continue
         # Draw the box
-        x1, y1, x2, y2 = int(box[0]), int(box[1]), int(box[2]), int(box[3])
-        # Color coding
-        color = (0, 255, 0)
-        if label == 'title': color = (0, 0, 255)
-        elif label == 'figure': color = (255, 0, 0)
-        elif label == 'table': color = (255, 255, 0)
-        cv2.rectangle(viz_image, (x1, y1), (x2, y2), color, 3)
-        cv2.putText(viz_image, label, (x1, y1 - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.8, color, 2)
-        detections_text.append(f"Found {label} at {box}")
     return viz_image, "\n".join(detections_text)

 import numpy as np
 import os
 from huggingface_hub import snapshot_download
 from paddleocr import PPStructureV3
 # --- STEP 1: Download the Model ---
 print(f"Model downloaded to: {model_path}")
 # --- STEP 2: Initialize V3 Engine ---
 layout_engine = PPStructureV3(
     layout_model_dir=model_path,
     table=False,
     ocr=False,
+    # show_log=True,  <-- REMOVED (Caused the crash)
+    # In V3, 'use_angle_cls' is often renamed for documents:
+    use_doc_orientation_classify=True,
+    enable_mkldnn=False # Keeps the crash fix
 )
 def analyze_layout(input_image):
     # Iterate through results
     for region in result:
+        # V3 Output format usually includes 'layout_bbox' or 'bbox'
         if isinstance(region, dict):
+            # Try specific v3 keys first, fallback to generic
             box = region.get('layout_bbox') or region.get('bbox')
             label = region.get('label', 'unknown')
         else:
         if box is None: continue
         # Draw the box
+        try:
+            x1, y1, x2, y2 = int(box[0]), int(box[1]), int(box[2]), int(box[3])
+            # Color coding
+            color = (0, 255, 0) # Default Green
+            if label == 'title': color = (0, 0, 255) # Red
+            elif label == 'figure': color = (255, 0, 0) # Blue
+            elif label == 'table': color = (255, 255, 0) # Cyan
+            cv2.rectangle(viz_image, (x1, y1), (x2, y2), color, 3)
+            cv2.putText(viz_image, label, (x1, y1 - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.8, color, 2)
+            detections_text.append(f"Found {label} at {box}")
+        except Exception:
+            pass
     return viz_image, "\n".join(detections_text)