Spaces:

ssppkenny
/

doclayout

Runtime error

Sergey Mikhno commited on Jun 29, 2025

Commit

529ecd0

1 Parent(s): 9efba4e

model

Files changed (1) hide show

app/app.py CHANGED Viewed

@@ -3,6 +3,9 @@ from doclayout_yolo import YOLOv10
 from huggingface_hub import hf_hub_download
 import torch
 import spaces
 import os
 import json
@@ -19,6 +22,8 @@ app = Flask(__name__)
 app.secret_key = "super secret key"
 app.config['UPLOAD_FOLDER'] = UPLOAD_FOLDER
 def allowed_file(filename):
     return '.' in filename and filename.rsplit('.', 1)[1].lower() in ALLOWED_EXTENSIONS
@@ -54,6 +59,16 @@ def doc_layout():
             blocknames = [names[int(n)] for n in det_res[0].boxes.cls]
             xyxy = [a.tolist() for a in det_res[0].boxes.xyxy]
             res = [{"coords": y, "type": x} for x, y in zip(blocknames, xyxy)]
             return json.dumps(res)
     return '''
     <!doctype html>

 from huggingface_hub import hf_hub_download
 import torch
 import spaces
+import cv2
+from doctr.io import DocumentFile
+from doctr.models import ocr_predictor
 import os
 import json
 app.secret_key = "super secret key"
 app.config['UPLOAD_FOLDER'] = UPLOAD_FOLDER
+doctr_model = ocr_predictor(pretrained=True)
 def allowed_file(filename):
     return '.' in filename and filename.rsplit('.', 1)[1].lower() in ALLOWED_EXTENSIONS
             blocknames = [names[int(n)] for n in det_res[0].boxes.cls]
             xyxy = [a.tolist() for a in det_res[0].boxes.xyxy]
             res = [{"coords": y, "type": x} for x, y in zip(blocknames, xyxy)]
+            pimg = cv2.imread(filename, 0)
+            for r in res:
+                if r["type"] == "plain text":
+                    x, y, x1, y1 = r["coords"]
+                    x, y, x1, y1 = int(x), int(y), int(x1), int(y1)
+                    pbytes = pimg[y:y1,x:x1].tobytes()
+                    single_img_doc = DocumentFile.from_images(pbytes)
+                    result = doctr_model(single_img_doc)
+                    print(result)
             return json.dumps(res)
     return '''
     <!doctype html>