Spaces:

triflix
/

sortitout

Paused

App Files Files Community

triflix commited on Nov 20, 2025

Commit

6894202

verified ·

1 Parent(s): 5b41007

Update app.py

Browse files

Files changed (1) hide show

app.py +30 -7

app.py CHANGED Viewed

@@ -79,9 +79,9 @@ async def ocr_endpoint(files: List[UploadFile] = File(...), max_pages: int | Non
     if len(files) > 15:
         raise HTTPException(status_code=400, detail="Maximum 15 files allowed.")
-    final_output = []
-    for file in files:
         filename = file.filename.lower()
         ext = filename.split(".")[-1]
@@ -91,17 +91,40 @@ async def ocr_endpoint(files: List[UploadFile] = File(...), max_pages: int | Non
         with open(temp_path, "wb") as f:
             f.write(await file.read())
         # PDF
         if filename.endswith(".pdf"):
             img_paths = pdf_to_images(temp_path, max_pages=max_pages)
-            for img_path in img_paths:
-                final_output.extend(extract_text(img_path))
-        # Images
         elif filename.endswith((".jpg", ".jpeg", ".png")):
-            final_output.extend(extract_text(temp_path))
         else:
             raise HTTPException(status_code=400, detail=f"Unsupported type: {filename}")
-    return JSONResponse({"results": final_output})

     if len(files) > 15:
         raise HTTPException(status_code=400, detail="Maximum 15 files allowed.")
+    structured_output = {"files": []}
+    for index, file in enumerate(files, start=1):
         filename = file.filename.lower()
         ext = filename.split(".")[-1]
         with open(temp_path, "wb") as f:
             f.write(await file.read())
+        file_record = {
+            "file_id": f"file_{index}",
+            "filename": filename,
+            "pages": []
+        }
+        # -------------------------------
         # PDF
+        # -------------------------------
         if filename.endswith(".pdf"):
             img_paths = pdf_to_images(temp_path, max_pages=max_pages)
+            for page_idx, img_path in enumerate(img_paths):
+                ocr_results = extract_text(img_path)
+                file_record["pages"].append({
+                    "page_index": page_idx,
+                    "results": ocr_results
+                })
+        # -------------------------------
+        # IMAGE
+        # -------------------------------
         elif filename.endswith((".jpg", ".jpeg", ".png")):
+            ocr_results = extract_text(temp_path)
+            file_record["pages"].append({
+                "page_index": 0,
+                "results": ocr_results
+            })
         else:
             raise HTTPException(status_code=400, detail=f"Unsupported type: {filename}")
+        structured_output["files"].append(file_record)
+    return JSONResponse(structured_output)