Spaces:

abhinavdread
/

paddleocr

Sleeping

abhinavvvvv commited on 14 days ago

Commit

699048b

1 Parent(s): 69e7a6e

initial commit

Files changed (5) hide show

Dockerfile ADDED Viewed

+FROM python:3.10-slim
+WORKDIR /app
+RUN apt-get update && apt-get install -y \
+  libglib2.0-0 \
+  libsm6 \
+  libxext6 \
+  libxrender1 \
+  && rm -rf /var/lib/apt/lists/*
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+COPY app ./app
+EXPOSE 8000
+CMD ["uvicorn", "app.main:app", "--host", "0.0.0.0", "--port", "8000", "--workers", "1"]

app/main.py ADDED Viewed

+from fastapi import FastAPI, UploadFile, File
+from app.ocr_engine import OCREngine
+from app.schemas import OCRResponse, OCRLine
+app = FastAPI(
+    title="Invoice OCR API",
+    version="1.0.0"
+)
+ocr_engine = OCREngine()
+@app.get("/")
+def health():
+    return {"status": "OCR API running"}
+@app.post("/ocr", response_model=OCRResponse)
+async def ocr_endpoint(file: UploadFile = File(...)):
+    image_bytes = await file.read()
+    lines = ocr_engine.extract_text(image_bytes)
+    return OCRResponse(
+        lines=[OCRLine(**line) for line in lines]
+    )

app/ocr_engine.py ADDED Viewed

+from paddleocr import PaddleOCR
+from PIL import Image
+import numpy as np
+import cv2
+class OCREngine:
+    def __init__(self):
+        self.ocr = PaddleOCR(
+            use_angle_cls=True,
+            lang='en',
+            use_gpu=False
+        )
+    def extract_text(self, image_bytes):
+        nparr = np.frombuffer(image_bytes, np.uint8)
+        img = cv2.imdecode(nparr, cv2.IMREAD_COLOR)
+        result = self.ocr.ocr(img, cls=True)
+        lines = []
+        for line in result[0]:
+            text = line[1][0]
+            confidence = float(line[1][1])
+            lines.append({
+                "text": text,
+                "confidence": confidence
+            })
+        return lines

app/schemas.py ADDED Viewed

+from pydantic import BaseModel
+from typing import List
+class OCRLine(BaseModel):
+    text: str
+    confidence: float
+class OCRResponse(BaseModel):
+    lines: List[OCRLine]

requirements.txt ADDED Viewed

+fastapi
+uvicorn[standard]
+paddleocr
+paddlepaddle==2.6.1
+python-multipart
+opencv-python-headless
+pillow