WalletSyncOCR

Sleeping

App Files Files Community

LogicGoInfotechSpaces commited on Nov 14, 2025

Commit

09328e0

verified ·

1 Parent(s): 223bd89

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -36

app.py CHANGED Viewed

@@ -1,9 +1,7 @@
 # app.py
-import io
 import uvicorn
 import numpy as np
 import cv2
-import re
 from fastapi import FastAPI, UploadFile, File, HTTPException
 from bson import ObjectId
 from motor.motor_asyncio import AsyncIOMotorClient, AsyncIOMotorGridFSBucket
@@ -19,16 +17,15 @@ MONGO_URI = (
 )
 DB_NAME = "ocr_fastapi"
-BUCKET_NAME = "fs"  # <-- FIXED (use default GridFS bucket)
 app = FastAPI()
-# MongoDB Init
 _client = AsyncIOMotorClient(MONGO_URI)
 _db = _client[DB_NAME]
 def gridfs():
-    # Always use default "fs" bucket (fs.files + fs.chunks)
     return AsyncIOMotorGridFSBucket(_db, bucket_name=BUCKET_NAME)
 ocr_engine = RapidOCR()
@@ -42,14 +39,11 @@ async def health():
 # --------------------------------------------------
 @app.post("/upload")
 async def upload_image(file: UploadFile = File(...)):
-    """
-    Uploads image to MongoDB GridFS
-    """
     try:
         data = await file.read()
         fs = gridfs()
-        # Upload to GridFS
         oid = await fs.upload_from_stream(
             file.filename,
             data,
@@ -58,9 +52,9 @@ async def upload_image(file: UploadFile = File(...)):
         print("📌 Uploaded ID:", oid)
-        # Debug: Confirm stored in fs.files
         stored = await _db[f"{BUCKET_NAME}.files"].count_documents({"_id": oid})
-        print("📦 Stored in DB:", stored)
         return {"image_id": str(oid)}
@@ -69,23 +63,20 @@ async def upload_image(file: UploadFile = File(...)):
 # --------------------------------------------------
 async def load_image_from_gridfs(image_id: str):
-    """
-    Loads the image bytes from GridFS bucket
-    """
     try:
         print("🔍 Fetching from GridFS:", image_id)
         oid = ObjectId(image_id)
         fs = gridfs()
-        # Debug: check existence
         file_exists = await _db[f"{BUCKET_NAME}.files"].count_documents({"_id": oid})
-        print("📂 Exists in fs.files:", file_exists)
         if file_exists == 0:
-            raise HTTPException(status_code=404, detail="Image not found in GridFS")
-        # Read file
         stream = await fs.open_download_stream(oid)
         data = await stream.read()
         await stream.close()
@@ -101,29 +92,27 @@ async def load_image_from_gridfs(image_id: str):
 # --------------------------------------------------
 @app.post("/generate/{image_id}")
 async def generate(image_id: str):
-    """
-    Reads image → performs OCR → returns extracted text
-    """
     raw_bytes = await load_image_from_gridfs(image_id)
-    # Decode image
     img_array = np.frombuffer(raw_bytes, np.uint8)
     img = cv2.imdecode(img_array, cv2.IMREAD_COLOR)
     if img is None:
         raise HTTPException(status_code=400, detail="Unable to decode image")
-    # Perform OCR
     result, times = ocr_engine(img)
     if not result:
         raise HTTPException(status_code=500, detail="OCR returned empty result")
-    # Extract plain text
     extracted = [text for box, text, score in result]
     full_text = "\n".join(extracted)
-    # Cache in memory for view endpoint
     OCR_RESULTS[image_id] = {
         "text": full_text,
         "details": result,
@@ -136,20 +125,11 @@ async def generate(image_id: str):
 @app.get("/view/{image_id}")
 async def view_details(image_id: str):
     """
-    Returns cached OCR result
     """
     if image_id not in OCR_RESULTS:
-        raise HTTPException(status_code=404, detail="No OCR result found for this ID")
     return OCR_RESULTS[image_id]
-@app.get("/debug/db")
-async def debug_db():
-    return {"db_name": _db.name, "collections": await _db.list_collection_names()}
-@app.get("/debug/test-write")
-async def test_write():
-    res = await _db["debug_test"].insert_one({"ping": "ok"})
-    return {"inserted_id": str(res.inserted_id)}
 # --------------------------------------------------
 if __name__ == "__main__":

 # app.py
 import uvicorn
 import numpy as np
 import cv2
 from fastapi import FastAPI, UploadFile, File, HTTPException
 from bson import ObjectId
 from motor.motor_asyncio import AsyncIOMotorClient, AsyncIOMotorGridFSBucket
 )
 DB_NAME = "ocr_fastapi"
+BUCKET_NAME = "ocr_images"   # ✔ USE THIS BUCKET
 app = FastAPI()
+# Init MongoDB & GridFS
 _client = AsyncIOMotorClient(MONGO_URI)
 _db = _client[DB_NAME]
 def gridfs():
     return AsyncIOMotorGridFSBucket(_db, bucket_name=BUCKET_NAME)
 ocr_engine = RapidOCR()
 # --------------------------------------------------
 @app.post("/upload")
 async def upload_image(file: UploadFile = File(...)):
     try:
         data = await file.read()
         fs = gridfs()
+        # Upload image bytes to GridFS
         oid = await fs.upload_from_stream(
             file.filename,
             data,
         print("📌 Uploaded ID:", oid)
+        # Debug: Confirm stored in ocr_images.files
         stored = await _db[f"{BUCKET_NAME}.files"].count_documents({"_id": oid})
+        print("📦 Stored in ocr_images.files:", stored)
         return {"image_id": str(oid)}
 # --------------------------------------------------
 async def load_image_from_gridfs(image_id: str):
     try:
         print("🔍 Fetching from GridFS:", image_id)
         oid = ObjectId(image_id)
         fs = gridfs()
+        # Check file existence
         file_exists = await _db[f"{BUCKET_NAME}.files"].count_documents({"_id": oid})
+        print("📂 Exists in ocr_images.files:", file_exists)
         if file_exists == 0:
+            raise HTTPException(status_code=404, detail="Image not found")
+        # Read file from GridFS
         stream = await fs.open_download_stream(oid)
         data = await stream.read()
         await stream.close()
 # --------------------------------------------------
 @app.post("/generate/{image_id}")
 async def generate(image_id: str):
+    # Load the image data
     raw_bytes = await load_image_from_gridfs(image_id)
+    # Decode into OpenCV format
     img_array = np.frombuffer(raw_bytes, np.uint8)
     img = cv2.imdecode(img_array, cv2.IMREAD_COLOR)
     if img is None:
         raise HTTPException(status_code=400, detail="Unable to decode image")
+    # Run OCR
     result, times = ocr_engine(img)
     if not result:
         raise HTTPException(status_code=500, detail="OCR returned empty result")
+    # Extract recognized text only
     extracted = [text for box, text, score in result]
     full_text = "\n".join(extracted)
+    # Cache OCR results for viewing
     OCR_RESULTS[image_id] = {
         "text": full_text,
         "details": result,
 @app.get("/view/{image_id}")
 async def view_details(image_id: str):
     """
+    Returns OCR results stored in memory.
     """
     if image_id not in OCR_RESULTS:
+        raise HTTPException(status_code=404, detail="No OCR result found")
     return OCR_RESULTS[image_id]
 # --------------------------------------------------
 if __name__ == "__main__":