OCR-FastAPI / app.py
msi
first commit
197a58a
raw
history blame
1.38 kB
from fastapi import FastAPI, UploadFile, File, HTTPException
from fastapi.responses import JSONResponse
from pydantic import BaseModel
from PIL import Image
import io
import os
import google.generativeai as genai
from fastapi.responses import FileResponse
from pdf_generator import create_receipt
genai.configure(api_key=os.environ.get("GOOGLE_API_KEY"))
app = FastAPI()
class OCRResponse(BaseModel):
extracted_text: str
@app.post("/ocr-image/", response_model=OCRResponse)
async def ocr_image(file: UploadFile = File(...)):
if not file.content_type.startswith("image/"):
raise HTTPException(status_code=400, detail="Uploaded file must be an image.")
try:
image_data = await file.read()
image = Image.open(io.BytesIO(image_data))
model = genai.GenerativeModel('gemini-2.0-flash')
prompt = "Extract and Identify all text from this image and generate a receipt without any additional information."
contents = [prompt, image]
response = model.generate_content(contents)
extracted_text = response.text
create_receipt(extracted_text, file_name="result/receipt.pdf")
return FileResponse(path="result/receipt.pdf", filename="receipt.pdf", media_type='application/pdf')
except Exception as e:
raise HTTPException(status_code=500, detail=f"OCR failed: {str(e)}")