ridoo14
/

object-detect

Model card Files Files and versions

object-detect / main.py

ridoo14's picture

Upload 6 files

4674250 verified about 1 year ago

history blame contribute delete

4.02 kB

	import io
	import base64
	import numpy as np
	import cv2
	from PIL import Image as PILImage
	from ultralytics import YOLO
	from fastapi import FastAPI, HTTPException
	from pydantic import BaseModel
	from typing import Optional
	from matplotlib import cm

	from fastapi.middleware.cors import CORSMiddleware

	app = FastAPI()

	# Add CORS middleware to allow requests from anywhere
	app.add_middleware(
	CORSMiddleware,
	allow_origins=["*"], # Allow all origins
	allow_credentials=True,
	allow_methods=["*"], # Allow all HTTP methods
	allow_headers=["*"], # Allow all headers
	)

	class ImageRequest(BaseModel):
	image: str # Base64-encoded image string

	class ObjectDetectionSystem:
	def __init__(self, model_path='Model/yolov8l.pt'):
	self.yolo_model = YOLO(model_path)
	self.color_map = cm.get_cmap("tab20", len(self.yolo_model.names)) # Generate distinct colors

	def detect_objects(self, image_base64: str, confidence_threshold: float = 0.5):
	try:
	# Decode Base64 and convert to NumPy array
	image_data = base64.b64decode(image_base64)
	pil_image = PILImage.open(io.BytesIO(image_data)).convert("RGB")
	image_np = np.array(pil_image)

	# Resize image for consistent processing
	input_size = 640 # Example size for YOLO models
	height, width, _ = image_np.shape
	scale = input_size / max(height, width)
	resized_image = cv2.resize(image_np, (int(width * scale), int(height * scale)))

	# Perform object detection
	results = self.yolo_model(resized_image)

	# Draw results on image
	output_image = resized_image.copy()
	for result in results:
	boxes = result.boxes
	for box in boxes:
	x1, y1, x2, y2 = box.xyxy[0].cpu().numpy()
	x1, y1, x2, y2 = int(x1), int(y1), int(x2), int(y2)
	confidence = float(box.conf[0])
	class_id = int(box.cls[0])
	class_name = self.yolo_model.names[class_id]

	if confidence > confidence_threshold:
	# Generate color for this class
	color = tuple(int(c * 255) for c in self.color_map(class_id)[:3])

	# Draw bounding box
	cv2.rectangle(output_image, (x1, y1), (x2, y2), color, 2)

	# Add label with confidence
	label = f'{class_name} ({confidence:.2f})'
	label_size, baseline = cv2.getTextSize(label, cv2.FONT_HERSHEY_SIMPLEX, 0.5, 1)
	label_y = max(y1, label_size[1] + 10)
	cv2.rectangle(output_image, (x1, label_y - label_size[1] - 10),
	(x1 + label_size[0], label_y + baseline - 10), color, -1)
	cv2.putText(output_image, label, (x1, label_y - 5), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (255, 255, 255), 1)

	# Convert back to Base64
	output_pil = PILImage.fromarray(output_image)
	buffered = io.BytesIO()
	output_pil.save(buffered, format="PNG")
	encoded_image = base64.b64encode(buffered.getvalue()).decode("utf-8")

	return encoded_image

	except Exception as e:
	raise HTTPException(status_code=500, detail=str(e))

	# Initialize the detector with a more advanced model
	detector = ObjectDetectionSystem('Model/yolov8l.pt')

	@app.post("/detect")
	async def detect_objects(request: ImageRequest):
	try:
	result_image = detector.detect_objects(request.image)
	return {"processed_image": result_image}
	except Exception as e:
	raise HTTPException(status_code=500, detail=str(e))

	@app.get("/")
	async def root():
	return {"message": "Object Detection API is running"}