Spaces:
Sleeping
Sleeping
| import numpy as np | |
| import cv2 | |
| class_names = [ | |
| "A", | |
| "B", | |
| "C", | |
| "D", | |
| "E", | |
| "F", | |
| "G", | |
| "H", | |
| "I", | |
| "J", | |
| "K", | |
| "L", | |
| "M", | |
| "N", | |
| "O", | |
| "P", | |
| "Q", | |
| "R", | |
| "S", | |
| "T", | |
| "U", | |
| "V", | |
| "W", | |
| "X", | |
| "Y", | |
| "Z", | |
| ] | |
| # Create a list of colors for each class where each color is a tuple of 3 integer values | |
| rng = np.random.default_rng(3) | |
| colors = rng.uniform(0, 255, size=(len(class_names), 3)) | |
| def nms(boxes, scores, iou_threshold): | |
| # Sort by score | |
| sorted_indices = np.argsort(scores)[::-1] | |
| keep_boxes = [] | |
| while sorted_indices.size > 0: | |
| # Pick the last box | |
| box_id = sorted_indices[0] | |
| keep_boxes.append(box_id) | |
| # Compute IoU of the picked box with the rest | |
| ious = compute_iou(boxes[box_id, :], boxes[sorted_indices[1:], :]) | |
| # Remove boxes with IoU over the threshold | |
| keep_indices = np.where(ious < iou_threshold)[0] | |
| # print(keep_indices.shape, sorted_indices.shape) | |
| sorted_indices = sorted_indices[keep_indices + 1] | |
| return keep_boxes | |
| def multiclass_nms(boxes, scores, class_ids, iou_threshold): | |
| unique_class_ids = np.unique(class_ids) | |
| keep_boxes = [] | |
| for class_id in unique_class_ids: | |
| class_indices = np.where(class_ids == class_id)[0] | |
| class_boxes = boxes[class_indices, :] | |
| class_scores = scores[class_indices] | |
| class_keep_boxes = nms(class_boxes, class_scores, iou_threshold) | |
| keep_boxes.extend(class_indices[class_keep_boxes]) | |
| return keep_boxes | |
| def compute_iou(box, boxes): | |
| # Compute xmin, ymin, xmax, ymax for both boxes | |
| xmin = np.maximum(box[0], boxes[:, 0]) | |
| ymin = np.maximum(box[1], boxes[:, 1]) | |
| xmax = np.minimum(box[2], boxes[:, 2]) | |
| ymax = np.minimum(box[3], boxes[:, 3]) | |
| # Compute intersection area | |
| intersection_area = np.maximum(0, xmax - xmin) * np.maximum(0, ymax - ymin) | |
| # Compute union area | |
| box_area = (box[2] - box[0]) * (box[3] - box[1]) | |
| boxes_area = (boxes[:, 2] - boxes[:, 0]) * (boxes[:, 3] - boxes[:, 1]) | |
| union_area = box_area + boxes_area - intersection_area | |
| # Compute IoU | |
| iou = intersection_area / union_area | |
| return iou | |
| def xywh2xyxy(x): | |
| # Convert bounding box (x, y, w, h) to bounding box (x1, y1, x2, y2) | |
| y = np.copy(x) | |
| y[..., 0] = x[..., 0] - x[..., 2] / 2 | |
| y[..., 1] = x[..., 1] - x[..., 3] / 2 | |
| y[..., 2] = x[..., 0] + x[..., 2] / 2 | |
| y[..., 3] = x[..., 1] + x[..., 3] / 2 | |
| return y | |
| def draw_detections(image, boxes, scores, class_ids, mask_alpha=0.3): | |
| det_img = image.copy() | |
| img_height, img_width = image.shape[:2] | |
| font_size = min([img_height, img_width]) * 0.0006 | |
| text_thickness = int(min([img_height, img_width]) * 0.001) | |
| #det_img = draw_masks(det_img, boxes, class_ids, mask_alpha) | |
| # Draw bounding boxes and labels of detections | |
| for class_id, box, score in zip(class_ids, boxes, scores): | |
| color = colors[class_id] | |
| draw_box(det_img, box, color) | |
| label = class_names[class_id] | |
| caption = f"{label} {int(score * 100)}%" | |
| draw_text(det_img, caption, box, color, font_size, text_thickness) | |
| return det_img | |
| def draw_box( | |
| image: np.ndarray, | |
| box: np.ndarray, | |
| color: tuple[int, int, int] = (0, 0, 255), | |
| thickness: int = 2, | |
| ) -> np.ndarray: | |
| x1, y1, x2, y2 = box.astype(int) | |
| return cv2.rectangle(image, (x1, y1), (x2, y2), color, thickness) | |
| def draw_text( | |
| image: np.ndarray, | |
| text: str, | |
| box: np.ndarray, | |
| color: tuple[int, int, int] = (0, 0, 255), | |
| font_size: float = 0.001, | |
| text_thickness: int = 2, | |
| ) -> np.ndarray: | |
| x1, y1, x2, y2 = box.astype(int) | |
| (tw, th), _ = cv2.getTextSize( | |
| text=text, | |
| fontFace=cv2.FONT_HERSHEY_SIMPLEX, | |
| fontScale=font_size, | |
| thickness=text_thickness, | |
| ) | |
| th = int(th * 1.2) | |
| cv2.rectangle(image, (x1, y1), (x1 + tw, y1 - th), color, -1) | |
| return cv2.putText( | |
| image, | |
| text, | |
| (x1, y1), | |
| cv2.FONT_HERSHEY_SIMPLEX, | |
| font_size, | |
| (255, 255, 255), | |
| text_thickness, | |
| cv2.LINE_AA, | |
| ) | |
| def draw_masks( | |
| image: np.ndarray, boxes: np.ndarray, classes: np.ndarray, mask_alpha: float = 0.3 | |
| ) -> np.ndarray: | |
| mask_img = image.copy() | |
| # Draw bounding boxes and labels of detections | |
| for box, class_id in zip(boxes, classes): | |
| color = colors[class_id] | |
| x1, y1, x2, y2 = box.astype(int) | |
| # Draw fill rectangle in mask image | |
| cv2.rectangle(mask_img, (x1, y1), (x2, y2), color, -1) | |
| return cv2.addWeighted(mask_img, mask_alpha, image, 1 - mask_alpha, 0) |