Spaces:

kebincontreras
/

Object_Detection_Modulo_Camera

Running

App Files Files Community

kebincontreras commited on Sep 24, 2024

Commit

a4ed2cd

verified ·

1 Parent(s): 36ab4ca

Upload 5 files

Browse files

Files changed (5) hide show

detection.py +157 -0
image_processing.py +27 -0
notacion.py +30 -0
utils.py +118 -0
yolo_classes.txt +80 -0

detection.py ADDED Viewed

	@@ -0,0 +1,157 @@

+from ultralytics import YOLOv10
+import os
+import torch
+def yolov10_inference(image, model_id, image_size, conf_threshold):
+    model = YOLOv10.from_pretrained(f'jameslahm/{model_id}')
+    results = model.predict(source=image, imgsz=image_size, conf=conf_threshold)
+    detections = []
+    if results and len(results) > 0:
+        for result in results:
+            for box in result.boxes:
+                detections.append({
+                    "coords": box.xyxy.cpu().numpy(),
+                    "class": result.names[int(box.cls.cpu())],
+                    "conf": box.conf.cpu().numpy()
+                    #"bbox": box.xyxy.cpu().numpy().tolist()
+                })
+    return results[0].plot() if results and len(results) > 0 else image, detections
+def calculate_iou(boxA, boxB):
+    xA = max(boxA[0], boxB[0])
+    yA = max(boxA[1], boxB[1])
+    xB = min(boxA[2], boxB[2])
+    yB = min(boxA[3], boxB[3])
+    interArea = max(0, xB - xA) * max(0, yB - yA)
+    boxAArea = (boxA[2] - boxA[0]) * (boxA[3] - boxA[1])
+    boxBArea = (boxB[2] - boxB[0]) * (boxB[3] - boxB[1])
+    iou = interArea / float(boxAArea + boxBArea - interArea)
+    return iou
+def calculate_detection_metrics(detections_true, detections_pred):
+    true_positives = 0
+    pred_positives = len(detections_pred)
+    real_positives = len(detections_true)
+    ious = []
+    for pred in detections_pred:
+        for real in detections_true:
+            if pred['class'] == real['class']:
+                iou = calculate_iou(pred['coords'].flatten(), real['coords'].flatten())
+                if iou >= 0.5:
+                    true_positives += 1
+                    ious.append(iou)
+                    break
+    precision = true_positives / pred_positives if pred_positives > 0 else 0
+    recall = true_positives / real_positives if real_positives > 0 else 0
+    f1_score = 2 * (precision * recall) / (precision + recall) if (precision + recall) > 0 else 0
+    average_iou = sum(ious) / len(ious) if ious else 0
+    return {"Precision": precision, "Recall": recall, "F1-Score": f1_score, "IOU": average_iou}
+def read_kitti_annotations(file_path):
+    ground_truths = []
+    with open(file_path, 'r') as file:
+        for line in file:
+            parts = line.strip().split()
+            if parts[0] != 'DontCare':  # Ignorar 'DontCare'
+                class_label = parts[0].lower()  # Clase en minúscula
+                bbox = [float(parts[4]), float(parts[5]), float(parts[6]), float(parts[7])]
+                ground_truths.append({'class': class_label, 'bbox': bbox})
+    return ground_truths
+def save_detections(detections, output_dir, filename='detections.txt'):
+    if not os.path.exists(output_dir):
+        os.makedirs(output_dir)
+    with open(os.path.join(output_dir, filename), 'w') as file:
+        for detection in detections:
+            class_label = detection['class']
+            bbox = ','.join(map(str, detection['bbox']))
+            file.write(f"{class_label},[{bbox}]\n")
+def yolov10_inference_1(image, model_id, image_size, conf_threshold):
+    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+    model = YOLOv10.from_pretrained(f'jameslahm/{model_id}').to(device)
+    results = model.predict(source=image, imgsz=image_size, conf=conf_threshold)
+    detections = []
+    if results and len(results) > 0:
+        for result in results:
+            for box in result.boxes:
+                detections.append({
+                    #"coords": box.xyxy.cpu().numpy(),
+                    "class": result.names[int(box.cls.cpu())],
+                    #"conf": box.conf.cpu().numpy()
+                    "bbox": box.xyxy.cpu().numpy().tolist()
+                })
+    return results[0].plot() if results and len(results) > 0 else image, detections
+def calculate_iou_1(boxA, boxB):
+    # Asegúrate de que boxA y boxB son listas planas de flotantes
+    # Esto es necesario porque la función max() y min() requieren comparar elementos directamente
+    boxA = [float(num) for sublist in boxA for num in sublist] if isinstance(boxA[0], list) else [float(num) for num in boxA]
+    boxB = [float(num) for sublist in boxB for num in sublist] if isinstance(boxB[0], list) else [float(num) for num in boxB]
+    # Determina las coordenadas de la intersección
+    xA = max(boxA[0], boxB[0])
+    yA = max(boxA[1], boxB[1])
+    xB = min(boxA[2], boxB[2])
+    yB = min(boxA[3], boxB[3])
+    # Calcula el área de la intersección
+    interArea = max(0, xB - xA) * max(0, yB - yA)
+    # Calcula el área de cada cuadro delimitador y la unión
+    boxAArea = (boxA[2] - boxA[0]) * (boxA[3] - boxA[1])
+    boxBArea = (boxB[2] - boxB[0]) * (boxB[3] - boxB[1])
+    unionArea = boxAArea + boxBArea - interArea
+    # Calcula el IoU
+    iou = interArea / float(unionArea)
+    return iou
+def calculate_detection_metrics_1(detections_true, detections_pred):
+    true_positives = 0
+    pred_positives = len(detections_pred)
+    real_positives = len(detections_true)
+    ious = []
+    for pred in detections_pred:
+        pred_bbox = pred['bbox']
+        pred_class = pred['class']
+        for real in detections_true:
+            real_bbox = real['bbox']
+            real_class = real['class']
+            if pred_class == real_class:
+                iou = calculate_iou_1(pred_bbox, real_bbox)
+                if iou >= 0.5:
+                    true_positives += 1
+                    ious.append(iou)
+                    break
+    precision = true_positives / pred_positives if pred_positives > 0 else 0
+    recall = true_positives / real_positives if real_positives > 0 else 0
+    f1_score = 2 * (precision * recall) / (precision + recall) if (precision + recall) > 0 else 0
+    average_iou = sum(ious) / len(ious) if ious else 0
+    return {"Precision": precision, "Recall": recall, "F1-Score": f1_score, "IOU": average_iou}

image_processing.py ADDED Viewed

	@@ -0,0 +1,27 @@

+import cv2
+import numpy as np
+def modulo(x, L):
+    positive = x > 0
+    x = x % L
+    x = np.where( ( x == 0) &  positive, L, x)
+    return x
+def apply_blur(image, kernel_size):
+    """Aplica desenfoque gaussiano a la imagen."""
+    return cv2.GaussianBlur(image, (kernel_size, kernel_size), 0)
+def clip_image(image, correction, sat_factor):
+    """Clips image with saturation factor and correction."""
+    processed_image = np.power(image, correction) * sat_factor
+    clipped_image = np.clip(processed_image, 0, 1)
+    return clipped_image
+def wrap_image(image, correction, sat_factor):
+    """Wraps image with saturation factor and correction."""
+    processed_image = np.power(image, 1.0) * sat_factor
+    wrapped_image =  modulo(processed_image, 1.0)
+    return wrapped_image

notacion.py ADDED Viewed

	@@ -0,0 +1,30 @@

+import numpy as np
+from PIL import Image
+import torch
+from torchvision import transforms
+# Mapeo de clases de YOLOv10 a las clases de tu base de datos
+def map_yolo_classes_to_db(yolo_detections):
+    """
+    Ajusta las clases detectadas por YOLO a las clases de la base de datos según el mapeo proporcionado.
+    """
+    mapping = {
+    'person': 'pedestrian',
+    'bicycle': 'cyclist',
+    'car': 'car',
+    'motorbike': 'cisc',
+    'aeroplane': 'cisc',
+    'bus': 'cisc',
+    'train': 'tram',
+    'truck': 'truck',
+    'van': 'van'
+     }
+    mapped_detections = []
+    for det in yolo_detections:
+        if det['class'] in mapping:
+            det['class'] = mapping[det['class']]
+            mapped_detections.append(det)
+    return mapped_detections

utils.py ADDED Viewed

	@@ -0,0 +1,118 @@

+import torch
+import torch_dct as dct
+from torchvision.transforms import functional as F
+def flip_odd_lines(matrix):
+    """
+    Flip odd lines of a matrix
+    """
+    matrix = matrix.clone()
+    matrix[..., 1::2, :] = matrix[..., 1::2, :].flip(-1)
+    return matrix
+rotate = lambda m, r: torch.rot90(m, r, [-2, -1])
+sequency_vec = lambda m: flip_odd_lines(rotate(m, 0)).flatten(start_dim= m.dim()-2)
+sequency_mat = lambda v, s: rotate(flip_odd_lines(v.unflatten(-1, s)), 0)
+def modulo(x, L):
+    positive = x > 0
+    x = x % L
+    x = torch.where( ( x == 0) &  positive, L, x)
+    return x
+def center_modulo(x, L):
+    return modulo(x + L/2, L) - L/2
+def unmodulo(psi):
+    psi = torch.nn.functional.pad(psi, (1,1), mode='constant', value=0)
+    psi = torch.diff(psi, 1)
+    psi = dct.dct(psi, norm='ortho')
+    N = psi.shape[-1]
+    k = torch.arange(0, N)
+    denom = 2*( torch.cos(  torch.pi * k / N  )  -  1  )
+    denom[0] = 1.0
+    denom = denom.unsqueeze(0).unsqueeze(0) + 1e-7
+    psi     = psi / denom
+    psi[..., 0] = 0.0
+    psi = dct.idct(psi, norm='ortho')
+    return psi
+RD = lambda x, L: torch.round( x / L)  * L
+def hard_thresholding(x, t):
+    return x * (torch.abs(x) > t)
+def stripe_estimation(psi, t=0.15):
+    dx = torch.diff(psi, 1, dim=-1)
+    dy = torch.diff(psi, 1, dim=-2)
+    dx = hard_thresholding(dx, t)
+    dy = hard_thresholding(dy, t)
+    dx = F.pad(dx, (1, 0, 1, 0))
+    dy = F.pad(dy, (0, 1, 0, 1))
+    rho = torch.diff(dx, 1, dim=-1) + torch.diff(dy, 1, dim=-2)
+    dct_rho = dct.dct_2d(rho, norm='ortho')
+    MX = rho.shape[-2]
+    NX = rho.shape[-1]
+    I, J = torch.meshgrid(torch.arange(0, MX), torch.arange(0, NX), indexing="ij")
+    I = I.to(rho.device)
+    J = J.to(rho.device)
+    denom = 2 * (torch.cos(torch.pi * I / MX ) + torch.cos(torch.pi * J / NX ) - 2)
+    denom = denom.unsqueeze(0).unsqueeze(0)
+    denom = denom.to(rho.device)
+    dct_phi = dct_rho / denom
+    dct_phi[..., 0, 0] = 0
+    phi = dct.idct_2d(dct_phi, norm='ortho')
+    phi = phi - torch.min(phi)
+    # phi = phi - torch.amin(phi, dim=(-1, -2), keepdim=True)
+    # phi = RD(phi, 1.0)
+    return phi
+def recons(m_t, DO=1, L=1.0, vertical=False, t=0.3):
+    if vertical:
+        m_t = m_t.permute(0, 1, 3, 2)
+    shape = m_t.shape[-2:]
+    modulo_vec = sequency_vec(m_t)
+    res = center_modulo( torch.diff(modulo_vec, n=DO), L) - torch.diff(modulo_vec, n=DO)
+    bl = res
+    for i in range(DO):
+        bl = unmodulo(bl)
+        bl = RD(bl, L)
+    x_est = bl
+    x_est = sequency_mat(x_est, shape)
+    x_est = x_est + m_t
+    if vertical:
+        x_est = x_est.permute(0, 1, 3, 2)
+    stripes = stripe_estimation(x_est, t=t)
+    x_est = x_est - stripes
+    # if vertical:
+    #     x_est = x_est.permute(0, 1, 3, 2)
+    x_est = x_est - x_est.min()
+    x_est = x_est / x_est.max()
+    return x_est

yolo_classes.txt ADDED Viewed

	@@ -0,0 +1,80 @@

+person
+bicycle
+car
+motorbike
+aeroplane
+bus
+train
+truck
+boat
+traffic light
+fire hydrant
+stop sign
+parking meter
+bench
+bird
+cat
+dog
+horse
+sheep
+cow
+elephant
+bear
+zebra
+giraffe
+backpack
+umbrella
+handbag
+tie
+suitcase
+frisbee
+skis
+snowboard
+sports ball
+kite
+baseball bat
+baseball glove
+skateboard
+surfboard
+tennis racket
+bottle
+wine glass
+cup
+fork
+knife
+spoon
+bowl
+banana
+apple
+sandwich
+orange
+broccoli
+carrot
+hot dog
+pizza
+donut
+cake
+chair
+sofa
+pottedplant
+bed
+diningtable
+toilet
+tvmonitor
+laptop
+mouse
+remote
+keyboard
+cell phone
+microwave
+oven
+toaster
+sink
+refrigerator
+book
+clock
+vase
+scissors
+teddy bear
+hair drier
+toothbrush