Spaces:

daniel-saed
/

F1-steering-angle-model

Running

App Files Files Community

daniel-saed commited on May 29, 2025

Commit

2d578e2

verified ·

1 Parent(s): 40a95d8

Update utils/helper.py

Browse files

Files changed (1) hide show

utils/helper.py +550 -549

utils/helper.py CHANGED Viewed

@@ -1,549 +1,550 @@
-import cv2
-import numpy as np
-from typing import Tuple
-import tempfile
-import os
-from PIL import Image
-import sys
-from pymongo import MongoClient
-from dotenv import load_dotenv
-import os
-import streamlit as st
-try:
-    if getattr(sys, 'frozen', False):
-        # En el ejecutable, intentar sys._MEIPASS
-        BASE_DIR = getattr(sys, '_MEIPASS', os.path.dirname(sys.executable))
-        print(f"Executable mode - Initial BASE_DIR: {BASE_DIR} (_MEIPASS: {hasattr(sys, '_MEIPASS')})")
-        # Verificar si BASE_DIR contiene los archivos esperados
-        expected_dirs = ['navigation', 'models', 'assets', 'img', 'utils']
-        if not any(os.path.exists(os.path.join(BASE_DIR, d)) for d in expected_dirs):
-            print(f"Warning: Expected directories not found in {BASE_DIR}")
-            # Buscar _MEI<random> en el directorio padre
-            temp_dir = os.path.dirname(BASE_DIR) if BASE_DIR != os.path.dirname(sys.executable) else BASE_DIR
-            for d in os.listdir(temp_dir):
-                if d.startswith('_MEI'):
-                    candidate = os.path.join(temp_dir, d)
-                    if any(os.path.exists(os.path.join(candidate, ed)) for ed in expected_dirs):
-                        BASE_DIR = candidate
-                        print(f"Adjusted BASE_DIR to _MEI directory: {BASE_DIR}")
-                        break
-            else:
-                print(f"No _MEI directory found in {temp_dir}, using {BASE_DIR}")
-    else:
-        # En desarrollo, usar el directorio del proyecto
-        current_file = os.path.abspath(os.path.realpath(__file__))
-        print(f"Development mode - Current file: {current_file}")
-        BASE_DIR = os.path.dirname(os.path.dirname(current_file))  # Subir de utils/ a F1-machine-learning-webapp/
-        print(f"Development mode - BASE_DIR: {BASE_DIR}")
-except Exception as e:
-    print(f"Error setting BASE_DIR: {e}")
-    # Fallback
-    BASE_DIR = os.path.dirname(os.path.abspath(os.path.realpath(__file__)))
-    BASE_DIR = os.path.dirname(BASE_DIR)
-    print(f"Fallback BASE_DIR: {BASE_DIR}")
-BASE_DIR = os.path.normpath(BASE_DIR)
-print(f"Final BASE_DIR: {BASE_DIR}")
-#load_dotenv()  # Carga las variables desde .env
-#mongo_uri = os.getenv("MONGO_URI")
-@st.cache_resource
-def get_mongo_client():
-    return MongoClient(st.secrets["MONGO_URI"])
-client = get_mongo_client()
-def get_metrics_collections():
-    db = client["f1_data"]
-    metrics_collection = db["usage_metrics"]
-    metrics_page = db["visits"]
-    return metrics_collection, metrics_page, db
-metrics_collection, metrics_page, db = get_metrics_collections()
-'''if not metrics_page.find_one({"page": "inicio"}):
-    metrics_page.insert_one({"page": "inicio", "visits": 0})
-if not metrics_collection.find_one({"action": "descargar_app"}):
-    metrics_collection.insert_one({"action": "descargar_app", "count": 0})'''
-'''except:
-    print("Error loading MongoDB URI from .env file. Please check your configuration.")
-    client = None
-    metrics_collection = None
-    metrics_page = None
-    db = None'''
-#-------------YOLO ONNX HELPERS-------------------
-def preprocess_image_tensor(image_rgb: np.ndarray) -> np.ndarray:
-    """Preprocess image to match Ultralytics YOLOv8."""
-    '''input = np.array(image_rgb)
-    input = input.transpose(2, 0, 1)
-    input = input.reshape(1,3,224,224).astype("float32")
-    input = input/255.0'''
-    input_data = image_rgb.transpose(2, 0, 1).reshape(1, 3, 224, 224)
-    # Convert to float32 and normalize to [0, 1]
-    input_data = input_data.astype(np.float32) / 255.0
-    return input_data
-def postprocess_outputs(outputs: list, height: int, width: int) -> Tuple[np.ndarray, np.ndarray, np.ndarray]:
-    """Process ONNX model outputs for a single-class model."""
-    res_size = 56
-    output0 = outputs[0]
-    output1 = outputs[1]
-    output0 = output0[0].transpose()
-    output1 = output1[0]
-    boxes = output0[:,0:5]
-    masks = output0[:,5:]
-    output1 = output1.reshape(32,res_size*res_size)
-    masks = masks @ output1
-    boxes = np.hstack([boxes,masks])
-    yolo_classes = [
-        "helmet"
-    ]
-    # parse and filter all boxes
-    objects = []
-    for row in boxes:
-        xc,yc,w,h = row[:4]
-        x1 = (xc-w/2)/224*width
-        y1 = (yc-h/2)/224*height
-        x2 = (xc+w/2)/224*width
-        y2 = (yc+h/2)/224*height
-        prob = row[4:5].max()
-        if prob < 0.2:
-            continue
-        class_id = row[4:5].argmax()
-        label = yolo_classes[class_id]
-        mask = get_mask(row[5:25684], (x1,y1,x2,y2), width, height)
-        try:
-            polygon = get_polygon(mask)
-        except:
-            continue
-        objects.append([x1,y1,x2,y2,label,prob,mask,polygon])
-    # apply non-maximum suppression
-    objects.sort(key=lambda x: x[5], reverse=True)
-    result = []
-    while len(objects)>0:
-        result.append(objects[0])
-        objects = [object for object in objects if iou(object,objects[0])<0.7]
-    return True,result
-def intersection(box1,box2):
-    box1_x1,box1_y1,box1_x2,box1_y2 = box1[:4]
-    box2_x1,box2_y1,box2_x2,box2_y2 = box2[:4]
-    x1 = max(box1_x1,box2_x1)
-    y1 = max(box1_y1,box2_y1)
-    x2 = min(box1_x2,box2_x2)
-    y2 = min(box1_y2,box2_y2)
-    return (x2-x1)*(y2-y1)
-def union(box1,box2):
-    box1_x1,box1_y1,box1_x2,box1_y2 = box1[:4]
-    box2_x1,box2_y1,box2_x2,box2_y2 = box2[:4]
-    box1_area = (box1_x2-box1_x1)*(box1_y2-box1_y1)
-    box2_area = (box2_x2-box2_x1)*(box2_y2-box2_y1)
-    return box1_area + box2_area - intersection(box1,box2)
-def iou(box1,box2):
-    return intersection(box1,box2)/union(box1,box2)
-def sigmoid(z):
-    return 1/(1 + np.exp(-z))
-# parse segmentation mask
-def get_mask(row, box, img_width, img_height):
-    # convert mask to image (matrix of pixels)
-    res_size = 56
-    mask = row.reshape(res_size,res_size)
-    mask = sigmoid(mask)
-    mask = (mask > 0.2).astype("uint8")*255
-    # crop the object defined by "box" from mask
-    x1,y1,x2,y2 = box
-    mask_x1 = round(x1/img_width*res_size)
-    mask_y1 = round(y1/img_height*res_size)
-    mask_x2 = round(x2/img_width*res_size)
-    mask_y2 = round(y2/img_height*res_size)
-    mask = mask[mask_y1:mask_y2,mask_x1:mask_x2]
-    # resize the cropped mask to the size of object
-    img_mask = Image.fromarray(mask,"L")
-    img_mask = img_mask.resize((round(x2-x1),round(y2-y1)))
-    mask = np.array(img_mask)
-    return mask
-# calculate bounding polygon from mask
-def get_polygon(mask):
-    contours = cv2.findContours(mask, cv2.RETR_LIST, cv2.CHAIN_APPROX_SIMPLE)
-    polygon = [[contour[0][0],contour[0][1]] for contour in contours[0][0]]
-    return polygon
-#------------------VIDEO CONVERSION------------------
-def convert_video_to_10fps(video_file):
-    """
-    Convert an uploaded video file to 10 FPS and return metadata
-    Args:
-        video_file: Streamlit uploaded file object
-    Returns:
-        Dictionary with video metadata and path to converted file
-    """
-    try:
-        # Create temporary file for the original upload
-        orig_tfile = tempfile.NamedTemporaryFile(delete=False, suffix='.mp4')
-        orig_tfile.write(video_file.read())
-        orig_tfile.close()
-        # Open the original video to get properties
-        orig_cap = cv2.VideoCapture(orig_tfile.name)
-        if not orig_cap.isOpened():
-            return {"success": False, "error": "Could not open video file"}
-        orig_fps = orig_cap.get(cv2.CAP_PROP_FPS)
-        width = int(orig_cap.get(cv2.CAP_PROP_FRAME_WIDTH))
-        height = int(orig_cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
-        orig_total_frames = int(orig_cap.get(cv2.CAP_PROP_FRAME_COUNT))
-        # Calculate duration
-        duration_seconds = orig_total_frames / orig_fps
-        expected_frames = int(duration_seconds * 10)  # 10 fps
-        # Create output temp file
-        converted_path = tempfile.mktemp(suffix='.mp4')
-        # Create VideoWriter
-        fourcc = cv2.VideoWriter_fourcc(*'mp4v')
-        out = cv2.VideoWriter(converted_path, fourcc, 10, (width, height))
-        # Calculate frame sampling
-        if orig_fps <= 10:
-            # If original is slower than target, duplicate frames
-            step = 1
-            duplication = int(10 / orig_fps)
-        else:
-            # If original is faster, skip frames
-            step = orig_fps / 10
-            duplication = 1
-        # Convert the video
-        frame_count = 0
-        output_count = 0
-        while orig_cap.isOpened():
-            ret, frame = orig_cap.read()
-            if not ret:
-                break
-            # Determine if we should include this frame
-            if frame_count % step < 1:  # Using modulo < 1 for floating point step values
-                # Write frame (possibly multiple times)
-                for _ in range(duplication):
-                    out.write(frame)
-                    output_count += 1
-            frame_count += 1
-        # Release resources
-        orig_cap.release()
-        out.release()
-        os.unlink(orig_tfile.name)  # Delete original temp file
-        # Instead of returning a dictionary, read the file back into memory
-        with open(converted_path, "rb") as f:
-            video_data = f.read()
-        # Clean up the temporary file
-        os.unlink(converted_path)
-        # Return a file-like object
-        from io import BytesIO
-        video_io = BytesIO(video_data)
-        video_io.name = "converted_10fps.mp4"
-        return video_io
-    except Exception as e:
-        print(f"Error converting video: {e}")
-        return None
-def recortar_imagen(image,starty_dic, axes_dic):
-    height, width, _ = image.shape
-    mask = np.zeros((height, width), dtype=np.uint8)
-    start_y = int((starty_dic-.02) * height)
-    cv2.rectangle(mask, (0, start_y), (width, height), 255, -1)
-    center = (width // 2, start_y)
-    axes = (width // 2, int(axes_dic * height))
-    cv2.ellipse(mask, center, axes, 0, 180, 360, 255, -1)
-    result = cv2.bitwise_and(image, image, mask=mask)
-    return result
-def recortar_imagen_again(image,starty_dic, axes_dic):
-    try:
-        height, width,_ = image.shape
-    except :
-        height, width = image.shape
-    mask = np.zeros((height, width), dtype=np.uint8)
-    start_y = int(starty_dic * height)
-    cv2.rectangle(mask, (0, start_y), (width, height), 255, -1)
-    center = (width // 2, start_y)
-    axes = (width // 2, int(axes_dic * height))
-    cv2.ellipse(mask, center, axes, 0, 180, 360, 255, -1)
-    result = cv2.bitwise_and(image, image, mask=mask)
-    return result
-def calculate_black_pixels_percentage(image):
-    """
-    Calcula el porcentaje de píxeles totalmente negros en la imagen.
-    Args:
-        image: Imagen cargada con cv2 (BGR o escala de grises).
-        is_grayscale: True si la imagen ya está en escala de gruises, False si es a color.
-    Returns:
-        float: Porcentaje de píxeles negros.
-    """
-    # Obtener dimensiones
-    '''image = cv2.imread(image_path)
-    image = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)'''
-    if image is None:
-        print(f"Error loading image")
-        return 0
-    if len(image.shape) == 3:
-        image = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
-    else:
-        image = image.copy()
-    h, w = image.shape[:2]
-    total_pixels = h * w
-    black_pixels = np.sum(image < 10)
-    # Calcular porcentaje
-    percentage = (black_pixels / total_pixels) * 100
-    percentage = (100.00 - float(percentage)) * .06
-    return percentage
-def create_rectangular_roi(height, width, x1=0, y1=0, x2=None, y2=None):
-    if x2 is None:
-        x2 = width
-    if y2 is None:
-        y2 = height
-    mask = np.zeros((height, width), dtype=np.uint8)
-    cv2.rectangle(mask, (x1, y1), (x2, y2), 255, -1)
-    return mask
-def preprocess_image(image, mask=None):
-    if len(image.shape) == 3:
-        gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
-    else:
-        gray = image.copy()
-    denoised = cv2.bilateralFilter(gray, d=3, sigmaColor=20, sigmaSpace=10)
-    sharpened = cv2.addWeighted(denoised, 3.0, denoised, -2.0, 0)
-    normalized = cv2.normalize(sharpened, None, 0, 255, cv2.NORM_MINMAX)
-    if mask is not None:
-        return cv2.bitwise_and(normalized, normalized, mask=mask)
-    return normalized
-def calculate_robust_rms_contrast(image, mask=None, bright_threshold=240):
-    if len(image.shape) == 3:
-        image = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
-    if mask is not None:
-        masked_image = image[mask > 0]
-    else:
-        masked_image = image.ravel()
-    if len(masked_image) == 0:
-        mean = np.mean(image)
-        std_dev = np.sqrt(np.mean((image - mean) ** 2))
-    else:
-        mask_bright = masked_image < bright_threshold
-        masked_image = masked_image[mask_bright]
-        if len(masked_image) == 0:
-            mean = np.mean(image)
-            std_dev = np.sqrt(np.mean((image - mean) ** 2))
-        else:
-            mean = np.mean(masked_image)
-            std_dev = np.sqrt(np.mean((masked_image - mean) ** 2))
-    return std_dev / 255.0
-def adaptive_clahe_iterative(image, roi_mask, initial_clip_limit=1.0, max_clip_limit=10.0, iterations=20, target_rms_min=0.199, target_rms_max=0.5, bright_threshold=230):
-    if len(image.shape) == 3:
-        original_gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
-    else:
-        original_gray = image.copy()
-    #preprocessed_image = preprocess_image(original_gray)
-    best_image = original_gray.copy()
-    best_rms = calculate_robust_rms_contrast(original_gray, roi_mask, bright_threshold)
-    clip_limit = initial_clip_limit
-    for i in range(iterations):
-        clahe = cv2.createCLAHE(clipLimit=clip_limit, tileGridSize=(8, 8))
-        current_image = clahe.apply(original_gray)
-        rms_contrast = calculate_robust_rms_contrast(current_image, roi_mask, bright_threshold)
-        if target_rms_min <= rms_contrast <= target_rms_max:
-            return current_image
-        if rms_contrast > best_rms:
-            best_rms = rms_contrast
-            best_image = current_image.copy()
-        if rms_contrast > target_rms_max:
-            clip_limit = min(clip_limit, 1.0)
-        else:
-            clip_limit = min(initial_clip_limit + (i * 0.5), max_clip_limit)
-    return best_image
-def adaptive_edge_detection(imagen, min_edge_percentage=5.5, max_edge_percentage=6.5, target_percentage=6.0, max_attempts=5,mode="Default"):
-    """
-    Detecta bordes con ajuste progresivo de parámetros hasta lograr un porcentaje óptimo
-    de píxeles de borde en la imagen - optimizado con operaciones vectorizadas.
-    """
-    # Read image
-    original = imagen
-    if original is None:
-        print(f"Error loading image")
-        return None, None, None, None
-    # Convert to grayscale
-    gray = original
-    # Calculate total pixels for percentage calculation
-    total_pixels = gray.shape[0] * gray.shape[1]
-    min_edge_pixels = int((min_edge_percentage / 100) * total_pixels)
-    max_edge_pixels = int((max_edge_percentage / 100) * total_pixels)
-    target_edge_pixels = int((target_percentage / 100) * total_pixels)
-    # Initial parameters - ajustados para conseguir un rango alrededor del 6% de bordes
-    clip_limits = [1]
-    grid_sizes = [(2, 2)]
-    # Empezamos con umbrales más altos para restringir la cantidad de bordes
-    canny_thresholds = [(55, 170), (45, 160), (35, 150), (25, 140), (20, 130),(20, 130),(20, 130)]
-    best_edges = None
-    best_enhanced = None
-    best_config = None
-    best_edge_score = float('inf')  # Inicializamos con un valor alto
-    edge_percentage = 0
-    # Try progressively more aggressive parameters
-    for attempt in range(max_attempts):
-        # Get parameters for this attempt
-        clip_limit = clip_limits[attempt]
-        grid_size = grid_sizes[attempt]
-        low_threshold, high_threshold = canny_thresholds[attempt]
-        if edge_percentage <= max_edge_percentage:
-            clahe = cv2.createCLAHE(clipLimit=clip_limit, tileGridSize=grid_size)
-        elif edge_count > max_edge_percentage:
-            # Si hay demasiados bordes, aplicamos un CLAHE más fuerte
-            clahe = cv2.createCLAHE(clipLimit=1, tileGridSize=grid_size)
-        enhanced = clahe.apply(gray)
-        #print("denoised shape:", denoised.shape, "dtype:", denoised.dtype)
-        # Apply noise reduction for higher attempts
-        '''if attempt >= 2:
-            enhanced = cv2.bilateralFilter(enhanced, 5, 100, 100)'''
-        if mode == "Default":
-            denoised = cv2.bilateralFilter(enhanced, d=5, sigmaColor=200, sigmaSpace=200)
-            median_intensity = np.median(denoised)
-            low_threshold = max(20, (1.0 - .3) * median_intensity)
-            high_threshold = max(80, (1.0 + .8) * median_intensity)
-        elif mode == "Low ilumination":
-            denoised = cv2.bilateralFilter(enhanced, d=5, sigmaColor=200, sigmaSpace=200)
-            median_intensity = np.median(denoised)
-            low_threshold = max(20, (1.0 - .3) * median_intensity)
-            high_threshold = max(80, (1.0 + .8) * median_intensity)
-        # Edge detection
-        edges = cv2.Canny(denoised, low_threshold, high_threshold)
-        std_intensity = np.std(edges)
-        # Reducir ruido con operaciones morfológicas - vectorizado
-        kernel = np.ones((1, 1), np.uint8)
-        edges = cv2.morphologyEx(
-            edges,
-            cv2.MORPH_OPEN,
-            kernel,
-            iterations=0 if std_intensity < 60 else 1  # Más iteraciones si hay más ruido
-        )
-        # Count edge pixels - vectorizado usando np.count_nonzero
-        edge_count = np.count_nonzero(edges)
-        edge_percentage = (edge_count / total_pixels) * 100
-        # Calcular distancia al objetivo - vectorizado
-        edge_score = abs(edge_count - target_edge_pixels)
-        # Record the best attempt (closest to target percentage)
-        if edge_score < best_edge_score:
-            best_edge_score = edge_score
-            best_edges = edges.copy()  # Hacer copia para evitar sobrescrituras
-            best_enhanced = enhanced.copy()
-            best_config = {
-                'attempt': attempt + 1,
-                'clip_limit': clip_limit,
-                'grid_size': grid_size,
-                'canny_thresholds': (low_threshold, high_threshold),
-                'edge_pixels': edge_count,
-                'edge_percentage': edge_percentage
-            }
-        # Salida temprana si estamos cerca del objetivo
-        if abs(edge_percentage - target_percentage) < 0.1:  # Within 0.2% of target
-            break
-    print(f"Mejor intento: {best_config['attempt']}, porcentaje de bordes: {edge_percentage:.2f}%")
-    return best_enhanced, best_edges, original, best_config

+import cv2
+import numpy as np
+from typing import Tuple
+import tempfile
+import os
+from PIL import Image
+import sys
+from pymongo import MongoClient
+from dotenv import load_dotenv
+import os
+import streamlit as st
+try:
+    if getattr(sys, 'frozen', False):
+        # En el ejecutable, intentar sys._MEIPASS
+        BASE_DIR = getattr(sys, '_MEIPASS', os.path.dirname(sys.executable))
+        print(f"Executable mode - Initial BASE_DIR: {BASE_DIR} (_MEIPASS: {hasattr(sys, '_MEIPASS')})")
+        # Verificar si BASE_DIR contiene los archivos esperados
+        expected_dirs = ['navigation', 'models', 'assets', 'img', 'utils']
+        if not any(os.path.exists(os.path.join(BASE_DIR, d)) for d in expected_dirs):
+            print(f"Warning: Expected directories not found in {BASE_DIR}")
+            # Buscar _MEI<random> en el directorio padre
+            temp_dir = os.path.dirname(BASE_DIR) if BASE_DIR != os.path.dirname(sys.executable) else BASE_DIR
+            for d in os.listdir(temp_dir):
+                if d.startswith('_MEI'):
+                    candidate = os.path.join(temp_dir, d)
+                    if any(os.path.exists(os.path.join(candidate, ed)) for ed in expected_dirs):
+                        BASE_DIR = candidate
+                        print(f"Adjusted BASE_DIR to _MEI directory: {BASE_DIR}")
+                        break
+            else:
+                print(f"No _MEI directory found in {temp_dir}, using {BASE_DIR}")
+    else:
+        # En desarrollo, usar el directorio del proyecto
+        current_file = os.path.abspath(os.path.realpath(__file__))
+        print(f"Development mode - Current file: {current_file}")
+        BASE_DIR = os.path.dirname(os.path.dirname(current_file))  # Subir de utils/ a F1-machine-learning-webapp/
+        print(f"Development mode - BASE_DIR: {BASE_DIR}")
+except Exception as e:
+    print(f"Error setting BASE_DIR: {e}")
+    # Fallback
+    BASE_DIR = os.path.dirname(os.path.abspath(os.path.realpath(__file__)))
+    BASE_DIR = os.path.dirname(BASE_DIR)
+    print(f"Fallback BASE_DIR: {BASE_DIR}")
+BASE_DIR = os.path.normpath(BASE_DIR)
+print(f"Final BASE_DIR: {BASE_DIR}")
+#load_dotenv()  # Carga las variables desde .env
+#mongo_uri = os.getenv("MONGO_URI")
+@st.cache_resource
+def get_mongo_client():
+    return os.getenv('MONGO_URI')
+client = get_mongo_client()
+def get_metrics_collections():
+    db = client["f1_data"]
+    metrics_collection = db["usage_metrics"]
+    metrics_page = db["visits"]
+    return metrics_collection, metrics_page, db
+metrics_collection, metrics_page, db = get_metrics_collections()
+'''if not metrics_page.find_one({"page": "inicio"}):
+    metrics_page.insert_one({"page": "inicio", "visits": 0})
+if not metrics_collection.find_one({"action": "descargar_app"}):
+    metrics_collection.insert_one({"action": "descargar_app", "count": 0})'''
+'''except:
+    print("Error loading MongoDB URI from .env file. Please check your configuration.")
+    client = None
+    metrics_collection = None
+    metrics_page = None
+    db = None'''
+#-------------YOLO ONNX HELPERS-------------------
+def preprocess_image_tensor(image_rgb: np.ndarray) -> np.ndarray:
+    """Preprocess image to match Ultralytics YOLOv8."""
+    '''input = np.array(image_rgb)
+    input = input.transpose(2, 0, 1)
+    input = input.reshape(1,3,224,224).astype("float32")
+    input = input/255.0'''
+    input_data = image_rgb.transpose(2, 0, 1).reshape(1, 3, 224, 224)
+    # Convert to float32 and normalize to [0, 1]
+    input_data = input_data.astype(np.float32) / 255.0
+    return input_data
+def postprocess_outputs(outputs: list, height: int, width: int) -> Tuple[np.ndarray, np.ndarray, np.ndarray]:
+    """Process ONNX model outputs for a single-class model."""
+    res_size = 56
+    output0 = outputs[0]
+    output1 = outputs[1]
+    output0 = output0[0].transpose()
+    output1 = output1[0]
+    boxes = output0[:,0:5]
+    masks = output0[:,5:]
+    output1 = output1.reshape(32,res_size*res_size)
+    masks = masks @ output1
+    boxes = np.hstack([boxes,masks])
+    yolo_classes = [
+        "helmet"
+    ]
+    # parse and filter all boxes
+    objects = []
+    for row in boxes:
+        xc,yc,w,h = row[:4]
+        x1 = (xc-w/2)/224*width
+        y1 = (yc-h/2)/224*height
+        x2 = (xc+w/2)/224*width
+        y2 = (yc+h/2)/224*height
+        prob = row[4:5].max()
+        if prob < 0.2:
+            continue
+        class_id = row[4:5].argmax()
+        label = yolo_classes[class_id]
+        mask = get_mask(row[5:25684], (x1,y1,x2,y2), width, height)
+        try:
+            polygon = get_polygon(mask)
+        except:
+            continue
+        objects.append([x1,y1,x2,y2,label,prob,mask,polygon])
+    # apply non-maximum suppression
+    objects.sort(key=lambda x: x[5], reverse=True)
+    result = []
+    while len(objects)>0:
+        result.append(objects[0])
+        objects = [object for object in objects if iou(object,objects[0])<0.7]
+    return True,result
+def intersection(box1,box2):
+    box1_x1,box1_y1,box1_x2,box1_y2 = box1[:4]
+    box2_x1,box2_y1,box2_x2,box2_y2 = box2[:4]
+    x1 = max(box1_x1,box2_x1)
+    y1 = max(box1_y1,box2_y1)
+    x2 = min(box1_x2,box2_x2)
+    y2 = min(box1_y2,box2_y2)
+    return (x2-x1)*(y2-y1)
+def union(box1,box2):
+    box1_x1,box1_y1,box1_x2,box1_y2 = box1[:4]
+    box2_x1,box2_y1,box2_x2,box2_y2 = box2[:4]
+    box1_area = (box1_x2-box1_x1)*(box1_y2-box1_y1)
+    box2_area = (box2_x2-box2_x1)*(box2_y2-box2_y1)
+    return box1_area + box2_area - intersection(box1,box2)
+def iou(box1,box2):
+    return intersection(box1,box2)/union(box1,box2)
+def sigmoid(z):
+    return 1/(1 + np.exp(-z))
+# parse segmentation mask
+def get_mask(row, box, img_width, img_height):
+    # convert mask to image (matrix of pixels)
+    res_size = 56
+    mask = row.reshape(res_size,res_size)
+    mask = sigmoid(mask)
+    mask = (mask > 0.2).astype("uint8")*255
+    # crop the object defined by "box" from mask
+    x1,y1,x2,y2 = box
+    mask_x1 = round(x1/img_width*res_size)
+    mask_y1 = round(y1/img_height*res_size)
+    mask_x2 = round(x2/img_width*res_size)
+    mask_y2 = round(y2/img_height*res_size)
+    mask = mask[mask_y1:mask_y2,mask_x1:mask_x2]
+    # resize the cropped mask to the size of object
+    img_mask = Image.fromarray(mask,"L")
+    img_mask = img_mask.resize((round(x2-x1),round(y2-y1)))
+    mask = np.array(img_mask)
+    return mask
+# calculate bounding polygon from mask
+def get_polygon(mask):
+    contours = cv2.findContours(mask, cv2.RETR_LIST, cv2.CHAIN_APPROX_SIMPLE)
+    polygon = [[contour[0][0],contour[0][1]] for contour in contours[0][0]]
+    return polygon
+#------------------VIDEO CONVERSION------------------
+def convert_video_to_10fps(video_file):
+    """
+    Convert an uploaded video file to 10 FPS and return metadata
+    Args:
+        video_file: Streamlit uploaded file object
+    Returns:
+        Dictionary with video metadata and path to converted file
+    """
+    try:
+        # Create temporary file for the original upload
+        orig_tfile = tempfile.NamedTemporaryFile(delete=False, suffix='.mp4')
+        orig_tfile.write(video_file.read())
+        orig_tfile.close()
+        # Open the original video to get properties
+        orig_cap = cv2.VideoCapture(orig_tfile.name)
+        if not orig_cap.isOpened():
+            return {"success": False, "error": "Could not open video file"}
+        orig_fps = orig_cap.get(cv2.CAP_PROP_FPS)
+        width = int(orig_cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+        height = int(orig_cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+        orig_total_frames = int(orig_cap.get(cv2.CAP_PROP_FRAME_COUNT))
+        # Calculate duration
+        duration_seconds = orig_total_frames / orig_fps
+        expected_frames = int(duration_seconds * 10)  # 10 fps
+        # Create output temp file
+        converted_path = tempfile.mktemp(suffix='.mp4')
+        # Create VideoWriter
+        fourcc = cv2.VideoWriter_fourcc(*'mp4v')
+        out = cv2.VideoWriter(converted_path, fourcc, 10, (width, height))
+        # Calculate frame sampling
+        if orig_fps <= 10:
+            # If original is slower than target, duplicate frames
+            step = 1
+            duplication = int(10 / orig_fps)
+        else:
+            # If original is faster, skip frames
+            step = orig_fps / 10
+            duplication = 1
+        # Convert the video
+        frame_count = 0
+        output_count = 0
+        while orig_cap.isOpened():
+            ret, frame = orig_cap.read()
+            if not ret:
+                break
+            # Determine if we should include this frame
+            if frame_count % step < 1:  # Using modulo < 1 for floating point step values
+                # Write frame (possibly multiple times)
+                for _ in range(duplication):
+                    out.write(frame)
+                    output_count += 1
+            frame_count += 1
+        # Release resources
+        orig_cap.release()
+        out.release()
+        os.unlink(orig_tfile.name)  # Delete original temp file
+        # Instead of returning a dictionary, read the file back into memory
+        with open(converted_path, "rb") as f:
+            video_data = f.read()
+        # Clean up the temporary file
+        os.unlink(converted_path)
+        # Return a file-like object
+        from io import BytesIO
+        video_io = BytesIO(video_data)
+        video_io.name = "converted_10fps.mp4"
+        return video_io
+    except Exception as e:
+        print(f"Error converting video: {e}")
+        return None
+def recortar_imagen(image,starty_dic, axes_dic):
+    height, width, _ = image.shape
+    mask = np.zeros((height, width), dtype=np.uint8)
+    start_y = int((starty_dic-.02) * height)
+    cv2.rectangle(mask, (0, start_y), (width, height), 255, -1)
+    center = (width // 2, start_y)
+    axes = (width // 2, int(axes_dic * height))
+    cv2.ellipse(mask, center, axes, 0, 180, 360, 255, -1)
+    result = cv2.bitwise_and(image, image, mask=mask)
+    return result
+def recortar_imagen_again(image,starty_dic, axes_dic):
+    try:
+        height, width,_ = image.shape
+    except :
+        height, width = image.shape
+    mask = np.zeros((height, width), dtype=np.uint8)
+    start_y = int(starty_dic * height)
+    cv2.rectangle(mask, (0, start_y), (width, height), 255, -1)
+    center = (width // 2, start_y)
+    axes = (width // 2, int(axes_dic * height))
+    cv2.ellipse(mask, center, axes, 0, 180, 360, 255, -1)
+    result = cv2.bitwise_and(image, image, mask=mask)
+    return result
+def calculate_black_pixels_percentage(image):
+    """
+    Calcula el porcentaje de píxeles totalmente negros en la imagen.
+    Args:
+        image: Imagen cargada con cv2 (BGR o escala de grises).
+        is_grayscale: True si la imagen ya está en escala de gruises, False si es a color.
+    Returns:
+        float: Porcentaje de píxeles negros.
+    """
+    # Obtener dimensiones
+    '''image = cv2.imread(image_path)
+    image = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)'''
+    if image is None:
+        print(f"Error loading image")
+        return 0
+    if len(image.shape) == 3:
+        image = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+    else:
+        image = image.copy()
+    h, w = image.shape[:2]
+    total_pixels = h * w
+    black_pixels = np.sum(image < 10)
+    # Calcular porcentaje
+    percentage = (black_pixels / total_pixels) * 100
+    percentage = (100.00 - float(percentage)) * .06
+    return percentage
+def create_rectangular_roi(height, width, x1=0, y1=0, x2=None, y2=None):
+    if x2 is None:
+        x2 = width
+    if y2 is None:
+        y2 = height
+    mask = np.zeros((height, width), dtype=np.uint8)
+    cv2.rectangle(mask, (x1, y1), (x2, y2), 255, -1)
+    return mask
+def preprocess_image(image, mask=None):
+    if len(image.shape) == 3:
+        gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+    else:
+        gray = image.copy()
+    denoised = cv2.bilateralFilter(gray, d=3, sigmaColor=20, sigmaSpace=10)
+    sharpened = cv2.addWeighted(denoised, 3.0, denoised, -2.0, 0)
+    normalized = cv2.normalize(sharpened, None, 0, 255, cv2.NORM_MINMAX)
+    if mask is not None:
+        return cv2.bitwise_and(normalized, normalized, mask=mask)
+    return normalized
+def calculate_robust_rms_contrast(image, mask=None, bright_threshold=240):
+    if len(image.shape) == 3:
+        image = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+    if mask is not None:
+        masked_image = image[mask > 0]
+    else:
+        masked_image = image.ravel()
+    if len(masked_image) == 0:
+        mean = np.mean(image)
+        std_dev = np.sqrt(np.mean((image - mean) ** 2))
+    else:
+        mask_bright = masked_image < bright_threshold
+        masked_image = masked_image[mask_bright]
+        if len(masked_image) == 0:
+            mean = np.mean(image)
+            std_dev = np.sqrt(np.mean((image - mean) ** 2))
+        else:
+            mean = np.mean(masked_image)
+            std_dev = np.sqrt(np.mean((masked_image - mean) ** 2))
+    return std_dev / 255.0
+def adaptive_clahe_iterative(image, roi_mask, initial_clip_limit=1.0, max_clip_limit=10.0, iterations=20, target_rms_min=0.199, target_rms_max=0.5, bright_threshold=230):
+    if len(image.shape) == 3:
+        original_gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+    else:
+        original_gray = image.copy()
+    #preprocessed_image = preprocess_image(original_gray)
+    best_image = original_gray.copy()
+    best_rms = calculate_robust_rms_contrast(original_gray, roi_mask, bright_threshold)
+    clip_limit = initial_clip_limit
+    for i in range(iterations):
+        clahe = cv2.createCLAHE(clipLimit=clip_limit, tileGridSize=(8, 8))
+        current_image = clahe.apply(original_gray)
+        rms_contrast = calculate_robust_rms_contrast(current_image, roi_mask, bright_threshold)
+        if target_rms_min <= rms_contrast <= target_rms_max:
+            return current_image
+        if rms_contrast > best_rms:
+            best_rms = rms_contrast
+            best_image = current_image.copy()
+        if rms_contrast > target_rms_max:
+            clip_limit = min(clip_limit, 1.0)
+        else:
+            clip_limit = min(initial_clip_limit + (i * 0.5), max_clip_limit)
+    return best_image
+def adaptive_edge_detection(imagen, min_edge_percentage=5.5, max_edge_percentage=6.5, target_percentage=6.0, max_attempts=5,mode="Default"):
+    """
+    Detecta bordes con ajuste progresivo de parámetros hasta lograr un porcentaje óptimo
+    de píxeles de borde en la imagen - optimizado con operaciones vectorizadas.
+    """
+    # Read image
+    original = imagen
+    if original is None:
+        print(f"Error loading image")
+        return None, None, None, None
+    # Convert to grayscale
+    gray = original
+    # Calculate total pixels for percentage calculation
+    total_pixels = gray.shape[0] * gray.shape[1]
+    min_edge_pixels = int((min_edge_percentage / 100) * total_pixels)
+    max_edge_pixels = int((max_edge_percentage / 100) * total_pixels)
+    target_edge_pixels = int((target_percentage / 100) * total_pixels)
+    # Initial parameters - ajustados para conseguir un rango alrededor del 6% de bordes
+    clip_limits = [1]
+    grid_sizes = [(2, 2)]
+    # Empezamos con umbrales más altos para restringir la cantidad de bordes
+    canny_thresholds = [(55, 170), (45, 160), (35, 150), (25, 140), (20, 130),(20, 130),(20, 130)]
+    best_edges = None
+    best_enhanced = None
+    best_config = None
+    best_edge_score = float('inf')  # Inicializamos con un valor alto
+    edge_percentage = 0
+    # Try progressively more aggressive parameters
+    for attempt in range(max_attempts):
+        # Get parameters for this attempt
+        clip_limit = clip_limits[attempt]
+        grid_size = grid_sizes[attempt]
+        low_threshold, high_threshold = canny_thresholds[attempt]
+        if edge_percentage <= max_edge_percentage:
+            clahe = cv2.createCLAHE(clipLimit=clip_limit, tileGridSize=grid_size)
+        elif edge_count > max_edge_percentage:
+            # Si hay demasiados bordes, aplicamos un CLAHE más fuerte
+            clahe = cv2.createCLAHE(clipLimit=1, tileGridSize=grid_size)
+        enhanced = clahe.apply(gray)
+        #print("denoised shape:", denoised.shape, "dtype:", denoised.dtype)
+        # Apply noise reduction for higher attempts
+        '''if attempt >= 2:
+            enhanced = cv2.bilateralFilter(enhanced, 5, 100, 100)'''
+        if mode == "Default":
+            denoised = cv2.bilateralFilter(enhanced, d=5, sigmaColor=200, sigmaSpace=200)
+            median_intensity = np.median(denoised)
+            low_threshold = max(20, (1.0 - .3) * median_intensity)
+            high_threshold = max(80, (1.0 + .8) * median_intensity)
+        elif mode == "Low ilumination":
+            denoised = cv2.bilateralFilter(enhanced, d=5, sigmaColor=200, sigmaSpace=200)
+            median_intensity = np.median(denoised)
+            low_threshold = max(20, (1.0 - .3) * median_intensity)
+            high_threshold = max(80, (1.0 + .8) * median_intensity)
+        # Edge detection
+        edges = cv2.Canny(denoised, low_threshold, high_threshold)
+        std_intensity = np.std(edges)
+        # Reducir ruido con operaciones morfológicas - vectorizado
+        kernel = np.ones((1, 1), np.uint8)
+        edges = cv2.morphologyEx(
+            edges,
+            cv2.MORPH_OPEN,
+            kernel,
+            iterations=0 if std_intensity < 60 else 1  # Más iteraciones si hay más ruido
+        )
+        # Count edge pixels - vectorizado usando np.count_nonzero
+        edge_count = np.count_nonzero(edges)
+        edge_percentage = (edge_count / total_pixels) * 100
+        # Calcular distancia al objetivo - vectorizado
+        edge_score = abs(edge_count - target_edge_pixels)
+        # Record the best attempt (closest to target percentage)
+        if edge_score < best_edge_score:
+            best_edge_score = edge_score
+            best_edges = edges.copy()  # Hacer copia para evitar sobrescrituras
+            best_enhanced = enhanced.copy()
+            best_config = {
+                'attempt': attempt + 1,
+                'clip_limit': clip_limit,
+                'grid_size': grid_size,
+                'canny_thresholds': (low_threshold, high_threshold),
+                'edge_pixels': edge_count,
+                'edge_percentage': edge_percentage
+            }
+        # Salida temprana si estamos cerca del objetivo
+        if abs(edge_percentage - target_percentage) < 0.1:  # Within 0.2% of target
+            break
+    print(f"Mejor intento: {best_config['attempt']}, porcentaje de bordes: {edge_percentage:.2f}%")
+    return best_enhanced, best_edges, original, best_config