Spaces:

IntuiAI
/

intelligent-pid

Build error

App Files Files Community

msIntui commited on Jan 31, 2025

Commit

7f22c74

1 Parent(s): 690b5e4

Fix merge conflict in detectors.py

Browse files

Files changed (1) hide show

detectors.py +103 -1052

detectors.py CHANGED Viewed

@@ -3,12 +3,17 @@ import math
 import torch
 import cv2
 import numpy as np
-from typing import List, Optional, Tuple, Dict
 from dataclasses import replace
 from math import sqrt
 import json
 import uuid
 from pathlib import Path
 # Base classes and utilities
 from base import BaseDetector
@@ -18,7 +23,6 @@ from config import SymbolConfig, TagConfig, LineConfig, PointConfig, JunctionCon
 # DeepLSD model for line detection
 from deeplsd.models.deeplsd_inference import DeepLSD
-from ultralytics import YOLO
 # Detection schema: dataclasses for different objects
 from detection_schema import (
@@ -39,1058 +43,105 @@ from detection_schema import (
 from skimage.morphology import skeletonize
 from skimage.measure import label
-class LineDetector(BaseDetector):
-    """
-    DeepLSD-based line detection that populates newly detected lines (and naive endpoints)
-    directly into a DetectionContext.
-    """
-<<<<<<< HEAD
-    def __init__(self, model_path=None, model=None, model_config=None, device=None, debug_handler=None):
-        self.device = device or torch.device('cpu')
         self.debug_handler = debug_handler
-        if model is not None:
-            self.model = model
-        else:
-            super().__init__(model_path)
-        self.config = model_config or {}
-        self.scale_factor = 8.0  # Inverse of 0.5 scaling
-        self.margin = 10  # BBox expansion margin
-=======
-    def __init__(self,
-                 config: LineConfig,
-                 model_path: str,
-                 model_config: dict,
-                 device: torch.device,
-                 debug_handler: DebugHandler = None):
-        self.device = device
-        self.model_path = model_path
-        self.model_config = model_config
-        super().__init__(config, debug_handler)
-        self._load_params()
-        self.model = self._load_model(model_path)
-        self.scale_factor = 0.75  # For downscaling input to model
-        self.margin = 10
->>>>>>> temp/test-integration
-    # -------------------------------------
-    # BaseDetector requirements
-    # -------------------------------------
-    def _load_model(self, model_path: str) -> DeepLSD:
-        """Load and configure the DeepLSD model."""
-        if not os.path.exists(model_path):
-            raise FileNotFoundError(f"Model file not found: {model_path}")
-        ckpt = torch.load(model_path, map_location=self.device)
-<<<<<<< HEAD
-        model = DeepLSD(self.config)
-        model.load_state_dict(ckpt['model'])
-=======
-        model = DeepLSD(self.model_config)
-        model.load_state_dict(ckpt["model"])
->>>>>>> temp/test-integration
-        return model.to(self.device).eval()
-    def _preprocess(self, image: np.ndarray) -> np.ndarray:
-        """
-        Not used directly here. We'll handle our own
-        masking + threshold steps in the detect() method.
-        """
-        return image
-    def _postprocess(self, image: np.ndarray) -> np.ndarray:
-        """
-        Not used directly. Postprocessing is integrated
-        into detect() after we create lines.
-        """
-        return image
-    # -------------------------------------
-    # Our main detection method
-    # -------------------------------------
-    def detect(self,
-               image: np.ndarray,
-               context: DetectionContext,
-               mask_coords: Optional[List[BBox]] = None,
-               *args,
-               **kwargs) -> None:
-        """
-        Main detection pipeline:
-          1) Apply mask
-          2) Convert to binary & downscale
-          3) Run DeepLSD
-          4) Build minimal Line objects (with naive endpoints)
-          5) Scale lines to original resolution
-          6) Store the lines into the context
-        We do NOT unify endpoints here or classify them as T/L/etc.
-        """
-        mask_coords = mask_coords or []
-        # (A) Preprocess
-        processed_img = self._apply_mask_and_downscale(image, mask_coords)
-        # (B) Inference
-        raw_output = self._run_model_inference(processed_img)
-        # (C) Create lines in downscaled space
-        downscaled_lines = self._create_lines_from_output(raw_output)
-        # (D) Scale them to original resolution
-        lines_scaled = [self._scale_line(ln) for ln in downscaled_lines]
-        # (E) Add them to context
-        for line in lines_scaled:
-            context.add_line(line)
-    # -------------------------------------
-    # Internal helpers
-    # -------------------------------------
-    def _load_params(self):
-        """Load any model_config parameters if needed."""
         pass
-    def _apply_mask_and_downscale(self, image: np.ndarray, mask_coords: List[BBox]) -> np.ndarray:
-        """Apply rectangular mask, then threshold, then downscale."""
-        masked = self._apply_masking(image, mask_coords)
-        gray = cv2.cvtColor(masked, cv2.COLOR_RGB2GRAY)
-<<<<<<< HEAD
-        binary = cv2.threshold(gray, 127, 255, cv2.THRESH_BINARY)[1]
-        return cv2.resize(binary, None, fx=1/self.scale_factor, fy=1/self.scale_factor)
-=======
-        binary_full = cv2.threshold(gray, 127, 255, cv2.THRESH_BINARY)[1]
->>>>>>> temp/test-integration
-        kernel = cv2.getStructuringElement(cv2.MORPH_RECT, (1, 1))
-        dilated = cv2.dilate(binary_full, kernel, iterations=2)
-        # Downscale
-        binary_downscaled = cv2.resize(
-            dilated,
-            None,
-            fx=self.scale_factor,
-            fy=self.scale_factor
-        )
-        return binary_downscaled
-    def _apply_masking(self, image: np.ndarray, mask_coords: List[BBox]) -> np.ndarray:
-        """White-out rectangular areas to ignore them."""
-        masked = image.copy()
-        for bbox in mask_coords:
-            x1, y1 = int(bbox.xmin), int(bbox.ymin)
-            x2, y2 = int(bbox.xmax), int(bbox.ymax)
-            cv2.rectangle(masked, (x1, y1), (x2, y2), (255, 255, 255), -1)
-        return masked
-    def _run_model_inference(self, downscaled_binary: np.ndarray) -> np.ndarray:
-        """Run DeepLSD on the downscaled binary image, returning raw lines [N, 2, 2]."""
-        tensor = torch.tensor(downscaled_binary, dtype=torch.float32, device=self.device)[None, None] / 255.0
-        # tensor = torch.tensor(downscaled_binary, dtype=torch.float32, device=self.device)[None, None] / 255.0
-        with torch.no_grad():
-            output = self.model({"image": tensor})
-            # shape: [batch, num_lines, 2, 2]
-            return output["lines"][0]
-    def _create_lines_from_output(self, model_output: np.ndarray) -> List[Line]:
-        """
-        Convert each [2,2] line segment into a minimal Line with naive endpoints (type=END).
-        Coordinates are in downscaled space.
-        """
-        lines = []
-        for endpoints in model_output:
-            (x1, y1), (x2, y2) = endpoints  # shape (2,) each
-            p_start = self._create_point(x1, y1)
-            p_end   = self._create_point(x2, y2)
-            # minimal bounding box in downscaled coords
-            x_min = min(x1, x2)
-            x_max = max(x1, x2)
-            y_min = min(y1, y2)
-            y_max = max(y1, y2)
-            line_obj = Line(
-                start=p_start,
-                end=p_end,
-                bbox=BBox(
-                    xmin=int(x_min),
-                    ymin=int(y_min),
-                    xmax=int(x_max),
-                    ymax=int(y_max)
-                ),
-                # style / confidence / ID assigned by default
-                style=LineStyle(
-                    connection_type=ConnectionType.SOLID,
-                    stroke_width=2,
-                    color="#000000"
-                ),
-                confidence=0.9,
-                topological_links=[]
-            )
-            lines.append(line_obj)
-        return lines
-    def _create_point(self, x: float, y: float) -> Point:
-        """
-        Creates a naive 'END'-type Point at downscaled coords.
-        We'll scale it later.
-        """
-        margin = 2
-        return Point(
-            coords=Coordinates(x=int(x), y=int(y)),
-            bbox=BBox(
-                xmin=int(x - margin),
-                ymin=int(y - margin),
-                xmax=int(x + margin),
-                ymax=int(y + margin)
-            ),
-            type=JunctionType.END,  # no classification here
-            confidence=1.0
-        )
-    def _scale_line(self, line: Line) -> Line:
-        """
-        Scale line's start/end points + bounding box to original resolution.
-        """
-        scaled_start = self._scale_point(line.start)
-        scaled_end = self._scale_point(line.end)
-        # recalc bounding box in original scale
-        new_bbox = BBox(
-            xmin=min(scaled_start.bbox.xmin, scaled_end.bbox.xmin),
-            ymin=min(scaled_start.bbox.ymin, scaled_end.bbox.ymin),
-            xmax=max(scaled_start.bbox.xmax, scaled_end.bbox.xmax),
-            ymax=max(scaled_start.bbox.ymax, scaled_end.bbox.ymax)
-        )
-        return replace(line, start=scaled_start, end=scaled_end, bbox=new_bbox)
-    def _scale_point(self, point: Point) -> Point:
-        sx = int(point.coords.x * 1/self.scale_factor)
-        sy = int(point.coords.y * 1/self.scale_factor)
-        bb = point.bbox
-        scaled_bbox = BBox(
-            xmin=int(bb.xmin * 1/self.scale_factor),
-            ymin=int(bb.ymin * 1/self.scale_factor),
-            xmax=int(bb.xmax * 1/self.scale_factor),
-            ymax=int(bb.ymax * 1/self.scale_factor)
-        )
-        return replace(point, coords=Coordinates(sx, sy), bbox=scaled_bbox)
-class PointDetector(BaseDetector):
-    """
-    A detector that:
-      1) Reads lines from the context
-      2) Clusters endpoints within 'threshold_distance'
-      3) Updates lines so that shared endpoints reference the same Point object
-    """
-    def __init__(self,
-                 config:PointConfig,
-                 debug_handler: DebugHandler = None):
-        super().__init__(config, debug_handler)  # No real model to load
-        self.threshold_distance = config.threshold_distance
-    def _load_model(self, model_path: str):
-        """No model needed for simple point unification."""
-        return None
-    def detect(self, image: np.ndarray, context: DetectionContext, *args, **kwargs) -> None:
-        """
-        Main method called by the pipeline.
-        1) Gather all line endpoints from context
-        2) Cluster them within 'threshold_distance'
-        3) Update the line endpoints so they reference the unified cluster point
-        """
-        # 1) Collect all endpoints
-        endpoints = []
-        for line in context.lines.values():
-            endpoints.append(line.start)
-            endpoints.append(line.end)
-        # 2) Cluster endpoints
-        clusters = self._cluster_points(endpoints, self.threshold_distance)
-        # 3) Build a dictionary of "representative" points
-        #    So that each cluster has one "canonical" point
-        #    Then we link all the points in that cluster to the canonical reference
-        unified_point_map = {}
-        for cluster in clusters:
-            # let's pick the first point in the cluster as the "representative"
-            rep_point = cluster[0]
-            for p in cluster[1:]:
-                unified_point_map[p.id] = rep_point
-        # 4) Update all lines to reference the canonical point
-        for line in context.lines.values():
-            # unify start
-            if line.start.id in unified_point_map:
-                line.start = unified_point_map[line.start.id]
-            # unify end
-            if line.end.id in unified_point_map:
-                line.end = unified_point_map[line.end.id]
-        # We could also store the final set of unique points back in context.points
-        # (e.g. clearing old duplicates).
-        # That step is optional: you might prefer to keep everything in lines only,
-        # or you might want context.points as a separate reference.
-        # If you want to keep unique points in context.points:
-        new_points = {}
-        for line in context.lines.values():
-            new_points[line.start.id] = line.start
-            new_points[line.end.id] = line.end
-        context.points = new_points  # replace the dictionary of points
-    def _preprocess(self, image: np.ndarray) -> np.ndarray:
-        """No specific image preprocessing needed."""
-        return image
-    def _postprocess(self, image: np.ndarray) -> np.ndarray:
-        """No specific image postprocessing needed."""
-        return image
-    # ----------------------
-    # HELPER: clustering
-    # ----------------------
-    def _cluster_points(self, points: List[Point], threshold: float) -> List[List[Point]]:
-        """
-        Very naive clustering:
-         1) Start from the first point
-         2) If it's within threshold of an existing cluster's representative,
-            put it in that cluster
-         3) Otherwise start a new cluster
-        Return: list of clusters, each is a list of Points
-        """
-        clusters = []
-        for pt in points:
-            placed = False
-            for cluster in clusters:
-                # pick the first point in the cluster as reference
-                ref_pt = cluster[0]
-                if self._distance(pt, ref_pt) < threshold:
-                    cluster.append(pt)
-                    placed = True
-                    break
-            if not placed:
-                clusters.append([pt])
-        return clusters
-    def _distance(self, p1: Point, p2: Point) -> float:
-        dx = p1.coords.x - p2.coords.x
-        dy = p1.coords.y - p2.coords.y
-        return sqrt(dx*dx + dy*dy)
-class JunctionDetector(BaseDetector):
-    """
-    Classifies points as 'END', 'L', or 'T' by skeletonizing the binarized image
-    and analyzing local connectivity. Also creates Junction objects in the context.
-    """
-    def __init__(self, config: JunctionConfig, debug_handler: DebugHandler = None):
-        super().__init__(config, debug_handler)  # no real model path
-        self.window_size = config.window_size
-        self.radius = config.radius
-        self.angle_threshold_lb = config.angle_threshold_lb
-        self.angle_threshold_ub = config.angle_threshold_ub
-        self.debug_handler = debug_handler or DebugHandler()
-    def _load_model(self, model_path: str):
-        """Not loading any actual model, just skeleton logic."""
-        return None
-    def detect(self,
-               image: np.ndarray,
-               context: DetectionContext,
-               *args,
-               **kwargs) -> None:
-        """
-        1) Convert to binary & skeletonize
-        2) Classify each point in the context
-        3) Create a Junction for each point and store it in context.junctions
-           (with 'connected_lines' referencing lines that share this point).
-        """
-        # 1) Preprocess -> skeleton
-        skeleton = self._create_skeleton(image)
-        # 2) Classify each point
-        for pt in context.points.values():
-            pt.type = self._classify_point(skeleton, pt)
-        # 3) Create a Junction object for each point
-        #    If you prefer only T or L, you can filter out END points.
-        self._record_junctions_in_context(context)
-    def _preprocess(self, image: np.ndarray) -> np.ndarray:
-        """We might do thresholding; let's do a simple binary threshold."""
-        if image.ndim == 3:
-            gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
-        else:
-            gray = image
-        _, bin_image = cv2.threshold(gray, 127, 255, cv2.THRESH_BINARY)
-        return bin_image
-    def _postprocess(self, image: np.ndarray) -> np.ndarray:
-        return image
-    def _create_skeleton(self, raw_image: np.ndarray) -> np.ndarray:
-        """Skeletonize the binarized image."""
-        bin_img = self._preprocess(raw_image)
-        # For skeletonize, we need a boolean array
-        inv = cv2.bitwise_not(bin_img)
-        inv_bool = (inv > 127).astype(np.uint8)
-        skel = skeletonize(inv_bool).astype(np.uint8) * 255
-        return skel
-    def _classify_point(self, skeleton: np.ndarray, pt: Point) -> JunctionType:
-        """
-        Given a skeleton image, look around 'pt' in a local window
-        to determine if it's an END, L, or T.
-        """
-        classification = JunctionType.END  # default
-        half_w = self.window_size // 2
-        x, y = pt.coords.x, pt.coords.y
-        top    = max(0, y - half_w)
-        bottom = min(skeleton.shape[0], y + half_w + 1)
-        left   = max(0, x - half_w)
-        right  = min(skeleton.shape[1], x + half_w + 1)
-        patch = (skeleton[top:bottom, left:right] > 127).astype(np.uint8)
-        # create circular mask
-        circle_mask = np.zeros_like(patch, dtype=np.uint8)
-        local_cx = x - left
-        local_cy = y - top
-        cv2.circle(circle_mask, (local_cx, local_cy), self.radius, 1, -1)
-        circle_skel = patch & circle_mask
-        # label connected regions
-        labeled = label(circle_skel, connectivity=2)
-        num_exits = labeled.max()
-        if num_exits == 1:
-            classification = JunctionType.END
-        elif num_exits == 2:
-            # check angle for L
-            classification = self._check_angle_for_L(labeled)
-        elif num_exits == 3:
-            classification = JunctionType.T
-        return classification
-    def _check_angle_for_L(self, labeled_region: np.ndarray) -> JunctionType:
-        """
-        If the angle between two branches is within
-        [angle_threshold_lb, angle_threshold_ub], it's 'L'.
-        Otherwise default to END.
-        """
-        coords = np.argwhere(labeled_region == 1)
-        if len(coords) < 2:
-            return JunctionType.END
-        (y1, x1), (y2, x2) = coords[:2]
-        dx = x2 - x1
-        dy = y2 - y1
-        angle = math.degrees(math.atan2(dy, dx))
-        acute_angle = min(abs(angle), 180 - abs(angle))
-        if self.angle_threshold_lb <= acute_angle <= self.angle_threshold_ub:
-            return JunctionType.L
-        return JunctionType.END
-    # -----------------------------------------
-    #  EXTRA STEP: Create Junction objects
-    # -----------------------------------------
-    def _record_junctions_in_context(self, context: DetectionContext):
-        """
-        Create a Junction object for each point in context.points.
-        If you only want T/L points as junctions, filter them out.
-        Also track any lines that connect to this point.
-        """
-        for pt in context.points.values():
-            # If you prefer to store all points as junction, do it:
-            # or if you want only T or L, do:
-            # if pt.type in {JunctionType.T, JunctionType.L}: ...
-            jn = Junction(
-                center=pt.coords,
-                junction_type=pt.type,
-                # add more properties if needed
-            )
-            # find lines that connect to this point
-            connected_lines = []
-            for ln in context.lines.values():
-                if ln.start.id == pt.id or ln.end.id == pt.id:
-                    connected_lines.append(ln.id)
-            jn.connected_lines = connected_lines
-            # add to context
-            context.add_junction(jn)
-# from loguru import logger
-#
-#
-# class SymbolDetector(BaseDetector):
-#     """
-#     YOLO-based symbol detector using multiple confidence thresholds,
-#     merges final detections, and stores them in the context.
-#     """
-#
-#     def __init__(self, config: SymbolConfig, debug_handler: Optional[DebugHandler] = None):
-#         super().__init__(config, debug_handler)
-#         self.config = config
-#         self.debug_handler = debug_handler or DebugHandler()
-#         self.models = self._load_models()
-#         self.class_map = self._build_class_map()
-#
-#         logger.info("Symbol detector initialized with config: %s", self.config)
-#
-#     # -----------------------------
-#     # BaseDetector Implementation
-#     # -----------------------------
-#     def _load_model(self, model_path: str):
-#         """We won't use this single-model loader; see _load_models()."""
-#         pass
-#
-#     def detect(self,
-#                image: np.ndarray,
-#                context: DetectionContext,
-#                roi_offset: Tuple[int, int],
-#                *args,
-#                **kwargs) -> None:
-#         """
-#         Run multi-threshold YOLO detection for each model, pick best threshold,
-#         merge detections, and store Symbol objects in context.
-#         """
-#         try:
-#             with self.debug_handler.track_performance("symbol_detection"):
-#                 # 1) Possibly preprocess & resize
-#                 processed_img = self._preprocess(image)
-#                 resized_img, scale_factor = self._resize_image(processed_img)
-#
-#                 # 2) Detect with all models, each using multiple thresholds
-#                 all_detections = []
-#                 for model_name, model in self.models.items():
-#                     best_detections = self._detect_best_threshold(
-#                         model, resized_img, image.shape, scale_factor, model_name
-#                     )
-#                     all_detections.extend(best_detections)
-#
-#                 # 3) Merge detections using NMS logic
-#                 merged_detections = self._merge_detections(all_detections)
-#
-#                 # 4) Update context with final symbols
-#                 self._update_context(merged_detections, context)
-#
-#                 # 5) Create optional debug image artifact
-#                 debug_image = self._create_debug_image(processed_img, merged_detections)
-#                 _, debug_img_encoded = cv2.imencode('.jpg', debug_image)
-#                 self.debug_handler.save_artifact(
-#                     name="symbol_detection_debug",
-#                     data=debug_img_encoded.tobytes(),
-#                     extension="jpg"
-#                 )
-#
-#         except Exception as e:
-#             logger.error("Symbol detection failed: %s", str(e), exc_info=True)
-#             self.debug_handler.save_artifact(
-#                 name="symbol_detection_error",
-#                 data=f"Detection error: {str(e)}".encode('utf-8'),
-#                 extension="txt"
-#             )
-#
-#     def _preprocess(self, image: np.ndarray) -> np.ndarray:
-#         """Preprocess if needed (e.g., histogram equalization)."""
-#         if self.config.apply_preprocessing:
-#             gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
-#             equalized = cv2.equalizeHist(gray)
-#             # convert back to BGR for YOLO
-#             return cv2.cvtColor(equalized, cv2.COLOR_GRAY2BGR)
-#         return image.copy()
-#
-#     def _postprocess(self, image: np.ndarray) -> np.ndarray:
-#         return None
-#
-#     # -----------------------------
-#     # Internal Helpers
-#     # -----------------------------
-#     def _load_models(self) -> Dict[str, YOLO]:
-#         """Load multiple YOLO models from config."""
-#         models = {}
-#         for model_name, path_str in self.config.model_paths.items():
-#             path = Path(path_str)
-#             if not path.exists():
-#                 raise FileNotFoundError(f"Model file not found: {path_str}")
-#             models[model_name] = YOLO(str(path))
-#             logger.info(f"Loaded model '{model_name}' from {path_str}")
-#         return models
-#
-#     def _build_class_map(self) -> Dict[int, SymbolType]:
-#         """
-#         Convert config symbol_type_mapping (like {"pump": "PUMP"})
-#         into a dictionary from YOLO class_id to SymbolType.
-#         If you have a fixed list of YOLO classes, you can map them here.
-#         """
-#         # For example, if YOLO has classes like ["valve", "pump", ...],
-#         # you might want to do something more dynamic.
-#         # For now, let's just return an empty dict or handle it in detection.
-#         return {}
-#
-#     def _resize_image(self, image: np.ndarray) -> Tuple[np.ndarray, float]:
-#         """Resize while maintaining aspect ratio if needed."""
-#         h, w = image.shape[:2]
-#         if not self.config.resize_image:
-#             return image, 1.0
-#
-#         if max(w, h) > self.config.max_dimension:
-#             scale = self.config.max_dimension / max(w, h)
-#             new_w, new_h = int(w * scale), int(h * scale)
-#             resized = cv2.resize(image, (new_w, new_h), interpolation=cv2.INTER_LINEAR)
-#             return resized, scale
-#         return image, 1.0
-#
-#     def _detect_best_threshold(self,
-#                                model: YOLO,
-#                                resized_img: np.ndarray,
-#                                orig_shape: Tuple[int, int, int],
-#                                scale_factor: float,
-#                                model_name: str) -> List[Dict]:
-#         """
-#         Run detection across multiple confidence thresholds.
-#         Use the threshold that yields the 'best metric' (currently # of detections).
-#         """
-#         best_metric = -1
-#         best_threshold = 0.5
-#         best_detections_list = []
-#
-#         # Evaluate each threshold
-#         for thresh in self.config.confidence_thresholds:
-#             # Run YOLO detection
-#             # Setting conf=thresh or conf=0.0 + we do filtering ourselves.
-#             results = model.predict(
-#                 source=resized_img,
-#                 imgsz=self.config.max_dimension,
-#                 conf=0.0,  # We'll filter manually below
-#                 verbose=False
-#             )
-#
-#             # Convert to detection dict
-#             detections_list = []
-#             for result in results:
-#                 for box in result.boxes:
-#                     conf_val = float(box.conf[0])
-#                     if conf_val >= thresh:
-#                         # Convert bounding box coords to original (local) coords
-#                         x1, y1, x2, y2 = self._scale_coordinates(
-#                             box.xyxy[0].cpu().numpy(),
-#                             resized_img.shape,  # shape after resizing
-#                             scale_factor
-#                         )
-#                         class_id = int(box.cls[0])
-#                         label = result.names[class_id] if result.names else "unknown_label"
-#
-#                         # parse label (category, type, new_label)
-#                         category, type_str, new_label = self._parse_label(label)
-#
-#                         detection_info = {
-#                             "symbol_id": str(uuid.uuid4()),
-#                             "class_id": class_id,
-#                             "original_label": label,
-#                             "category": category,
-#                             "type": type_str,
-#                             "label": new_label,
-#                             "confidence": conf_val,
-#                             "bbox": [x1, y1, x2, y2],
-#                             "model_source": model_name
-#                         }
-#                         detections_list.append(detection_info)
-#
-#             # Evaluate
-#             metric = self._evaluate_detections(detections_list)
-#             if metric > best_metric:
-#                 best_metric = metric
-#                 best_threshold = thresh
-#                 best_detections_list = detections_list
-#
-#         logger.info(f"For model {model_name}, best threshold={best_threshold:.2f} with {best_metric} detections.")
-#         return best_detections_list
-#
-#     def _evaluate_detections(self, detections_list: List[Dict]) -> int:
-#         """A simple metric: # of detections."""
-#         return len(detections_list)
-#
-#     def _parse_label(self, label: str) -> Tuple[str, str, str]:
-#         """
-#         Attempt to parse the YOLO label into (category, type, new_label).
-#         Example label: "inst_ind_Solenoid_actuator"
-#            -> category=inst, type=ind, new_label="Solenoid_actuator"
-#         If no underscores, we fallback to "Unknown" for type.
-#         """
-#         split_label = label.split('_')
-#         if len(split_label) >= 3:
-#             category = split_label[0]
-#             type_ = split_label[1]
-#             new_label = '_'.join(split_label[2:])
-#         elif len(split_label) == 2:
-#             category = split_label[0]
-#             type_ = split_label[1]
-#             new_label = split_label[1]
-#         elif len(split_label) == 1:
-#             category = split_label[0]
-#             type_ = "Unknown"
-#             new_label = split_label[0]
-#         else:
-#             logger.warning(f"Unexpected label format: {label}")
-#             return ("Unknown", "Unknown", label)
-#
-#         return (category, type_, new_label)
-#
-#     def _scale_coordinates(self,
-#                            coords: np.ndarray,
-#                            resized_shape: Tuple[int, int, int],
-#                            scale_factor: float) -> Tuple[int, int, int, int]:
-#         """
-#         Scale YOLO's [x1,y1,x2,y2] from the resized image back to the original local coords.
-#         """
-#         x1, y1, x2, y2 = coords
-#         # Because we resized by scale_factor
-#         # so original coordinate = coords / scale_factor
-#         return (
-#             int(x1 / scale_factor),
-#             int(y1 / scale_factor),
-#             int(x2 / scale_factor),
-#             int(y2 / scale_factor),
-#         )
-#
-#     def _merge_detections(self, all_detections: List[Dict]) -> List[Dict]:
-#         """Merge using NMS-like approach (IoU-based) across all models."""
-#         if not all_detections:
-#             return []
-#
-#         # Sort by confidence (descending)
-#         all_detections.sort(key=lambda x: x['confidence'], reverse=True)
-#         keep = [True] * len(all_detections)
-#
-#         for i in range(len(all_detections)):
-#             if not keep[i]:
-#                 continue
-#             for j in range(i + 1, len(all_detections)):
-#                 if not keep[j]:
-#                     continue
-#                 # Merge if same class_id & high IoU
-#                 if (all_detections[i]['class_id'] == all_detections[j]['class_id'] and
-#                     self._calculate_iou(all_detections[i]['bbox'], all_detections[j]['bbox']) > 0.5):
-#                     keep[j] = False
-#
-#         return [det for idx, det in enumerate(all_detections) if keep[idx]]
-#
-#     def _calculate_iou(self, box1: List[int], box2: List[int]) -> float:
-#         """Intersection over Union"""
-#         x_left   = max(box1[0], box2[0])
-#         y_top    = max(box1[1], box2[1])
-#         x_right  = min(box1[2], box2[2])
-#         y_bottom = min(box1[3], box2[3])
-#
-#         inter_w = max(0, x_right - x_left)
-#         inter_h = max(0, y_bottom - y_top)
-#         intersection = inter_w * inter_h
-#
-#         area1 = (box1[2] - box1[0]) * (box1[3] - box1[1])
-#         area2 = (box2[2] - box2[0]) * (box2[3] - box2[1])
-#         union = float(area1 + area2 - intersection)
-#         return intersection / union if union > 0 else 0.0
-#
-#     def _update_context(self, detections: List[Dict], context: DetectionContext) -> None:
-#         """Convert final detections into Symbol objects & add to context."""
-#         for det in detections:
-#             x1, y1, x2, y2 = det['bbox']
-#             # Use your Symbol dataclass from detection_schema
-#             symbol_obj = Symbol(
-#                 bbox=BBox(xmin=x1, ymin=y1, xmax=x2, ymax=y2),
-#                 center=Coordinates(x=(x1 + x2) // 2, y=(y1 + y2) // 2),
-#                 symbol_type=SymbolType.OTHER,  # default
-#                 confidence=det['confidence'],
-#                 model_source=det['model_source'],
-#                 class_id=det['class_id'],
-#                 original_label=det['original_label'],
-#                 category=det['category'],
-#                 type=det['type'],
-#                 label=det['label']
-#             )
-#             context.add_symbol(symbol_obj)
-#
-#     def _create_debug_image(self, image: np.ndarray, detections: List[Dict]) -> np.ndarray:
-#         """Optional: draw bounding boxes & labels on a copy of 'image'."""
-#         debug_img = image.copy()
-#         for det in detections:
-#             x1, y1, x2, y2 = det['bbox']
-#             cv2.rectangle(debug_img, (x1, y1), (x2, y2), (0, 255, 0), 2)
-#             txt = f"{det['label']} {det['confidence']:.2f}"
-#             cv2.putText(debug_img, txt, (x1, max(0, y1 - 10)),
-#                         cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 255), 1)
-#         return debug_img
-#
-#
-# class TagDetector(BaseDetector):
-#     """
-#     A placeholder detector that reads precomputed tag data
-#     from a JSON file and populates the context with Tag objects.
-#     """
-#
-#     def __init__(self,
-#                  config: TagConfig,
-#                  debug_handler: Optional[DebugHandler] = None,
-#                  tag_json_path: str = "./tags.json"):
-#         super().__init__(config=config, debug_handler=debug_handler)
-#         self.tag_json_path = tag_json_path
-#
-#     def _load_model(self, model_path: str):
-#         """Not loading an actual model; tag data is read from JSON."""
-#         return None
-#
-#     def detect(self,
-#                image: np.ndarray,
-#                context: DetectionContext,
-#                roi_offset: Tuple[int, int],
-#                *args,
-#                **kwargs) -> None:
-#         """
-#         Reads from a JSON file containing tag info,
-#         adjusts coordinates using roi_offset, and updates context.
-#         """
-#
-#         tag_data = self._load_json_data(self.tag_json_path)
-#         if not tag_data:
-#             return
-#
-#         x_min, y_min = roi_offset  # Offset values from cropping
-#
-#         for record in tag_data.get("detections", []):  # Fix: Use "detections" key
-#             tag_obj = self._parse_tag_record(record, x_min, y_min)
-#             context.add_tag(tag_obj)
-#
-#     def _preprocess(self, image: np.ndarray) -> np.ndarray:
-#         return image
-#
-#     def _postprocess(self, image: np.ndarray) -> np.ndarray:
-#         return image
-#
-#     # --------------
-#     # HELPER METHODS
-#     # --------------
-#     def _load_json_data(self, json_path: str) -> dict:
-#         if not os.path.exists(json_path):
-#             self.debug_handler.save_artifact(name="tag_error",
-#                                              data=b"Missing tag JSON file",
-#                                              extension="txt")
-#             return {}
-#
-#         with open(json_path, "r", encoding="utf-8") as f:
-#             return json.load(f)
-#
-#     def _parse_tag_record(self, record: dict, x_min: int, y_min: int) -> Tag:
-#         """
-#         Builds a Tag object from a JSON record, adjusting coordinates for cropping.
-#         """
-#         bbox_list = record.get("bbox", [0, 0, 0, 0])
-#         bbox_obj = BBox(
-#             xmin=bbox_list[0] - x_min,
-#             ymin=bbox_list[1] - y_min,
-#             xmax=bbox_list[2] - x_min,
-#             ymax=bbox_list[3] - y_min
-#         )
-#
-#         return Tag(
-#             text=record.get("text", ""),
-#             bbox=bbox_obj,
-#             confidence=record.get("confidence", 1.0),
-#             source=record.get("source", ""),
-#             text_type=record.get("text_type", "Unknown"),
-#             id=record.get("id", str(uuid.uuid4())),
-#             font_size=record.get("font_size", 12),
-#             rotation=record.get("rotation", 0.0)
-#         )
-import json
-import uuid
-class SymbolDetector(BaseDetector):
-    """
-    A placeholder detector that reads precomputed symbol data
-    from a JSON file and populates the context with Symbol objects.
-    """
-    def __init__(self,
-                 config: SymbolConfig,
-                 debug_handler: Optional[DebugHandler] = None,
-                 symbol_json_path: str = "./symbols.json"):
-        super().__init__(config=config, debug_handler=debug_handler)
-        self.symbol_json_path = symbol_json_path
-    def _load_model(self, model_path: str):
-        """Not loading an actual model; symbol data is read from JSON."""
-        return None
-    def detect(self,
-               image: np.ndarray,
-               context: DetectionContext,
-               roi_offset: Tuple[int, int],
-               *args,
-               **kwargs) -> None:
-        """
-        Reads from a JSON file containing symbol info,
-        adjusts coordinates using roi_offset, and updates context.
-        """
-        symbol_data = self._load_json_data(self.symbol_json_path)
-        if not symbol_data:
-            return
-        x_min, y_min = roi_offset  # Offset values from cropping
-        for record in symbol_data.get("detections", []):  # Fix: Use "detections" key
-            sym_obj = self._parse_symbol_record(record, x_min, y_min)
-            context.add_symbol(sym_obj)
-    def _preprocess(self, image: np.ndarray) -> np.ndarray:
-        return image
-    def _postprocess(self, image: np.ndarray) -> np.ndarray:
-        return image
-    # --------------
-    # HELPER METHODS
-    # --------------
-    def _load_json_data(self, json_path: str) -> dict:
-        if not os.path.exists(json_path):
-            self.debug_handler.save_artifact(name="symbol_error",
-                                             data=b"Missing symbol JSON file",
-                                             extension="txt")
-            return {}
-        with open(json_path, "r", encoding="utf-8") as f:
-            return json.load(f)
-    def _parse_symbol_record(self, record: dict, x_min: int, y_min: int) -> Symbol:
-        """
-        Builds a Symbol object from a JSON record, adjusting coordinates for cropping.
-        """
-        bbox_list = record.get("bbox", [0, 0, 0, 0])
-        bbox_obj = BBox(
-            xmin=bbox_list[0] - x_min,
-            ymin=bbox_list[1] - y_min,
-            xmax=bbox_list[2] - x_min,
-            ymax=bbox_list[3] - y_min
-        )
-        # Compute the center
-        center_coords = Coordinates(
-            x=(bbox_obj.xmin + bbox_obj.xmax) // 2,
-            y=(bbox_obj.ymin + bbox_obj.ymax) // 2
-        )
-        return Symbol(
-            id=record.get("symbol_id", ""),
-            class_id=record.get("class_id", -1),
-            original_label=record.get("original_label", ""),
-            category=record.get("category", ""),
-            type=record.get("type", ""),
-            label=record.get("label", ""),
-            bbox=bbox_obj,
-            center=center_coords,
-            confidence=record.get("confidence", 0.95),
-            model_source=record.get("model_source", ""),
-            connections=[]
-        )
-class TagDetector(BaseDetector):
-    """
-    A placeholder detector that reads precomputed tag data
-    from a JSON file and populates the context with Tag objects.
-    """
-    def __init__(self,
-                 config: TagConfig,
-                 debug_handler: Optional[DebugHandler] = None,
-                 tag_json_path: str = "./tags.json"):
-        super().__init__(config=config, debug_handler=debug_handler)
-        self.tag_json_path = tag_json_path
-    def _load_model(self, model_path: str):
-        """Not loading an actual model; tag data is read from JSON."""
-        return None
-    def detect(self,
-               image: np.ndarray,
-               context: DetectionContext,
-               roi_offset: Tuple[int, int],
-               *args,
-               **kwargs) -> None:
-        """
-        Reads from a JSON file containing tag info,
-        adjusts coordinates using roi_offset, and updates context.
-        """
-        tag_data = self._load_json_data(self.tag_json_path)
-        if not tag_data:
-            return
-        x_min, y_min = roi_offset  # Offset values from cropping
-        for record in tag_data.get("detections", []):  # Fix: Use "detections" key
-            tag_obj = self._parse_tag_record(record, x_min, y_min)
-            context.add_tag(tag_obj)
-    def _preprocess(self, image: np.ndarray) -> np.ndarray:
-        return image
-    def _postprocess(self, image: np.ndarray) -> np.ndarray:
-        return image
-    # --------------
-    # HELPER METHODS
-    # --------------
-    def _load_json_data(self, json_path: str) -> dict:
-        if not os.path.exists(json_path):
-            self.debug_handler.save_artifact(name="tag_error",
-                                             data=b"Missing tag JSON file",
-                                             extension="txt")
-            return {}
-        with open(json_path, "r", encoding="utf-8") as f:
-            return json.load(f)
-    def _parse_tag_record(self, record: dict, x_min: int, y_min: int) -> Tag:
-        """
-        Builds a Tag object from a JSON record, adjusting coordinates for cropping.
-        """
-        bbox_list = record.get("bbox", [0, 0, 0, 0])
-        bbox_obj = BBox(
-            xmin=bbox_list[0] - x_min,
-            ymin=bbox_list[1] - y_min,
-            xmax=bbox_list[2] - x_min,
-            ymax=bbox_list[3] - y_min
-        )
-        return Tag(
-            text=record.get("text", ""),
-            bbox=bbox_obj,
-            confidence=record.get("confidence", 1.0),
-            source=record.get("source", ""),
-            text_type=record.get("text_type", "Unknown"),
-            id=record.get("id", str(uuid.uuid4())),
-            font_size=record.get("font_size", 12),
-            rotation=record.get("rotation", 0.0)
-        )

 import torch
 import cv2
 import numpy as np
+from typing import List, Optional, Tuple, Dict, Any
 from dataclasses import replace
 from math import sqrt
 import json
 import uuid
 from pathlib import Path
+from abc import ABC, abstractmethod
+from ultralytics import YOLO
+from PIL import Image
+import matplotlib.pyplot as plt
+from storage import StorageInterface
 # Base classes and utilities
 from base import BaseDetector
 # DeepLSD model for line detection
 from deeplsd.models.deeplsd_inference import DeepLSD
 # Detection schema: dataclasses for different objects
 from detection_schema import (
 from skimage.morphology import skeletonize
 from skimage.measure import label
+# Configure logging
+logger = logging.getLogger(__name__)
+class Detector(ABC):
+    """Base class for all detectors"""
+    def __init__(self, config: Any, debug_handler=None):
+        self.config = config
         self.debug_handler = debug_handler
+    @abstractmethod
+    def detect(self, image: np.ndarray) -> Dict:
+        """Perform detection on the image"""
         pass
+    def save_debug_image(self, image: np.ndarray, filename: str):
+        """Save debug visualization if debug handler is available"""
+        if self.debug_handler:
+            self.debug_handler.save_image(image, filename)
+class SymbolDetector(Detector):
+    """Detector for symbols in P&ID diagrams"""
+    def __init__(self, config, debug_handler=None):
+        super().__init__(config, debug_handler)
+        self.models = {}
+        for name, path in config.model_paths.items():
+            if os.path.exists(path):
+                self.models[name] = YOLO(path)
+            else:
+                logger.warning(f"Model not found at {path}")
+    def detect(self, image: np.ndarray) -> Dict:
+        """Detect symbols using multiple YOLO models"""
+        results = []
+        # Process with each model
+        for model_name, model in self.models.items():
+            model_results = model(image, conf=self.config.confidence_threshold)[0]
+            boxes = model_results.boxes
+            for box in boxes:
+                x1, y1, x2, y2 = box.xyxy[0].cpu().numpy()
+                conf = box.conf[0].cpu().numpy()
+                cls = box.cls[0].cpu().numpy()
+                cls_name = model_results.names[int(cls)]
+                results.append({
+                    'bbox': [float(x1), float(y1), float(x2), float(y2)],
+                    'confidence': float(conf),
+                    'class': cls_name,
+                    'model': model_name
+                })
+        return {'detections': results}
+class TagDetector(Detector):
+    """Detector for text tags in P&ID diagrams"""
+    def __init__(self, config, debug_handler=None):
+        super().__init__(config, debug_handler)
+        self.ocr = None  # Initialize OCR engine here
+    def detect(self, image: np.ndarray) -> Dict:
+        """Detect and recognize text tags"""
+        # Implement text detection logic
+        return {'detections': []}
+class LineDetector(Detector):
+    """Detector for lines in P&ID diagrams"""
+    def __init__(self, config, model_path=None, model_config=None, device='cpu', debug_handler=None):
+        super().__init__(config, debug_handler)
+        self.model_path = model_path
+        self.model_config = model_config or {}
+        self.device = device
+    def detect(self, image: np.ndarray) -> Dict:
+        """Detect lines using DeepLSD or other methods"""
+        # Implement line detection logic
+        return {'detections': []}
+class PointDetector(Detector):
+    """Detector for connection points in P&ID diagrams"""
+    def detect(self, image: np.ndarray) -> Dict:
+        """Detect connection points"""
+        # Implement point detection logic
+        return {'detections': []}
+class JunctionDetector(Detector):
+    """Detector for line junctions in P&ID diagrams"""
+    def detect(self, image: np.ndarray) -> Dict:
+        """Detect line junctions"""
+        # Implement junction detection logic
+        return {'detections': []}