Addax-Data-Science
/

NAM-ADS-v1

Model card Files Files and versions

xet

Community

Addax-Data-Science commited on about 1 month ago

Commit

aba2956

verified ·

1 Parent(s): d7437ff

Upload inference.py

Browse files

Files changed (1) hide show

inference.py +211 -219

inference.py CHANGED Viewed

@@ -12,6 +12,7 @@ Training data: 850,000+ images
 Original source: streamlit-AddaxAI/classification/model_types/addax-yolov8/classify_detections.py
 Adapted by: Claude Code on 2026-01-11
 """
 from __future__ import annotations
@@ -24,13 +25,6 @@ import torch
 from PIL import Image, ImageFile, ImageOps
 from ultralytics import YOLO
-# Module-level variables (injected by AddaxAI framework)
-MODEL_DIR: Path | None = None  # Set by CustomInferenceLoader
-MODEL_PATH: Path | None = None  # Set by CustomInferenceLoader
-# Module-level model instance (loaded once at startup)
-animal_model: YOLO | None = None
 # Don't freak out over truncated images
 ImageFile.LOAD_TRUNCATED_IMAGES = True
@@ -40,217 +34,215 @@ if plt != 'Windows':
     pathlib.WindowsPath = pathlib.PosixPath
-def check_gpu() -> bool:
-    """
-    Check GPU availability for YOLOv8 inference.
-    Checks both Apple Metal Performance Shaders (MPS) and CUDA availability.
-    Returns:
-        True if GPU available, False otherwise
-    """
-    # Check Apple MPS (Apple Silicon)
-    try:
-        if torch.backends.mps.is_built() and torch.backends.mps.is_available():
-            return True
-    except Exception:
-        pass
-    # Check CUDA (NVIDIA)
-    return torch.cuda.is_available()
-def load_model() -> None:
-    """
-    Load YOLOv8 classification model into memory.
-    This function is called once during worker initialization.
-    The model is stored in the global `animal_model` variable and reused
-    for all subsequent classification requests.
-    Raises:
-        RuntimeError: If model loading fails
-        FileNotFoundError: If MODEL_PATH is invalid
-    """
-    global animal_model, MODEL_PATH
-    # MODEL_PATH is injected by framework before this function is called
-    # Check that the path exists (framework guarantees it's not None)
-    if not MODEL_PATH.exists():
-        raise FileNotFoundError(f"Model file not found: {MODEL_PATH}")
-    try:
-        animal_model = YOLO(str(MODEL_PATH))
-    except Exception as e:
-        raise RuntimeError(f"Failed to load YOLOv8 model from {MODEL_PATH}: {e}") from e
-def get_crop(image: Image.Image, bbox: tuple[float, float, float, float]) -> Image.Image:
-    """
-    Crop image using model-specific preprocessing.
-    This cropping method was developed by Dan Morris for MegaDetector and is
-    designed to:
-    1. Square the bounding box (max of width/height)
-    2. Add padding to prevent over-enlargement of small animals
-    3. Center the detection within the crop
-    4. Pad with black (0) to maintain square aspect ratio
-    Args:
-        image: PIL Image (full resolution)
-        bbox: Normalized bounding box (x, y, width, height) in range [0.0, 1.0]
-    Returns:
-        Cropped and padded PIL Image ready for classification
-    Raises:
-        ValueError: If bbox is invalid (zero size)
-    """
-    img_w, img_h = image.size
-    # Denormalize bbox coordinates
-    xmin = int(bbox[0] * img_w)
-    ymin = int(bbox[1] * img_h)
-    box_w = int(bbox[2] * img_w)
-    box_h = int(bbox[3] * img_h)
-    # Square the box (use max dimension)
-    box_size = max(box_w, box_h)
-    # Add padding (prevents over-enlargement of small animals)
-    box_size = _pad_crop(box_size)
-    # Center the detection within the squared crop
-    xmin = max(0, min(
-        xmin - int((box_size - box_w) / 2),
-        img_w - box_w
-    ))
-    ymin = max(0, min(
-        ymin - int((box_size - box_h) / 2),
-        img_h - box_h
-    ))
-    # Clip to image boundaries
-    box_w = min(img_w, box_size)
-    box_h = min(img_h, box_size)
-    if box_w == 0 or box_h == 0:
-        raise ValueError(f"Invalid bbox size: {box_w}x{box_h}")
-    # Crop and pad to square
-    crop = image.crop(box=[xmin, ymin, xmin + box_w, ymin + box_h])
-    crop = ImageOps.pad(crop, size=(box_size, box_size), color=0)
-    return crop
-def _pad_crop(box_size: int) -> int:
-    """
-    Calculate padded crop size to prevent over-enlargement of small animals.
-    YOLOv8 expects 224x224 input. This function ensures small detections aren't
-    excessively upscaled while adding consistent padding to larger detections.
-    Args:
-        box_size: Original bounding box size (max of width/height)
-    Returns:
-        Padded box size
-    """
-    input_size_network = 224
-    default_padding = 30
-    if box_size >= input_size_network:
-        # Large detection: add default padding
-        return box_size + default_padding
-    else:
-        # Small detection: ensure minimum size without excessive enlargement
-        diff_size = input_size_network - box_size
-        if diff_size < default_padding:
             return box_size + default_padding
         else:
-            return input_size_network
-def get_classification(crop: Image.Image) -> list[tuple[str, float]]:
-    """
-    Run YOLOv8 classification on cropped image.
-    Args:
-        crop: Cropped and preprocessed PIL Image
-    Returns:
-        List of (class_name, confidence) tuples for ALL classes, sorted by confidence.
-        Example: [("giraffe", 0.99985), ("cattle", 0.00003), ...]
-    Raises:
-        RuntimeError: If model not loaded or inference fails
-    """
-    global animal_model
-    if animal_model is None:
-        raise RuntimeError("Model not loaded - call load_model() first")
-    try:
-        # Run YOLOv8 classification (verbose=False suppresses progress bar)
-        results = animal_model(crop, verbose=False)
-        # Extract class names dict (YOLOv8 uses alphabetical order)
-        # Example: {0: "aardwolf", 1: "african wild cat", ..., 13: "giraffe", ...}
-        names_dict = results[0].names
-        # Extract probabilities: [0.0001, 0.0002, ..., 0.9998, ...]
-        probs = results[0].probs.data.tolist()
-        # Build list of (class_name, confidence) tuples
-        # Return YOLOv8's class names (which will be mapped to taxonomy IDs later)
-        classifications = []
-        for idx, class_name in names_dict.items():
-            confidence = probs[idx]
-            classifications.append((class_name, confidence))
-        # Sort by confidence descending (already sorted by YOLOv8, but ensure it)
-        classifications.sort(key=lambda x: x[1], reverse=True)
-        return classifications
-    except Exception as e:
-        raise RuntimeError(f"YOLOv8 classification failed: {e}") from e
-def get_class_names() -> dict[str, str]:
-    """
-    Get mapping of class IDs to species names from YOLOv8 model.
-    YOLOv8 stores class names in alphabetical order internally. This function
-    extracts those names and creates a 1-indexed mapping for the JSON format.
-    NOTE: taxonomy.csv is NOT used here - it's only for UI taxonomy tree display.
-    The class IDs here are YOLOv8's alphabetical indices (0-based) + 1.
-    Returns:
-        Dict mapping class ID (1-indexed string) to common name
-        Example: {"1": "aardwolf", "2": "african wild cat", ..., "14": "giraffe", ...}
-    Raises:
-        RuntimeError: If model not loaded
-    """
-    global animal_model
-    if animal_model is None:
-        raise RuntimeError("Model not loaded - call load_model() first")
-    try:
-        # YOLOv8 names dict (alphabetical order): {0: "aardwolf", 1: "african wild cat", ...}
-        yolo_names = animal_model.names
-        # Convert to 1-indexed dict for JSON compatibility
-        class_names = {}
-        for idx, name in yolo_names.items():
-            class_id_str = str(idx + 1)  # 1-indexed
-            class_names[class_id_str] = name
-        return class_names
-    except Exception as e:
-        raise RuntimeError(f"Failed to extract class names from model: {e}") from e

 Original source: streamlit-AddaxAI/classification/model_types/addax-yolov8/classify_detections.py
 Adapted by: Claude Code on 2026-01-11
+Updated: 2026-01-13 - Migrated to class-based interface
 """
 from __future__ import annotations
 from PIL import Image, ImageFile, ImageOps
 from ultralytics import YOLO
 # Don't freak out over truncated images
 ImageFile.LOAD_TRUNCATED_IMAGES = True
     pathlib.WindowsPath = pathlib.PosixPath
+class ModelInference:
+    """YOLOv8 inference implementation for Namibian Desert species classifier."""
+    def __init__(self, model_dir: Path, model_path: Path):
+        """
+        Initialize with model paths.
+        Args:
+            model_dir: Directory containing model files
+            model_path: Path to namib_desert_v1.pt file
+        """
+        self.model_dir = model_dir
+        self.model_path = model_path
+        self.model: YOLO | None = None
+    def check_gpu(self) -> bool:
+        """
+        Check GPU availability for YOLOv8 inference.
+        Checks both Apple Metal Performance Shaders (MPS) and CUDA availability.
+        Returns:
+            True if GPU available, False otherwise
+        """
+        # Check Apple MPS (Apple Silicon)
+        try:
+            if torch.backends.mps.is_built() and torch.backends.mps.is_available():
+                return True
+        except Exception:
+            pass
+        # Check CUDA (NVIDIA)
+        return torch.cuda.is_available()
+    def load_model(self) -> None:
+        """
+        Load YOLOv8 classification model into memory.
+        This function is called once during worker initialization.
+        The model is stored in self.model and reused for all subsequent
+        classification requests.
+        Raises:
+            RuntimeError: If model loading fails
+            FileNotFoundError: If model_path is invalid
+        """
+        if not self.model_path.exists():
+            raise FileNotFoundError(f"Model file not found: {self.model_path}")
+        try:
+            self.model = YOLO(str(self.model_path))
+        except Exception as e:
+            raise RuntimeError(f"Failed to load YOLOv8 model from {self.model_path}: {e}") from e
+    def get_crop(
+        self, image: Image.Image, bbox: tuple[float, float, float, float]
+    ) -> Image.Image:
+        """
+        Crop image using model-specific preprocessing.
+        This cropping method was developed by Dan Morris for MegaDetector and is
+        designed to:
+        1. Square the bounding box (max of width/height)
+        2. Add padding to prevent over-enlargement of small animals
+        3. Center the detection within the crop
+        4. Pad with black (0) to maintain square aspect ratio
+        Args:
+            image: PIL Image (full resolution)
+            bbox: Normalized bounding box (x, y, width, height) in range [0.0, 1.0]
+        Returns:
+            Cropped and padded PIL Image ready for classification
+        Raises:
+            ValueError: If bbox is invalid (zero size)
+        """
+        img_w, img_h = image.size
+        # Denormalize bbox coordinates
+        xmin = int(bbox[0] * img_w)
+        ymin = int(bbox[1] * img_h)
+        box_w = int(bbox[2] * img_w)
+        box_h = int(bbox[3] * img_h)
+        # Square the box (use max dimension)
+        box_size = max(box_w, box_h)
+        # Add padding (prevents over-enlargement of small animals)
+        box_size = self._pad_crop(box_size)
+        # Center the detection within the squared crop
+        xmin = max(0, min(xmin - int((box_size - box_w) / 2), img_w - box_w))
+        ymin = max(0, min(ymin - int((box_size - box_h) / 2), img_h - box_h))
+        # Clip to image boundaries
+        box_w = min(img_w, box_size)
+        box_h = min(img_h, box_size)
+        if box_w == 0 or box_h == 0:
+            raise ValueError(f"Invalid bbox size: {box_w}x{box_h}")
+        # Crop and pad to square
+        crop = image.crop(box=[xmin, ymin, xmin + box_w, ymin + box_h])
+        crop = ImageOps.pad(crop, size=(box_size, box_size), color=0)
+        return crop
+    def _pad_crop(self, box_size: int) -> int:
+        """
+        Calculate padded crop size to prevent over-enlargement of small animals.
+        YOLOv8 expects 224x224 input. This function ensures small detections aren't
+        excessively upscaled while adding consistent padding to larger detections.
+        Args:
+            box_size: Original bounding box size (max of width/height)
+        Returns:
+            Padded box size
+        """
+        input_size_network = 224
+        default_padding = 30
+        if box_size >= input_size_network:
+            # Large detection: add default padding
             return box_size + default_padding
         else:
+            # Small detection: ensure minimum size without excessive enlargement
+            diff_size = input_size_network - box_size
+            if diff_size < default_padding:
+                return box_size + default_padding
+            else:
+                return input_size_network
+    def get_classification(self, crop: Image.Image) -> list[tuple[str, float]]:
+        """
+        Run YOLOv8 classification on cropped image.
+        Args:
+            crop: Cropped and preprocessed PIL Image
+        Returns:
+            List of (class_name, confidence) tuples for ALL classes, sorted by confidence.
+            Example: [("giraffe", 0.99985), ("cattle", 0.00003), ...]
+        Raises:
+            RuntimeError: If model not loaded or inference fails
+        """
+        if self.model is None:
+            raise RuntimeError("Model not loaded - call load_model() first")
+        try:
+            # Run YOLOv8 classification (verbose=False suppresses progress bar)
+            results = self.model(crop, verbose=False)
+            # Extract class names dict (YOLOv8 uses alphabetical order)
+            # Example: {0: "aardwolf", 1: "african wild cat", ..., 13: "giraffe", ...}
+            names_dict = results[0].names
+            # Extract probabilities: [0.0001, 0.0002, ..., 0.9998, ...]
+            probs = results[0].probs.data.tolist()
+            # Build list of (class_name, confidence) tuples
+            # Return YOLOv8's class names (which will be mapped to taxonomy IDs later)
+            classifications = []
+            for idx, class_name in names_dict.items():
+                confidence = probs[idx]
+                classifications.append((class_name, confidence))
+            # Sort by confidence descending (already sorted by YOLOv8, but ensure it)
+            classifications.sort(key=lambda x: x[1], reverse=True)
+            return classifications
+        except Exception as e:
+            raise RuntimeError(f"YOLOv8 classification failed: {e}") from e
+    def get_class_names(self) -> dict[str, str]:
+        """
+        Get mapping of class IDs to species names from YOLOv8 model.
+        YOLOv8 stores class names in alphabetical order internally. This function
+        extracts those names and creates a 1-indexed mapping for the JSON format.
+        NOTE: taxonomy.csv is NOT used here - it's only for UI taxonomy tree display.
+        The class IDs here are YOLOv8's alphabetical indices (0-based) + 1.
+        Returns:
+            Dict mapping class ID (1-indexed string) to common name
+            Example: {"1": "aardwolf", "2": "african wild cat", ..., "14": "giraffe", ...}
+        Raises:
+            RuntimeError: If model not loaded
+        """
+        if self.model is None:
+            raise RuntimeError("Model not loaded - call load_model() first")
+        try:
+            # YOLOv8 names dict (alphabetical order): {0: "aardwolf", 1: "african wild cat", ...}
+            yolo_names = self.model.names
+            # Convert to 1-indexed dict for JSON compatibility
+            class_names = {}
+            for idx, name in yolo_names.items():
+                class_id_str = str(idx + 1)  # 1-indexed
+                class_names[class_id_str] = name
+            return class_names
+        except Exception as e:
+            raise RuntimeError(f"Failed to extract class names from model: {e}") from e