coolroman
/

ScoreVision

ONNX

Model card Files Files and versions

xet

Community

coolroman commited on 13 days ago

Commit

4524d7b

verified ·

1 Parent(s): a0571d3

scorevision: push artifact

Browse files

Files changed (1) hide show

miner.py +34 -10

miner.py CHANGED Viewed

@@ -98,7 +98,7 @@ class Miner:
         # Tuning matched to alfred's deployed model — bias toward precision to dodge
         # the false_positive pillar penalty (validator weights FP heavily on this element).
-        self.conf_thres = 0.50
         self.iou_thres = 0.4
         self.cross_iou_thresh = 0.7
         self.max_det = 100
@@ -337,9 +337,14 @@ class Miner:
         ratio: float,
         pad: tuple[float, float],
         orig_size: tuple[int, int],
     ) -> tuple[np.ndarray, np.ndarray, np.ndarray]:
         """Decode end2end NMS output and return (boxes, scores, cls_ids)
-        in original image coordinates, after conf-threshold + remap + letterbox-reverse + sanity."""
         if preds.ndim == 3 and preds.shape[0] == 1:
             preds = preds[0]
         if preds.ndim != 2 or preds.shape[1] < 6:
@@ -349,14 +354,15 @@ class Miner:
         scores = preds[:, 4].astype(np.float32)
         cls_ids = preds[:, 5].astype(np.int32)
-        valid = (cls_ids >= 0) & (cls_ids < len(self.cls_remap))
         boxes, scores, cls_ids = boxes[valid], scores[valid], cls_ids[valid]
         cls_ids = self.cls_remap[cls_ids]
-        keep = scores >= self.conf_thres
-        boxes = boxes[keep]
-        scores = scores[keep]
-        cls_ids = cls_ids[keep]
         if len(boxes) == 0:
             return (
                 np.empty((0, 4), dtype=np.float32),
@@ -381,11 +387,29 @@ class Miner:
         out = self.session.run(self.output_names, {self.input_name: x})[0]
         return self._decode_raw_dets(out, ratio, pad, orig_size)
     def _predict_single(self, image: np.ndarray) -> list[BoundingBox]:
-        boxes, scores, cls_ids = self._forward(image)
-        if len(boxes) == 0:
             return []
-        return self._build_results(boxes, scores, cls_ids)
     def _predict_tta(self, image: np.ndarray) -> list[BoundingBox]:
         """Hflip TTA: merge primary + flipped via per-class hard-NMS,

         # Tuning matched to alfred's deployed model — bias toward precision to dodge
         # the false_positive pillar penalty (validator weights FP heavily on this element).
+        self.conf_thres = 0.40
         self.iou_thres = 0.4
         self.cross_iou_thresh = 0.7
         self.max_det = 100
         ratio: float,
         pad: tuple[float, float],
         orig_size: tuple[int, int],
+        *,
+        apply_conf_thresh: bool = True,
     ) -> tuple[np.ndarray, np.ndarray, np.ndarray]:
         """Decode end2end NMS output and return (boxes, scores, cls_ids)
+        in original image coordinates, after conf-threshold + remap + letterbox-reverse + sanity.
+        When apply_conf_thresh=False, the conf-threshold filter is skipped (used for
+        the no-detection fallback path: take the single top-conf raw box)."""
         if preds.ndim == 3 and preds.shape[0] == 1:
             preds = preds[0]
         if preds.ndim != 2 or preds.shape[1] < 6:
         scores = preds[:, 4].astype(np.float32)
         cls_ids = preds[:, 5].astype(np.int32)
+        valid = (cls_ids >= 0) & (cls_ids < len(self.cls_remap)) & (scores > 0)
         boxes, scores, cls_ids = boxes[valid], scores[valid], cls_ids[valid]
         cls_ids = self.cls_remap[cls_ids]
+        if apply_conf_thresh:
+            keep = scores >= self.conf_thres
+            boxes = boxes[keep]
+            scores = scores[keep]
+            cls_ids = cls_ids[keep]
         if len(boxes) == 0:
             return (
                 np.empty((0, 4), dtype=np.float32),
         out = self.session.run(self.output_names, {self.input_name: x})[0]
         return self._decode_raw_dets(out, ratio, pad, orig_size)
+    def _forward_with_fallback(
+        self, image: np.ndarray
+    ) -> tuple[
+        tuple[np.ndarray, np.ndarray, np.ndarray],
+        tuple[np.ndarray, np.ndarray, np.ndarray],
+    ]:
+        """Run ONNX once, decode twice: (filtered @ conf_thres, all-survived sanity)."""
+        x, ratio, pad, orig_size = self._preprocess(image)
+        out = self.session.run(self.output_names, {self.input_name: x})[0]
+        primary = self._decode_raw_dets(out, ratio, pad, orig_size, apply_conf_thresh=True)
+        fallback = self._decode_raw_dets(out, ratio, pad, orig_size, apply_conf_thresh=False)
+        return primary, fallback
     def _predict_single(self, image: np.ndarray) -> list[BoundingBox]:
+        (boxes, scores, cls_ids), (fb_b, fb_s, fb_c) = self._forward_with_fallback(image)
+        if len(boxes) > 0:
+            return self._build_results(boxes, scores, cls_ids)
+        # FALLBACK: nothing passed conf_thres — return single top-conf box
+        # (any class, any conf > 0) so the validator's mAP isn't a hard zero.
+        if len(fb_b) == 0:
             return []
+        i = int(np.argmax(fb_s))
+        return self._build_results(fb_b[i:i + 1], fb_s[i:i + 1], fb_c[i:i + 1])
     def _predict_tta(self, image: np.ndarray) -> list[BoundingBox]:
         """Hflip TTA: merge primary + flipped via per-class hard-NMS,