Spaces:

ivanm151
/

fruits

Runtime error

App Files Files Community

ivanm151 commited on Jan 19

Commit

b7d2f0a

1 Parent(s): 9672426

1st classifier upd

Browse files

Files changed (4) hide show

app.py +6 -3
models.py +1 -1
utils.py +39 -63
weights/{class1.pth → class.pth} +1 -1

app.py CHANGED Viewed

@@ -78,7 +78,9 @@ async def predict2(
     mask_256 = decode_base64_mask(mask_256_base64)
     # 3. Letterbox + маска + crop + resize до 100×100
-    cropped_100 = apply_mask_and_crop_letterbox(original_np, mask_256)
     # 4. Препроцессинг для классификатора
     input_tensor = preprocess_for_classifier(cropped_100).unsqueeze(0).to(DEVICE)
@@ -112,10 +114,11 @@ async def predict3(
     mask_256 = decode_base64_mask(mask_256_base64)
     # Вырезаем и готовим 224×224
-    cropped_224 = apply_mask_and_crop_letterbox_224(
         original_np,
         mask_256,
-        margin_ratio=0.05,          # подбери под свои тесты
         bg_color=(255, 255, 255)
     )

     mask_256 = decode_base64_mask(mask_256_base64)
     # 3. Letterbox + маска + crop + resize до 100×100
+    cropped_100 = apply_mask_and_crop_letterbox(original_np, mask_256, margin_ratio=0.02,
+    target_size=100,
+    bg_color=(255, 255, 255))
     # 4. Препроцессинг для классификатора
     input_tensor = preprocess_for_classifier(cropped_100).unsqueeze(0).to(DEVICE)
     mask_256 = decode_base64_mask(mask_256_base64)
     # Вырезаем и готовим 224×224
+    cropped_224 = apply_mask_and_crop_letterbox(
         original_np,
         mask_256,
+        margin_ratio=0.05,
+        target_size=224,
         bg_color=(255, 255, 255)
     )

models.py CHANGED Viewed

@@ -24,7 +24,7 @@ def load_model1(weights_path='weights/seg.pth'):
     return model1
-def load_model2(weights_path='weights/class1.pth'):
     global model2
     if model2 is None:
         model2 = models.mobilenet_v2(pretrained=False)

     return model1
+def load_model2(weights_path='weights/class.pth'):
     global model2
     if model2 is None:
         model2 = models.mobilenet_v2(pretrained=False)

utils.py CHANGED Viewed

@@ -44,8 +44,7 @@ def mask_to_base64(mask: np.ndarray) -> str:
 # ────────────────────────────────────────────────
 # Новые для классификации
-FRUIT_CLASSES = ['apple', 'banana', 'orange', 'grape', 'strawberry',
-                 'tomato', 'pear', 'peach', 'cherry', 'lemon']
 def decode_base64_mask(base64_str: str) -> np.ndarray:
@@ -81,36 +80,56 @@ def letterbox_resize(img: np.ndarray, target_size: int = 256) -> tuple[np.ndarra
     return padded, scale, (top, bottom, left, right)
 def apply_mask_and_crop_letterbox(
-    orig_img: np.ndarray,          # оригинал любой размер
-    mask_256: np.ndarray           # маска 256×256 [0..1]
 ) -> np.ndarray:
-    """
-    1. Делаем letterbox-версию оригинала 256×256
-    2. Применяем маску
-    3. Находим bbox
-    4. Вырезаем + margin
-    5. Ресайзим до 100×100
-    """
-    letterbox_img, scale, paddings = letterbox_resize(orig_img, 256)
     top, bottom, left, right = paddings
-    # Маска уже 256×256 — применяем напрямую
     masked = letterbox_img.copy()
-    masked[mask_256 < 0.5] = [255, 255, 255]
-    # Находим контуры / bbox
     mask_bin = (mask_256 > 0.5).astype(np.uint8) * 255
     contours, _ = cv2.findContours(mask_bin, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
     if not contours:
-        return np.zeros((100, 100, 3), dtype=np.uint8)
     cnt = max(contours, key=cv2.contourArea)
     x, y, bw, bh = cv2.boundingRect(cnt)
-    # margin ~10%
-    margin = int(max(bw, bh) * 0.02)
     x1 = max(0, x - margin)
     y1 = max(0, y - margin)
     x2 = min(256, x + bw + margin)
@@ -118,8 +137,8 @@ def apply_mask_and_crop_letterbox(
     cropped = masked[y1:y2, x1:x2]
-    # Финальный ресайз до 100×100 для классификатора
-    final = cv2.resize(cropped, (100, 100), interpolation=cv2.INTER_AREA)
     return final
@@ -149,46 +168,3 @@ def preprocess_for_freshness(img_224: np.ndarray) -> torch.Tensor:
         transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
     ])
     return transform(img_224)
-def apply_mask_and_crop_letterbox_224(
-    orig_img: np.ndarray,
-    mask_256: np.ndarray,
-    margin_ratio: float = 0.05,           # можно подкрутить
-    bg_color: tuple = (255, 255, 255)     # белый фон — важно!
-) -> np.ndarray:
-    """
-    Аналог apply_mask_and_crop_letterbox, но для 224×224
-    """
-    # Letterbox до 224×224
-    letterbox_img, scale, paddings = letterbox_resize(orig_img, target_size=224)
-    top, bottom, left, right = paddings
-    # Применяем маску (маска 256→ресайзим до 224)
-    mask_resized = cv2.resize(mask_256, (224, 224), interpolation=cv2.INTER_NEAREST)
-    masked = letterbox_img.copy()
-    masked[mask_resized < 0.5] = bg_color   # белый фон
-    # Контуры
-    mask_bin = (mask_resized > 0.5).astype(np.uint8) * 255
-    contours, _ = cv2.findContours(mask_bin, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
-    if not contours:
-        return np.full((224, 224, 3), bg_color, dtype=np.uint8)
-    cnt = max(contours, key=cv2.contourArea)
-    x, y, bw, bh = cv2.boundingRect(cnt)
-    margin = int(max(bw, bh) * margin_ratio)
-    x1 = max(0, x - margin)
-    y1 = max(0, y - margin)
-    x2 = min(224, x + bw + margin)
-    y2 = min(224, y + bh + margin)
-    cropped = masked[y1:y2, x1:x2]
-    # Финальный resize до 224×224 (если обрезали меньше)
-    final = cv2.resize(cropped, (224, 224), interpolation=cv2.INTER_AREA)
-    return final

 # ────────────────────────────────────────────────
 # Новые для классификации
+FRUIT_CLASSES = ['apple', 'banana', 'orange', 'strawberry', 'pear', 'lemon', 'cucumber', 'plum', 'raspberry', 'watermelon']
 def decode_base64_mask(base64_str: str) -> np.ndarray:
     return padded, scale, (top, bottom, left, right)
+def letterbox_any_size(
+    img: np.ndarray,
+    target_size: int = 100,          # или 224
+    bg_color: tuple = (255, 255, 255)
+) -> np.ndarray:
+    """ Универсальный letterbox для любого входного изображения """
+    h, w = img.shape[:2]
+    scale = min(target_size / h, target_size / w)
+    new_h, new_w = int(h * scale), int(w * scale)
+    resized = cv2.resize(img, (new_w, new_h), interpolation=cv2.INTER_AREA)
+    pad_h = target_size - new_h
+    pad_w = target_size - new_w
+    top = pad_h // 2
+    bottom = pad_h - top
+    left = pad_w // 2
+    right = pad_w - left
+    padded = cv2.copyMakeBorder(
+        resized, top, bottom, left, right,
+        cv2.BORDER_CONSTANT, value=bg_color
+    )
+    return padded
 def apply_mask_and_crop_letterbox(
+    orig_img: np.ndarray,
+    mask_256: np.ndarray,
+    margin_ratio: float = 0.02,
+    target_size: int = 100,
+    bg_color: tuple = (255, 255, 255)
 ) -> np.ndarray:
+    # Letterbox оригинала до 256×256 (для совместимости с маской)
+    letterbox_img, _, paddings = letterbox_resize(orig_img, target_size=256)
     top, bottom, left, right = paddings
     masked = letterbox_img.copy()
+    masked[mask_256 < 0.5] = bg_color
     mask_bin = (mask_256 > 0.5).astype(np.uint8) * 255
     contours, _ = cv2.findContours(mask_bin, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
     if not contours:
+        return np.full((target_size, target_size, 3), bg_color, dtype=np.uint8)
     cnt = max(contours, key=cv2.contourArea)
     x, y, bw, bh = cv2.boundingRect(cnt)
+    margin = int(max(bw, bh) * margin_ratio)
     x1 = max(0, x - margin)
     y1 = max(0, y - margin)
     x2 = min(256, x + bw + margin)
     cropped = masked[y1:y2, x1:x2]
+    # Самое важное: letterbox вместо force-resize
+    final = letterbox_any_size(cropped, target_size=target_size, bg_color=bg_color)
     return final
         transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
     ])
     return transform(img_224)

weights/{class1.pth → class.pth} RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c5767f1246bfe8ee0077a0eefda6c8a1a66e8639de3fc1d94bacf7254633a5f2
 size 9205515

 version https://git-lfs.github.com/spec/v1
+oid sha256:0720a4afc5d0649b9af6e1532947af363f7230276172f6345aae6b951be071e5
 size 9205515