Spaces:

coderuday21
/

satdetect

Sleeping

App Files Files Community

coderuday21 commited on Mar 2

Commit

ce1e651

1 Parent(s): bd1ea11

Code review fixes: SSIM stability, symmetric CLAHE, confidence scoring, KMeans perf, auth hardening, remove debug endpoint

Browse files

Files changed (3) hide show

app/auth.py +9 -17
app/detection_engine.py +60 -26
app/main.py +16 -18

app/auth.py CHANGED Viewed

@@ -1,5 +1,6 @@
 import os
-from datetime import datetime, timedelta
 from typing import Optional
 from jose import JWTError, jwt
@@ -11,6 +12,8 @@ from sqlalchemy.orm import Session
 from .database import get_db
 from .models import User
 SECRET_KEY = os.environ.get("SECRET_KEY", "dev-fallback-key-change-in-production")
 ALGORITHM = "HS256"
 ACCESS_TOKEN_EXPIRE_MINUTES = 60 * 24 * 7  # 7 days
@@ -30,7 +33,7 @@ def get_password_hash(password: str) -> str:
 def create_access_token(data: dict, expires_delta: Optional[timedelta] = None) -> str:
     to_encode = data.copy()
-    expire = datetime.utcnow() + (expires_delta or timedelta(minutes=ACCESS_TOKEN_EXPIRE_MINUTES))
     to_encode.update({"exp": expire})
     return jwt.encode(to_encode, SECRET_KEY, algorithm=ALGORITHM)
@@ -44,26 +47,22 @@ def get_user_by_id(db: Session, user_id: int) -> Optional[User]:
 def get_user_from_token(token: str, db: Session) -> Optional[User]:
-    """Resolve user from JWT token (used as fallback when header/cookie not sent)."""
     if not token:
-        print("[AUTH] get_user_from_token: token is empty/None")
         return None
     try:
         payload = jwt.decode(token, SECRET_KEY, algorithms=[ALGORITHM])
         user_id_str = payload.get("sub")
-        print(f"[AUTH] decoded token OK, sub={user_id_str}")
         if user_id_str is None:
             return None
         try:
             user_id = int(user_id_str)
         except (ValueError, TypeError):
             return None
-    except JWTError as e:
-        print(f"[AUTH] JWT decode FAILED: {e}")
         return None
-    user = get_user_by_id(db, user_id)
-    print(f"[AUTH] DB lookup: user={'found' if user else 'NOT FOUND'}")
-    return user
 def get_current_user(
@@ -71,18 +70,11 @@ def get_current_user(
     credentials: Optional[HTTPAuthorizationCredentials] = Depends(security),
     db: Session = Depends(get_db),
 ) -> Optional[User]:
-    print(f"[AUTH] get_current_user called")
-    print(f"[AUTH]   credentials present: {credentials is not None}")
-    print(f"[AUTH]   cookie present: {request.cookies.get(COOKIE_NAME) is not None}")
-    print(f"[AUTH]   Authorization header: {request.headers.get('authorization', 'MISSING')[:50]}")
-    # 1) Try Bearer header
     if credentials:
         user = get_user_from_token(credentials.credentials, db)
         if user:
             return user
-    # 2) Try cookie (sent automatically by browser on same-origin requests)
     token = request.cookies.get(COOKIE_NAME)
     if token:
         return get_user_from_token(token, db)
-    print("[AUTH] No valid auth found, returning None")
     return None

+import logging
 import os
+from datetime import datetime, timedelta, timezone
 from typing import Optional
 from jose import JWTError, jwt
 from .database import get_db
 from .models import User
+logger = logging.getLogger(__name__)
 SECRET_KEY = os.environ.get("SECRET_KEY", "dev-fallback-key-change-in-production")
 ALGORITHM = "HS256"
 ACCESS_TOKEN_EXPIRE_MINUTES = 60 * 24 * 7  # 7 days
 def create_access_token(data: dict, expires_delta: Optional[timedelta] = None) -> str:
     to_encode = data.copy()
+    expire = datetime.now(timezone.utc) + (expires_delta or timedelta(minutes=ACCESS_TOKEN_EXPIRE_MINUTES))
     to_encode.update({"exp": expire})
     return jwt.encode(to_encode, SECRET_KEY, algorithm=ALGORITHM)
 def get_user_from_token(token: str, db: Session) -> Optional[User]:
+    """Resolve user from JWT token."""
     if not token:
         return None
     try:
         payload = jwt.decode(token, SECRET_KEY, algorithms=[ALGORITHM])
         user_id_str = payload.get("sub")
         if user_id_str is None:
             return None
         try:
             user_id = int(user_id_str)
         except (ValueError, TypeError):
+            logger.warning("JWT 'sub' claim is not a valid integer")
             return None
+    except JWTError:
         return None
+    return get_user_by_id(db, user_id)
 def get_current_user(
     credentials: Optional[HTTPAuthorizationCredentials] = Depends(security),
     db: Session = Depends(get_db),
 ) -> Optional[User]:
     if credentials:
         user = get_user_from_token(credentials.credentials, db)
         if user:
             return user
     token = request.cookies.get(COOKIE_NAME)
     if token:
         return get_user_from_token(token, db)
     return None

app/detection_engine.py CHANGED Viewed

@@ -21,13 +21,16 @@ def preprocess_image(image):
     img_array = np.array(image)
     if img_array.ndim == 2:
         img_array = cv2.cvtColor(img_array, cv2.COLOR_GRAY2RGB)
-    if img_array.shape[2] == 4:
         img_array = cv2.cvtColor(img_array, cv2.COLOR_RGBA2RGB)
     max_size = 2000
     height, width = img_array.shape[:2]
     if max(height, width) > max_size:
         scale = max_size / max(height, width)
-        img_array = cv2.resize(img_array, (int(width * scale), int(height * scale)), interpolation=cv2.INTER_AREA)
     return img_array
@@ -68,11 +71,15 @@ def register_images(img1, img2, max_features=2000):
     if homography is None:
         return img1, img2, False
-    # Only accept if enough inliers
     inlier_ratio = np.sum(mask) / len(mask) if mask is not None else 0
     if inlier_ratio < 0.3:
         return img1, img2, False
     h, w = img1.shape[:2]
     img2_aligned = cv2.warpPerspective(img2, homography, (w, h), borderMode=cv2.BORDER_REFLECT)
     return img1, img2_aligned, True
@@ -83,7 +90,7 @@ def register_images(img1, img2, max_features=2000):
 # ---------------------------------------------------------------------------
 def normalize_radiometry(img1, img2):
-    """Histogram-matching normalization in LAB space for all channels."""
     lab1 = cv2.cvtColor(img1, cv2.COLOR_RGB2LAB).astype(np.float32)
     lab2 = cv2.cvtColor(img2, cv2.COLOR_RGB2LAB).astype(np.float32)
@@ -94,13 +101,17 @@ def normalize_radiometry(img1, img2):
         if std2 > 1e-6:
             result[:, :, ch] = (lab2[:, :, ch] - mean2) * (std1 / std2) + mean1
-    # Also apply CLAHE on L channel for contrast equalization
     result_uint8 = np.clip(result, 0, 255).astype(np.uint8)
     clahe = cv2.createCLAHE(clipLimit=2.0, tileGridSize=(8, 8))
     result_uint8[:, :, 0] = clahe.apply(result_uint8[:, :, 0])
-    img2_normalized = cv2.cvtColor(result_uint8, cv2.COLOR_LAB2RGB)
-    return img1, img2_normalized
 # ---------------------------------------------------------------------------
@@ -122,12 +133,13 @@ def compute_ssim_change_map(img1, img2, win_size=7):
     mu2_sq = mu2 * mu2
     mu1_mu2 = mu1 * mu2
-    sigma1_sq = cv2.GaussianBlur(gray1 * gray1, (win_size, win_size), 1.5) - mu1_sq
-    sigma2_sq = cv2.GaussianBlur(gray2 * gray2, (win_size, win_size), 1.5) - mu2_sq
     sigma12 = cv2.GaussianBlur(gray1 * gray2, (win_size, win_size), 1.5) - mu1_mu2
-    ssim_map = ((2 * mu1_mu2 + C1) * (2 * sigma12 + C2)) / \
-               ((mu1_sq + mu2_sq + C1) * (sigma1_sq + sigma2_sq + C2))
     # Structural dissimilarity: 0 = identical, 1 = completely different
     dssim = np.clip((1.0 - ssim_map) / 2.0, 0, 1)
@@ -224,7 +236,6 @@ def feature_based_method(img1, img2, num_clusters=4, sensitivity=0.5):
     if img1.shape != img2.shape:
         img2 = cv2.resize(img2, (img1.shape[1], img1.shape[0]))
-    # Combine LAB and HSV differences for richer features
     lab1 = cv2.cvtColor(img1, cv2.COLOR_RGB2LAB).astype(np.float32)
     lab2 = cv2.cvtColor(img2, cv2.COLOR_RGB2LAB).astype(np.float32)
     hsv1 = cv2.cvtColor(img1, cv2.COLOR_RGB2HSV).astype(np.float32)
@@ -234,19 +245,41 @@ def feature_based_method(img1, img2, num_clusters=4, sensitivity=0.5):
     diff_hsv = np.abs(hsv1 - hsv2)
     h, w, _ = diff_lab.shape
-    features = np.concatenate([diff_lab, diff_hsv[:, :, 1:]], axis=2)  # 5 channels
-    features_flat = features.reshape(-1, features.shape[2])
     scaler = StandardScaler()
     features_scaled = scaler.fit_transform(features_flat)
     kmeans = KMeans(n_clusters=num_clusters, random_state=42, n_init=10)
-    labels = kmeans.fit_predict(features_scaled)
-    # Find the cluster with highest mean difference (= change)
-    cluster_means = [np.mean(np.linalg.norm(features_flat[labels == i], axis=1)) for i in range(num_clusters)]
     change_cluster_idx = np.argmax(cluster_means)
     change_mask = (labels == change_cluster_idx).astype(np.uint8) * 255
     change_mask = change_mask.reshape(h, w)
@@ -667,12 +700,8 @@ def classify_object_type(image_region, bbox):
         soil += 0.10
     scores["Bare Land/Soil Change"] = soil
-    # Normalize scores
-    max_score = max(scores.values()) if scores else 0
-    if max_score > 0:
-        for k in scores:
-            scores[k] /= max_score
     best = max(scores, key=scores.get)
     conf = scores[best]
@@ -698,14 +727,20 @@ def classify_with_ensemble(image_region, bbox, num_sub=4):
     classifications = []
     confidences = []
     for sb in sub_boxes:
         obj_type, conf = classify_object_type(image_region, sb)
         if obj_type is None:
-            return None, 0.0  # transient → exclude
         if obj_type != "Unclassified":
             classifications.append(obj_type)
             confidences.append(conf)
     if not classifications:
         return classify_object_type(image_region, (x, y, w, h))
@@ -795,8 +830,7 @@ def run_detection(before_pil, after_pil, method="AI-Based Deep Learning",
     else:
         change_mask = hybrid_method(before_array, after_array)
-    # Classify regions
-    change_regions = analyze_change_regions(change_mask, after_array, min_area=80)
     # Color-coded visualization using region classifications
     result_image = visualize_changes(before_array, after_array, change_mask, regions=change_regions)

     img_array = np.array(image)
     if img_array.ndim == 2:
         img_array = cv2.cvtColor(img_array, cv2.COLOR_GRAY2RGB)
+    elif img_array.ndim == 3 and img_array.shape[2] == 4:
         img_array = cv2.cvtColor(img_array, cv2.COLOR_RGBA2RGB)
+    elif img_array.ndim != 3 or img_array.shape[2] != 3:
+        raise ValueError(f"Unsupported image shape: {img_array.shape}")
     max_size = 2000
     height, width = img_array.shape[:2]
     if max(height, width) > max_size:
         scale = max_size / max(height, width)
+        new_w, new_h = max(1, int(width * scale)), max(1, int(height * scale))
+        img_array = cv2.resize(img_array, (new_w, new_h), interpolation=cv2.INTER_AREA)
     return img_array
     if homography is None:
         return img1, img2, False
     inlier_ratio = np.sum(mask) / len(mask) if mask is not None else 0
     if inlier_ratio < 0.3:
         return img1, img2, False
+    # Reject degenerate homographies (near-singular or extreme distortion)
+    det = np.linalg.det(homography)
+    if abs(det) < 0.1 or abs(det) > 10.0:
+        return img1, img2, False
     h, w = img1.shape[:2]
     img2_aligned = cv2.warpPerspective(img2, homography, (w, h), borderMode=cv2.BORDER_REFLECT)
     return img1, img2_aligned, True
 # ---------------------------------------------------------------------------
 def normalize_radiometry(img1, img2):
+    """Histogram-matching normalization in LAB space. CLAHE applied symmetrically."""
     lab1 = cv2.cvtColor(img1, cv2.COLOR_RGB2LAB).astype(np.float32)
     lab2 = cv2.cvtColor(img2, cv2.COLOR_RGB2LAB).astype(np.float32)
         if std2 > 1e-6:
             result[:, :, ch] = (lab2[:, :, ch] - mean2) * (std1 / std2) + mean1
     result_uint8 = np.clip(result, 0, 255).astype(np.uint8)
+    # CLAHE on L channel of BOTH images so downstream comparison is symmetric
     clahe = cv2.createCLAHE(clipLimit=2.0, tileGridSize=(8, 8))
+    lab1_uint8 = cv2.cvtColor(img1, cv2.COLOR_RGB2LAB)
+    lab1_uint8[:, :, 0] = clahe.apply(lab1_uint8[:, :, 0])
     result_uint8[:, :, 0] = clahe.apply(result_uint8[:, :, 0])
+    img1_out = cv2.cvtColor(lab1_uint8, cv2.COLOR_LAB2RGB)
+    img2_out = cv2.cvtColor(result_uint8, cv2.COLOR_LAB2RGB)
+    return img1_out, img2_out
 # ---------------------------------------------------------------------------
     mu2_sq = mu2 * mu2
     mu1_mu2 = mu1 * mu2
+    # Clamp to zero: E[X²]-E[X]² can go slightly negative from float rounding
+    sigma1_sq = np.maximum(cv2.GaussianBlur(gray1 * gray1, (win_size, win_size), 1.5) - mu1_sq, 0)
+    sigma2_sq = np.maximum(cv2.GaussianBlur(gray2 * gray2, (win_size, win_size), 1.5) - mu2_sq, 0)
     sigma12 = cv2.GaussianBlur(gray1 * gray2, (win_size, win_size), 1.5) - mu1_mu2
+    denom = (mu1_sq + mu2_sq + C1) * (sigma1_sq + sigma2_sq + C2)
+    ssim_map = ((2 * mu1_mu2 + C1) * (2 * sigma12 + C2)) / (denom + 1e-12)
     # Structural dissimilarity: 0 = identical, 1 = completely different
     dssim = np.clip((1.0 - ssim_map) / 2.0, 0, 1)
     if img1.shape != img2.shape:
         img2 = cv2.resize(img2, (img1.shape[1], img1.shape[0]))
     lab1 = cv2.cvtColor(img1, cv2.COLOR_RGB2LAB).astype(np.float32)
     lab2 = cv2.cvtColor(img2, cv2.COLOR_RGB2LAB).astype(np.float32)
     hsv1 = cv2.cvtColor(img1, cv2.COLOR_RGB2HSV).astype(np.float32)
     diff_hsv = np.abs(hsv1 - hsv2)
     h, w, _ = diff_lab.shape
+    features = np.concatenate([diff_lab, diff_hsv[:, :, 1:]], axis=2)
+    # Downsample for KMeans (full-res is too slow for >1M pixels)
+    MAX_PIXELS = 250_000
+    total = h * w
+    if total > MAX_PIXELS:
+        scale = np.sqrt(MAX_PIXELS / total)
+        sh, sw = max(1, int(h * scale)), max(1, int(w * scale))
+        features_small = cv2.resize(features, (sw, sh))
+    else:
+        features_small = features
+        sh, sw = h, w
+    features_flat = features_small.reshape(-1, features_small.shape[2])
     scaler = StandardScaler()
     features_scaled = scaler.fit_transform(features_flat)
     kmeans = KMeans(n_clusters=num_clusters, random_state=42, n_init=10)
+    labels_small = kmeans.fit_predict(features_scaled)
+    cluster_means = [
+        np.mean(np.linalg.norm(features_flat[labels_small == i], axis=1))
+        if np.any(labels_small == i) else 0.0
+        for i in range(num_clusters)
+    ]
     change_cluster_idx = np.argmax(cluster_means)
+    # Map labels back to full resolution by predicting on all pixels
+    if total > MAX_PIXELS:
+        full_flat = features.reshape(-1, features.shape[2])
+        full_scaled = scaler.transform(full_flat)
+        labels = kmeans.predict(full_scaled)
+    else:
+        labels = labels_small
     change_mask = (labels == change_cluster_idx).astype(np.uint8) * 255
     change_mask = change_mask.reshape(h, w)
         soil += 0.10
     scores["Bare Land/Soil Change"] = soil
+    # Use raw scores as confidence (each rule set sums to ~1.0 max)
+    # Do NOT normalize by max_score — that inflates weak matches to 1.0
     best = max(scores, key=scores.get)
     conf = scores[best]
     classifications = []
     confidences = []
+    transient_count = 0
     for sb in sub_boxes:
         obj_type, conf = classify_object_type(image_region, sb)
         if obj_type is None:
+            transient_count += 1
+            continue
         if obj_type != "Unclassified":
             classifications.append(obj_type)
             confidences.append(conf)
+    # Only exclude if majority of sub-regions are transient
+    if transient_count > len(sub_boxes) // 2:
+        return None, 0.0
     if not classifications:
         return classify_object_type(image_region, (x, y, w, h))
     else:
         change_mask = hybrid_method(before_array, after_array)
+    change_regions = analyze_change_regions(change_mask, after_array, min_area=200)
     # Color-coded visualization using region classifications
     result_image = visualize_changes(before_array, after_array, change_mask, regions=change_regions)

app/main.py CHANGED Viewed

@@ -132,12 +132,18 @@ def reset_password(data: PasswordReset, db: Session = Depends(get_db)):
         raise HTTPException(status_code=400, detail="Password must be at least 6 characters")
     user = get_user_by_email(db, data.email)
     if not user:
         raise HTTPException(status_code=404, detail="No account found with that email")
     user.hashed_password = get_password_hash(data.new_password)
     db.commit()
     return {"ok": True, "message": "Password has been reset. You can now sign in."}
 @app.get("/api/me")
 def me(user: Optional[User] = Depends(get_current_user)):
     if not user:
@@ -145,22 +151,6 @@ def me(user: Optional[User] = Depends(get_current_user)):
     return {"id": user.id, "email": user.email, "full_name": user.full_name}
-@app.get("/api/debug-auth")
-def debug_auth(request: Request, user: Optional[User] = Depends(get_current_user)):
-    """Debug endpoint to see what auth info the server receives."""
-    auth_header = request.headers.get("authorization", "")
-    cookie_val = request.cookies.get(COOKIE_NAME, "")
-    return {
-        "has_auth_header": bool(auth_header),
-        "auth_header_preview": auth_header[:40] + "..." if len(auth_header) > 40 else auth_header,
-        "has_cookie": bool(cookie_val),
-        "cookie_preview": cookie_val[:20] + "..." if len(cookie_val) > 20 else cookie_val,
-        "authenticated": user is not None,
-        "user_id": user.id if user else None,
-        "user_email": user.email if user else None,
-    }
 # --- Detection route ---
 @app.post("/api/detect")
 async def detect(
@@ -186,9 +176,17 @@ async def detect(
     user = get_user_from_token(token, db) if token else None
     if not user:
         raise HTTPException(status_code=401, detail="Login required")
     try:
-        before_pil = Image.open(io.BytesIO(await before.read())).convert("RGB")
-        after_pil = Image.open(io.BytesIO(await after.read())).convert("RGB")
     except Exception as e:
         raise HTTPException(status_code=400, detail=f"Invalid image: {e}")
     change_mask, result_image, stats, change_regions = run_detection(

         raise HTTPException(status_code=400, detail="Password must be at least 6 characters")
     user = get_user_by_email(db, data.email)
     if not user:
+        # Intentionally vague to prevent email enumeration
         raise HTTPException(status_code=404, detail="No account found with that email")
     user.hashed_password = get_password_hash(data.new_password)
     db.commit()
     return {"ok": True, "message": "Password has been reset. You can now sign in."}
+# NOTE: This reset flow has no email verification. In production, implement
+# a token-based flow: POST /forgot sends email with one-time link,
+# GET /reset?token=... validates token, POST /reset sets new password.
 @app.get("/api/me")
 def me(user: Optional[User] = Depends(get_current_user)):
     if not user:
     return {"id": user.id, "email": user.email, "full_name": user.full_name}
 # --- Detection route ---
 @app.post("/api/detect")
 async def detect(
     user = get_user_from_token(token, db) if token else None
     if not user:
         raise HTTPException(status_code=401, detail="Login required")
+    MAX_UPLOAD_BYTES = 20 * 1024 * 1024  # 20 MB
     try:
+        before_bytes = await before.read()
+        after_bytes = await after.read()
+        if len(before_bytes) > MAX_UPLOAD_BYTES or len(after_bytes) > MAX_UPLOAD_BYTES:
+            raise HTTPException(status_code=400, detail="Image too large (max 20 MB)")
+        before_pil = Image.open(io.BytesIO(before_bytes)).convert("RGB")
+        after_pil = Image.open(io.BytesIO(after_bytes)).convert("RGB")
+        del before_bytes, after_bytes
+    except HTTPException:
+        raise
     except Exception as e:
         raise HTTPException(status_code=400, detail=f"Invalid image: {e}")
     change_mask, result_image, stats, change_regions = run_detection(