Spaces:

ExistedYear
/

smishing_detector_api

Paused

App Files Files Community

ExistedYear commited on about 12 hours ago

Commit

abdf9b3

1 Parent(s): 348b3a4

balls

Browse files

Files changed (1) hide show

smishing_detector/predictor.py +45 -67

smishing_detector/predictor.py CHANGED Viewed

@@ -265,56 +265,38 @@ class SmishingPredictor:
                         spam_rule: float, ham_rule: float,
                         uf: dict) -> Tuple[str, str, float, bool, str]:
         """
-        Green Channel — distinguishes SCAMS from harmless promotional spam.
-        This project detects smishing (scam SMS), NOT general spam.
-        A message like "Congratulations! Free 5G SIM upgrade. Visit your nearest
-        Airtel store" is promotional spam, not a scam — it has no phishing URL,
-        no threats, no urgency to click a link.
-        Logic:
-        1. Hard scam signals (spam_rule >= 0.55) → NEVER clear. These have
-           explicit phishing patterns like "account suspended", "KYC update",
-           "digital arrest" with suspicious URLs.
-        2. Soft spam (spam_rule < 0.55) + ALL URLs are verified legit domains
-           → GREEN CHANNEL → downgrade to "safe" (it's just an ad/promo).
-        3. Soft spam + NO URLs at all + ham patterns detected → also GREEN
-           CHANNEL (legit transactional or brand notification).
-        Returns: (label, risk, final_prob, green_cleared, green_reason)
-        """
-        # Never green-channel if hard scam patterns are present
-        if spam_rule >= 0.55:
-            risk = "high" if final_prob >= 0.75 else "medium" if final_prob >= self.threshold else "low"
-            return label, risk, final_prob, False, ""
-        # Only applies to messages that would otherwise be classified as spam
-        if label != "spam":
-            risk = "low"
-            return label, risk, final_prob, False, ""
-        # Build static legit domain set (fallback whitelist)
-        static_legit = set()
-        try:
-            from utils.safe_browsing import get_checker
-            static_legit |= get_checker().fallback_legit_domains
-        except Exception:
-            pass
-        try:
-            from utils.data_loader import LEGIT_DOMAINS
-            static_legit |= LEGIT_DOMAINS
-        except Exception:
-            pass
         has_url = bool(uf.get("has_url"))
-        has_suspicious = bool(uf.get("suspicious_tld") or uf.get("has_ip_url"))
-        # Case 1: Message has URLs — check each via GSB then static whitelist
-        if has_url and not has_suspicious:
             try:
                 import tldextract
                 urls = extract_urls(message)
                 if urls:
                     checker = None
                     try:
                         from utils.safe_browsing import get_checker as _gc
@@ -322,15 +304,14 @@ class SmishingPredictor:
                     except Exception:
                         pass
-                    all_legit = True
-                    malicious_found = False
                     for url in urls:
                         ext = tldextract.extract(url)
                         full_domain = f"{ext.domain}.{ext.suffix}".lower().strip(".")
                         if not full_domain:
                             continue
-                        # GSB first (cached, live lookup if needed)
                         status = "unknown"
                         if checker:
                             try:
@@ -339,36 +320,33 @@ class SmishingPredictor:
                                 pass
                         if status == "known_malicious":
-                            malicious_found = True
-                            break
-                        elif status == "known_safe":
-                            continue  # GSB verified safe
-                        elif full_domain in static_legit:
-                            continue  # static whitelist
-                        else:
-                            all_legit = False
-                            break
-                    if malicious_found:
-                        return "spam", "high", max(final_prob, 0.90), False, ""
-                    if all_legit:
                         return "safe", "low", min(final_prob, 0.40), True, \
                             "all URLs verified as legitimate domains"
             except Exception:
                 pass
-        # Case 2: No URL + ham patterns present + low spam rule score
-        # e.g. "Airtel: Congratulations! Eligible for free 5G upgrade. Visit store."
-        if not has_url and ham_rule >= 0.35 and spam_rule < 0.35:
             return "safe", "low", min(final_prob, 0.35), True, \
                 "no URLs + legitimate transactional patterns detected"
-        # Case 3: Has legit domain URL + ham patterns dominate spam patterns
-        if has_url and uf.get("has_legit_domain") and ham_rule > spam_rule:
-            return "safe", "low", min(final_prob, 0.42), True, \
-                "legit domain URL + stronger ham signals than scam signals"
-        risk = "high" if final_prob >= 0.75 else "medium" if final_prob >= self.threshold else "low"
         return label, risk, final_prob, False, ""
     def predict(self, message: str) -> dict:

                         spam_rule: float, ham_rule: float,
                         uf: dict) -> Tuple[str, str, float, bool, str]:
         """
+        Unified URL-aware channel checking.
+        For EVERY message that has URLs, check ALL of them against
+        GSB first, then static whitelist:
+         1. ANY URL → known_malicious  => SPAM (escalate)
+         2. ALL URLs → known_safe      => SAFE (green channel)
+         3. ANY URL → unverified       => keep model verdict (no override)
+         4. No URLs + ham patterns     => SAFE (promo/ad without links)
+        """
         has_url = bool(uf.get("has_url"))
+        risk = "high" if final_prob >= 0.75 else "medium" if final_prob >= self.threshold else "low"
+        # ── URL checking (runs for ALL messages with URLs) ──────────────────
+        if has_url:
             try:
                 import tldextract
                 urls = extract_urls(message)
                 if urls:
+                    # static whitelist
+                    static_legit = set()
+                    try:
+                        from utils.safe_browsing import get_checker
+                        static_legit |= get_checker().fallback_legit_domains
+                    except Exception:
+                        pass
+                    try:
+                        from utils.data_loader import LEGIT_DOMAINS
+                        static_legit |= LEGIT_DOMAINS
+                    except Exception:
+                        pass
                     checker = None
                     try:
                         from utils.safe_browsing import get_checker as _gc
                     except Exception:
                         pass
+                    all_safe = True
                     for url in urls:
                         ext = tldextract.extract(url)
                         full_domain = f"{ext.domain}.{ext.suffix}".lower().strip(".")
                         if not full_domain:
                             continue
+                        # 1. GSB first
                         status = "unknown"
                         if checker:
                             try:
                                 pass
                         if status == "known_malicious":
+                            return "spam", "high", max(final_prob, 0.90), False, ""
+                        if status == "known_safe":
+                            continue
+                        if full_domain in static_legit:
+                            continue
+                        # unverified — don't green-channel
+                        all_safe = False
+                        break
+                    if all_safe:
+                        if label == "spam" and spam_rule >= 0.35:
+                            # message looks scammy but all URLs are legit → cap at medium
+                            return "spam", "medium", min(final_prob, 0.55), True, \
+                                "URLs verified legitimate but message content is suspicious"
                         return "safe", "low", min(final_prob, 0.40), True, \
                             "all URLs verified as legitimate domains"
             except Exception:
                 pass
+            # URLs exist but at least one is unverified → keep model verdict
+            return label, risk, final_prob, False, ""
+        # ── No URLs: check for harmless promo/ad patterns ───────────────────
+        if ham_rule >= 0.35 and spam_rule < 0.35 and label == "spam":
             return "safe", "low", min(final_prob, 0.35), True, \
                 "no URLs + legitimate transactional patterns detected"
         return label, risk, final_prob, False, ""
     def predict(self, message: str) -> dict: