Spaces:

princemaxp
/

CySecGuardians

Sleeping

App Files Files Community

princemaxp commited on Jan 8

Commit

8ff3ffa

verified ·

1 Parent(s): 734dc8c

Update analyze_email_main.py

Browse files

Files changed (1) hide show

analyze_email_main.py +20 -52

analyze_email_main.py CHANGED Viewed

@@ -11,10 +11,6 @@ from scoring_engine import compute_final_score
 from behavioral_analyzer import analyze_behavior, behavioral_summary
-# =========================
-# MAIN ANALYSIS FUNCTION
-# =========================
 def analyze(file_path):
     start_time = time.time()
@@ -26,51 +22,52 @@ def analyze(file_path):
     # =========================
     # 🧠 ANALYZERS
     # =========================
-    # Header analysis (auth, spoofing, BEC signals)
-    header_findings, header_score, auth_summary = analyze_headers(headers)
-    # Body heuristic / NLP analysis
     body_findings, body_score, highlighted_body, body_verdict = analyze_body(
         subject, body, urls, images
     )
-    # URL analysis
     url_findings, url_score = analyze_urls(urls)
-    # Attachment analysis
     attachment_findings, attachment_score, attachment_hashes = analyze_attachments(
         attachments
     )
     # =========================
-    # 🧠 BEHAVIORAL ANALYSIS (PHASE 4.3 – CORE FIX)
     # =========================
     behavior_result = analyze_behavior(body)
     behavior_score = behavior_result["confidence_score"]
     behavior_attack = behavior_result["dominant_attack"]
     behavior_verdict = behavior_result["verdict"]
     behavior_text = behavioral_summary(behavior_result)
     # =========================
-    # 🧮 FINAL CORRELATION SCORING
     # =========================
     final_score, verdict, reasoning = compute_final_score(
         header_score=header_score,
         body_score=body_score,
         url_score=url_score,
         attachment_score=attachment_score,
-        behavior_score=behavior_score,  # 🔥 NEW
         header_findings=header_findings,
         body_findings=body_findings,
         url_findings=url_findings,
         attachment_findings=attachment_findings,
-        auth_results=auth_summary,
-        behavior_result=behavior_result,  # 🔥 NEW
     )
     # =========================
-    # 🏷 TAGGING ENGINE
     # =========================
     tags = set()
@@ -79,36 +76,30 @@ def analyze(file_path):
     ):
         fl = finding.lower()
-        if "attachment" in fl or "macro" in fl or "html" in fl:
             tags.add("Malicious Attachment")
         if "reply-to" in fl or "bec" in fl:
             tags.add("BEC Indicator")
         if "url" in fl or "phishing" in fl:
-            tags.add("Malicious / Phishing URL")
         if "spf" in fl or "dkim" in fl or "dmarc" in fl:
             tags.add("Email Authentication Failure")
         if "brand" in fl or "look-alike" in fl:
             tags.add("Brand Spoofing")
-        if "urgent" in fl or "immediately" in fl:
             tags.add("Urgency / Social Engineering")
-    # Behavioral tags (VERY IMPORTANT)
     if behavior_attack != "None":
-        tags.add(behavior_attack.upper())
         tags.add("Behavioral Threat")
     # =========================
-    # ⏱ PROCESSING TIME
     # =========================
     processing_time = round(time.time() - start_time, 2)
     # =========================
-    # 📊 SUMMARY OUTPUT
     # =========================
     summary = {
         "Final Verdict": verdict,
@@ -119,9 +110,6 @@ def analyze(file_path):
         "Main Tags": ", ".join(sorted(tags)) if tags else "No special tags",
     }
-    # =========================
-    # 🔍 DETAILED OUTPUT
-    # =========================
     details = {
         "Header Findings": header_findings,
         "Body Findings": body_findings,
@@ -129,30 +117,10 @@ def analyze(file_path):
         "Attachment Findings": attachment_findings,
         "Attachment Hashes": attachment_hashes,
         "Highlighted Body": highlighted_body,
-        "Auth Results": auth_summary,
         "Behavioral Analysis": behavior_result,
         "Behavioral Summary": behavior_text,
         "Scoring Reasoning": reasoning,
     }
     return summary, details
-# =========================
-# 🧪 LOCAL TEST
-# =========================
-if __name__ == "__main__":
-    summary, details = analyze("sample.eml")
-    print("\n===== SUMMARY =====")
-    for k, v in summary.items():
-        print(f"{k}: {v}")
-    print("\n===== DETAILS =====")
-    for k, v in details.items():
-        print(f"\n{k}:")
-        if isinstance(v, list):
-            for item in v:
-                print(f"  - {item}")
-        else:
-            print(v)

 from behavioral_analyzer import analyze_behavior, behavioral_summary
 def analyze(file_path):
     start_time = time.time()
     # =========================
     # 🧠 ANALYZERS
     # =========================
+    header_findings, header_score, auth_summary = analyze_headers(headers, body)
+    auth_results = auth_summary  # must be dict
     body_findings, body_score, highlighted_body, body_verdict = analyze_body(
         subject, body, urls, images
     )
     url_findings, url_score = analyze_urls(urls)
     attachment_findings, attachment_score, attachment_hashes = analyze_attachments(
         attachments
     )
     # =========================
+    # 🧠 BEHAVIORAL ANALYSIS
     # =========================
     behavior_result = analyze_behavior(body)
     behavior_score = behavior_result["confidence_score"]
     behavior_attack = behavior_result["dominant_attack"]
     behavior_verdict = behavior_result["verdict"]
+    behavior_findings = behavior_result.get("findings", [])
     behavior_text = behavioral_summary(behavior_result)
     # =========================
+    # 🧮 FINAL SCORING
     # =========================
     final_score, verdict, reasoning = compute_final_score(
         header_score=header_score,
         body_score=body_score,
         url_score=url_score,
         attachment_score=attachment_score,
+        behavior_score=behavior_score,
         header_findings=header_findings,
         body_findings=body_findings,
         url_findings=url_findings,
         attachment_findings=attachment_findings,
+        behavior_findings=behavior_findings,
+        auth_results=auth_results,
     )
+    # 🔐 Safety override
+    if behavior_verdict == "Malicious" and verdict == "✅ Safe":
+        verdict = "⚠️ Suspicious"
     # =========================
+    # 🏷 TAGGING
     # =========================
     tags = set()
     ):
         fl = finding.lower()
+        if "attachment" in fl or "macro" in fl:
             tags.add("Malicious Attachment")
         if "reply-to" in fl or "bec" in fl:
             tags.add("BEC Indicator")
         if "url" in fl or "phishing" in fl:
+            tags.add("Malicious URL")
         if "spf" in fl or "dkim" in fl or "dmarc" in fl:
             tags.add("Email Authentication Failure")
         if "brand" in fl or "look-alike" in fl:
             tags.add("Brand Spoofing")
+        if "urgent" in fl:
             tags.add("Urgency / Social Engineering")
     if behavior_attack != "None":
         tags.add("Behavioral Threat")
+        tags.add(behavior_attack.upper())
     # =========================
+    # ⏱ TIME
     # =========================
     processing_time = round(time.time() - start_time, 2)
     # =========================
+    # 📊 OUTPUT
     # =========================
     summary = {
         "Final Verdict": verdict,
         "Main Tags": ", ".join(sorted(tags)) if tags else "No special tags",
     }
     details = {
         "Header Findings": header_findings,
         "Body Findings": body_findings,
         "Attachment Findings": attachment_findings,
         "Attachment Hashes": attachment_hashes,
         "Highlighted Body": highlighted_body,
+        "Auth Results": auth_results,
         "Behavioral Analysis": behavior_result,
         "Behavioral Summary": behavior_text,
         "Scoring Reasoning": reasoning,
     }
     return summary, details