Spaces:

testpj
/

email-classification

Configuration error

sajadup

Merge remote files and add my email app

591f049 16 days ago

21.2 kB

	import os
	import gc
	import re
	import torch
	import numpy as np
	import firebase_admin
	from firebase_admin import credentials, db
	from fastapi import FastAPI, Form, Request
	from fastapi.responses import HTMLResponse
	from transformers import (
	AutoTokenizer,
	AutoConfig,
	DistilBertForSequenceClassification,
	T5ForConditionalGeneration,
	T5Tokenizer
	)
	from lime.lime_text import LimeTextExplainer
	import uuid
	from datetime import datetime

	# FIREBASE INITIALIZATION
	# Ensure your serviceAccountKey.json is in the same directory
	if not firebase_admin._apps:
	cred = credentials.Certificate("serviceAccountKey.json")
	firebase_admin.initialize_app(cred, {
	'databaseURL': 'https://your-project-id.firebaseio.com/' # <--- Add Firebase URL here
	})

	app = FastAPI()

	# Global variables
	tokenizer = None
	model = None
	explainer = LimeTextExplainer(class_names=["LEGITIMATE", "PHISHING"])
	gen_tokenizer = None
	gen_model = None
	MODEL_DIR = "phishing_model_optimized"
	WEIGHTS_NAME = "quantized_model.pt"


	# PHISHING INDICATOR PATTERNS (Original Rule-Based)

	PHISHING_PATTERNS = {
	"urgency": [
	r"\bimmediate(ly)?\b", r"\burgent(ly)?\b", r"\bact now\b",
	r"\baction required\b", r"\bwithin \d+ (hour\|minute\|day)s?\b",
	r"\bexpir(e\|es\|ing\|ed)\b", r"\bsuspended\b", r"\bcompromised\b",
	r"\bverify (now\|immediately\|your)\b", r"\bfailure to\b",
	r"\bpermanent(ly)?\b", r"\bdelete(d)?\b", r"\block(ed)?\b"
	],
	"threat": [
	r"\baccount.(suspend\|terminat\|delet\|lock\|compromis)\w",
	r"\b(suspend\|terminat\|delet\|lock\|compromis)\w.account\b",
	r"\blegal action\b", r"\bpenalt(y\|ies)\b", r"\bconsequences\b"
	],
	"credential_request": [
	r"\bpassword\b", r"\bverify your (identity\|account\|email)\b",
	r"\bconfirm your\b", r"\bupdate.*(payment\|billing\|account)\b",
	r"\bssn\b", r"\bcredit card\b", r"\bbank account\b"
	],
	"suspicious_links": [
	r"https?://[^\s]*\.(xyz\|tk\|ml\|ga\|cf\|gq\|top\|club\|online)/",
	r"https?://[^\s]-[^\s]\.(com\|net\|org)/",
	r"https?://\d+\.\d+\.\d+\.\d+",
	r"bit\.ly\|tinyurl\|short\.link\|t\.co",
	r"click.here\|click.below\|click.*link"
	],
	"impersonation": [
	r"\b(paypal\|amazon\|netflix\|apple\|microsoft\|google\|bank)\b",
	r"\bcustomer (service\|support)\b", r"\bsecurity (team\|department)\b"
	]
	}

	def detect_phishing_indicators(text: str) -> dict:
	text_lower = text.lower()
	detected = {cat: [] for cat in PHISHING_PATTERNS}
	for category, patterns in PHISHING_PATTERNS.items():
	for pattern in patterns:
	matches = re.findall(pattern, text_lower, re.IGNORECASE)
	if matches:
	detected[category].extend(matches if isinstance(matches[0], str) else [m[0] for m in matches])
	for category in detected:
	detected[category] = list(set(detected[category]))
	return detected

	def calculate_phishing_score(indicators: dict) -> float:
	weights = {"urgency": 0.25, "threat": 0.25, "credential_request": 0.20, "suspicious_links": 0.20, "impersonation": 0.10}
	score = 0.0
	for category, weight in weights.items():
	if indicators[category]:
	category_score = min(len(indicators[category]) * 0.4, 1.0)
	score += weight * category_score
	return min(score, 1.0)

	def get_confidence_label(confidence: float) -> str:
	"""Determine confidence level descriptor based on score"""
	if confidence >= 0.90:
	return "high confidence"
	elif confidence >= 0.70:
	return "moderate confidence"
	else:
	return "low confidence"

	def generate_explanation_with_flan(indicators: dict, label: str, confidence: float, email_text: str) -> str:
	"""Generate high-quality natural language explanation using FLAN-T5"""

	# Get confidence level descriptor
	confidence_level = get_confidence_label(confidence)

	# Build detailed indicator analysis
	indicator_details = []
	urgency_count = len(indicators["urgency"])
	threat_count = len(indicators["threat"])
	cred_count = len(indicators["credential_request"])
	link_count = len(indicators["suspicious_links"])
	imperson_count = len(indicators["impersonation"])

	if urgency_count > 0:
	urgency_examples = ', '.join([f'"{item}"' for item in indicators['urgency'][:2]])
	indicator_details.append(f"high urgency language ({urgency_count} instances: {urgency_examples})")
	if threat_count > 0:
	threat_examples = ', '.join([f'"{item}"' for item in indicators['threat'][:2]])
	indicator_details.append(f"threatening tone ({threat_count} instances: {threat_examples})")
	if cred_count > 0:
	cred_examples = ', '.join([f'"{item}"' for item in indicators['credential_request'][:2]])
	indicator_details.append(f"credential requests ({cred_count} instances: {cred_examples})")
	if link_count > 0:
	indicator_details.append(f"suspicious links ({link_count} detected)")
	if imperson_count > 0:
	brands = ', '.join(indicators['impersonation'][:2])
	indicator_details.append(f"brand impersonation attempts ({brands})")

	# Create sophisticated prompts based on label
	if label == "PHISHING":
	indicators_summary = "; ".join(indicator_details) if indicator_details else "general phishing patterns"

	prompt = f"""You are a cybersecurity expert. Explain why this email is phishing:

	Email sample: "{email_text[:250]}"

	Detected threats: {indicators_summary}

	Write a clear 2-sentence explanation that:
	1. States the classification with confidence level
	2. Describes specific malicious tactics (urgency, social engineering, credential harvesting, clickbait)
	3. Uses professional security terminology

	Explanation:"""
	else: # LEGITIMATE
	safe_indicators = []
	if not indicators["urgency"] and not indicators["threat"]:
	safe_indicators.append("no urgency or threat language")
	if not indicators["credential_request"]:
	safe_indicators.append("no credential requests")
	if not indicators["suspicious_links"]:
	safe_indicators.append("no suspicious links")
	if not indicators["impersonation"]:
	safe_indicators.append("no brand impersonation")

	safety_summary = ", ".join(safe_indicators) if safe_indicators else "standard communication patterns"

	prompt = f"""You are a cybersecurity expert. Explain why this email is legitimate:

	Email sample: "{email_text[:250]}"

	Safety indicators: {safety_summary}

	Write a clear 2-sentence explanation that:
	1. States the classification with confidence level
	2. Notes the absence of social-engineering cues, suspicious tokens, or phishing tactics
	3. Uses professional security terminology

	Explanation:"""

	try:
	# Tokenize the prompt
	inputs = gen_tokenizer(
	prompt,
	return_tensors="pt",
	max_length=512,
	truncation=True
	)

	# Generate explanation with optimized parameters
	with torch.no_grad():
	outputs = gen_model.generate(
	inputs.input_ids,
	max_length=180,
	min_length=40,
	num_beams=5,
	length_penalty=1.2,
	early_stopping=True,
	temperature=0.8,
	top_p=0.92,
	do_sample=False,
	no_repeat_ngram_size=3
	)

	# Decode the generated text
	explanation = gen_tokenizer.decode(outputs[0], skip_special_tokens=True)

	# Post-process: add confidence level prefix
	explanation = f"The email was classified as {label} with {confidence_level} ({confidence:.2f}). {explanation}"

	return explanation

	except Exception as e:
	print(f"FLAN-T5 generation error: {e}")
	# Enhanced fallback explanations
	if label == "PHISHING":
	reasons = []
	if indicators["urgency"]: reasons.append("uses high urgency tactics")
	if indicators["threat"]: reasons.append("contains threatening language")
	if indicators["credential_request"]: reasons.append("attempts credential harvesting")
	if indicators["suspicious_links"]: reasons.append("includes clickbait keywords")

	reason_text = " and ".join(reasons) if reasons else "exhibits fraudulent patterns"
	return f"The email was classified as PHISHING with {confidence_level} ({confidence:.2f}). The email {reason_text} suggesting a social-engineering attempt to capture sensitive information."
	else:
	return f"The email was classified as LEGITIMATE with {confidence_level} ({confidence:.2f}). The message appears routine and contains no social-engineering cues or suspicious tokens."

	@app.on_event("startup")
	def load_models():
	global tokenizer, model, gen_tokenizer, gen_model
	base_path = os.path.dirname(os.path.abspath(__file__))
	model_path = os.path.join(base_path, MODEL_DIR)
	weights_path = os.path.join(model_path, WEIGHTS_NAME)
	gc.collect()
	try:
	# Load DistilBERT for classification
	tokenizer = AutoTokenizer.from_pretrained(model_path, local_files_only=True)
	config = AutoConfig.from_pretrained(model_path, local_files_only=True)
	base_model = DistilBertForSequenceClassification(config)
	model = torch.quantization.quantize_dynamic(base_model, {torch.nn.Linear}, dtype=torch.qint8)
	if os.path.exists(weights_path):
	model.load_state_dict(torch.load(weights_path, map_location='cpu'))
	model.eval()

	# Load FLAN-T5 for explanation generation
	print("Loading FLAN-T5 for explanation generation...")
	gen_tokenizer = T5Tokenizer.from_pretrained("google/flan-t5-small", legacy=False)
	gen_model = T5ForConditionalGeneration.from_pretrained("google/flan-t5-small")
	gen_model.eval()
	print("FLAN-T5 loaded successfully!")

	except Exception as e:
	print(f"Load Error: {e}")

	def predictor(texts):
	probs_list = []
	for text in texts:
	inputs = tokenizer(text, return_tensors="pt", truncation=True, padding=True, max_length=256)
	with torch.no_grad():
	outputs = model(**inputs)
	probs = torch.softmax(outputs.logits, dim=1).numpy()
	probs_list.append(probs[0])
	return np.array(probs_list)

	def hybrid_predict(email_text: str) -> tuple:
	ml_probs = predictor([email_text])[0]
	indicators = detect_phishing_indicators(email_text)
	rule_score = calculate_phishing_score(indicators)
	# Combine scores based on your logic
	if rule_score > 0.5: combined_prob = (ml_probs[1] * 0.3) + (rule_score * 0.7)
	elif rule_score > 0.2: combined_prob = (ml_probs[1] * 0.5) + (rule_score * 0.5)
	else: combined_prob = (ml_probs[1] * 0.7) + (rule_score * 0.3)

	label = "PHISHING" if combined_prob >= 0.5 else "LEGITIMATE"
	confidence = combined_prob if label == "PHISHING" else 1 - combined_prob
	return label, confidence, indicators

	@app.get("/", response_class=HTMLResponse)
	async def index():
	return """
	<html>
	<head><title>Robust Explainable Phishing Classification</title></head>
	<body style="font-family: sans-serif; background: #f4f7f6; display: flex; justify-content: center; padding-top: 50px;">
	<div style="background: white; padding: 40px; border-radius: 15px; box-shadow: 0 10px 30px rgba(0,0,0,0.1); width: 800px;">
	<form action="/predict" method="post">
	<textarea name="email_text" rows="10" style="width: 100%; padding: 10px;" placeholder="Paste email here..." required></textarea>
	<button type="submit" style="width: 100%; background: #007bff; color: white; padding: 15px; margin-top: 10px; border: none; cursor: pointer; border-radius: 8px;">Analyze & Explain</button>
	</form>
	</div>
	</body>
	</html>
	"""

	@app.post("/predict", response_class=HTMLResponse)
	async def predict(email_text: str = Form(...)):
	label, confidence, indicators = hybrid_predict(email_text)

	# Generate unique token for this analysis
	unique_token = str(uuid.uuid4())[:8].upper()
	timestamp = datetime.now().strftime("%Y-%m-%d %H:%M:%S")

	# Store analysis data in Firebase for reference
	analysis_ref = db.reference('/analysis_records')
	analysis_ref.child(unique_token).set({
	'timestamp': timestamp,
	'label': label,
	'confidence': float(confidence),
	'email_length': len(email_text)
	})

	# Get LIME explanation for technical keywords
	try:
	exp = explainer.explain_instance(email_text, predictor, num_features=6, num_samples=100)
	keyword_str = ", ".join([word for word, weight in exp.as_list() if abs(weight) > 0.01])
	except:
	keyword_str = "analysis unavailable"

	# Generate natural language explanation using FLAN-T5
	clean_explanation = generate_explanation_with_flan(indicators, label, confidence, email_text)

	color = "#dc3545" if label == "PHISHING" else "#28a745"

	# HTML Result with Enhanced Feedback Form
	return f"""
	<div style="font-family: sans-serif; max-width: 900px; margin: auto; padding: 20px;">
	<div style="background: {color}; color: white; padding: 20px; border-radius: 20px; text-align: center;">
	<h1 style="margin: 0;">{label}</h1>
	<p>Confidence: {confidence:.2%}</p>
	</div>
	<div style="background: white; padding: 30px; border-radius: 15px; margin-top: 30px; box-shadow: 0 5px 15px rgba(0,0,0,0.05);">
	<h3>Security Analysis (FLAN-T5 Generated)</h3>
	<p style="font-size: 1.1em;">{clean_explanation}</p>
	<p><b>Technical Triggers (LIME):</b> {keyword_str}</p>

	<hr style="margin: 40px 0;">

	<h3>Help Us Improve (XAI Evaluation)</h3>
	<div style="background: #f8f9fa; padding: 15px; border-radius: 8px; margin-bottom: 20px;">
	<p style="margin: 5px 0;"><b>Analysis Token:</b> <span style="font-family: monospace; font-size: 1.2em; color: {color}; font-weight: bold;">{unique_token}</span></p>
	<p style="margin: 5px 0; font-size: 0.9em; color: #666;">Please save this token for your records</p>
	</div>

	<form action="/feedback" method="post">
	<input type="hidden" name="token" value="{unique_token}">

	<table style="width: 100%; border-collapse: collapse; margin: 20px 0;">
	<thead>
	<tr style="background: #f1f3f5;">
	<th style="padding: 15px; text-align: left; border: 1px solid #dee2e6; width: 50%;">Evaluation Criteria</th>
	<th style="padding: 10px; text-align: center; border: 1px solid #dee2e6; width: 10%;">1</th>
	<th style="padding: 10px; text-align: center; border: 1px solid #dee2e6; width: 10%;">2</th>
	<th style="padding: 10px; text-align: center; border: 1px solid #dee2e6; width: 10%;">3</th>
	<th style="padding: 10px; text-align: center; border: 1px solid #dee2e6; width: 10%;">4</th>
	<th style="padding: 10px; text-align: center; border: 1px solid #dee2e6; width: 10%;">5</th>
	</tr>
	</thead>
	<tbody>
	<tr>
	<td style="padding: 15px; border: 1px solid #dee2e6; background: #fff;">
	<b>1. Decision Clarity:</b><br>
	<span style="font-size: 0.9em; color: #666;">The explanation helped me understand the result.</span>
	</td>
	<td style="padding: 10px; text-align: center; border: 1px solid #dee2e6;">
	<input type="radio" name="understanding" value="1" required style="width: 20px; height: 20px; cursor: pointer;">
	</td>
	<td style="padding: 10px; text-align: center; border: 1px solid #dee2e6;">
	<input type="radio" name="understanding" value="2" style="width: 20px; height: 20px; cursor: pointer;">
	</td>
	<td style="padding: 10px; text-align: center; border: 1px solid #dee2e6;">
	<input type="radio" name="understanding" value="3" style="width: 20px; height: 20px; cursor: pointer;">
	</td>
	<td style="padding: 10px; text-align: center; border: 1px solid #dee2e6;">
	<input type="radio" name="understanding" value="4" style="width: 20px; height: 20px; cursor: pointer;">
	</td>
	<td style="padding: 10px; text-align: center; border: 1px solid #dee2e6;">
	<input type="radio" name="understanding" value="5" style="width: 20px; height: 20px; cursor: pointer;">
	</td>
	</tr>
	<tr>
	<td style="padding: 15px; border: 1px solid #dee2e6; background: #f8f9fa;">
	<b>2. Information Focus:</b><br>
	<span style="font-size: 0.9em; color: #666;">The explanation was concise and essential.</span>
	</td>
	<td style="padding: 10px; text-align: center; border: 1px solid #dee2e6; background: #f8f9fa;">
	<input type="radio" name="clarity" value="1" required style="width: 20px; height: 20px; cursor: pointer;">
	</td>
	<td style="padding: 10px; text-align: center; border: 1px solid #dee2e6; background: #f8f9fa;">
	<input type="radio" name="clarity" value="2" style="width: 20px; height: 20px; cursor: pointer;">
	</td>
	<td style="padding: 10px; text-align: center; border: 1px solid #dee2e6; background: #f8f9fa;">
	<input type="radio" name="clarity" value="3" style="width: 20px; height: 20px; cursor: pointer;">
	</td>
	<td style="padding: 10px; text-align: center; border: 1px solid #dee2e6; background: #f8f9fa;">
	<input type="radio" name="clarity" value="4" style="width: 20px; height: 20px; cursor: pointer;">
	</td>
	<td style="padding: 10px; text-align: center; border: 1px solid #dee2e6; background: #f8f9fa;">
	<input type="radio" name="clarity" value="5" style="width: 20px; height: 20px; cursor: pointer;">
	</td>
	</tr>
	</tbody>
	</table>

	<p style="font-size: 0.85em; color: #666; text-align: center; margin-top: 10px;">
	Rating Scale: 1 = Strongly Disagree \| 5 = Strongly Agree
	</p>

	<button type="submit" style="width: 100%; background: #28a745; color: white; padding: 12px; border: none; border-radius: 5px; cursor: pointer; font-size: 1.05em; margin-top: 15px;">Submit Feedback to Firebase</button>
	</form>
	</div>

	<div style="text-align: center; margin-top: 20px;">
	<a href="/" style="color: #007bff; text-decoration: none;">← Analyze Another Email</a>
	</div>
	</div>
	"""

	@app.post("/feedback")
	async def save_feedback(token: str = Form(...), understanding: int = Form(...), clarity: int = Form(...)):
	timestamp = datetime.now().strftime("%Y-%m-%d %H:%M:%S")

	# Save feedback with token reference
	feedback_ref = db.reference('/xai_feedback')
	feedback_ref.push({
	'token': token,
	'understanding': understanding,
	'clarity': clarity,
	'timestamp': timestamp
	})

	return HTMLResponse(f"""
	<div style="font-family: sans-serif; max-width: 800px; margin: 100px auto; padding: 40px; background: white; border-radius: 15px; box-shadow: 0 10px 30px rgba(0,0,0,0.1); text-align: center;">
	<h2 style="color: #28a745;">Feedback Received!</h2>
	<p>Thank you for contributing to our research.</p>
	<p><b>Your Token:</b> <span style="font-family: monospace; font-size: 1.2em; color: #007bff;">{token}</span></p>
	<a href="/" style="display: inline-block; margin-top: 20px; padding: 12px 30px; background: #007bff; color: white; text-decoration: none; border-radius: 5px;">Go back to Home</a>
	</div>
	""")

	if __name__ == "__main__":
	import uvicorn
	uvicorn.run(app, host="127.0.0.1", port=8000)