Spaces:

padmanabhbosamia
/

Fraud_Detection

Running

App Files Files Community

Fraud_Detection / app.py

padmanabhbosamia

Update app.py

5253576 verified 2 months ago

raw

history blame contribute delete

32.9 kB

	import gradio as gr
	import pandas as pd
	import numpy as np
	from sklearn.ensemble import RandomForestClassifier
	from sklearn.model_selection import train_test_split
	from sklearn.metrics import accuracy_score, precision_score, recall_score, f1_score, confusion_matrix
	import pickle
	import os

	# Global variables to store the model and data
	model = None
	feature_columns = None

	def load_and_train_model(csv_file):
	"""Load dataset and train a Random Forest model"""
	global model, feature_columns

	try:
	# Read the uploaded CSV
	df = pd.read_csv(csv_file.name)

	# Check if 'fraud' column exists
	if 'fraud' not in df.columns:
	return "❌ Error: CSV must contain a 'fraud' column as the target variable."

	# Separate features and target
	X = df.drop(['fraud', 'transaction_id'], axis=1, errors='ignore')
	y = df['fraud']

	feature_columns = X.columns.tolist()

	# Split data
	X_train, X_test, y_train, y_test = train_test_split(
	X, y, test_size=0.2, random_state=42, stratify=y
	)

	# Train Random Forest model
	model = RandomForestClassifier(n_estimators=100, random_state=42, max_depth=10)
	model.fit(X_train, y_train)

	# Evaluate
	y_pred = model.predict(X_test)

	accuracy = accuracy_score(y_test, y_pred)
	precision = precision_score(y_test, y_pred)
	recall = recall_score(y_test, y_pred)
	f1 = f1_score(y_test, y_pred)
	cm = confusion_matrix(y_test, y_pred)

	# Format results
	results = f"""
	✅ Model Trained Successfully!

	📊 Dataset Information:
	- Total Samples: {len(df)}
	- Training Samples: {len(X_train)}
	- Test Samples: {len(X_test)}
	- Fraud Cases: {y.sum()} ({y.mean()*100:.1f}%)
	- Legitimate Cases: {(y==0).sum()} ({(y==0).mean()*100:.1f}%)

	📈 Model Performance:
	- Accuracy: {accuracy*100:.2f}%
	- Precision: {precision*100:.2f}%
	- Recall: {recall*100:.2f}%
	- F1-Score: {f1*100:.2f}%

	🔢 Confusion Matrix:
	```
	Predicted
	Fraud Legitimate
	Actual Fraud {cm[1][1]} {cm[1][0]}
	Legit {cm[0][1]} {cm[0][0]}
	```

	Key Metrics Explained:
	- True Positives (TP): {cm[1][1]} frauds correctly detected
	- False Negatives (FN): {cm[1][0]} frauds missed (⚠️ costly!)
	- False Positives (FP): {cm[0][1]} false alarms
	- True Negatives (TN): {cm[0][0]} legitimate transactions correctly identified

	✅ Model is ready! You can now make predictions below.
	"""

	return results

	except Exception as e:
	return f"❌ Error: {str(e)}"


	def predict_single_transaction(amount, hour, dist_home, dist_last, ratio_median,
	repeat_retailer, used_chip, used_pin, online_order):
	"""Make a prediction for a single transaction"""
	global model, feature_columns

	if model is None:
	return "⚠️ Please upload and train a model first!", ""

	try:
	# Create input dataframe
	input_data = pd.DataFrame({
	'transaction_amount': [amount],
	'transaction_hour': [hour],
	'distance_from_home_km': [dist_home],
	'distance_from_last_transaction_km': [dist_last],
	'ratio_to_median_purchase': [ratio_median],
	'repeat_retailer': [repeat_retailer],
	'used_chip': [used_chip],
	'used_pin': [used_pin],
	'online_order': [online_order]
	})

	# Make prediction
	prediction = model.predict(input_data)[0]
	probability = model.predict_proba(input_data)[0]

	# Format result
	fraud_prob = probability[1] * 100
	legit_prob = probability[0] * 100

	if prediction == 1:
	result = f"🚨 FRAUD DETECTED"
	confidence = fraud_prob
	color = "red"
	else:
	result = f"✅ LEGITIMATE TRANSACTION"
	confidence = legit_prob
	color = "green"

	details = f"""
	{result}

	Confidence: {confidence:.1f}%

	Probability Distribution:
	- Fraud: {fraud_prob:.1f}%
	- Legitimate: {legit_prob:.1f}%

	Risk Level: {'🔴 HIGH' if fraud_prob > 70 else '🟡 MEDIUM' if fraud_prob > 40 else '🟢 LOW'}

	Transaction Details:
	- Amount: ${amount:,.2f}
	- Time: {hour}:00
	- Distance from home: {dist_home:.1f} km
	- Distance from last transaction: {dist_last:.1f} km
	- Ratio to median: {ratio_median:.2f}x
	- Repeat retailer: {'Yes' if repeat_retailer else 'No'}
	- Used chip: {'Yes' if used_chip else 'No'}
	- Used PIN: {'Yes' if used_pin else 'No'}
	- Online order: {'Yes' if online_order else 'No'}
	"""

	return details, result

	except Exception as e:
	return f"❌ Error: {str(e)}", ""


	def predict_batch(csv_file):
	"""Make predictions for batch of transactions"""
	global model, feature_columns

	if model is None:
	return None, "⚠️ Please upload and train a model first!"

	try:
	# Read CSV
	df = pd.read_csv(csv_file.name)

	# Keep original df for output
	original_df = df.copy()

	# Prepare features
	X = df.drop(['fraud', 'transaction_id'], axis=1, errors='ignore')

	# Make predictions
	predictions = model.predict(X)
	probabilities = model.predict_proba(X)

	# Add predictions to dataframe
	original_df['predicted_fraud'] = predictions
	original_df['fraud_probability'] = probabilities[:, 1] * 100
	original_df['confidence'] = np.max(probabilities, axis=1) * 100

	# Calculate metrics if 'fraud' column exists
	if 'fraud' in original_df.columns:
	accuracy = accuracy_score(original_df['fraud'], predictions)
	precision = precision_score(original_df['fraud'], predictions)
	recall = recall_score(original_df['fraud'], predictions)
	f1 = f1_score(original_df['fraud'], predictions)

	metrics = f"""
	📊 Batch Prediction Results:

	- Total Transactions: {len(df)}
	- Predicted Fraud: {predictions.sum()} ({predictions.mean()*100:.1f}%)
	- Predicted Legitimate: {(predictions==0).sum()} ({(predictions==0).mean()*100:.1f}%)

	📈 Performance Metrics:
	- Accuracy: {accuracy*100:.2f}%
	- Precision: {precision*100:.2f}%
	- Recall: {recall*100:.2f}%
	- F1-Score: {f1*100:.2f}%

	✅ Results are ready for download!
	"""
	else:
	metrics = f"""
	📊 Batch Prediction Results:

	- Total Transactions: {len(df)}
	- Predicted Fraud: {predictions.sum()} ({predictions.mean()*100:.1f}%)
	- Predicted Legitimate: {(predictions==0).sum()} ({(predictions==0).mean()*100:.1f}%)

	✅ Results are ready for download!
	"""

	# Save results to temporary CSV
	output_file = "predictions_output.csv"
	original_df.to_csv(output_file, index=False)

	return output_file, metrics

	except Exception as e:
	return None, f"❌ Error: {str(e)}"


	def calculate_business_impact(total_transactions, fraud_rate_percent, precision, recall,
	fraud_loss_per_transaction, review_cost_per_transaction):
	"""Calculate the financial business impact of a fraud detection model"""

	try:
	# Convert fraud rate to decimal
	fraud_rate = fraud_rate_percent / 100

	# Calculate actual frauds in the dataset
	total_frauds = int(total_transactions * fraud_rate)
	total_legitimate = total_transactions - total_frauds

	# Calculate confusion matrix components
	# Recall = TP / (TP + FN) = TP / total_frauds
	# So: TP = recall * total_frauds
	true_positives = int(recall * total_frauds)
	false_negatives = total_frauds - true_positives

	# Precision = TP / (TP + FP)
	# So: FP = TP / precision - TP = TP * (1/precision - 1)
	false_positives = int(true_positives / precision - true_positives) if precision > 0 else 0
	true_negatives = total_legitimate - false_positives

	# Calculate financial impact
	# Frauds caught (prevented losses)
	fraud_losses_prevented = true_positives * fraud_loss_per_transaction

	# Frauds missed (actual losses)
	fraud_losses_incurred = false_negatives * fraud_loss_per_transaction

	# Review costs (for all flagged transactions)
	total_flagged = true_positives + false_positives
	total_review_costs = total_flagged * review_cost_per_transaction

	# Net benefit
	net_benefit = fraud_losses_prevented - fraud_losses_incurred - total_review_costs

	# Without model (baseline - all frauds go through)
	baseline_losses = total_frauds * fraud_loss_per_transaction
	savings_vs_baseline = baseline_losses - fraud_losses_incurred - total_review_costs

	# Calculate percentages
	fraud_detection_rate = (true_positives / total_frauds * 100) if total_frauds > 0 else 0
	false_positive_rate = (false_positives / total_legitimate * 100) if total_legitimate > 0 else 0

	# Format results
	results = f"""
	## 💰 Business Impact Analysis

	### 📊 Transaction Breakdown
	- Total Transactions: {total_transactions:,} per month
	- Actual Frauds: {total_frauds:,} ({fraud_rate_percent:.2f}%)
	- Legitimate Transactions: {total_legitimate:,} ({100-fraud_rate_percent:.2f}%)

	### 🎯 Model Performance
	- Precision: {precision100:.1f}% (of flagged, {precision100:.1f}% are actually fraud)
	- Recall: {recall100:.1f}% (catches {recall100:.1f}% of all frauds)

	### 🔍 Detection Results
	- ✅ True Positives (Frauds Caught): {true_positives:,} ({fraud_detection_rate:.1f}% of frauds)
	- ❌ False Negatives (Frauds Missed): {false_negatives:,} ({100-fraud_detection_rate:.1f}% of frauds)
	- ⚠️ False Positives (False Alarms): {false_positives:,} ({false_positive_rate:.2f}% of legitimate)
	- ✅ True Negatives (Correctly Allowed): {true_negatives:,}

	### 💵 Financial Impact (Monthly)

	Fraud Prevention:
	- Losses Prevented: ${fraud_losses_prevented:,.2f}
	- ({true_positives:,} frauds caught × ${fraud_loss_per_transaction:,.2f})

	Losses Incurred:
	- Missed Fraud Losses: ${fraud_losses_incurred:,.2f}
	- ({false_negatives:,} frauds missed × ${fraud_loss_per_transaction:,.2f})

	Operational Costs:
	- Manual Review Costs: ${total_review_costs:,.2f}
	- ({total_flagged:,} flagged transactions × ${review_cost_per_transaction:,.2f})

	### 📈 Net Benefit: ${net_benefit:,.2f} per month

	### 🎯 Primary Benefit:
	The model saves ${savings_vs_baseline:,.2f} per month compared to having no fraud detection system.

	Annual Impact: ${net_benefit * 12:,.2f}

	### 📊 Key Insights:
	1. Fraud Detection Rate: {fraud_detection_rate:.1f}% of frauds are caught
	2. Cost Efficiency: Every ${total_review_costs/fraud_losses_prevented:.2f} spent on reviews prevents ${fraud_loss_per_transaction:.2f} in fraud
	3. ROI: {((net_benefit / total_review_costs) * 100) if total_review_costs > 0 else 0:.1f}% return on review investment
	4. Remaining Risk: {false_negatives:,} frauds still slip through (${fraud_losses_incurred:,.2f} in losses)

	### ⚠️ Recommendations:
	- *Current Recall ({recall100:.1f}%):** Missing {false_negatives:,} frauds costs ${fraud_losses_incurred:,.2f}/month
	- Consider improving recall to reduce missed frauds
	- Balance precision to control review costs
	"""

	return results

	except Exception as e:
	return f"❌ Error calculating business impact: {str(e)}"


	def analyze_model_drift(initial_precision, current_precision, months_deployed,
	initial_recall, current_recall):
	"""Analyze model drift and provide recommendations"""

	try:
	precision_drop = initial_precision - current_precision
	precision_drop_pct = (precision_drop / initial_precision * 100) if initial_precision > 0 else 0

	recall_change = current_recall - initial_recall
	recall_change_pct = (recall_change / initial_recall * 100) if initial_recall > 0 else 0

	# Determine severity
	if precision_drop_pct > 20:
	severity = "🔴 CRITICAL"
	urgency = "Immediate action required"
	elif precision_drop_pct > 10:
	severity = "🟠 HIGH"
	urgency = "Action needed within 1-2 weeks"
	else:
	severity = "🟡 MODERATE"
	urgency = "Monitor closely, plan retraining"

	# Most likely causes (in order of probability)
	causes = []
	if precision_drop_pct > 15:
	causes.append({
	"rank": 1,
	"cause": "Data Drift / Distribution Shift",
	"description": "The statistical distribution of incoming transactions has changed. Legitimate customer behavior patterns have shifted (e.g., new spending habits, new products, seasonal changes, post-pandemic behavior changes).",
	"probability": "Very High (80-90%)"
	})
	else:
	causes.append({
	"rank": 1,
	"cause": "Data Drift / Distribution Shift",
	"description": "Gradual changes in transaction patterns over time.",
	"probability": "High (70-80%)"
	})

	causes.append({
	"rank": 2,
	"cause": "Concept Drift",
	"description": "The relationship between features and fraud has changed. Fraudsters have adapted their tactics to evade detection, or new fraud patterns have emerged that weren't in training data.",
	"probability": "Medium-High (50-60%)"
	})

	causes.append({
	"rank": 3,
	"cause": "Feature Drift",
	"description": "Individual features have changed meaning or distribution. Examples: new payment methods, changes in merchant categories, updated transaction processing systems.",
	"probability": "Medium (30-40%)"
	})

	causes.append({
	"rank": 4,
	"cause": "Label Quality Issues",
	"description": "Ground truth labels may have become less accurate, or fraud definition has changed. This is less common but can cause apparent precision drops.",
	"probability": "Low (10-20%)"
	})

	# Appropriate actions
	actions = [
	{
	"priority": "🔴 IMMEDIATE",
	"action": "Data Distribution Analysis",
	"steps": [
	"Compare feature distributions of recent data vs training data",
	"Use statistical tests (KS test, PSI - Population Stability Index)",
	"Identify which features have drifted most significantly",
	"Check for missing values, outliers, or data quality issues"
	]
	},
	{
	"priority": "🔴 IMMEDIATE",
	"action": "Model Retraining",
	"steps": [
	"Collect recent labeled data (last 1-3 months)",
	"Retrain model with updated dataset",
	"Use time-based train/test splits (not random)",
	"Consider ensemble with older model for stability",
	"Validate on holdout set before deployment"
	]
	},
	{
	"priority": "🟠 HIGH",
	"action": "Implement Monitoring",
	"steps": [
	"Set up automated drift detection (PSI, feature drift alerts)",
	"Track precision/recall on rolling windows (daily/weekly)",
	"Monitor false positive rate trends",
	"Alert when metrics drop below thresholds",
	"Dashboard for real-time model health"
	]
	},
	{
	"priority": "🟠 HIGH",
	"action": "Threshold Adjustment",
	"steps": [
	"Temporarily adjust classification threshold to maintain precision",
	"Use probability scores instead of binary predictions",
	"Implement adaptive thresholds based on recent performance",
	"Balance precision vs recall based on business needs"
	]
	},
	{
	"priority": "🟡 MEDIUM",
	"action": "Feature Engineering Updates",
	"steps": [
	"Review and update feature engineering logic",
	"Add new features that capture current fraud patterns",
	"Remove obsolete features",
	"Consider interaction features or time-based features"
	]
	},
	{
	"priority": "🟡 MEDIUM",
	"action": "Continuous Learning Pipeline",
	"steps": [
	"Implement periodic retraining schedule (monthly/quarterly)",
	"Use online learning or incremental updates if applicable",
	"A/B test new model versions before full deployment",
	"Maintain model versioning and rollback capability"
	]
	}
	]

	# Calculate impact
	# Assuming same parameters as before for impact calculation
	# This is a simplified impact - in reality you'd need full business params
	impact_note = "⚠️ Lower precision means more false positives, increasing review costs and customer friction."

	# Format results
	results = f"""
	## 🔍 Model Drift Analysis

	### 📉 Performance Degradation
	- Initial Precision: {initial_precision*100:.1f}%
	- Current Precision: {current_precision*100:.1f}%
	- Precision Drop: {precision_drop*100:.1f} percentage points ({precision_drop_pct:.1f}% relative decrease)
	- Deployment Duration: {months_deployed} months

	- Initial Recall: {initial_recall*100:.1f}%
	- Current Recall: {current_recall*100:.1f}%
	- Recall Change: {recall_change*100:+.1f} percentage points ({recall_change_pct:+.1f}% relative change)

	### {severity} - {urgency}

	---

	## 🎯 Most Likely Cause

	### {causes[0]['rank']}. {causes[0]['cause']}
	Probability: {causes[0]['probability']}

	Explanation:
	{causes[0]['description']}

	Why This Matters:
	- Lower precision = More false positives
	- More legitimate transactions flagged for review
	- Increased operational costs and customer friction
	- Model is becoming less reliable over time

	---

	## 🔧 Appropriate Actions (Priority Order)

	"""

	for action in actions:
	results += f"""
	### {action['priority']} {action['action']}
	"""
	for i, step in enumerate(action['steps'], 1):
	results += f"{i}. {step}\n"
	results += "\n"

	results += f"""
	---

	## 📊 Additional Considerations

	### Why Precision Drops Are Critical:
	1. Financial Impact: More false positives = higher review costs
	2. Customer Experience: Legitimate customers face more friction
	3. Operational Burden: Review teams overwhelmed with false alarms
	4. Trust Erosion: Model loses credibility if too many false alarms

	### Prevention Strategy:
	- Proactive Monitoring: Don't wait for metrics to drop
	- Regular Retraining: Schedule periodic model updates (every 1-3 months)
	- Data Quality: Ensure incoming data matches training data characteristics
	- Feedback Loops: Incorporate labeled outcomes back into training data

	### Expected Timeline:
	- Immediate (Week 1): Data analysis, threshold adjustment
	- Short-term (Weeks 2-4): Model retraining, validation
	- Long-term (Ongoing): Continuous monitoring, scheduled retraining

	---

	## 💡 Key Takeaway

	The most likely cause is DATA DRIFT - your model was trained on data from 3+ months ago, and transaction patterns have changed. The model needs to be retrained on recent data to adapt to current patterns.

	Action: Implement a retraining pipeline with recent labeled data and set up continuous monitoring to catch drift early.
	"""

	return results

	except Exception as e:
	return f"❌ Error analyzing model drift: {str(e)}"


	# Create Gradio interface
	with gr.Blocks(title="Fraud Detection System") as demo:

	gr.Markdown("""
	# 💳 Credit Card Fraud Detection System
	### AI Infinity Programme \| TalentSprint

	This interactive demo allows you to train a fraud detection model and make predictions on credit card transactions.

	How to use:
	1. Upload your training dataset (CSV file)
	2. Train the model
	3. Make single predictions or batch predictions
	""")

	with gr.Tab("📤 Upload & Train Model"):
	gr.Markdown("### Step 1: Upload Training Dataset")
	gr.Markdown("Upload a CSV file containing transaction data with a 'fraud' column (0 = legitimate, 1 = fraud)")

	with gr.Row():
	with gr.Column():
	train_file = gr.File(label="Upload Training CSV", file_types=[".csv"])
	train_button = gr.Button("🚀 Train Model", variant="primary", size="lg")

	with gr.Column():
	train_output = gr.Markdown(label="Training Results")

	train_button.click(
	fn=load_and_train_model,
	inputs=[train_file],
	outputs=[train_output]
	)

	gr.Markdown("""
	---
	Expected CSV format:
	- `transaction_amount`, `transaction_hour`, `distance_from_home_km`, `distance_from_last_transaction_km`,
	- `ratio_to_median_purchase`, `repeat_retailer`, `used_chip`, `used_pin`, `online_order`, `fraud`
	""")

	with gr.Tab("🔍 Single Prediction"):
	gr.Markdown("### Test Individual Transactions")
	gr.Markdown("Enter transaction details to check if it's fraudulent")

	with gr.Row():
	with gr.Column():
	amount = gr.Number(label="Transaction Amount ($)", value=100)
	hour = gr.Slider(0, 23, step=1, label="Transaction Hour (0-23)", value=14)
	dist_home = gr.Number(label="Distance from Home (km)", value=10)
	dist_last = gr.Number(label="Distance from Last Transaction (km)", value=5)
	ratio_median = gr.Number(label="Ratio to Median Purchase", value=1.0)

	with gr.Column():
	repeat_retailer = gr.Checkbox(label="Repeat Retailer", value=True)
	used_chip = gr.Checkbox(label="Used Chip", value=True)
	used_pin = gr.Checkbox(label="Used PIN", value=True)
	online_order = gr.Checkbox(label="Online Order", value=False)

	predict_button = gr.Button("🔮 Predict", variant="primary", size="lg")

	with gr.Row():
	prediction_output = gr.Markdown(label="Prediction Result")
	prediction_label = gr.Markdown(label="Quick Result")

	predict_button.click(
	fn=predict_single_transaction,
	inputs=[amount, hour, dist_home, dist_last, ratio_median,
	repeat_retailer, used_chip, used_pin, online_order],
	outputs=[prediction_output, prediction_label]
	)

	gr.Markdown("---")
	gr.Markdown("### 🧪 Quick Test Scenarios")

	with gr.Row():
	gr.Markdown("""
	Scenario 1: Obvious Fraud
	- Amount: $4500, Hour: 3, Dist Home: 800km
	- New retailer, no chip/PIN, online
	""")
	gr.Markdown("""
	Scenario 2: Normal Transaction
	- Amount: $45, Hour: 14, Dist Home: 5km
	- Repeat retailer, chip + PIN, in-person
	""")
	gr.Markdown("""
	Scenario 3: Suspicious
	- Amount: $350, Hour: 22, Dist Home: 60km
	- New retailer, chip but no PIN, online
	""")

	with gr.Tab("📊 Batch Predictions"):
	gr.Markdown("### Upload Multiple Transactions")
	gr.Markdown("Upload a CSV file with multiple transactions to get predictions for all of them")

	with gr.Row():
	with gr.Column():
	batch_file = gr.File(label="Upload Test CSV", file_types=[".csv"])
	batch_button = gr.Button("📈 Predict Batch", variant="primary", size="lg")

	with gr.Column():
	batch_output = gr.Markdown(label="Batch Results")
	download_file = gr.File(label="Download Results CSV")

	batch_button.click(
	fn=predict_batch,
	inputs=[batch_file],
	outputs=[download_file, batch_output]
	)

	with gr.Tab("💰 Business Impact Calculator"):
	gr.Markdown("### Calculate Financial Impact of Your Fraud Detection Model")
	gr.Markdown("Enter your model's performance metrics and business parameters to see the financial impact")

	with gr.Row():
	with gr.Column():
	gr.Markdown("#### 📊 Model Performance Metrics")
	precision_input = gr.Slider(0, 1, step=0.01, value=0.85, label="Precision (0-1)", info="Of flagged transactions, what % are actually fraud?")
	recall_input = gr.Slider(0, 1, step=0.01, value=0.90, label="Recall (0-1)", info="Of all frauds, what % does the model catch?")

	gr.Markdown("#### 🏦 Business Parameters")
	total_transactions = gr.Number(label="Total Transactions per Month", value=1000000, precision=0)
	fraud_rate = gr.Slider(0, 10, step=0.01, value=1.0, label="Fraud Rate (%)", info="Percentage of transactions that are fraudulent")

	gr.Markdown("#### 💵 Cost Parameters")
	fraud_loss = gr.Number(label="Average Fraud Loss per Transaction ($)", value=500, precision=2)
	review_cost = gr.Number(label="Manual Review Cost per Flagged Transaction ($)", value=2.00, precision=2)

	calc_button = gr.Button("💰 Calculate Business Impact", variant="primary", size="lg")

	with gr.Column():
	impact_output = gr.Markdown(label="Business Impact Analysis")

	calc_button.click(
	fn=calculate_business_impact,
	inputs=[total_transactions, fraud_rate, precision_input, recall_input, fraud_loss, review_cost],
	outputs=[impact_output]
	)

	gr.Markdown("---")
	gr.Markdown("""
	### 📚 How to Use This Calculator

	Example Scenario:
	- Bank processes 1 million transactions/month
	- Model has 85% precision and 90% recall
	- 1% of transactions are fraudulent
	- Average fraud loss: $500 per transaction
	- Manual review cost: $2 per flagged transaction

	What This Calculates:
	1. True Positives: Frauds caught by the model
	2. False Negatives: Frauds missed (costly!)
	3. False Positives: Legitimate transactions flagged (review costs)
	4. Net Benefit: Total financial impact of using the model

	Key Insight: The primary benefit is the net savings compared to having no fraud detection system.
	""")

	with gr.Tab("📉 Model Drift Analysis"):
	gr.Markdown("### Analyze Model Performance Degradation")
	gr.Markdown("If your model's precision or recall has dropped over time, use this tool to identify likely causes and appropriate actions")

	with gr.Row():
	with gr.Column():
	gr.Markdown("#### 📊 Initial Performance (At Deployment)")
	initial_precision = gr.Slider(0, 1, step=0.01, value=0.85, label="Initial Precision", info="Model precision when first deployed")
	initial_recall = gr.Slider(0, 1, step=0.01, value=0.90, label="Initial Recall", info="Model recall when first deployed")

	gr.Markdown("#### 📉 Current Performance (Now)")
	current_precision = gr.Slider(0, 1, step=0.01, value=0.70, label="Current Precision", info="Model precision after deployment period")
	current_recall = gr.Slider(0, 1, step=0.01, value=0.90, label="Current Recall", info="Model recall now (may have changed)")

	gr.Markdown("#### ⏱️ Deployment Information")
	months_deployed = gr.Number(label="Months Since Deployment", value=3, precision=1, info="How long has the model been in production?")

	analyze_button = gr.Button("🔍 Analyze Model Drift", variant="primary", size="lg")

	with gr.Column():
	drift_output = gr.Markdown(label="Drift Analysis & Recommendations")

	analyze_button.click(
	fn=analyze_model_drift,
	inputs=[initial_precision, current_precision, months_deployed, initial_recall, current_recall],
	outputs=[drift_output]
	)

	gr.Markdown("---")
	gr.Markdown("""
	### 📚 Understanding Model Drift

	What is Model Drift?
	Model drift occurs when a machine learning model's performance degrades over time because the data it encounters in production differs from the data it was trained on.

	Common Scenarios:
	- Precision drops from 85% to 70% → More false positives (legitimate transactions flagged)
	- Recall drops → More frauds missed (false negatives)
	- Both drop → Model is becoming unreliable

	Why It Happens:
	1. Customer behavior changes (new spending patterns, seasonal trends)
	2. Fraudsters adapt their tactics
	3. New products/services introduced
	4. Changes in transaction processing systems
	5. External factors (economic changes, regulations)

	Example:
	After 3 months, precision drops from 85% to 70%. This means:
	- Previously: 85 out of 100 flagged transactions were fraud
	- Now: Only 70 out of 100 flagged transactions are fraud
	- 30% increase in false positives = Higher review costs, customer friction
	""")

	with gr.Tab("ℹ️ About"):
	gr.Markdown("""
	## About This Demo

	This fraud detection system uses a Random Forest Classifier to identify potentially fraudulent credit card transactions.

	### Features Used:
	1. transaction_amount: Transaction value in dollars
	2. transaction_hour: Hour of day (0-23)
	3. distance_from_home_km: Distance from cardholder's home
	4. distance_from_last_transaction_km: Distance from previous transaction
	5. ratio_to_median_purchase: Ratio compared to typical spending
	6. repeat_retailer: Whether customer used this merchant before
	7. used_chip: Whether chip card was used
	8. used_pin: Whether PIN was entered
	9. online_order: Whether transaction was online

	### Model Performance:
	The model is trained to maximize recall (catching frauds) while maintaining reasonable precision (avoiding false alarms).

	### Important Metrics:
	- Precision: Of flagged transactions, how many are actually fraud?
	- Recall: Of all frauds, how many do we catch?
	- F1-Score: Balance between precision and recall

	### Business Impact:
	- False Negative (missed fraud): Very costly - customer loses money
	- False Positive (false alarm): Moderately costly - customer inconvenience

	---

	Created for: AI Infinity Programme \| TalentSprint
	Target Audience: Software engineers transitioning to AI roles
	Educational Purpose: Understanding classification, metrics, and business logic
	""")

	# Launch the app
	if __name__ == "__main__":
	demo.launch()