Spaces:

Ariyan-Pro
/

Self-Healing-ML-Pipelines

Sleeping

App Files Files Community

Self-Healing-ML-Pipelines / experiments /concept_shift_simulator.py

Ariyan-Pro

🚀 Initial upload: Self-Healing ML Pipelines

11898c7 verified 4 months ago

raw

history blame contribute delete

9.86 kB

	"""
	Concept Shift Simulator for ML pipeline testing
	"""
	import numpy as np
	import pandas as pd
	from sklearn.linear_model import LogisticRegression
	from sklearn.model_selection import train_test_split
	from sklearn.metrics import accuracy_score
	import time
	import json
	from datetime import datetime

	class ConceptShiftSimulator:
	"""Simulates concept shift (relationship changes) in ML data"""

	def __init__(self, seed=42):
	self.seed = seed
	np.random.seed(seed)
	self.results = []

	def generate_synthetic_data(self, n_samples=1000, n_features=10):
	"""Generate synthetic classification data"""
	X = np.random.randn(n_samples, n_features)

	# Create meaningful coefficients
	coefficients = np.random.randn(n_features)
	coefficients = coefficients / np.linalg.norm(coefficients)

	# Generate labels with some noise
	logits = X @ coefficients
	probabilities = 1 / (1 + np.exp(-logits))
	y = (probabilities > 0.5).astype(int)

	# Add some label noise
	noise_mask = np.random.random(n_samples) < 0.1
	y[noise_mask] = 1 - y[noise_mask]

	return X, y, coefficients

	def induce_concept_shift(self, X, coefficients, shift_type='abrupt', magnitude=0.3):
	"""Induce concept shift by changing feature relationships"""
	n_samples, n_features = X.shape

	if shift_type == 'abrupt':
	# Abrupt change: flip signs of some coefficients
	new_coefficients = coefficients.copy()
	# Fix: Use len(new_coefficients) instead of n_features
	new_coefficients[:int(len(new_coefficients) * magnitude)] *= -1

	elif shift_type == 'gradual':
	# Gradual change: interpolate between original and flipped
	new_coefficients = coefficients.copy()
	flip_indices = np.random.choice(
	n_features,
	size=int(n_features * magnitude),
	replace=False
	)
	for idx in flip_indices:
	new_coefficients[idx] = -coefficients[idx] * magnitude

	elif shift_type == 'recurring':
	# Recurring: oscillate between patterns
	new_coefficients = coefficients.copy()
	oscillation = np.sin(np.arange(n_features) * 0.5) * magnitude
	new_coefficients *= (1 + oscillation)

	# Generate new labels with shifted concept
	logits = X @ new_coefficients
	probabilities = 1 / (1 + np.exp(-logits))
	y_shifted = (probabilities > 0.5).astype(int)

	# Add noise
	noise_mask = np.random.random(n_samples) < 0.1
	y_shifted[noise_mask] = 1 - y_shifted[noise_mask]

	return X, y_shifted, new_coefficients

	def train_model(self, X_train, y_train):
	"""Train a simple classifier"""
	model = LogisticRegression(random_state=self.seed, max_iter=1000)
	model.fit(X_train, y_train)
	return model

	def evaluate_shift(self, model, X_test, y_original, y_shifted):
	"""Evaluate impact of concept shift"""
	# Predictions on original and shifted data
	y_pred_original = model.predict(X_test)
	y_pred_shifted = model.predict(X_test)

	# Calculate metrics
	acc_original = accuracy_score(y_original, y_pred_original)
	acc_shifted = accuracy_score(y_shifted, y_pred_shifted)

	accuracy_drop = acc_original - acc_shifted

	# Calculate drift score (difference in prediction distributions)
	drift_score = np.abs(y_pred_original - y_pred_shifted).mean()

	return {
	'accuracy_original': acc_original,
	'accuracy_shifted': acc_shifted,
	'accuracy_drop': accuracy_drop,
	'drift_score': drift_score,
	'shift_detected': accuracy_drop > 0.1 # Threshold for detection
	}

	def run_experiment(self, shift_type='abrupt', magnitude=0.3):
	"""Run a complete concept shift experiment"""
	print(f"\n🔍 Running Concept Shift Experiment:")
	print(f" Type: {shift_type}")
	print(f" Magnitude: {magnitude}")

	# 1. Generate data
	X, y_original, coefficients = self.generate_synthetic_data()
	X_train, X_test, y_train, y_test = train_test_split(
	X, y_original, test_size=0.3, random_state=self.seed
	)

	# 2. Train initial model
	start_time = time.time()
	model = self.train_model(X_train, y_train)
	training_time = (time.time() - start_time) * 1000 # ms

	# 3. Induce concept shift in test data
	X_test_shifted, y_test_shifted, _ = self.induce_concept_shift(
	X_test, coefficients, shift_type, magnitude
	)

	# 4. Evaluate shift
	start_time = time.time()
	evaluation = self.evaluate_shift(model, X_test, y_test, y_test_shifted)
	evaluation_time = (time.time() - start_time) * 1000 # ms

	# 5. Record results
	result = {
	'shift_type': shift_type,
	'magnitude': magnitude,
	'training_time_ms': training_time,
	'evaluation_time_ms': evaluation_time,
	**evaluation
	}

	self.results.append(result)

	# 6. Print results
	print(f"📊 Results:")
	print(f" Accuracy drop: {result['accuracy_drop']:.3f}")
	print(f" Drift score: {result['drift_score']:.3f}")
	print(f" Shift detected: {result['shift_detected']}")
	print(f" Training time: {training_time:.2f} ms")
	print(f" Evaluation time: {evaluation_time:.2f} ms")

	return result

	def run_comprehensive_test(self):
	"""Run multiple concept shift scenarios"""
	print("🧪 Running comprehensive concept shift experiments...")

	scenarios = [
	('abrupt', 0.1),
	('abrupt', 0.3),
	('abrupt', 0.5),
	('gradual', 0.2),
	('gradual', 0.4),
	('recurring', 0.3)
	]

	for shift_type, magnitude in scenarios:
	try:
	self.run_experiment(shift_type, magnitude)
	except Exception as e:
	print(f"❌ Error in scenario ({shift_type}, {magnitude}): {e}")
	# Continue with other scenarios
	continue

	return self.generate_summary_report()

	def generate_summary_report(self):
	"""Generate comprehensive experiment report"""
	if not self.results:
	print("⚠️ No results to summarize")
	return None

	print("\n" + "="*60)
	print("📈 CONCEPT SHIFT EXPERIMENT SUMMARY")
	print("="*60)

	# Calculate statistics
	detected = [r for r in self.results if r['shift_detected']]
	not_detected = [r for r in self.results if not r['shift_detected']]

	print(f"\nDetection Performance:")
	print(f" Shifts detected: {len(detected)}/{len(self.results)} scenarios")

	if detected:
	avg_accuracy_drop = np.mean([r['accuracy_drop'] for r in detected])
	avg_drift_score = np.mean([r['drift_score'] for r in detected])
	avg_eval_time = np.mean([r['evaluation_time_ms'] for r in detected])

	print(f"\n📊 Metrics (detected scenarios):")
	print(f" Average accuracy drop: {avg_accuracy_drop:.3f}")
	print(f" Average drift score: {avg_drift_score:.3f}")
	print(f" Average evaluation time: {avg_eval_time:.2f} ms")

	# Save detailed results
	timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
	output_file = f"concept_shift_results_{timestamp}.json"

	with open(output_file, 'w') as f:
	json.dump({
	'timestamp': datetime.now().isoformat(),
	'scenarios': len(self.results),
	'detected': len(detected),
	'results': self.results,
	'summary': {
	'detection_rate': len(detected)/len(self.results) if self.results else 0,
	'avg_accuracy_drop': float(avg_accuracy_drop) if detected else 0,
	'avg_drift_score': float(avg_drift_score) if detected else 0
	}
	}, f, indent=2, default=str)

	print(f"\n📁 Detailed results saved to: {output_file}")

	return {
	'detection_rate': len(detected)/len(self.results) if self.results else 0,
	'avg_accuracy_drop': avg_accuracy_drop if detected else 0,
	'avg_drift_score': avg_drift_score if detected else 0,
	'output_file': output_file
	}

	def main():
	"""Command-line interface"""
	import argparse

	parser = argparse.ArgumentParser(description='Run concept shift experiments')
	parser.add_argument('--scenario', type=str, default='comprehensive',
	choices=['abrupt', 'gradual', 'recurring', 'comprehensive'],
	help='Concept shift scenario to run')
	parser.add_argument('--magnitude', type=float, default=0.3,
	help='Shift magnitude (0.1 to 0.5)')

	args = parser.parse_args()

	simulator = ConceptShiftSimulator()

	if args.scenario == 'comprehensive':
	print("🧪 Running comprehensive concept shift experiments...")
	simulator.run_comprehensive_test()
	else:
	print(f"🧪 Running {args.scenario} concept shift experiment...")
	simulator.run_experiment(args.scenario, args.magnitude)

	if __name__ == "__main__":
	main()