Spaces:

Dyra1204
/

ViT-Auditing-Toolkit

Sleeping

App Files Files Community

Dyuti Dasmahapatra commited on Oct 12

Commit

dd5a03c

1 Parent(s): a01dc02

Phase 2: Dashboard Integrated

Browse files

Files changed (3) hide show

app.py +443 -0
src/auditor.py +471 -0
tests/test_advanced_features.py +140 -0

app.py CHANGED Viewed

	@@ -0,0 +1,443 @@

+# app.py
+import gradio as gr
+import sys
+import os
+import matplotlib.pyplot as plt
+from PIL import Image
+import numpy as np
+import time
+import torch
+# Add src to path
+sys.path.append(os.path.join(os.path.dirname(__file__), 'src'))
+from model_loader import load_model_and_processor, SUPPORTED_MODELS
+from predictor import predict_image, create_prediction_plot
+from explainer import explain_attention, explain_gradcam, explain_gradient_shap
+from auditor import create_auditors
+from utils import preprocess_image, get_top_predictions_dict
+# Global variables to cache model and processor
+model = None
+processor = None
+current_model_name = None
+auditors = None
+def load_selected_model(model_name):
+    """Load the selected model and cache it globally."""
+    global model, processor, current_model_name, auditors
+    try:
+        if model is None or current_model_name != model_name:
+            print(f"Loading model: {model_name}")
+            model, processor = load_model_and_processor(model_name)
+            current_model_name = model_name
+            # Initialize auditors
+            auditors = create_auditors(model, processor)
+            print("✅ Model and auditors loaded successfully!")
+        return f"✅ Model loaded: {model_name}"
+    except Exception as e:
+        return f"❌ Error loading model: {str(e)}"
+def analyze_image_basic(image, model_choice, xai_method, layer_index, head_index):
+    """
+    Basic explainability analysis - the core function for Tab 1.
+    """
+    try:
+        # Load model if needed
+        model_status = load_selected_model(SUPPORTED_MODELS[model_choice])
+        if "❌" in model_status:
+            return None, None, None, model_status
+        # Preprocess image
+        if image is None:
+            return None, None, None, "⚠️ Please upload an image first."
+        processed_image = preprocess_image(image)
+        # Get predictions
+        probs, indices, labels = predict_image(processed_image, model, processor)
+        pred_fig = create_prediction_plot(probs, labels)
+        # Generate explanation based on selected method
+        explanation_fig = None
+        explanation_image = None
+        if xai_method == "Attention Visualization":
+            explanation_fig = explain_attention(
+                model, processor, processed_image,
+                layer_index=layer_index, head_index=head_index
+            )
+        elif xai_method == "GradCAM":
+            explanation_fig, explanation_image = explain_gradcam(
+                model, processor, processed_image
+            )
+        elif xai_method == "GradientSHAP":
+            explanation_fig = explain_gradient_shap(
+                model, processor, processed_image, n_samples=3
+            )
+        # Convert predictions to dictionary for Gradio Label
+        pred_dict = get_top_predictions_dict(probs, labels)
+        return processed_image, pred_fig, explanation_fig, f"✅ Analysis complete! Top prediction: {labels[0]} ({probs[0]:.2%})"
+    except Exception as e:
+        error_msg = f"❌ Analysis failed: {str(e)}"
+        print(error_msg)
+        return None, None, None, error_msg
+def analyze_counterfactual(image, model_choice, patch_size, perturbation_type):
+    """
+    Counterfactual analysis for Tab 2.
+    """
+    try:
+        # Load model if needed
+        model_status = load_selected_model(SUPPORTED_MODELS[model_choice])
+        if "❌" in model_status:
+            return None, None, model_status
+        if image is None:
+            return None, None, "⚠️ Please upload an image first."
+        processed_image = preprocess_image(image)
+        # Perform counterfactual analysis
+        results = auditors['counterfactual'].patch_perturbation_analysis(
+            processed_image,
+            patch_size=patch_size,
+            perturbation_type=perturbation_type
+        )
+        # Create summary message
+        summary = (
+            f"🔍 Counterfactual Analysis Complete!\n"
+            f"• Avg confidence change: {results['avg_confidence_change']:.4f}\n"
+            f"• Prediction flip rate: {results['prediction_flip_rate']:.2%}\n"
+            f"• Most sensitive patch: {results['most_sensitive_patch']}"
+        )
+        return results['figure'], summary
+    except Exception as e:
+        error_msg = f"❌ Counterfactual analysis failed: {str(e)}"
+        print(error_msg)
+        return None, error_msg
+def analyze_calibration(image, model_choice, n_bins):
+    """
+    Confidence calibration analysis for Tab 3.
+    """
+    try:
+        # Load model if needed
+        model_status = load_selected_model(SUPPORTED_MODELS[model_choice])
+        if "❌" in model_status:
+            return None, None, model_status
+        if image is None:
+            return None, None, "⚠️ Please upload an image first."
+        processed_image = preprocess_image(image)
+        # For demo purposes, create a simple test set from the uploaded image
+        # In a real scenario, you'd use a proper validation set
+        test_images = [processed_image] * 10  # Create multiple copies
+        # Perform calibration analysis
+        results = auditors['calibration'].analyze_calibration(
+            test_images, n_bins=n_bins
+        )
+        # Create summary message
+        metrics = results['metrics']
+        summary = (
+            f"📊 Calibration Analysis Complete!\n"
+            f"• Mean confidence: {metrics['mean_confidence']:.3f}\n"
+            f"• Overconfident rate: {metrics['overconfident_rate']:.2%}\n"
+            f"• Underconfident rate: {metrics['underconfident_rate']:.2%}"
+        )
+        return results['figure'], summary
+    except Exception as e:
+        error_msg = f"❌ Calibration analysis failed: {str(e)}"
+        print(error_msg)
+        return None, error_msg
+def analyze_bias_detection(image, model_choice):
+    """
+    Bias detection analysis for Tab 4.
+    """
+    try:
+        # Load model if needed
+        model_status = load_selected_model(SUPPORTED_MODELS[model_choice])
+        if "❌" in model_status:
+            return None, None, model_status
+        if image is None:
+            return None, None, "⚠️ Please upload an image first."
+        processed_image = preprocess_image(image)
+        # Create demo subgroups based on the uploaded image
+        # In a real scenario, you'd use predefined subgroups from your dataset
+        subsets = []
+        subset_names = ['Original', 'Brightness+', 'Brightness-', 'Contrast+']
+        # Original image
+        subsets.append([processed_image])
+        # Brightness increased
+        bright_image = processed_image.copy().point(lambda p: min(255, p * 1.5))
+        subsets.append([bright_image])
+        # Brightness decreased
+        dark_image = processed_image.copy().point(lambda p: p * 0.7)
+        subsets.append([dark_image])
+        # Contrast increased
+        contrast_image = processed_image.copy().point(lambda p: 128 + (p - 128) * 1.5)
+        subsets.append([contrast_image])
+        # Perform bias analysis
+        results = auditors['bias'].analyze_subgroup_performance(
+            subsets, subset_names
+        )
+        # Create summary message
+        subgroup_metrics = results['subgroup_metrics']
+        summary = f"⚖️ Bias Detection Complete!\nAnalyzed {len(subgroup_metrics)} subgroups:\n"
+        for name, metrics in subgroup_metrics.items():
+            summary += f"• {name}: confidence={metrics['mean_confidence']:.3f}\n"
+        return results['figure'], summary
+    except Exception as e:
+        error_msg = f"❌ Bias detection failed: {str(e)}"
+        print(error_msg)
+        return None, error_msg
+def create_demo_image():
+    """Create a demo image for first-time users."""
+    # Create a simple demo image with multiple colors
+    img = Image.new('RGB', (224, 224), color=(150, 100, 100))
+    # Add different colored regions
+    for x in range(50, 150):
+        for y in range(50, 150):
+            img.putpixel((x, y), (100, 200, 100))  # Green square
+    for x in range(160, 200):
+        for y in range(160, 200):
+            img.putpixel((x, y), (100, 100, 200))  # Blue square
+    return img
+# Create the Gradio interface
+with gr.Blocks(theme=gr.themes.Soft(), title="ViT Auditing Toolkit") as demo:
+    gr.Markdown(
+        """
+        # 🎯 ViT Auditing Toolkit
+        ### An Interactive Dashboard for Model Explainability and Validation
+        Upload an image or use the demo image to analyze Vision Transformer model predictions
+        and explore various explanation methods.
+        """
+    )
+    # Model selection (shared across all tabs)
+    with gr.Row():
+        model_choice = gr.Dropdown(
+            choices=list(SUPPORTED_MODELS.keys()),
+            value="ViT-Base",
+            label="🎯 Select Model",
+            info="Choose which Vision Transformer model to use"
+        )
+        load_btn = gr.Button("🔄 Load Model", variant="primary")
+        model_status = gr.Textbox(label="Model Status", interactive=False)
+    load_btn.click(
+        fn=lambda model: load_selected_model(SUPPORTED_MODELS[model]),
+        inputs=[model_choice],
+        outputs=[model_status]
+    )
+    # Tabbed interface
+    with gr.Tabs():
+        # Tab 1: Basic Explainability
+        with gr.TabItem("🔍 Basic Explainability"):
+            with gr.Row():
+                with gr.Column(scale=1):
+                    image_input = gr.Image(
+                        label="📁 Upload Image",
+                        type="pil",
+                        value=create_demo_image()
+                    )
+                    with gr.Accordion("⚙️ Explanation Settings", open=False):
+                        xai_method = gr.Dropdown(
+                            choices=[
+                                "Attention Visualization",
+                                "GradCAM",
+                                "GradientSHAP"
+                            ],
+                            value="Attention Visualization",
+                            label="Explanation Method"
+                        )
+                        with gr.Row():
+                            layer_index = gr.Slider(
+                                minimum=0, maximum=11, value=6, step=1,
+                                label="Attention Layer Index"
+                            )
+                            head_index = gr.Slider(
+                                minimum=0, maximum=11, value=0, step=1,
+                                label="Attention Head Index"
+                            )
+                    analyze_btn = gr.Button("🚀 Analyze Image", variant="primary")
+                    status_output = gr.Textbox(label="Status", interactive=False)
+                with gr.Column(scale=2):
+                    with gr.Row():
+                        original_display = gr.Image(
+                            label="📸 Processed Image",
+                            interactive=False
+                        )
+                        prediction_display = gr.Plot(
+                            label="📊 Model Predictions"
+                        )
+                    explanation_display = gr.Plot(
+                        label="🔍 Explanation Visualization"
+                    )
+            # Connect the analyze button
+            analyze_btn.click(
+                fn=analyze_image_basic,
+                inputs=[image_input, model_choice, xai_method, layer_index, head_index],
+                outputs=[original_display, prediction_display, explanation_display, status_output]
+            )
+        # Tab 2: Counterfactual Analysis
+        with gr.TabItem("🔄 Counterfactual Analysis"):
+            with gr.Row():
+                with gr.Column(scale=1):
+                    cf_image_input = gr.Image(
+                        label="📁 Upload Image",
+                        type="pil",
+                        value=create_demo_image()
+                    )
+                    with gr.Accordion("⚙️ Counterfactual Settings", open=True):
+                        patch_size = gr.Slider(
+                            minimum=16, maximum=64, value=32, step=16,
+                            label="Patch Size"
+                        )
+                        perturbation_type = gr.Dropdown(
+                            choices=["blur", "blackout", "gray", "noise"],
+                            value="blur",
+                            label="Perturbation Type"
+                        )
+                    cf_analyze_btn = gr.Button("🔄 Run Counterfactual Analysis", variant="primary")
+                    cf_status_output = gr.Textbox(label="Status", interactive=False)
+                with gr.Column(scale=2):
+                    cf_explanation_display = gr.Plot(
+                        label="🔄 Counterfactual Analysis Results"
+                    )
+            cf_analyze_btn.click(
+                fn=analyze_counterfactual,
+                inputs=[cf_image_input, model_choice, patch_size, perturbation_type],
+                outputs=[cf_explanation_display, cf_status_output]
+            )
+        # Tab 3: Confidence Calibration
+        with gr.TabItem("📊 Confidence Calibration"):
+            with gr.Row():
+                with gr.Column(scale=1):
+                    cal_image_input = gr.Image(
+                        label="📁 Upload Sample Image (Used to generate demo test set)",
+                        type="pil",
+                        value=create_demo_image()
+                    )
+                    with gr.Accordion("⚙️ Calibration Settings", open=True):
+                        n_bins = gr.Slider(
+                            minimum=5, maximum=20, value=10, step=1,
+                            label="Number of Bins"
+                        )
+                    cal_analyze_btn = gr.Button("📊 Analyze Calibration", variant="primary")
+                    cal_status_output = gr.Textbox(label="Status", interactive=False)
+                with gr.Column(scale=2):
+                    cal_explanation_display = gr.Plot(
+                        label="📊 Calibration Analysis Results"
+                    )
+            cal_analyze_btn.click(
+                fn=analyze_calibration,
+                inputs=[cal_image_input, model_choice, n_bins],
+                outputs=[cal_explanation_display, cal_status_output]
+            )
+        # Tab 4: Bias Detection
+        with gr.TabItem("⚖️ Bias Detection"):
+            with gr.Row():
+                with gr.Column(scale=1):
+                    bias_image_input = gr.Image(
+                        label="📁 Upload Sample Image (Used to generate demo subgroups)",
+                        type="pil",
+                        value=create_demo_image()
+                    )
+                    bias_analyze_btn = gr.Button("⚖️ Detect Bias", variant="primary")
+                    bias_status_output = gr.Textbox(label="Status", interactive=False)
+                with gr.Column(scale=2):
+                    bias_explanation_display = gr.Plot(
+                        label="⚖️ Bias Detection Results"
+                    )
+            bias_analyze_btn.click(
+                fn=analyze_bias_detection,
+                inputs=[bias_image_input, model_choice],
+                outputs=[bias_explanation_display, bias_status_output]
+            )
+    # Footer
+    gr.Markdown(
+        """
+        ---
+        ### 🛠️ About This Toolkit
+        This interactive dashboard provides comprehensive auditing capabilities for Vision Transformer models:
+        - **🔍 Basic Explainability**: Understand model predictions with attention maps, GradCAM, and SHAP
+        - **🔄 Counterfactual Analysis**: Test how predictions change with image perturbations
+        - **📊 Confidence Calibration**: Evaluate if the model is properly calibrated
+        - **⚖️ Bias Detection**: Identify performance variations across different subgroups
+        Built with ❤️ using Gradio, Transformers, and Captum.
+        """
+    )
+# Launch the application
+if __name__ == "__main__":
+    demo.launch(
+        server_name="localhost",  # Changed from "0.0.0.0"
+        server_port=7860,
+        share=False,
+        show_error=True
+    )

src/auditor.py ADDED Viewed

	@@ -0,0 +1,471 @@

+# src/auditor.py
+import torch
+import numpy as np
+import matplotlib.pyplot as plt
+from PIL import Image, ImageDraw, ImageFilter
+import torch.nn.functional as F
+from scipy import stats
+from sklearn.calibration import calibration_curve
+from sklearn.metrics import brier_score_loss
+import pandas as pd
+class CounterfactualAnalyzer:
+    """Analyze how predictions change with image perturbations."""
+    def __init__(self, model, processor):
+        self.model = model
+        self.processor = processor
+        self.device = next(model.parameters()).device
+    def patch_perturbation_analysis(self, image, patch_size=16, perturbation_type='blur'):
+        """
+        Analyze how predictions change when different patches are perturbed.
+        Args:
+            image: PIL Image
+            patch_size: Size of patches to perturb
+            perturbation_type: Type of perturbation ('blur', 'noise', 'blackout', 'gray')
+        Returns:
+            dict: Analysis results with visualizations
+        """
+        original_probs, _, original_labels = self._predict_image(image)
+        original_top_label = original_labels[0]
+        original_confidence = original_probs[0]
+        # Get image dimensions
+        width, height = image.size
+        # Create grid of patches
+        patches_x = width // patch_size
+        patches_y = height // patch_size
+        # Store results
+        confidence_changes = []
+        prediction_changes = []
+        patch_heatmap = np.zeros((patches_y, patches_x))
+        for i in range(patches_y):
+            for j in range(patches_x):
+                # Create perturbed image
+                perturbed_img = self._perturb_patch(
+                    image.copy(), j, i, patch_size, perturbation_type
+                )
+                # Get prediction on perturbed image
+                perturbed_probs, _, perturbed_labels = self._predict_image(perturbed_img)
+                perturbed_confidence = perturbed_probs[0]
+                perturbed_label = perturbed_labels[0]
+                # Calculate changes
+                confidence_change = perturbed_confidence - original_confidence
+                prediction_change = 1 if perturbed_label != original_top_label else 0
+                confidence_changes.append(confidence_change)
+                prediction_changes.append(prediction_change)
+                patch_heatmap[i, j] = confidence_change
+        # Create visualization
+        fig = self._create_counterfactual_visualization(
+            image, patch_heatmap, patch_size, original_top_label,
+            original_confidence, confidence_changes, prediction_changes
+        )
+        return {
+            'figure': fig,
+            'patch_heatmap': patch_heatmap,
+            'avg_confidence_change': np.mean(confidence_changes),
+            'prediction_flip_rate': np.mean(prediction_changes),
+            'most_sensitive_patch': np.unravel_index(np.argmin(patch_heatmap), patch_heatmap.shape)
+        }
+    def _perturb_patch(self, image, patch_x, patch_y, patch_size, perturbation_type):
+        """Apply perturbation to a specific patch."""
+        left = patch_x * patch_size
+        upper = patch_y * patch_size
+        right = left + patch_size
+        lower = upper + patch_size
+        patch_box = (left, upper, right, lower)
+        if perturbation_type == 'blur':
+            # Extract patch, blur it, and paste back
+            patch = image.crop(patch_box)
+            blurred_patch = patch.filter(ImageFilter.GaussianBlur(5))
+            image.paste(blurred_patch, patch_box)
+        elif perturbation_type == 'blackout':
+            # Black out the patch
+            draw = ImageDraw.Draw(image)
+            draw.rectangle(patch_box, fill='black')
+        elif perturbation_type == 'gray':
+            # Convert patch to grayscale
+            patch = image.crop(patch_box)
+            gray_patch = patch.convert('L').convert('RGB')
+            image.paste(gray_patch, patch_box)
+        elif perturbation_type == 'noise':
+            # Add noise to patch
+            patch = np.array(image.crop(patch_box))
+            noise = np.random.normal(0, 50, patch.shape).astype(np.uint8)
+            noisy_patch = np.clip(patch + noise, 0, 255).astype(np.uint8)
+            image.paste(Image.fromarray(noisy_patch), patch_box)
+        return image
+    def _predict_image(self, image):
+        """Helper function to get predictions."""
+        from predictor import predict_image
+        return predict_image(image, self.model, self.processor, top_k=5)
+    def _create_counterfactual_visualization(self, image, patch_heatmap, patch_size,
+                                           original_label, original_confidence,
+                                           confidence_changes, prediction_changes):
+        """Create visualization for counterfactual analysis."""
+        fig, ((ax1, ax2), (ax3, ax4)) = plt.subplots(2, 2, figsize=(15, 12))
+        # Original image
+        ax1.imshow(image)
+        ax1.set_title(f'Original Image\nPrediction: {original_label} ({original_confidence:.2%})',
+                     fontweight='bold')
+        ax1.axis('off')
+        # Patch sensitivity heatmap
+        im = ax2.imshow(patch_heatmap, cmap='RdBu_r', vmin=-0.5, vmax=0.5)
+        ax2.set_title('Patch Sensitivity Heatmap\n(Confidence Change When Perturbed)',
+                     fontweight='bold')
+        ax2.set_xlabel('Patch X')
+        ax2.set_ylabel('Patch Y')
+        plt.colorbar(im, ax=ax2, label='Confidence Change')
+        # Add patch grid to original image
+        width, height = image.size
+        for i in range(patch_heatmap.shape[0]):
+            for j in range(patch_heatmap.shape[1]):
+                rect = plt.Rectangle((j * patch_size, i * patch_size),
+                                   patch_size, patch_size,
+                                   linewidth=1, edgecolor='red',
+                                   facecolor='none', alpha=0.3)
+                ax1.add_patch(rect)
+        # Confidence change distribution
+        ax3.hist(confidence_changes, bins=20, alpha=0.7, color='skyblue')
+        ax3.axvline(0, color='red', linestyle='--', label='No Change')
+        ax3.set_xlabel('Confidence Change')
+        ax3.set_ylabel('Frequency')
+        ax3.set_title('Distribution of Confidence Changes', fontweight='bold')
+        ax3.legend()
+        ax3.grid(alpha=0.3)
+        # Prediction flip analysis
+        flip_rate = np.mean(prediction_changes)
+        ax4.bar(['No Flip', 'Flip'], [1 - flip_rate, flip_rate], color=['green', 'red'])
+        ax4.set_ylabel('Proportion')
+        ax4.set_title(f'Prediction Flip Rate: {flip_rate:.2%}', fontweight='bold')
+        ax4.grid(alpha=0.3)
+        plt.tight_layout()
+        return fig
+class ConfidenceCalibrationAnalyzer:
+    """Analyze model calibration and confidence metrics."""
+    def __init__(self, model, processor):
+        self.model = model
+        self.processor = processor
+        self.device = next(model.parameters()).device
+    def analyze_calibration(self, test_images, test_labels=None, n_bins=10):
+        """
+        Analyze model calibration using confidence scores.
+        Args:
+            test_images: List of PIL Images for testing
+            test_labels: Optional true labels for accuracy calculation
+            n_bins: Number of bins for calibration curve
+        Returns:
+            dict: Calibration analysis results
+        """
+        confidences = []
+        predictions = []
+        max_confidences = []
+        # Get predictions and confidences
+        for img in test_images:
+            probs, indices, labels = self._predict_image(img)
+            max_confidences.append(probs[0])
+            predictions.append(labels[0])
+            confidences.append(probs)
+        max_confidences = np.array(max_confidences)
+        # Create calibration analysis
+        fig = self._create_calibration_visualization(
+            max_confidences, test_labels, predictions, n_bins
+        )
+        # Calculate calibration metrics
+        calibration_metrics = self._calculate_calibration_metrics(
+            max_confidences, test_labels, predictions
+        )
+        return {
+            'figure': fig,
+            'metrics': calibration_metrics,
+            'confidence_distribution': max_confidences
+        }
+    def _predict_image(self, image):
+        """Helper function to get predictions."""
+        from predictor import predict_image
+        return predict_image(image, self.model, self.processor, top_k=5)
+    def _create_calibration_visualization(self, confidences, true_labels, predictions, n_bins):
+        """Create calibration visualization."""
+        fig, ((ax1, ax2), (ax3, ax4)) = plt.subplots(2, 2, figsize=(15, 12))
+        # Confidence distribution
+        ax1.hist(confidences, bins=20, alpha=0.7, color='lightblue', edgecolor='black')
+        ax1.set_xlabel('Confidence Score')
+        ax1.set_ylabel('Frequency')
+        ax1.set_title('Distribution of Confidence Scores', fontweight='bold')
+        ax1.axvline(np.mean(confidences), color='red', linestyle='--',
+                   label=f'Mean: {np.mean(confidences):.3f}')
+        ax1.legend()
+        ax1.grid(alpha=0.3)
+        # Reliability diagram (if true labels available)
+        if true_labels is not None:
+            # Convert to binary correctness
+            correct = np.array([pred == true for pred, true in zip(predictions, true_labels)])
+            fraction_of_positives, mean_predicted_prob = calibration_curve(
+                correct, confidences, n_bins=n_bins, strategy='uniform'
+            )
+            ax2.plot(mean_predicted_prob, fraction_of_positives, "s-", label='Model')
+            ax2.plot([0, 1], [0, 1], "k:", label="Perfectly calibrated")
+            ax2.set_xlabel('Mean Predicted Probability')
+            ax2.set_ylabel('Fraction of Positives')
+            ax2.set_title('Reliability Diagram', fontweight='bold')
+            ax2.legend()
+            ax2.grid(alpha=0.3)
+            # Calculate ECE
+            bin_edges = np.linspace(0, 1, n_bins + 1)
+            bin_indices = np.digitize(confidences, bin_edges) - 1
+            bin_indices = np.clip(bin_indices, 0, n_bins - 1)
+            ece = 0
+            for bin_idx in range(n_bins):
+                mask = bin_indices == bin_idx
+                if np.sum(mask) > 0:
+                    bin_conf = np.mean(confidences[mask])
+                    bin_acc = np.mean(correct[mask])
+                    ece += (np.sum(mask) / len(confidences)) * np.abs(bin_acc - bin_conf)
+            ax2.text(0.1, 0.9, f'ECE: {ece:.3f}', transform=ax2.transAxes,
+                    bbox=dict(boxstyle="round,pad=0.3", facecolor="yellow", alpha=0.7))
+        # Confidence vs accuracy (if true labels available)
+        if true_labels is not None:
+            confidence_bins = np.linspace(0, 1, n_bins + 1)
+            bin_accuracies = []
+            bin_confidences = []
+            for i in range(n_bins):
+                mask = (confidences >= confidence_bins[i]) & (confidences < confidence_bins[i+1])
+                if np.sum(mask) > 0:
+                    bin_acc = np.mean(correct[mask])
+                    bin_conf = np.mean(confidences[mask])
+                    bin_accuracies.append(bin_acc)
+                    bin_confidences.append(bin_conf)
+            ax3.plot(bin_confidences, bin_accuracies, 'o-', label='Model')
+            ax3.plot([0, 1], [0, 1], 'k--', label='Ideal')
+            ax3.set_xlabel('Average Confidence')
+            ax3.set_ylabel('Average Accuracy')
+            ax3.set_title('Confidence vs Accuracy', fontweight='bold')
+            ax3.legend()
+            ax3.grid(alpha=0.3)
+        # Top-1 vs Top-5 confidence gap
+        if len(confidences) > 0 and isinstance(confidences[0], np.ndarray):
+            top1_conf = [c[0] for c in confidences]
+            top5_conf = [np.sum(c[:5]) for c in confidences]
+            confidence_gap = [t1 - (t5 - t1)/4 for t1, t5 in zip(top1_conf, top5_conf)]
+            ax4.hist(confidence_gap, bins=20, alpha=0.7, color='lightgreen', edgecolor='black')
+            ax4.set_xlabel('Confidence Gap (Top-1 vs Rest)')
+            ax4.set_ylabel('Frequency')
+            ax4.set_title('Distribution of Confidence Gaps', fontweight='bold')
+            ax4.grid(alpha=0.3)
+        plt.tight_layout()
+        return fig
+    def _calculate_calibration_metrics(self, confidences, true_labels, predictions):
+        """Calculate calibration metrics."""
+        metrics = {
+            'mean_confidence': float(np.mean(confidences)),
+            'confidence_std': float(np.std(confidences)),
+            'overconfident_rate': float(np.mean(confidences > 0.8)),
+            'underconfident_rate': float(np.mean(confidences < 0.2)),
+        }
+        if true_labels is not None:
+            correct = np.array([pred == true for pred, true in zip(predictions, true_labels)])
+            accuracy = np.mean(correct)
+            avg_confidence = np.mean(confidences)
+            metrics.update({
+                'accuracy': float(accuracy),
+                'confidence_gap': float(avg_confidence - accuracy),
+                'brier_score': float(brier_score_loss(correct, confidences))
+            })
+        return metrics
+class BiasDetector:
+    """Detect potential biases in model performance across subgroups."""
+    def __init__(self, model, processor):
+        self.model = model
+        self.processor = processor
+        self.device = next(model.parameters()).device
+    def analyze_subgroup_performance(self, image_subsets, subset_names, true_labels_subsets=None):
+        """
+        Analyze performance across different subgroups.
+        Args:
+            image_subsets: List of image subsets for each subgroup
+            subset_names: Names for each subgroup
+            true_labels_subsets: Optional true labels for each subset
+        Returns:
+            dict: Bias analysis results
+        """
+        subgroup_metrics = {}
+        for i, (subset, name) in enumerate(zip(image_subsets, subset_names)):
+            confidences = []
+            predictions = []
+            for img in subset:
+                probs, indices, labels = self._predict_image(img)
+                confidences.append(probs[0])
+                predictions.append(labels[0])
+            metrics = {
+                'mean_confidence': np.mean(confidences),
+                'confidence_std': np.std(confidences),
+                'sample_size': len(subset)
+            }
+            # Calculate accuracy if true labels provided
+            if true_labels_subsets is not None and i < len(true_labels_subsets):
+                true_labels = true_labels_subsets[i]
+                correct = [pred == true for pred, true in zip(predictions, true_labels)]
+                metrics['accuracy'] = np.mean(correct)
+                metrics['error_rate'] = 1 - metrics['accuracy']
+            subgroup_metrics[name] = metrics
+        # Create bias analysis visualization
+        fig = self._create_bias_visualization(subgroup_metrics, true_labels_subsets is not None)
+        # Calculate fairness metrics
+        fairness_metrics = self._calculate_fairness_metrics(subgroup_metrics)
+        return {
+            'figure': fig,
+            'subgroup_metrics': subgroup_metrics,
+            'fairness_metrics': fairness_metrics
+        }
+    def _predict_image(self, image):
+        """Helper function to get predictions."""
+        from predictor import predict_image
+        return predict_image(image, self.model, self.processor, top_k=5)
+    def _create_bias_visualization(self, subgroup_metrics, has_accuracy):
+        """Create visualization for bias analysis."""
+        if has_accuracy:
+            fig, (ax1, ax2, ax3) = plt.subplots(1, 3, figsize=(18, 5))
+        else:
+            fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(12, 5))
+        subgroups = list(subgroup_metrics.keys())
+        # Confidence by subgroup
+        confidences = [metrics['mean_confidence'] for metrics in subgroup_metrics.values()]
+        ax1.bar(subgroups, confidences, color='lightblue', alpha=0.7)
+        ax1.set_ylabel('Mean Confidence')
+        ax1.set_title('Mean Confidence by Subgroup', fontweight='bold')
+        ax1.tick_params(axis='x', rotation=45)
+        ax1.grid(axis='y', alpha=0.3)
+        # Add confidence values on bars
+        for i, v in enumerate(confidences):
+            ax1.text(i, v + 0.01, f'{v:.3f}', ha='center', va='bottom')
+        # Sample sizes
+        sample_sizes = [metrics['sample_size'] for metrics in subgroup_metrics.values()]
+        ax2.bar(subgroups, sample_sizes, color='lightgreen', alpha=0.7)
+        ax2.set_ylabel('Sample Size')
+        ax2.set_title('Sample Size by Subgroup', fontweight='bold')
+        ax2.tick_params(axis='x', rotation=45)
+        ax2.grid(axis='y', alpha=0.3)
+        # Add sample size values on bars
+        for i, v in enumerate(sample_sizes):
+            ax2.text(i, v + max(sample_sizes)*0.01, f'{v}', ha='center', va='bottom')
+        # Accuracy by subgroup (if available)
+        if has_accuracy:
+            accuracies = [metrics.get('accuracy', 0) for metrics in subgroup_metrics.values()]
+            ax3.bar(subgroups, accuracies, color='lightcoral', alpha=0.7)
+            ax3.set_ylabel('Accuracy')
+            ax3.set_title('Accuracy by Subgroup', fontweight='bold')
+            ax3.tick_params(axis='x', rotation=45)
+            ax3.grid(axis='y', alpha=0.3)
+            # Add accuracy values on bars
+            for i, v in enumerate(accuracies):
+                ax3.text(i, v + 0.01, f'{v:.3f}', ha='center', va='bottom')
+        plt.tight_layout()
+        return fig
+    def _calculate_fairness_metrics(self, subgroup_metrics):
+        """Calculate fairness metrics."""
+        fairness_metrics = {}
+        # Check if we have accuracy metrics
+        has_accuracy = all('accuracy' in metrics for metrics in subgroup_metrics.values())
+        if has_accuracy and len(subgroup_metrics) >= 2:
+            accuracies = [metrics['accuracy'] for metrics in subgroup_metrics.values()]
+            confidences = [metrics['mean_confidence'] for metrics in subgroup_metrics.values()]
+            fairness_metrics = {
+                'accuracy_range': float(max(accuracies) - min(accuracies)),
+                'accuracy_std': float(np.std(accuracies)),
+                'confidence_range': float(max(confidences) - min(confidences)),
+                'max_accuracy_disparity': float(max(accuracies) / min(accuracies) if min(accuracies) > 0 else float('inf')),
+            }
+        return fairness_metrics
+# Convenience function to create all auditors
+def create_auditors(model, processor):
+    """Create all auditing analyzers."""
+    return {
+        'counterfactual': CounterfactualAnalyzer(model, processor),
+        'calibration': ConfidenceCalibrationAnalyzer(model, processor),
+        'bias': BiasDetector(model, processor)
+    }

tests/test_advanced_features.py ADDED Viewed

	@@ -0,0 +1,140 @@

+# test_advanced_features.py
+import sys
+import os
+sys.path.append(os.path.join(os.path.dirname(__file__), 'src'))
+from model_loader import load_model_and_processor
+from auditor import create_auditors, CounterfactualAnalyzer, ConfidenceCalibrationAnalyzer, BiasDetector
+from PIL import Image
+import matplotlib.pyplot as plt
+import numpy as np
+def create_test_subsets():
+    """Create dummy test subsets for bias detection demo."""
+    # Create different colored images to simulate subgroups
+    subsets = []
+    subset_names = ['Red Dominant', 'Green Dominant', 'Blue Dominant', 'Mixed Colors']
+    for i, name in enumerate(subset_names):
+        subset = []
+        for j in range(10):  # 10 images per subset
+            if name == 'Red Dominant':
+                img = Image.new('RGB', (224, 224), color=(200, 50, 50))
+            elif name == 'Green Dominant':
+                img = Image.new('RGB', (224, 224), color=(50, 200, 50))
+            elif name == 'Blue Dominant':
+                img = Image.new('RGB', (224, 224), color=(50, 50, 200))
+            else:  # Mixed
+                color = (50 + j*20, 100 + j*10, 150 - j*15)
+                img = Image.new('RGB', (224, 224), color=color)
+            subset.append(img)
+        subsets.append(subset)
+    return subsets, subset_names
+def test_advanced_features():
+    """
+    Test the advanced auditing features.
+    """
+    print("🔬 Testing Advanced Auditing Features")
+    print("=" * 50)
+    try:
+        # Load model
+        model, processor = load_model_and_processor()
+        # Create auditors
+        auditors = create_auditors(model, processor)
+        print("✅ Auditors created: Counterfactual, Calibration, Bias Detection")
+        # Create test image
+        test_image = Image.new('RGB', (224, 224), color=(150, 100, 100))
+        for x in range(50, 150):
+            for y in range(50, 150):
+                test_image.putpixel((x, y), (100, 200, 100))
+        print("\n1. Testing Counterfactual Analysis...")
+        counterfactual_results = auditors['counterfactual'].patch_perturbation_analysis(
+            test_image, patch_size=32, perturbation_type='blur'
+        )
+        print("   ✅ Counterfactual analysis completed")
+        print(f"   📊 Avg confidence change: {counterfactual_results['avg_confidence_change']:.4f}")
+        print(f"   🔀 Prediction flip rate: {counterfactual_results['prediction_flip_rate']:.2%}")
+        print("\n2. Testing Confidence Calibration...")
+        # Create dummy test set
+        test_images = [test_image] * 5  # Simple test with same image
+        calibration_results = auditors['calibration'].analyze_calibration(test_images)
+        print("   ✅ Calibration analysis completed")
+        print(f"   📈 Mean confidence: {calibration_results['metrics']['mean_confidence']:.3f}")
+        print(f"   🎯 Overconfident rate: {calibration_results['metrics']['overconfident_rate']:.2%}")
+        print("\n3. Testing Bias Detection...")
+        test_subsets, subset_names = create_test_subsets()
+        bias_results = auditors['bias'].analyze_subgroup_performance(test_subsets, subset_names)
+        print("   ✅ Bias detection analysis completed")
+        print(f"   📊 Analyzed {len(subset_names)} subgroups")
+        # Display results
+        print("\n📊 DISPLAYING ADVANCED ANALYSIS RESULTS:")
+        print("=" * 40)
+        # Counterfactual results
+        plt.figure(counterfactual_results['figure'].number)
+        plt.suptitle("1. Counterfactual Analysis - Patch Sensitivity", fontweight='bold', y=0.98)
+        plt.show()
+        # Calibration results
+        plt.figure(calibration_results['figure'].number)
+        plt.suptitle("2. Confidence Calibration Analysis", fontweight='bold', y=0.98)
+        plt.show()
+        # Bias detection results
+        plt.figure(bias_results['figure'].number)
+        plt.suptitle("3. Bias Detection - Subgroup Analysis", fontweight='bold', y=0.98)
+        plt.show()
+        # Print detailed metrics
+        print("\n📈 DETAILED METRICS:")
+        print("-" * 20)
+        print("\n🎯 Counterfactual Analysis:")
+        for key, value in counterfactual_results.items():
+            if key != 'figure':
+                print(f"   {key}: {value}")
+        print("\n📊 Calibration Analysis:")
+        for key, value in calibration_results['metrics'].items():
+            print(f"   {key}: {value}")
+        print("\n⚖️ Bias Detection:")
+        print("   Subgroup Metrics:")
+        for subgroup, metrics in bias_results['subgroup_metrics'].items():
+            print(f"     {subgroup}:")
+            for metric, value in metrics.items():
+                print(f"       {metric}: {value}")
+        print("\n🎉 ADVANCED FEATURES SUMMARY:")
+        print("=" * 35)
+        print("✅ Counterfactual Analysis - Patch Sensitivity")
+        print("��� Confidence Calibration - Reliability Analysis")
+        print("✅ Bias Detection - Subgroup Performance")
+        print("✅ All advanced auditing features working!")
+        return True
+    except Exception as e:
+        print(f"❌ Advanced features test failed: {e}")
+        import traceback
+        traceback.print_exc()
+        return False
+if __name__ == "__main__":
+    success = test_advanced_features()
+    if success:
+        print("\n🚀 All Phase 1 + Advanced Features Complete!")
+        print("   Ready for Phase 2: Dashboard Integration!")
+    else:
+        print("\n⚠️ Some advanced features need debugging")