📖 Add example usage script

- Demonstrates BYOL model loading and feature extraction
- Shows preprocessing pipeline for inference
- Includes batch processing examples
- Feature similarity computation example
- Complete documentation for model usage

Ready-to-use code for:
✅ Loading pre-trained BYOL model
✅ Feature extraction from mammogram tiles
✅ Batch processing capabilities
✅ Downstream task preparation

Files changed (1) hide show

example_usage.py +143 -0

example_usage.py ADDED Viewed

	@@ -0,0 +1,143 @@

+#!/usr/bin/env python3
+"""
+example_usage.py
+Demonstrates how to use the BYOL Mammogram model for feature extraction
+and classification tasks.
+"""
+import torch
+import torch.nn as nn
+from torchvision import models, transforms
+from PIL import Image
+import numpy as np
+from pathlib import Path
+# Import the BYOL model classes
+from train_byol_mammo import MammogramBYOL
+def load_byol_model(checkpoint_path: str, device: torch.device):
+    """Load the pre-trained BYOL model for feature extraction."""
+    print(f"📥 Loading BYOL model from: {checkpoint_path}")
+    # Create ResNet50 backbone (same as training)
+    resnet = models.resnet50(weights=None)
+    backbone = nn.Sequential(*list(resnet.children())[:-1])
+    # Initialize BYOL model with same architecture
+    model = MammogramBYOL(
+        backbone=backbone,
+        input_dim=2048,      # ResNet50 feature dimension
+        hidden_dim=4096,     # BYOL projection head hidden dim
+        proj_dim=256         # BYOL projection dimension
+    ).to(device)
+    # Load the trained weights
+    checkpoint = torch.load(checkpoint_path, map_location=device)
+    model.load_state_dict(checkpoint['model_state_dict'])
+    model.eval()
+    print(f"✅ Model loaded successfully!")
+    print(f"   Epoch: {checkpoint.get('epoch', 'Unknown')}")
+    print(f"   Final loss: {checkpoint.get('loss', 'Unknown'):.4f}")
+    return model
+def create_inference_transform(tile_size: int = 512):
+    """Create the preprocessing transform for inference."""
+    return transforms.Compose([
+        transforms.Resize((tile_size, tile_size), antialias=True),
+        transforms.ToTensor(),
+        transforms.Normalize(mean=[0.5, 0.5, 0.5], std=[0.5, 0.5, 0.5])
+    ])
+def extract_features(model, image_tensor, device):
+    """Extract 2048-dimensional features from mammogram tiles."""
+    with torch.no_grad():
+        image_tensor = image_tensor.to(device)
+        features = model.get_features(image_tensor)
+    return features.cpu().numpy()
+def main():
+    """Demonstrate model usage."""
+    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+    print(f"🖥️  Using device: {device}")
+    # Load the pre-trained BYOL model
+    model = load_byol_model("mammogram_byol_best.pth", device)
+    # Create preprocessing transform
+    transform = create_inference_transform(tile_size=512)
+    # Example 1: Feature extraction from a single image
+    print("\n📊 Example 1: Feature Extraction")
+    print("-" * 40)
+    # Create a dummy mammogram tile (replace with actual image loading)
+    dummy_image = Image.fromarray(np.random.randint(0, 255, (512, 512), dtype=np.uint8))
+    dummy_image = dummy_image.convert('RGB')  # Convert to RGB as expected
+    # Preprocess the image
+    image_tensor = transform(dummy_image).unsqueeze(0)  # Add batch dimension
+    # Extract features
+    features = extract_features(model, image_tensor, device)
+    print(f"✅ Input shape: {image_tensor.shape}")
+    print(f"✅ Feature shape: {features.shape}")
+    print(f"✅ Feature vector (first 10 values): {features[0][:10]}")
+    # Example 2: Batch processing multiple images
+    print("\n📊 Example 2: Batch Feature Extraction")
+    print("-" * 40)
+    # Create a batch of dummy images
+    batch_size = 4
+    dummy_batch = torch.stack([
+        transform(Image.fromarray(np.random.randint(0, 255, (512, 512), dtype=np.uint8)).convert('RGB'))
+        for _ in range(batch_size)
+    ])
+    # Extract features for the entire batch
+    batch_features = extract_features(model, dummy_batch, device)
+    print(f"✅ Batch input shape: {dummy_batch.shape}")
+    print(f"✅ Batch features shape: {batch_features.shape}")
+    print(f"✅ Features per image: {batch_features.shape[1]} dimensions")
+    # Example 3: Similarity computation
+    print("\n📊 Example 3: Feature Similarity")
+    print("-" * 40)
+    # Compute cosine similarity between first two images
+    from sklearn.metrics.pairwise import cosine_similarity
+    similarity = cosine_similarity(
+        batch_features[0:1],
+        batch_features[1:2]
+    )[0][0]
+    print(f"✅ Cosine similarity between image 1 and 2: {similarity:.4f}")
+    print("\n🎯 Next Steps:")
+    print("- Use these 2048D features for downstream classification")
+    print("- Train a classifier using train_classification.py")
+    print("- Fine-tune the entire model for specific tasks")
+    print("- Use for similarity search or clustering")
+    print(f"\n📚 Model Summary:")
+    print(f"- Architecture: ResNet50 + BYOL")
+    print(f"- Input: 512x512 RGB mammogram tiles")
+    print(f"- Output: 2048-dimensional feature vectors")
+    print(f"- Training: Self-supervised on breast tissue tiles")
+    print(f"- Use case: Medical image analysis and classification")
+if __name__ == "__main__":
+    main()