Lab-Rasool
/

sybil

@@ -135,6 +135,405 @@ for i, score in enumerate(output.risk_scores.numpy()):
     print(f"Year {i+1}: {float(score)}")
 ```
 ## 📈 Performance Metrics
 | Dataset | 1-Year AUC | 6-Year AUC | Sample Size |
@@ -215,7 +614,7 @@ This Hugging Face implementation is based on the original work by:
 MIT License - See [LICENSE](LICENSE) file
 - Original Model © 2022 Peter Mikhael & Jeremy Wohlwend
-- HF Adaptation © 2025 Aakash Tripathi
 ## 🔧 Troubleshooting

     print(f"Year {i+1}: {float(score)}")
 ```
+## 🔬 Advanced Usage: Embedding Extraction
+### Extract Embeddings Before Dropout Layer
+You can extract 512-dimensional embedding vectors from the layer immediately before the dropout layer. This captures the learned risk features before the final prediction layer.
+```python
+from huggingface_hub import snapshot_download
+import sys
+import os
+import torch
+import numpy as np
+# Download and setup model
+model_path = snapshot_download(repo_id="Lab-Rasool/sybil")
+sys.path.append(model_path)
+from modeling_sybil_hf import SybilHFWrapper
+from configuration_sybil import SybilConfig
+def extract_embeddings(dicom_paths):
+    """
+    Extract embeddings from the layer after ReLU, before Dropout.
+    Args:
+        dicom_paths: List of DICOM file paths
+    Returns:
+        numpy array of shape (512,) - averaged embeddings across ensemble
+    """
+    # Initialize model
+    config = SybilConfig()
+    model = SybilHFWrapper(config)
+    # Set each model in ensemble to eval mode
+    for m in model.models:
+        m.eval()
+    # Storage for embeddings from each model in ensemble
+    all_embeddings = []
+    # Register hooks on each model in the ensemble
+    for model_idx, ensemble_model in enumerate(model.models):
+        embeddings_buffer = []
+        def create_hook(buffer):
+            def hook(module, input, output):
+                # Capture the output of ReLU layer (before dropout)
+                buffer.append(output.detach().cpu())
+            return hook
+        # Register hook on the ReLU layer
+        hook_handle = ensemble_model.relu.register_forward_hook(create_hook(embeddings_buffer))
+        # Run forward pass
+        with torch.no_grad():
+            _ = model(dicom_paths=dicom_paths)
+        # Remove hook
+        hook_handle.remove()
+        # Get the embeddings (should be shape [1, 512])
+        if embeddings_buffer:
+            embedding = embeddings_buffer[0].numpy().squeeze()
+            all_embeddings.append(embedding)
+            print(f"Model {model_idx + 1}: Embedding shape = {embedding.shape}")
+    # Average embeddings across ensemble
+    averaged_embedding = np.mean(all_embeddings, axis=0)
+    return averaged_embedding
+# Usage
+dicom_dir = "path/to/volume"
+dicom_paths = [os.path.join(dicom_dir, f) for f in os.listdir(dicom_dir) if f.endswith('.dcm')]
+embeddings = extract_embeddings(dicom_paths)
+print(f"\nEmbedding vector shape: {embeddings.shape}")
+print(f"Embedding statistics:")
+print(f"  Mean: {np.mean(embeddings):.6f}")
+print(f"  Std: {np.std(embeddings):.6f}")
+print(f"  Min: {np.min(embeddings):.6f}")
+print(f"  Max: {np.max(embeddings):.6f}")
+```
+## 🎯 Extracting Embeddings at Other Layers
+### Available Extraction Points
+The Sybil model has several key layers where you can extract intermediate representations:
+```python
+import torch
+from huggingface_hub import snapshot_download
+import sys
+model_path = snapshot_download(repo_id="Lab-Rasool/sybil")
+sys.path.append(model_path)
+from modeling_sybil_hf import SybilHFWrapper
+from configuration_sybil import SybilConfig
+config = SybilConfig()
+model = SybilHFWrapper(config)
+# Get first model from ensemble for demonstration
+first_model = model.models[0]
+# Model architecture flow:
+# Input → image_encoder → pool → relu → dropout → prob_of_failure_layer → Output
+def extract_layer_output(model, layer_name, dicom_paths):
+    """
+    Extract output from any layer in the model.
+    Args:
+        model: SybilHFWrapper model
+        layer_name: Name of the layer to extract from
+        dicom_paths: List of DICOM file paths
+    Returns:
+        Extracted features from the specified layer
+    """
+    features = []
+    def hook_fn(module, input, output):
+        features.append(output.detach().cpu())
+    # Register hook on the specified layer
+    for m in model.models:
+        layer = dict(m.named_modules())[layer_name]
+        hook_handle = layer.register_forward_hook(hook_fn)
+    # Run forward pass
+    with torch.no_grad():
+        _ = model(dicom_paths=dicom_paths)
+    # Remove hook
+    hook_handle.remove()
+    return features
+# Example 1: Extract from image encoder (3D feature maps)
+# Shape: (batch, 512, time, height, width)
+encoder_features = extract_layer_output(model, 'image_encoder', dicom_paths)
+print(f"Image encoder output shape: {encoder_features[0].shape}")
+# Example 2: Extract from pooling layer (before ReLU)
+# Shape: (batch, 512)
+pool_features = extract_layer_output(model, 'pool', dicom_paths)
+print(f"Pool layer output shape: {pool_features[0].shape}")
+# Example 3: Extract from ReLU layer (before dropout) - RECOMMENDED
+# Shape: (batch, 512)
+relu_features = extract_layer_output(model, 'relu', dicom_paths)
+print(f"ReLU layer output shape: {relu_features[0].shape}")
+# Example 4: Extract from dropout layer (before final prediction)
+# Shape: (batch, 512)
+dropout_features = extract_layer_output(model, 'dropout', dicom_paths)
+print(f"Dropout layer output shape: {dropout_features[0].shape}")
+```
+### Custom Layer Extraction Template
+```python
+def extract_custom_layer(dicom_paths, target_layer_name):
+    """
+    Template for extracting features from any layer.
+    Args:
+        dicom_paths: List of DICOM file paths
+        target_layer_name: Name of target layer (e.g., 'relu', 'pool', 'image_encoder')
+    Returns:
+        Extracted features averaged across ensemble
+    """
+    from huggingface_hub import snapshot_download
+    import sys
+    import torch
+    import numpy as np
+    model_path = snapshot_download(repo_id="Lab-Rasool/sybil")
+    sys.path.append(model_path)
+    from modeling_sybil_hf import SybilHFWrapper
+    from configuration_sybil import SybilConfig
+    config = SybilConfig()
+    model = SybilHFWrapper(config)
+    all_features = []
+    for ensemble_model in model.models:
+        ensemble_model.eval()
+        features_buffer = []
+        # Get the target layer
+        target_layer = dict(ensemble_model.named_modules())[target_layer_name]
+        # Register hook
+        def hook(module, input, output):
+            features_buffer.append(output.detach().cpu())
+        hook_handle = target_layer.register_forward_hook(hook)
+        # Forward pass
+        with torch.no_grad():
+            _ = model(dicom_paths=dicom_paths)
+        hook_handle.remove()
+        if features_buffer:
+            all_features.append(features_buffer[0])
+    # Average across ensemble
+    averaged_features = torch.stack(all_features).mean(dim=0)
+    return averaged_features.numpy()
+```
+## 🔍 Model Architecture Inspection
+### Print Full Model Architecture
+```python
+from huggingface_hub import snapshot_download
+import sys
+model_path = snapshot_download(repo_id="Lab-Rasool/sybil")
+sys.path.append(model_path)
+from modeling_sybil_hf import SybilHFWrapper
+from configuration_sybil import SybilConfig
+config = SybilConfig()
+model = SybilHFWrapper(config)
+# Print configuration
+print("=" * 80)
+print("MODEL CONFIGURATION:")
+print("=" * 80)
+print(config)
+# Print ensemble information
+print("\n" + "=" * 80)
+print("ENSEMBLE INFORMATION:")
+print("=" * 80)
+print(f"Number of models in ensemble: {len(model.models)}")
+print(f"Device: {model.device}")
+# Print architecture of first model
+print("\n" + "=" * 80)
+print("MODEL ARCHITECTURE (First model in ensemble):")
+print("=" * 80)
+first_model = model.models[0]
+print(first_model)
+```
+### Count Model Parameters
+```python
+from huggingface_hub import snapshot_download
+import sys
+model_path = snapshot_download(repo_id="Lab-Rasool/sybil")
+sys.path.append(model_path)
+from modeling_sybil_hf import SybilHFWrapper
+from configuration_sybil import SybilConfig
+config = SybilConfig()
+model = SybilHFWrapper(config)
+print("=" * 80)
+print("MODEL PARAMETERS:")
+print("=" * 80)
+# Parameters per model in ensemble
+for i, ensemble_model in enumerate(model.models):
+    total_params = sum(p.numel() for p in ensemble_model.parameters())
+    trainable_params = sum(p.numel() for p in ensemble_model.parameters() if p.requires_grad)
+    print(f"\nModel {i+1}:")
+    print(f"  Total parameters: {total_params:,}")
+    print(f"  Trainable parameters: {trainable_params:,}")
+    print(f"  Non-trainable parameters: {total_params - trainable_params:,}")
+# Total ensemble parameters
+total_ensemble = sum(
+    sum(p.numel() for p in m.parameters())
+    for m in model.models
+)
+print(f"\nTotal ensemble parameters: {total_ensemble:,}")
+```
+### List Model Components
+```python
+from huggingface_hub import snapshot_download
+import sys
+model_path = snapshot_download(repo_id="Lab-Rasool/sybil")
+sys.path.append(model_path)
+from modeling_sybil_hf import SybilHFWrapper
+from configuration_sybil import SybilConfig
+config = SybilConfig()
+model = SybilHFWrapper(config)
+first_model = model.models[0]
+print("=" * 80)
+print("MODEL COMPONENTS:")
+print("=" * 80)
+# Print each component with parameter count
+for name, module in first_model.named_children():
+    num_params = sum(p.numel() for p in module.parameters())
+    print(f"{name}: {module.__class__.__name__} ({num_params:,} parameters)")
+print("\n" + "=" * 80)
+print("DETAILED LAYER NAMES:")
+print("=" * 80)
+# Print all named modules (including nested layers)
+for name, module in first_model.named_modules():
+    if name:  # Skip the root module
+        print(f"  {name}: {module.__class__.__name__}")
+```
+### Model Architecture Overview
+The Sybil model consists of the following key components:
+```
+Input (3D CT Volume)
+    ↓
+image_encoder (R3D-18 backbone)
+    - 3D convolutional neural network
+    - Pretrained on Kinetics-400
+    - Output: (batch, 512, time, height, width)
+    ↓
+pool (MultiAttentionPool)
+    - Attention-based pooling mechanisms
+    - Combines multiple pooling strategies
+    - Output: (batch, 512)
+    ↓
+relu (ReLU activation)
+    - Non-linear activation
+    - Output: (batch, 512) ← EMBEDDING EXTRACTION POINT
+    ↓
+dropout (Dropout layer)
+    - Regularization (p=0.0 in inference)
+    - Output: (batch, 512)
+    ↓
+prob_of_failure_layer (CumulativeProbabilityLayer)
+    - Hazard function prediction
+    - Output: (batch, 6) - one score per year
+    ↓
+sigmoid (applied post-forward)
+    ↓
+Risk Scores (final output)
+```
+### Get Layer-by-Layer Summary
+```python
+def print_model_summary(model):
+    """Print a detailed summary of the model architecture."""
+    from huggingface_hub import snapshot_download
+    import sys
+    model_path = snapshot_download(repo_id="Lab-Rasool/sybil")
+    sys.path.append(model_path)
+    from modeling_sybil_hf import SybilHFWrapper
+    from configuration_sybil import SybilConfig
+    config = SybilConfig()
+    model = SybilHFWrapper(config)
+    first_model = model.models[0]
+    print(f"{'Layer Name':<40} {'Type':<30} {'Parameters':>15}")
+    print("=" * 85)
+    total_params = 0
+    for name, module in first_model.named_modules():
+        if name:  # Skip root
+            num_params = sum(p.numel() for p in module.parameters())
+            if num_params > 0:
+                print(f"{name:<40} {module.__class__.__name__:<30} {num_params:>15,}")
+                total_params += num_params
+    print("=" * 85)
+    print(f"{'TOTAL':<40} {'':<30} {total_params:>15,}")
+# Usage
+print_model_summary(model)
+```
 ## 📈 Performance Metrics
 | Dataset | 1-Year AUC | 6-Year AUC | Sample Size |
 MIT License - See [LICENSE](LICENSE) file
 - Original Model © 2022 Peter Mikhael & Jeremy Wohlwend
+- HF Adaptation with Embeddings © 2025 [Aakash Tripathi](https://github.com/Aakash-Tripathi)
 ## 🔧 Troubleshooting