nileshhanotia
/

mutation-pathogenicity-predictor

@@ -1,74 +1,128 @@
 import torch
 import torch.nn as nn
 class MutationPredictorCNN(nn.Module):
     def __init__(self):
         super().__init__()
-        # convolution backbone (MUST match training)
-        self.conv1 = nn.Conv1d(11, 64, kernel_size=7, padding=3)
-        self.bn1   = nn.BatchNorm1d(64)
-        self.conv2 = nn.Conv1d(64, 128, kernel_size=5, padding=2)
-        self.bn2   = nn.BatchNorm1d(128)
-        self.conv3 = nn.Conv1d(128, 256, kernel_size=3, padding=1)
-        self.bn3   = nn.BatchNorm1d(256)
-        self.global_pool = nn.AdaptiveAvgPool1d(1)
-        # mutation branch
-        self.mut_fc = nn.Linear(12, 32)
-        # explainability head
-        self.importance_head = nn.Linear(256, 1)
-        # classifier head
-        self.fc1 = nn.Linear(288, 128)
-        self.fc2 = nn.Linear(128, 64)
-        self.fc3 = nn.Linear(64, 1)
-        self.relu    = nn.ReLU()
-        self.dropout = nn.Dropout(0.4)
     def forward(self, x):
-        seq_flat = x[:, :1089]
-        mut_one  = x[:, 1089:1101]
-        h = self.relu(self.bn1(self.conv1(seq_flat.view(-1, 11, 99))))
-        h = self.relu(self.bn2(self.conv2(h)))
-        conv_out = self.relu(self.bn3(self.conv3(h)))
-        # full explainability map
-        importance_map = torch.sigmoid(
-            self.importance_head(conv_out.permute(0,2,1))
-        ).squeeze(-1)
-        # mutation position
-        mut_pos = x[:, 990:1089].argmax(dim=1).clamp(0,98)
-        mut_feat = conv_out[
-            torch.arange(conv_out.size(0)),
-            :,
-            mut_pos
-        ]
-        importance_score = torch.sigmoid(
-            self.importance_head(mut_feat)
-        )
-        pooled = self.global_pool(conv_out).squeeze(-1)
-        mut_vec = self.relu(self.mut_fc(mut_one))
-        combined = torch.cat([pooled, mut_vec], dim=1)
-        out = self.dropout(self.relu(self.fc1(combined)))
-        out = self.dropout(self.relu(self.fc2(out)))
-        logit = self.fc3(out)
-        return logit, importance_score, importance_map

 import torch
 import torch.nn as nn
+import torch.nn.functional as F
 class MutationPredictorCNN(nn.Module):
+    """
+    Mutation Pathogenicity Predictor CNN
+    Architecture matches the trained checkpoint weights
+    """
     def __init__(self):
         super().__init__()
+        # Convolutional layers - CORRECTED kernel sizes to match checkpoint
+        self.conv1 = nn.Conv1d(11, 64, kernel_size=7, padding=3)  # Changed from 5 to 7
+        self.bn1 = nn.BatchNorm1d(64)
+        self.conv2 = nn.Conv1d(64, 128, kernel_size=5, padding=2)  # Correct
+        self.bn2 = nn.BatchNorm1d(128)
+        self.conv3 = nn.Conv1d(128, 256, kernel_size=3, padding=1)  # Changed from 5 to 3
+        self.bn3 = nn.BatchNorm1d(256)
+        # Pooling layers to reduce dimensions
+        self.pool = nn.MaxPool1d(kernel_size=2, stride=2)
+        # Mutation type processing - CORRECTED
+        self.mut_fc = nn.Linear(12, 32)  # Changed from (256, 1) to (12, 32)
+        # After 3 pooling layers: 99 -> 49 -> 24 -> 12
+        # Conv output: 256 channels * 12 positions = 3072
+        # Mutation features: 32
+        # Total: 3072 + 32 = 3104
+        # BUT checkpoint shows fc1 is (128, 288)
+        # So we need adaptive pooling to get 256 features from conv
+        self.adaptive_pool = nn.AdaptiveAvgPool1d(1)  # Pool to single value per channel
+        # Fully connected layers - CORRECTED to match checkpoint
+        # Input: 256 (conv) + 32 (mutation) = 288
+        self.fc1 = nn.Linear(288, 128)  # Changed from (256*99, 256) to (288, 128)
+        self.fc2 = nn.Linear(128, 64)   # Changed from (256, 64) to (128, 64)
+        self.fc3 = nn.Linear(64, 1)     # Correct
+        # Importance head - CORRECTED
+        # Takes conv features (256) and outputs single importance score
+        self.importance_head = nn.Linear(256, 1)  # Changed from (256*99, 99) to (256, 1)
     def forward(self, x):
+        """
+        Forward pass
+        Args:
+            x: Input tensor (batch, 1101)
+               [0:990] - sequence features (99*10)
+               [990:1089] - difference mask (99)
+               [1089:1101] - mutation type (12)
+        Returns:
+            cls: Classification output (batch, 1)
+            importance: Importance score (batch, 1)
+        """
+        batch_size = x.size(0)
+        # Extract mutation type for separate processing
+        mut_type = x[:, 1089:1101]  # Last 12 dimensions
+        # Reshape remaining features for CNN
+        # First 1089 features -> reshape to (batch, 11, 99)
+        x_seq = x[:, :1089].view(batch_size, 11, 99)
+        # Convolutional layers with pooling
+        x_conv = F.relu(self.bn1(self.conv1(x_seq)))
+        x_conv = self.pool(x_conv)  # 99 -> 49
+        x_conv = F.relu(self.bn2(self.conv2(x_conv)))
+        x_conv = self.pool(x_conv)  # 49 -> 24
+        x_conv = F.relu(self.bn3(self.conv3(x_conv)))
+        x_conv = self.pool(x_conv)  # 24 -> 12
+        # Adaptive pooling to get fixed 256 features
+        x_conv = self.adaptive_pool(x_conv)  # (batch, 256, 1)
+        conv_features = x_conv.view(batch_size, 256)  # (batch, 256)
+        # Process mutation type
+        mut_features = F.relu(self.mut_fc(mut_type))  # (batch, 32)
+        # Concatenate features
+        combined = torch.cat([conv_features, mut_features], dim=1)  # (batch, 288)
+        # Classification branch
+        x = F.relu(self.fc1(combined))
+        x = F.relu(self.fc2(x))
+        cls = torch.sigmoid(self.fc3(x))  # (batch, 1)
+        # Importance branch (uses conv features)
+        importance = torch.sigmoid(self.importance_head(conv_features))  # (batch, 1)
+        return cls, importance
+if __name__ == "__main__":
+    # Test the model
+    print("Testing MutationPredictorCNN...")
+    model = MutationPredictorCNN()
+    # Test input (batch_size=2, features=1101)
+    test_input = torch.randn(2, 1101)
+    cls, importance = model(test_input)
+    print(f"Input shape: {test_input.shape}")
+    print(f"Classification output shape: {cls.shape}")
+    print(f"Importance output shape: {importance.shape}")
+    print("\nModel parameter shapes (should match checkpoint):")
+    for name, param in model.named_parameters():
+        print(f"{name:30s}: {str(param.shape):20s}")
+    print("\nExpected parameter shapes from checkpoint:")
+    print("conv1.weight                  : torch.Size([64, 11, 7])")
+    print("conv3.weight                  : torch.Size([256, 128, 3])")
+    print("mut_fc.weight                 : torch.Size([32, 12])")
+    print("fc1.weight                    : torch.Size([128, 288])")
+    print("importance_head.weight        : torch.Size([1, 256])")