Upload folder using huggingface_hub

Browse files

Files changed (5) hide show

README.md +164 -0
config.json +36 -0
model.py +244 -0
model.safetensors +3 -0
pytorch_model.bin +3 -0

README.md ADDED Viewed

	@@ -0,0 +1,164 @@

+---
+license: mit
+tags:
+- image-classification
+- medical-imaging
+- cervical-cancer
+- pytorch
+- safetensors
+datasets:
+- custom
+metrics:
+- accuracy
+- f1
+pipeline_tag: image-classification
+library_name: pytorch
+---
+# Cervical Type Classification Model
+## Model Description
+This model classifies cervical images into 3 transformation zone types, which is important for colposcopy evaluation and cervical cancer screening.
+| Label | Type | Description |
+|-------|------|-------------|
+| 0 | Type 1 | Transformation zone fully visible on ectocervix |
+| 1 | Type 2 | Transformation zone partially visible (extends into endocervical canal) |
+| 2 | Type 3 | Transformation zone not visible (entirely within endocervical canal) |
+## Model Architecture
+Simple CNN with 4 convolutional layers:
+```
+Input (256x256x3)
+    ↓
+Conv2d(3→32) + BN + ReLU + MaxPool
+Conv2d(32→64) + BN + ReLU + MaxPool
+Conv2d(64→128) + BN + ReLU + MaxPool
+Conv2d(128→256) + BN + ReLU + MaxPool
+    ↓
+AdaptiveAvgPool2d(1)
+    ↓
+FC(256→256) + ReLU + Dropout(0.4)
+FC(256→128) + ReLU + Dropout(0.4)
+    ↓
+FC(128→3) → Output
+```
+**Parameters:** 488,451
+## Training
+| Parameter | Value |
+|-----------|-------|
+| Learning Rate | 1e-4 |
+| Batch Size | 32 |
+| Dropout | 0.4 |
+| Optimizer | Adam |
+| Epochs | 50 |
+## Performance
+| Metric | Value |
+|--------|-------|
+| **Validation Accuracy** | 61.69% |
+| **Macro F1 Score** | 61.81% |
+### Per-Class F1 Scores
+| Type | F1 Score |
+|------|----------|
+| Type 1 | 68.32% |
+| Type 2 | 56.41% |
+| Type 3 | 60.69% |
+## Usage
+### Installation
+```bash
+pip install torch torchvision safetensors
+```
+### Quick Start
+```python
+import torch
+from PIL import Image
+from torchvision import transforms
+# Load model
+from model import BaseCNN
+model = BaseCNN.from_pretrained("./")
+model.eval()
+# Preprocess image
+transform = transforms.Compose([
+    transforms.Resize((256, 256)),
+    transforms.ToTensor(),
+])
+image = Image.open("cervical_image.jpg").convert("RGB")
+input_tensor = transform(image).unsqueeze(0)
+# Inference
+with torch.no_grad():
+    output = model(input_tensor)
+    probabilities = torch.softmax(output, dim=1)
+    prediction = output.argmax(dim=1).item()
+labels = ["Type 1", "Type 2", "Type 3"]
+print(f"Prediction: {labels[prediction]}")
+print(f"Confidence: {probabilities[0][prediction]:.2%}")
+```
+### Using with Hugging Face Hub
+```python
+from huggingface_hub import hf_hub_download
+import torch
+# Download model files
+model_path = hf_hub_download(repo_id="your-username/cervical-type-classifier", filename="model.safetensors")
+config_path = hf_hub_download(repo_id="your-username/cervical-type-classifier", filename="config.json")
+# Load using safetensors
+from safetensors.torch import load_file
+state_dict = load_file(model_path)
+# Create model and load weights
+from model import BaseCNN
+import json
+with open(config_path) as f:
+    config = json.load(f)
+model = BaseCNN(**config['model_config'])
+model.load_state_dict(state_dict)
+model.eval()
+```
+## Limitations
+- Model was trained on a specific dataset and may not generalize to all cervical imaging equipment
+- Type 2 classification has lower accuracy (56.41% F1) as it represents an intermediate state
+- Input images should be 256x256 RGB
+## Citation
+If you use this model, please cite:
+```bibtex
+@misc{cervical-type-classifier,
+  title={Cervical Type Classification Model},
+  author={Your Name},
+  year={2026},
+  howpublished={\url{https://huggingface.co/your-username/cervical-type-classifier}}
+}
+```
+## License
+MIT License

config.json ADDED Viewed

	@@ -0,0 +1,36 @@

+{
+  "model_type": "BaseCNN",
+  "model_config": {
+    "layers": [
+      32,
+      64,
+      128,
+      256
+    ],
+    "kernel": 3,
+    "padding": 1,
+    "stride": 1,
+    "batchnorm": true,
+    "bn_pre_activ": true,
+    "activation": "ReLU",
+    "dropout": 0.4,
+    "pool": true,
+    "fc_layers": [
+      256,
+      128
+    ],
+    "nr_classes": 3,
+    "in_channels": 3
+  },
+  "num_labels": 3,
+  "id2label": {
+    "0": "Type 1",
+    "1": "Type 2",
+    "2": "Type 3"
+  },
+  "label2id": {
+    "Type 1": 0,
+    "Type 2": 1,
+    "Type 3": 2
+  }
+}

model.py ADDED Viewed

	@@ -0,0 +1,244 @@

+"""
+Cervical Type Classification Model
+This module contains the BaseCNN model for classifying cervical images
+into 3 transformation zone types.
+Usage:
+    from model import BaseCNN
+    # Load pretrained model
+    model = BaseCNN.from_pretrained("./")
+    # Or create from scratch
+    model = BaseCNN(
+        layers=[32, 64, 128, 256],
+        fc_layers=[256, 128],
+        nr_classes=3
+    )
+"""
+import json
+from pathlib import Path
+import torch
+import torch.nn as nn
+try:
+    from safetensors.torch import load_file, save_file
+    HAS_SAFETENSORS = True
+except ImportError:
+    HAS_SAFETENSORS = False
+class BaseCNN(nn.Module):
+    """
+    Simple CNN for cervical type classification.
+    Classifies cervical images into 3 transformation zone types:
+    - Type 1: Transformation zone fully visible on ectocervix
+    - Type 2: Transformation zone partially visible
+    - Type 3: Transformation zone not visible (within endocervical canal)
+    Args:
+        layers: List of output channels for each conv layer. Default: [32, 64, 128, 256]
+        kernel: Kernel size for conv layers. Default: 3
+        padding: Padding for conv layers. Default: 1
+        stride: Stride for conv layers. Default: 1
+        batchnorm: Whether to use batch normalization. Default: True
+        bn_pre_activ: Whether to apply BN before activation. Default: True
+        activation: Activation function name. Default: 'ReLU'
+        dropout: Dropout rate for FC layers. Default: 0.4
+        pool: Whether to use max pooling after each conv. Default: True
+        fc_layers: List of FC layer sizes. Default: [256, 128]
+        nr_classes: Number of output classes. Default: 3
+        in_channels: Number of input channels. Default: 3
+    """
+    def __init__(
+        self,
+        layers: list = None,
+        kernel: int = 3,
+        padding: int = 1,
+        stride: int = 1,
+        batchnorm: bool = True,
+        bn_pre_activ: bool = True,
+        activation: str = 'ReLU',
+        dropout: float = 0.4,
+        pool: bool = True,
+        fc_layers: list = None,
+        nr_classes: int = 3,
+        in_channels: int = 3,
+    ):
+        super().__init__()
+        # Store config for serialization
+        self.config = {
+            'layers': layers or [32, 64, 128, 256],
+            'kernel': kernel,
+            'padding': padding,
+            'stride': stride,
+            'batchnorm': batchnorm,
+            'bn_pre_activ': bn_pre_activ,
+            'activation': activation,
+            'dropout': dropout,
+            'pool': pool,
+            'fc_layers': fc_layers or [256, 128],
+            'nr_classes': nr_classes,
+            'in_channels': in_channels,
+        }
+        layers = self.config['layers']
+        fc_layers = self.config['fc_layers']
+        # Activation function
+        activation_fn = getattr(nn, activation)
+        # Build convolutional layers (ModuleList to match original)
+        self.conv_layers = nn.ModuleList()
+        prev_channels = in_channels
+        for out_channels in layers:
+            self.conv_layers.append(
+                nn.Conv2d(prev_channels, out_channels, kernel, stride, padding)
+            )
+            if batchnorm and bn_pre_activ:
+                self.conv_layers.append(nn.BatchNorm2d(out_channels))
+            self.conv_layers.append(activation_fn())
+            if batchnorm and not bn_pre_activ:
+                self.conv_layers.append(nn.BatchNorm2d(out_channels))
+            if pool:
+                self.conv_layers.append(nn.MaxPool2d(2, 2))
+            prev_channels = out_channels
+        # Global average pooling
+        self.adaptive_pool = nn.AdaptiveAvgPool2d(1)
+        # Build fully connected layers (ModuleList to match original)
+        self.fc_layers = nn.ModuleList()
+        prev_features = layers[-1]
+        for fc_size in fc_layers:
+            self.fc_layers.append(nn.Linear(prev_features, fc_size))
+            self.fc_layers.append(activation_fn())
+            self.fc_layers.append(nn.Dropout(dropout))
+            prev_features = fc_size
+        # Final classifier (separate, to match original)
+        self.classifier = nn.Linear(prev_features, nr_classes)
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """
+        Forward pass.
+        Args:
+            x: Input tensor of shape (batch_size, 3, 256, 256)
+        Returns:
+            Logits tensor of shape (batch_size, num_classes)
+        """
+        for layer in self.conv_layers:
+            x = layer(x)
+        x = self.adaptive_pool(x)
+        x = x.view(x.size(0), -1)
+        for layer in self.fc_layers:
+            x = layer(x)
+        x = self.classifier(x)
+        return x
+    @classmethod
+    def from_pretrained(cls, model_path: str, device: str = 'cpu') -> 'BaseCNN':
+        """
+        Load a pretrained model from a directory.
+        Args:
+            model_path: Path to directory containing model files
+            device: Device to load model on ('cpu' or 'cuda')
+        Returns:
+            Loaded model in eval mode
+        """
+        model_path = Path(model_path)
+        # Load config
+        config_path = model_path / 'config.json'
+        with open(config_path, 'r') as f:
+            config = json.load(f)
+        # Create model
+        model = cls(**config['model_config'])
+        # Load weights (prefer safetensors)
+        safetensors_path = model_path / 'model.safetensors'
+        pytorch_path = model_path / 'pytorch_model.bin'
+        if safetensors_path.exists() and HAS_SAFETENSORS:
+            state_dict = load_file(str(safetensors_path), device=device)
+        elif pytorch_path.exists():
+            state_dict = torch.load(pytorch_path, map_location=device, weights_only=True)
+        else:
+            raise FileNotFoundError(f"No model weights found in {model_path}")
+        model.load_state_dict(state_dict)
+        model.to(device)
+        model.eval()
+        return model
+    def save_pretrained(self, save_path: str) -> None:
+        """
+        Save model in Hugging Face compatible format.
+        Args:
+            save_path: Directory to save model files
+        """
+        save_path = Path(save_path)
+        save_path.mkdir(parents=True, exist_ok=True)
+        # Save config
+        config = {
+            'model_type': 'BaseCNN',
+            'model_config': self.config,
+            'num_labels': self.config['nr_classes'],
+            'id2label': {
+                '0': 'Type 1',
+                '1': 'Type 2',
+                '2': 'Type 3'
+            },
+            'label2id': {
+                'Type 1': 0,
+                'Type 2': 1,
+                'Type 3': 2
+            }
+        }
+        with open(save_path / 'config.json', 'w') as f:
+            json.dump(config, f, indent=2)
+        # Save weights
+        state_dict = {k: v.contiguous() for k, v in self.state_dict().items()}
+        # SafeTensors format (recommended)
+        if HAS_SAFETENSORS:
+            save_file(state_dict, str(save_path / 'model.safetensors'))
+        # PyTorch format (backup)
+        torch.save(state_dict, save_path / 'pytorch_model.bin')
+# Label mappings
+ID2LABEL = {0: 'Type 1', 1: 'Type 2', 2: 'Type 3'}
+LABEL2ID = {'Type 1': 0, 'Type 2': 1, 'Type 3': 2}
+if __name__ == '__main__':
+    # Quick test
+    model = BaseCNN()
+    print(f"Model parameters: {sum(p.numel() for p in model.parameters()):,}")
+    # Test forward pass
+    x = torch.randn(1, 3, 256, 256)
+    y = model(x)
+    print(f"Input shape: {x.shape}")
+    print(f"Output shape: {y.shape}")

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:beb3e17da6b94596232aa18078b9d22872f4711c7c1ef21a35f3277175d14063
+size 1960588

pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3d88b2345cde9dcdc7fc2b8ba76edb2c64abfbc274f320bd55ad9e12801c9b00
+size 1969453