Spaces:

i4ata
/

CustomUnetSegmentation

Sleeping

App Files Files Community

i4ata commited on Feb 25, 2024

Commit

671b160

1 Parent(s): 8b5523a

demo to spaces

Browse files

Files changed (17) hide show

LICENSE +21 -0
README.md +19 -13
__pycache__/custom_unet.cpython-310.pyc +0 -0
__pycache__/early_stopper.cpython-310.pyc +0 -0
__pycache__/model.cpython-310.pyc +0 -0
__pycache__/unet.cpython-310.pyc +0 -0
app.py +55 -0
custom_unet.py +135 -0
early_stopper.py +23 -0
examples/example_1.jpg +0 -0
examples/example_2.jpg +0 -0
examples/example_3.jpg +0 -0
model.py +130 -0
models/custom_unet.pth +3 -0
models/unet.pth +3 -0
requirements.txt +9 -0
unet.py +67 -0

LICENSE ADDED Viewed

	@@ -0,0 +1,21 @@

+MIT License
+Copyright (c) 2023 i4ata
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

README.md CHANGED Viewed

@@ -1,13 +1,19 @@
----
-title: CustomUnetSegmentation
-emoji: 🐠
-colorFrom: gray
-colorTo: yellow
-sdk: gradio
-sdk_version: 4.19.2
-app_file: app.py
-pinned: false
-license: mit
----
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

+# UnetSegmentation
+My own implementation of the U-net architecture compared to a pretrained model from PyTorch Segmentation Models.
+To train:
+```python train.py```
+To visualize training:
+```tesnorboard --logdir runs```
+To visually compare models on some examples:
+```python compare_models.py```
+To launch a Gradio application:
+```python3 gradio_app.py```

__pycache__/custom_unet.cpython-310.pyc ADDED Viewed

Binary file (5.68 kB). View file

__pycache__/early_stopper.cpython-310.pyc ADDED Viewed

Binary file (956 Bytes). View file

__pycache__/model.cpython-310.pyc ADDED Viewed

Binary file (4.59 kB). View file

__pycache__/unet.cpython-310.pyc ADDED Viewed

Binary file (2.81 kB). View file

app.py ADDED Viewed

	@@ -0,0 +1,55 @@

+import gradio as gr
+from PIL import Image
+import os
+import torch
+import numpy as np
+from model import SegmentationModel
+from custom_unet import CustomUnet
+from unet import Unet
+from typing import Dict, Union, Tuple, List
+class GradioApp:
+    def __init__(self) -> None:
+        self.models: Dict[str, Union[str, SegmentationModel]] = {
+            'Custom': 'custom_unet',
+            'Pretrained': 'unet'
+        }
+    def predict(self, img_file: str, model_name: str) -> Tuple[str, List[Tuple[np.ndarray, str]]]:
+        # Lazy loading of models
+        if isinstance(self.models[model_name], str):
+            model_class = CustomUnet if model_name == 'Custom' else Unet
+            self.models[model_name] = model_class(self.models[model_name], from_file=True, device='cpu')
+            self.models[model_name].eval()
+        prediction = self.models[model_name].predict(img_file, option='mask')[0] * 1
+        return img_file, [(prediction, 'person')]
+    def launch(self):
+        examples_list = [['examples/' + example] for example in os.listdir('examples')]
+        demo = gr.Interface(
+            fn=self.predict,
+            inputs=[
+                gr.Image(type='filepath', label='Input image to segment'),
+                gr.Radio(choices=('Custom', 'Pretrained'), label='Available models')
+            ],
+            outputs=gr.AnnotatedImage(label='Model predictions'),
+            examples=examples_list,
+            cache_examples=False,
+            #title='Plants Diseases Classification',
+            #description=f'This model performs classification on images of leaves that are either healthy, \
+            #    have bean rust, or have an angular leaf spot. A vision transformer neural network architecture is used. \
+            #    The dataset can be downloaded from [Kaggle]({dataset_url}) and the source code is on [GitHub]({github_repo_url}).',
+        )
+        demo.launch()
+if __name__ == '__main__':
+    app = GradioApp()
+    app.launch()

custom_unet.py ADDED Viewed

	@@ -0,0 +1,135 @@

+"""This python module impements the Unet architecture as defined in https://arxiv.org/pdf/1505.04597.
+Only, I use padded convolutions. That way, there is no need for center cropping and the output mask
+is the same shape as the input image.
+Additional things: https://towardsdatascience.com/understanding-u-net-61276b10f360
+"""
+import torch
+import torch.nn as nn
+from torchinfo import summary
+from model import SegmentationModel
+from early_stopper import EarlyStopper
+from typing import Tuple, Union, Optional
+device = 'cuda' if torch.cuda.is_available() else 'cpu'
+class DiceLoss(nn.Module):
+    def forward(self, logits: torch.Tensor, mask_true: torch.Tensor):
+        logits = torch.sigmoid(logits) > .5
+        intersection = (logits * mask_true).sum()
+        union = logits.sum() + mask_true.sum()
+        return 2 * intersection / union
+class DoubleConv(nn.Module):
+    def __init__(self, in_channels: int, out_channels: int) -> None:
+        super().__init__()
+        self.relu = nn.ReLU()
+        self.conv1 = nn.Conv2d(in_channels, out_channels, kernel_size=3, padding='same')
+        self.conv2 = nn.Conv2d(out_channels, out_channels, kernel_size=3, padding='same')
+    def forward(self, x: torch.Tensor):
+        return self.relu(self.conv2(self.relu(self.conv1(x))))
+class Up(nn.Module):
+    def __init__(self, in_channels, out_channels) -> None:
+        super().__init__()
+        self.upconv = nn.ConvTranspose2d(in_channels=in_channels, out_channels=out_channels, kernel_size=2, stride=2)
+        self.conv = DoubleConv(in_channels=in_channels, out_channels=out_channels)
+    def forward(self, x_left, x_right):
+        return self.conv(torch.cat((x_left, self.upconv(x_right)), dim=1))
+class UnetModel(nn.Module):
+    def __init__(self, in_channels: int = 3, depth: int = 3, start_channels: int = 16) -> None:
+        super().__init__()
+        self.input_conv = DoubleConv(in_channels, start_channels)
+        self.encoder_layers = nn.ModuleList()
+        for i in range(depth):
+            self.encoder_layers.append(DoubleConv(start_channels, start_channels * 2))
+            start_channels *= 2
+        self.decoder_layers = nn.ModuleList()
+        for i in range(depth):
+            self.decoder_layers.append(Up(start_channels, start_channels // 2))
+            start_channels //= 2
+        self.output_conv = nn.Conv2d(start_channels, 1, kernel_size=1)
+        self.pool = nn.MaxPool2d(2, 2)
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        x = self.input_conv(x)
+        xs = [x]
+        for encoding_layer in self.encoder_layers:
+            x = encoding_layer(self.pool(x))
+            xs.append(x)
+        for decoding_layer, x_left in zip(self.decoder_layers, reversed(xs[:-1])):
+            x = decoding_layer(x_left, x)
+        return self.output_conv(x)
+class CustomUnet(SegmentationModel):
+    def __init__(self,
+                 name: str = 'default_name',
+                 from_file: bool = True,
+                 image_size: Tuple[int, int] = (320, 320),
+                 in_channels: int = 3,
+                 start_channels: int = 16,
+                 encoder_depth: int = 5,
+                 device: str = 'cuda' if torch.cuda.is_available() else 'cpu') -> None:
+        super().__init__()
+        assert image_size[0] % (2**encoder_depth) == 0
+        assert image_size[1] % (2**encoder_depth) == 0
+        self.name = name
+        self.image_size = image_size
+        self.in_channels = in_channels
+        self.device = device
+        self.save_path = f'models/{name}.pth'
+        if from_file:
+            self.unet = torch.load(self.save_path, map_location=device)
+        else:
+            self.unet = UnetModel(in_channels=in_channels, depth=encoder_depth, start_channels=start_channels).to(device)
+        self.bce_loss = nn.BCEWithLogitsLoss()
+        self.dice_loss = DiceLoss()
+        self.loss_fn = lambda logits, masks: self.bce_loss(logits, masks) + self.dice_loss(logits, masks)
+    def configure_optimizers(self, **kwargs):
+        self.optimizer = torch.optim.Adam(params=self.unet.parameters(), lr=kwargs['lr'])
+        self.early_stopper = EarlyStopper(patience=kwargs['patience'])
+    def forward(self, images: torch.Tensor, masks: Optional[torch.Tensor] = None) -> Union[torch.Tensor, Tuple[torch.Tensor, torch.Tensor]]:
+        logits = self.unet(images)
+        if masks is None:
+            return logits
+        return logits, self.loss_fn(logits, masks)
+    def save(self) -> None:
+        # Save the whole model, not only the state dict, so that it will work for different unets
+        torch.save(self.unet, self.save_path)
+    def print_summary(self, batch_size: int = 16) -> None:
+        print(summary(self.unet, input_size=(batch_size, self.in_channels, *self.image_size),
+                      col_names=['input_size', 'output_size', 'num_params'],
+                      row_settings=['var_names']))

early_stopper.py ADDED Viewed

	@@ -0,0 +1,23 @@

+"""This module contains a class that implements early stopping regularization technique"""
+class EarlyStopper:
+    def __init__(self, patience: int = 2):
+        self.patience = patience
+        self.best_loss = float('inf')
+        self.counter = 0
+        self.save_model = False
+    def check(self, validation_loss: float) -> bool:
+        self.save_model = False
+        if validation_loss > self.best_loss:
+            self.counter += 1
+            if self.counter == self.patience:
+                return True
+        else:
+            self.best_loss = validation_loss
+            self.counter = 0
+            self.save_model = True
+        return False

examples/example_1.jpg ADDED Viewed

examples/example_2.jpg ADDED Viewed

examples/example_3.jpg ADDED Viewed

model.py ADDED Viewed

	@@ -0,0 +1,130 @@

+"""This module contains the base class for segmentation models"""
+import torch
+import torch.nn as nn
+from torch.utils.data import DataLoader
+from torchvision.utils import draw_segmentation_masks
+from torchvision.transforms.functional import resize
+from torch.utils.tensorboard.writer import SummaryWriter
+import numpy as np
+import cv2 as cv
+import albumentations as A
+from typing import Optional, Union, Tuple, Literal
+from early_stopper import EarlyStopper
+class SegmentationModel(nn.Module):
+    name: str = "base name"
+    device: Literal['cpu', 'cuda'] = None
+    optimizer: torch.optim.Optimizer = None
+    early_stopper: EarlyStopper = None
+    lr_scheduler: torch.optim.lr_scheduler.LRScheduler = None
+    save_path: str = None
+    image_size: Tuple[int, int] = None
+    def configure_optimizers(self, **kwargs) -> None:
+        raise NotImplementedError()
+    def forward(self, images: torch.Tensor, masks: Optional[torch.Tensor] = None) -> Union[torch.Tensor, Tuple[torch.Tensor, torch.Tensor]]:
+        raise NotImplementedError()
+    def _train_step(self, data_loader: DataLoader) -> float:
+        self.train()
+        total_loss = 0.
+        for images, masks in data_loader:
+            images, masks = images.to(self.device), masks.to(self.device)
+            self.optimizer.zero_grad()
+            logits, loss = self(images, masks)
+            loss.backward()
+            self.optimizer.step()
+            total_loss += loss.item()
+        return total_loss / len(data_loader)
+    def _test_step(self, data_loader: DataLoader) -> float:
+        self.eval()
+        total_loss = 0.
+        with torch.inference_mode():
+            for images, masks in data_loader:
+                images, masks = images.to(self.device), masks.to(self.device)
+                logits, loss = self(images, masks)
+                total_loss += loss.item()
+        return total_loss / len(data_loader)
+    def train_model(self, train_loader: DataLoader, test_loader: DataLoader, epochs: int, log_dir: str) -> None:
+        writer = SummaryWriter(log_dir=f'{log_dir}/{self.name}')
+        for i in range(epochs):
+            train_loss = self._train_step(train_loader)
+            test_loss = self._test_step(test_loader)
+            if self.early_stopper is not None:
+                if self.early_stopper.check(test_loss):
+                    print(f'Model stopped early due to risk of overfitting')
+                    break
+                if self.early_stopper.save_model:
+                    self.save()
+                    print('saved model')
+            if self.lr_scheduler is not None:
+                self.lr_scheduler.step()
+            print(f'{i}: Train loss: {train_loss :.2} | Test loss: {test_loss :.2}')
+            writer.add_scalars(main_tag='Loss over time',
+                               tag_scalar_dict={'train loss': train_loss, 'test loss': test_loss},
+                               global_step=i)
+        else:
+            if self.early_stopper is not None:
+                print('Model did not converge. Possibility of underfitting')
+            self.save()
+        writer.close()
+    def save(self) -> None:
+        raise NotImplementedError()
+    def predict(self,
+                test_image_path: str,
+                option: Literal['mask', 'image_with_mask', 'mask_and_image_with_mask'] = 'image_with_mask'
+        ) -> Union[np.ndarray, Tuple[np.ndarray, np.ndarray]]:
+        self.eval()
+        input_resizer = A.Resize(*self.image_size)
+        original_image = cv.cvtColor(cv.imread(test_image_path), cv.COLOR_BGR2RGB)
+        original_image_tensor = torch.from_numpy(original_image).permute(2,0,1).type(torch.uint8)
+        resized_image_tensor = (torch.from_numpy(input_resizer(image=original_image)['image']).float() / 255.).permute(2,0,1)
+        with torch.inference_mode():
+            logits = self(resized_image_tensor.unsqueeze(0).to(self.device)).squeeze(0).cpu().detach()
+        probs = torch.sigmoid(logits)
+        resized_mask_tensor = probs > .5
+        original_mask_tensor = resize(resized_mask_tensor, size=original_image.shape[:-1], antialias=True)
+        image_with_mask = draw_segmentation_masks(image=original_image_tensor,
+                                                  masks=original_mask_tensor,
+                                                  alpha=.5,
+                                                  colors='white')
+        if option == 'mask':
+            return original_mask_tensor.numpy()
+        if option == 'image_with_mask':
+            return image_with_mask.permute(1,2,0).numpy()
+        if option == 'mask_and_image_with_mask':
+            return original_mask_tensor.numpy(), image_with_mask.permute(1,2,0).numpy()
+    def print_summary(self) -> None:
+        raise NotImplementedError()

models/custom_unet.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eeca616e3026a77a2125e4c880f5335e1efa4a2c53b1ad4dad0082e227e49b85
+size 7812958

models/unet.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d26354f766301bc980c66f3984599491a4c3dc35706dc3e31a95f115e30a74c6
+size 25378610

requirements.txt ADDED Viewed

	@@ -0,0 +1,9 @@

+torch
+torchinfo
+segmentation-models-pytorch
+albumentations
+opencv-python
+gradio
+numpy
+matplotlib
+tensorboard

unet.py ADDED Viewed

	@@ -0,0 +1,67 @@

+"""This module defines a Unet architecture"""
+import torch.nn as nn
+import torch
+from torchinfo import summary
+import segmentation_models_pytorch as smp
+from early_stopper import EarlyStopper
+from model import SegmentationModel
+from typing import Optional, Union, Tuple
+class Unet(SegmentationModel):
+    def __init__(self,
+                 name: str = 'default_name',
+                 from_file: bool = True,
+                 image_size: Tuple[int, int] = (320, 320),
+                 encoder_name: str = 'timm-efficientnet-b0',
+                 pretrained: bool = True,
+                 in_channels: int = 3,
+                 encoder_depth: int = 5,
+                 device: str = 'cuda' if torch.cuda.is_available() else 'cpu') -> None:
+        super().__init__()
+        self.name = name
+        self.image_size = image_size
+        self.in_channels = in_channels
+        self.device = device
+        self.save_path = f'models/{name}.pth'
+        if from_file:
+            self.unet = torch.load(self.save_path, map_location=device)
+        else:
+            self.unet = smp.Unet(
+                encoder_name=encoder_name,
+                encoder_weights='imagenet' if pretrained else None,
+                in_channels=in_channels,
+                encoder_depth=encoder_depth,
+                classes=1,
+                activation=None
+            ).to(device)
+        bce_loss_fn = nn.BCEWithLogitsLoss()
+        dice_loss_fn = smp.losses.DiceLoss(mode='binary')
+        self.loss_fn = lambda logits, masks: bce_loss_fn(logits, masks) + dice_loss_fn(logits, masks)
+    def configure_optimizers(self, **kwargs):
+        self.optimizer = torch.optim.Adam(params=self.unet.parameters(), lr=kwargs['lr'])
+        self.early_stopper = EarlyStopper(patience=kwargs['patience'])
+    def forward(self, images: torch.Tensor, masks: Optional[torch.Tensor] = None) -> Union[torch.Tensor, Tuple[torch.Tensor, torch.Tensor]]:
+        logits = self.unet(images)
+        if masks is None:
+            return logits
+        return logits, self.loss_fn(logits, masks)
+    def save(self) -> None:
+        # Save the whole model, not only the state dict, so that it will work for different unets
+        torch.save(self.unet, self.save_path)
+    def print_summary(self, batch_size: int = 16) -> None:
+        print(summary(self.unet, input_size=(batch_size, self.in_channels, *self.image_size),
+                      col_names=['input_size', 'output_size', 'num_params'],
+                      row_settings=['var_names']))