| from huggingface_hub import PyTorchModelHubMixin |
| from torch import nn |
|
|
| class SurfinBird(nn.Module, PyTorchModelHubMixin): |
| def __init__(self, config: dict) -> None: |
| super().__init__() |
| self.conv1 = nn.Conv2d( |
| in_channels=config["num_channels"], |
| out_channels=64, |
| kernel_size=7, |
| stride=2, |
| padding=3) |
| self.bn1 = nn.BatchNorm2d(64) |
| self.relu1 = nn.ReLU() |
| self.mp1 = nn.MaxPool2d(kernel_size=2, |
| stride=2) |
| self.conv_block_2 = nn.Sequential( |
| nn.Conv2d( |
| in_channels=64, |
| out_channels=64, |
| kernel_size=3, |
| stride=1, |
| padding=1 |
| ), |
| nn.BatchNorm2d(64), |
| nn.ReLU(), |
| nn.Conv2d( |
| in_channels=64, |
| out_channels=64, |
| kernel_size=3, |
| stride=1, |
| padding=1 |
| ), |
| nn.BatchNorm2d(64), |
| nn.ReLU(), |
| nn.Conv2d( |
| in_channels=64, |
| out_channels=64, |
| kernel_size=3, |
| stride=1, |
| padding=1 |
| ), |
| nn.BatchNorm2d(64), |
| nn.ReLU(), |
| nn.MaxPool2d(kernel_size=2, |
| stride=2) |
| ) |
| self.conv_block_3 = nn.Sequential( |
| nn.Conv2d( |
| in_channels=64, |
| out_channels=128, |
| kernel_size=3, |
| stride=1, |
| padding=1 |
| ), |
| nn.BatchNorm2d(128), |
| nn.ReLU(), |
| nn.Conv2d( |
| in_channels=128, |
| out_channels=128, |
| kernel_size=3, |
| stride=1, |
| padding=1 |
| ), |
| nn.BatchNorm2d(128), |
| nn.ReLU(), |
| nn.Conv2d( |
| in_channels=128, |
| out_channels=128, |
| kernel_size=3, |
| stride=1, |
| padding=1 |
| ), |
| nn.BatchNorm2d(128), |
| nn.ReLU(), |
| nn.MaxPool2d(kernel_size=2, |
| stride=2) |
| ) |
| self.conv_block_4 = nn.Sequential( |
| nn.Conv2d( |
| in_channels=128, |
| out_channels=128, |
| kernel_size=3, |
| stride=1, |
| padding=1 |
| ), |
| nn.BatchNorm2d(128), |
| nn.ReLU(), |
| nn.Conv2d( |
| in_channels=128, |
| out_channels=128, |
| kernel_size=3, |
| stride=1, |
| padding=1 |
| ), |
| nn.BatchNorm2d(128), |
| nn.ReLU(), |
| nn.Conv2d( |
| in_channels=128, |
| out_channels=128, |
| kernel_size=3, |
| stride=1, |
| padding=1 |
| ), |
| nn.BatchNorm2d(128), |
| nn.ReLU(), |
| nn.MaxPool2d(kernel_size=2, |
| stride=2) |
| ) |
| self.conv_block_5 = nn.Sequential( |
| nn.Conv2d( |
| in_channels=128, |
| out_channels=256, |
| kernel_size=3, |
| stride=1, |
| padding=1 |
| ), |
| nn.BatchNorm2d(256), |
| nn.ReLU(), |
| nn.Conv2d( |
| in_channels=256, |
| out_channels=256, |
| kernel_size=3, |
| stride=1, |
| padding=1 |
| ), |
| nn.BatchNorm2d(256), |
| nn.ReLU(), |
| nn.Conv2d( |
| in_channels=256, |
| out_channels=256, |
| kernel_size=3, |
| stride=1, |
| padding=1 |
| ), |
| nn.BatchNorm2d(256), |
| nn.ReLU(), |
| nn.MaxPool2d(kernel_size=2, |
| stride=2) |
| ) |
| self.conv_block_6 = nn.Sequential( |
| nn.Conv2d( |
| in_channels=256, |
| out_channels=256, |
| kernel_size=3, |
| stride=1, |
| padding=1 |
| ), |
| nn.BatchNorm2d(256), |
| nn.ReLU(), |
| nn.Conv2d( |
| in_channels=256, |
| out_channels=256, |
| kernel_size=3, |
| stride=1, |
| padding=1 |
| ), |
| nn.BatchNorm2d(256), |
| nn.ReLU(), |
| nn.Conv2d( |
| in_channels=256, |
| out_channels=256, |
| kernel_size=3, |
| stride=1, |
| padding=1 |
| ), |
| nn.BatchNorm2d(256), |
| nn.ReLU(), |
| nn.MaxPool2d(kernel_size=2, |
| stride=2) |
| ) |
|
|
| self.avgpool = nn.Sequential( |
| nn.AdaptiveAvgPool2d(output_size=(1, 1)) |
| ) |
|
|
| self.classifier = nn.Sequential( |
| nn.Flatten(), |
| nn.Linear(in_features=config["hidden_units"]*1*1, |
| out_features=config["num_classes"]) |
| ) |
| def forward(self, x: torch.Tensor): |
| return self.classifier(self.avgpool(self.conv_block_6(self.conv_block_5(self.conv_block_4(self.conv_block_3(self.conv_block_2(self.mp1(self.relu1(self.bn1(self.conv1(x))))))))))) |
|
|
| config = {"num_channels": 3, "hidden_units": 256, "num_classes": 525} |