UFM / uniflowmatch /models /unet_encoder.py
infinity1096
initial commit
c8b42eb
import torch
import torch.nn as nn
import torch.nn.functional as F
class DoubleConv(nn.Module):
"""(Conv2d => ReLU) * 2 with padding"""
def __init__(self, in_channels, out_channels):
super().__init__()
self.conv = nn.Sequential(
nn.Conv2d(in_channels, out_channels, kernel_size=3, padding=1), # preserve spatial
nn.ReLU(inplace=True),
nn.Conv2d(out_channels, out_channels, kernel_size=3, padding=1), # preserve spatial
nn.ReLU(inplace=True),
)
def forward(self, x):
return self.conv(x)
class UNet(nn.Module):
def __init__(self, in_channels, out_channels, features=[64, 128, 256, 512]):
super().__init__()
self.downs = nn.ModuleList()
self.ups = nn.ModuleList()
# Downsampling part
for feature in features:
self.downs.append(DoubleConv(in_channels, feature))
in_channels = feature
self.pool = nn.MaxPool2d(kernel_size=2, stride=2)
# Bottleneck
self.bottleneck = DoubleConv(features[-1], features[-1] * 2)
# Upsampling part
for feature in reversed(features):
self.ups.append(nn.ConvTranspose2d(feature * 2, feature, kernel_size=2, stride=2))
self.ups.append(DoubleConv(feature * 2, feature))
# Final output
self.final_conv = nn.Conv2d(features[0], out_channels, kernel_size=1)
def forward(self, x):
skip_connections = []
# Encoder
for down in self.downs:
x = down(x)
skip_connections.append(x)
x = self.pool(x)
x = self.bottleneck(x)
# Decoder
skip_connections = skip_connections[::-1]
for idx in range(0, len(self.ups), 2):
x = self.ups[idx](x) # ConvTranspose2d
skip_connection = skip_connections[idx // 2]
if x.shape != skip_connection.shape:
x = F.interpolate(x, size=skip_connection.shape[2:]) # Fix mismatched shapes
x = torch.cat((skip_connection, x), dim=1)
x = self.ups[idx + 1](x)
return self.final_conv(x)
if __name__ == "__main__":
model = UNet(in_channels=3, out_channels=16)
x = torch.randn(1, 3, 256, 256)
out = model(x)
print(out.shape)