depthsplat / MinkowskiEngine /examples /stack_unet.py

Upload folder using huggingface_hub

a6dd040 verified 5 months ago

3.84 kB

	# Copyright (c) Chris Choy (chrischoy@ai.stanford.edu).
	#
	# Permission is hereby granted, free of charge, to any person obtaining a copy of
	# this software and associated documentation files (the "Software"), to deal in
	# the Software without restriction, including without limitation the rights to
	# use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
	# of the Software, and to permit persons to whom the Software is furnished to do
	# so, subject to the following conditions:
	#
	# The above copyright notice and this permission notice shall be included in all
	# copies or substantial portions of the Software.
	#
	# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
	# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
	# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
	# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
	# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
	# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
	# SOFTWARE.
	#
	# Please cite "4D Spatio-Temporal ConvNets: Minkowski Convolutional Neural
	# Networks", CVPR'19 (https://arxiv.org/abs/1904.08755) if you use any part
	# of the code.
	import torch
	import torch.nn as nn

	import MinkowskiEngine as ME
	import MinkowskiEngine.MinkowskiFunctional as MF

	from tests.python.common import data_loader


	class StackUNet(ME.MinkowskiNetwork):
	def __init__(self, in_nchannel, out_nchannel, D):
	ME.MinkowskiNetwork.__init__(self, D)
	channels = [in_nchannel, 16, 32]
	self.net = nn.Sequential(
	ME.MinkowskiStackSum(
	ME.MinkowskiConvolution(
	channels[0],
	channels[1],
	kernel_size=3,
	stride=1,
	dimension=D,
	),
	nn.Sequential(
	ME.MinkowskiConvolution(
	channels[0],
	channels[1],
	kernel_size=3,
	stride=2,
	dimension=D,
	),
	ME.MinkowskiStackSum(
	nn.Identity(),
	nn.Sequential(
	ME.MinkowskiConvolution(
	channels[1],
	channels[2],
	kernel_size=3,
	stride=2,
	dimension=D,
	),
	ME.MinkowskiConvolutionTranspose(
	channels[2],
	channels[1],
	kernel_size=3,
	stride=1,
	dimension=D,
	),
	ME.MinkowskiPoolingTranspose(
	kernel_size=2, stride=2, dimension=D
	),
	),
	),
	ME.MinkowskiPoolingTranspose(kernel_size=2, stride=2, dimension=D),
	),
	),
	ME.MinkowskiToFeature(),
	nn.Linear(channels[1], out_nchannel, bias=True),
	)

	def forward(self, x):
	return self.net(x)


	if __name__ == "__main__":
	# loss and network
	net = StackUNet(3, 5, D=2)
	print(net)

	# a data loader must return a tuple of coords, features, and labels.
	coords, feat, label = data_loader()
	device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

	net = net.to(device)
	input = ME.SparseTensor(feat, coords, device=device)

	# Forward
	output = net(input)