Yeqing0814's picture
Upload folder using huggingface_hub
a6dd040 verified
# Copyright (c) Chris Choy (chrischoy@ai.stanford.edu).
#
# Permission is hereby granted, free of charge, to any person obtaining a copy of
# this software and associated documentation files (the "Software"), to deal in
# the Software without restriction, including without limitation the rights to
# use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
# of the Software, and to permit persons to whom the Software is furnished to do
# so, subject to the following conditions:
#
# The above copyright notice and this permission notice shall be included in all
# copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# SOFTWARE.
#
# Please cite "4D Spatio-Temporal ConvNets: Minkowski Convolutional Neural
# Networks", CVPR'19 (https://arxiv.org/abs/1904.08755) if you use any part
# of the code.
import torch
import MinkowskiEngine as ME
from tests.python.common import data_loader
def get_random_coords(dimension=2, tensor_stride=2):
torch.manual_seed(0)
# Create random coordinates with tensor stride == 2
coords = torch.rand(10, dimension + 1)
coords[:, :dimension] *= 5 # random coords
coords[:, -1] *= 2 # random batch index
coords = coords.floor().int()
coords = ME.utils.sparse_quantize(coords)
coords[:, :dimension] *= tensor_stride # make the tensor stride 2
return coords, tensor_stride
def print_sparse_tensor(tensor):
for c, f in zip(tensor.C.numpy(), tensor.F.detach().numpy()):
print(f"Coordinate {c} : Feature {f}")
def conv():
in_channels, out_channels, D = 2, 3, 2
coords, feats, labels = data_loader(in_channels, batch_size=1)
# Convolution
input = ME.SparseTensor(features=feats, coordinates=coords)
conv = ME.MinkowskiConvolution(
in_channels,
out_channels,
kernel_size=3,
stride=2,
bias=False,
dimension=D)
output = conv(input)
print('Input:')
print_sparse_tensor(input)
print('Output:')
print_sparse_tensor(output)
# Convolution transpose and generate new coordinates
strided_coords, tensor_stride = get_random_coords()
input = ME.SparseTensor(
features=torch.rand(len(strided_coords), in_channels), #
coordinates=strided_coords,
tensor_stride=tensor_stride)
conv_tr = ME.MinkowskiConvolutionTranspose(
in_channels,
out_channels,
kernel_size=3,
stride=2,
bias=False,
dimension=D)
output = conv_tr(input)
print('\nInput:')
print_sparse_tensor(input)
print('Convolution Transpose Output:')
print_sparse_tensor(output)
def conv_on_coords():
in_channels, out_channels, D = 2, 3, 2
coords, feats, labels = data_loader(in_channels, batch_size=1)
# Create input with tensor stride == 4
strided_coords4, tensor_stride4 = get_random_coords(tensor_stride=4)
strided_coords2, tensor_stride2 = get_random_coords(tensor_stride=2)
input = ME.SparseTensor(
features=torch.rand(len(strided_coords4), in_channels), #
coordinates=strided_coords4,
tensor_stride=tensor_stride4)
cm = input.coordinate_manager
# Convolution transpose and generate new coordinates
conv_tr = ME.MinkowskiConvolutionTranspose(
in_channels,
out_channels,
kernel_size=3,
stride=2,
bias=False,
dimension=D)
pool_tr = ME.MinkowskiPoolingTranspose(
kernel_size=2,
stride=2,
dimension=D)
# If the there is no coordinates defined for the tensor stride, it will create one
# tensor stride 4 -> conv_tr with stride 2 -> tensor stride 2
output1 = conv_tr(input)
# output1 = pool_tr(input)
# convolution on the specified coords
output2 = conv_tr(input, coords)
# output2 = pool_tr(input, coords)
# convolution on the specified coords with tensor stride == 2
coords_key, _ = cm.insert_and_map(strided_coords2, tensor_stride=2)
output3 = conv_tr(input, coords_key)
# output3 = pool_tr(input, coords_key)
# convolution on the coordinates of a sparse tensor
output4 = conv_tr(input, output1)
# output4 = pool_tr(input, output1)
if __name__ == '__main__':
conv()
conv_on_coords()