camenduru's picture
ceres-solver and colmap
2b5a2b6
// Copyright (c) 2022, ETH Zurich and UNC Chapel Hill.
// All rights reserved.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are met:
//
// * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
//
// * Redistributions in binary form must reproduce the above copyright
// notice, this list of conditions and the following disclaimer in the
// documentation and/or other materials provided with the distribution.
//
// * Neither the name of ETH Zurich and UNC Chapel Hill nor the names of
// its contributors may be used to endorse or promote products derived
// from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDERS OR CONTRIBUTORS BE
// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
// POSSIBILITY OF SUCH DAMAGE.
//
// Author: Johannes L. Schoenberger (jsch-at-demuc-dot-de)
#ifndef COLMAP_SRC_MVS_CUDA_ROTATE_H_
#define COLMAP_SRC_MVS_CUDA_ROTATE_H_
#include <cuda_runtime.h>
namespace colmap {
namespace mvs {
// Rotate the input matrix by 90 degrees in counter-clockwise direction.
template <typename T>
void CudaRotate(const T* input, T* output, const int width, const int height,
const int pitch_input, const int pitch_output);
////////////////////////////////////////////////////////////////////////////////
// Implementation
////////////////////////////////////////////////////////////////////////////////
#ifdef __CUDACC__
#define TILE_DIM_ROTATE 32
namespace internal {
template <typename T>
__global__ void CudaRotateKernel(T* output_data, const T* input_data,
const int width, const int height,
const int input_pitch,
const int output_pitch) {
int input_x = blockDim.x * blockIdx.x + threadIdx.x;
int input_y = blockDim.y * blockIdx.y + threadIdx.y;
if (input_x >= width || input_y >= height) {
return;
}
int output_x = input_y;
int output_y = width - 1 - input_x;
*((T*)((char*)output_data + output_y * output_pitch) + output_x) =
*((T*)((char*)input_data + input_y * input_pitch) + input_x);
}
} // namespace internal
template <typename T>
void CudaRotate(const T* input, T* output, const int width, const int height,
const int pitch_input, const int pitch_output) {
dim3 block_dim(TILE_DIM_ROTATE, 1, 1);
dim3 grid_dim;
grid_dim.x = (width - 1) / TILE_DIM_ROTATE + 1;
grid_dim.y = height;
internal::CudaRotateKernel<<<grid_dim, block_dim>>>(
output, input, width, height, pitch_input, pitch_output);
}
#undef TILE_DIM_ROTATE
#endif // __CUDACC__
} // namespace mvs
} // namespace colmap
#endif // COLMAP_SRC_MVS_CUDA_ROTATE_H_