// Copyright (c) 2022, ETH Zurich and UNC Chapel Hill. // All rights reserved. // // Redistribution and use in source and binary forms, with or without // modification, are permitted provided that the following conditions are met: // // * Redistributions of source code must retain the above copyright // notice, this list of conditions and the following disclaimer. // // * Redistributions in binary form must reproduce the above copyright // notice, this list of conditions and the following disclaimer in the // documentation and/or other materials provided with the distribution. // // * Neither the name of ETH Zurich and UNC Chapel Hill nor the names of // its contributors may be used to endorse or promote products derived // from this software without specific prior written permission. // // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE // ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDERS OR CONTRIBUTORS BE // LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR // CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF // SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS // INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN // CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) // ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE // POSSIBILITY OF SUCH DAMAGE. // // Author: Johannes L. Schoenberger (jsch-at-demuc-dot-de) #ifndef COLMAP_SRC_MVS_PATCH_MATCH_H_ #define COLMAP_SRC_MVS_PATCH_MATCH_H_ #include #include #include #include "mvs/depth_map.h" #include "mvs/image.h" #include "mvs/model.h" #include "mvs/normal_map.h" #ifndef __CUDACC__ #include "util/threading.h" #endif namespace colmap { namespace mvs { // Maximum possible window radius for the photometric consistency cost. This // value is equal to THREADS_PER_BLOCK in patch_match_cuda.cu and the limit // arises from the shared memory implementation. const static size_t kMaxPatchMatchWindowRadius = 32; class ConsistencyGraph; class PatchMatchCuda; class Workspace; struct PatchMatchOptions { // Maximum image size in either dimension. int max_image_size = -1; // Index of the GPU used for patch match. For multi-GPU usage, // you should separate multiple GPU indices by comma, e.g., "0,1,2,3". std::string gpu_index = "-1"; // Depth range in which to randomly sample depth hypotheses. double depth_min = -1.0f; double depth_max = -1.0f; // Half window size to compute NCC photo-consistency cost. int window_radius = 5; // Number of pixels to skip when computing NCC. For a value of 1, every // pixel is used to compute the NCC. For larger values, only every n-th row // and column is used and the computation speed thereby increases roughly by // a factor of window_step^2. Note that not all combinations of window sizes // and steps produce nice results, especially if the step is greather than 2. int window_step = 1; // Parameters for bilaterally weighted NCC. double sigma_spatial = -1; double sigma_color = 0.2f; // Number of random samples to draw in Monte Carlo sampling. int num_samples = 15; // Spread of the NCC likelihood function. double ncc_sigma = 0.6f; // Minimum triangulation angle in degrees. double min_triangulation_angle = 1.0f; // Spread of the incident angle likelihood function. double incident_angle_sigma = 0.9f; // Number of coordinate descent iterations. Each iteration consists // of four sweeps from left to right, top to bottom, and vice versa. int num_iterations = 5; // Whether to add a regularized geometric consistency term to the cost // function. If true, the `depth_maps` and `normal_maps` must not be null. bool geom_consistency = true; // The relative weight of the geometric consistency term w.r.t. to // the photo-consistency term. double geom_consistency_regularizer = 0.3f; // Maximum geometric consistency cost in terms of the forward-backward // reprojection error in pixels. double geom_consistency_max_cost = 3.0f; // Whether to enable filtering. bool filter = true; // Minimum NCC coefficient for pixel to be photo-consistent. double filter_min_ncc = 0.1f; // Minimum triangulation angle to be stable. double filter_min_triangulation_angle = 3.0f; // Minimum number of source images have to be consistent // for pixel not to be filtered. int filter_min_num_consistent = 2; // Maximum forward-backward reprojection error for pixel // to be geometrically consistent. double filter_geom_consistency_max_cost = 1.0f; // Cache size in gigabytes for patch match, which keeps the bitmaps, depth // maps, and normal maps of this number of images in memory. A higher value // leads to less disk access and faster computation, while a lower value // leads to reduced memory usage. Note that a single image can consume a lot // of memory, if the consistency graph is dense. double cache_size = 32.0; // Whether to tolerate missing images/maps in the problem setup bool allow_missing_files = false; // Whether to write the consistency graph. bool write_consistency_graph = false; void Print() const; bool Check() const { if (depth_min != -1.0f || depth_max != -1.0f) { CHECK_OPTION_LE(depth_min, depth_max); CHECK_OPTION_GE(depth_min, 0.0f); } CHECK_OPTION_LE(window_radius, static_cast(kMaxPatchMatchWindowRadius)); CHECK_OPTION_GT(sigma_color, 0.0f); CHECK_OPTION_GT(window_radius, 0); CHECK_OPTION_GT(window_step, 0); CHECK_OPTION_LE(window_step, 2); CHECK_OPTION_GT(num_samples, 0); CHECK_OPTION_GT(ncc_sigma, 0.0f); CHECK_OPTION_GE(min_triangulation_angle, 0.0f); CHECK_OPTION_LT(min_triangulation_angle, 180.0f); CHECK_OPTION_GT(incident_angle_sigma, 0.0f); CHECK_OPTION_GT(num_iterations, 0); CHECK_OPTION_GE(geom_consistency_regularizer, 0.0f); CHECK_OPTION_GE(geom_consistency_max_cost, 0.0f); CHECK_OPTION_GE(filter_min_ncc, -1.0f); CHECK_OPTION_LE(filter_min_ncc, 1.0f); CHECK_OPTION_GE(filter_min_triangulation_angle, 0.0f); CHECK_OPTION_LE(filter_min_triangulation_angle, 180.0f); CHECK_OPTION_GE(filter_min_num_consistent, 0); CHECK_OPTION_GE(filter_geom_consistency_max_cost, 0.0f); CHECK_OPTION_GT(cache_size, 0); return true; } }; // This is a wrapper class around the actual PatchMatchCuda implementation. This // class is necessary to hide Cuda code from any boost or Eigen code, since // NVCC/MSVC cannot compile complex C++ code. class PatchMatch { public: struct Problem { // Index of the reference image. int ref_image_idx = -1; // Indices of the source images. std::vector src_image_idxs; // Input images for the photometric consistency term. std::vector* images = nullptr; // Input depth maps for the geometric consistency term. std::vector* depth_maps = nullptr; // Input normal maps for the geometric consistency term. std::vector* normal_maps = nullptr; // Print the configuration to stdout. void Print() const; }; PatchMatch(const PatchMatchOptions& options, const Problem& problem); ~PatchMatch(); // Check the options and the problem for validity. void Check() const; // Run the patch match algorithm. void Run(); // Get the computed values after running the algorithm. DepthMap GetDepthMap() const; NormalMap GetNormalMap() const; ConsistencyGraph GetConsistencyGraph() const; Mat GetSelProbMap() const; private: const PatchMatchOptions options_; const Problem problem_; std::unique_ptr patch_match_cuda_; }; // This thread processes all problems in a workspace. A workspace has the // following file structure, if the workspace format is "COLMAP": // // images/* // sparse/{cameras.txt, images.txt, points3D.txt} // stereo/ // depth_maps/* // normal_maps/* // consistency_graphs/* // patch-match.cfg // // The `patch-match.cfg` file specifies the images to be processed as: // // image_name1.jpg // __all__ // image_name2.jpg // __auto__, 20 // image_name3.jpg // image_name1.jpg, image_name2.jpg // // Two consecutive lines specify the images used to compute one patch match // problem. The first line specifies the reference image and the second line the // source images. Image names are relative to the `images` directory. In this // example, the first reference image uses all other images as source images, // the second reference image uses the 20 most connected images as source // images, and the third reference image uses the first and second as source // images. Note that all specified images must be reconstructed in the COLMAP // reconstruction provided in the `sparse` folder. #ifndef __CUDACC__ class PatchMatchController : public Thread { public: PatchMatchController(const PatchMatchOptions& options, const std::string& workspace_path, const std::string& workspace_format, const std::string& pmvs_option_name, const std::string& config_path = ""); private: void Run(); void ReadWorkspace(); void ReadProblems(); void ReadGpuIndices(); void ProcessProblem(const PatchMatchOptions& options, const size_t problem_idx); const PatchMatchOptions options_; const std::string workspace_path_; const std::string workspace_format_; const std::string pmvs_option_name_; const std::string config_path_; std::unique_ptr thread_pool_; std::mutex workspace_mutex_; std::unique_ptr workspace_; std::vector problems_; std::vector gpu_indices_; std::vector> depth_ranges_; }; #endif } // namespace mvs } // namespace colmap #endif // COLMAP_SRC_MVS_PATCH_MATCH_H_