Merge pull request #2619 from akashsharma02:submap

[GSoC] Add Submaps and PoseGraph optimization for Large Scale Depth Fusion * - Add HashTSDF class - Implement Integrate function (untested) * Integration seems to be working, raycasting does not * Update integration code * Integration and Raycasting fixes, (both work now) * - Format code - Clean up comments and few fixes * Add Kinect Fusion backup file * - Add interpolation for vertices and normals (slow and unreliable!) - Format code - Delete kinfu_back.cpp * Bug fix for integration and noisy odometry * - Create volume abstract class - Address Review comments * - Add getPoints and getNormals function - Fix formatting according to comments - Move volume abstract class to include/opencv2/rgbd/ - Write factory method for creating TSDFVolumes - Small bug fixes - Minor fixes according to comments * - Add tests for hashTSDF - Fix raycasting bug causing to loop forever - Suppress warnings by explicit conversion - Disable hashTsdf test until we figure out memory leak - style changes - Add missing license in a few files, correct precomp.hpp usage * - Use CRTP based static polymorphism to choose between CPU and GPU for HashTSDF volume * Create submap and submapMgr Implement overlap_ratio check to create new submaps * Early draft of posegraph and submaps (Doesn't even compile) * Minor cleanup (no compilation) * Track all submaps (no posegraph update yet) * Return inliers from ICP for weighting the constraints (Huber threshold based inliers pending) * Add updating constraints between submaps and retain same current map * Fix constraints creation between submaps and allow for switching between submaps * - Fix bug in allocate volumeUnits - Simplify calculation of visibleBlocks * Remove inlier calculation in fast_icp (not required) * Modify readFile to allow reading other datasets easily * - Implement posegraph update, Gauss newton is unstable - Minor changes to Gauss newton and Sparse matrix. Residual still increases slightly over iterations * Implement simplified levenberg marquardt * Bug fixes for Levenberg Marquardt and minor changes * minor changes * Fixes, but Optimizer is still not well behaved * Working Ceres optimizer * - Reorganize IO code for samples in a separate file - Minor fix for Ceres preprocessor definition - Remove unused generatorJacobian, will be used for opencv implementation of levenberg marquardt - Doxygen docs fix - Minor preprocessor fixes * - Reorganize IO code for samples in a separate file - Minor fix for Ceres preprocessor definition - Remove unused generatorJacobian, will be used for opencv implementation of levenberg marquardt - Doxygen docs fix - Minor preprocessor fixes - Move inline functions to header, and make function params const references * - Add Python bindings for volume struct - Remove makeVolume(const VolumeParams&) Python binding due to compilation issues - Minor changes according to comments * - Remove dynafu::Params() since it is identical to kinfu::Params() - Use common functions for dynafu_demo - Suppress "unreachable code" in volume.cpp * Minor API changes * Minor * Remove CRTP for HashTSDF class * Bug fixes for HashTSDF integration
2025-10-22 07:31:26 +08:00 · 2020-10-13 15:19:15 -04:00
parent ef0c722f56
commit 7022f4e3e0
25 changed files with 2655 additions and 845 deletions
--- a/modules/rgbd/samples/io_utils.hpp
+++ b/modules/rgbd/samples/io_utils.hpp
@@ -0,0 +1,313 @@
+// This file is part of OpenCV project.
+// It is subject to the license terms in the LICENSE file found in the top-level directory
+// of this distribution and at http://opencv.org/license.html
+
+#ifndef OPENCV_RGBS_IO_UTILS_HPP
+#define OPENCV_RGBS_IO_UTILS_HPP
+
+#include <fstream>
+#include <iostream>
+#include <opencv2/calib3d.hpp>
+#include <opencv2/core.hpp>
+#include <opencv2/highgui.hpp>
+#include <opencv2/rgbd/kinfu.hpp>
+#include <opencv2/rgbd/large_kinfu.hpp>
+
+namespace cv
+{
+namespace io_utils
+{
+
+static std::vector<std::string> readDepth(const std::string& fileList)
+{
+    std::vector<std::string> v;
+
+    std::fstream file(fileList);
+    if (!file.is_open())
+        throw std::runtime_error("Failed to read depth list");
+
+    std::string dir;
+    size_t slashIdx = fileList.rfind('/');
+    slashIdx        = slashIdx != std::string::npos ? slashIdx : fileList.rfind('\\');
+    dir             = fileList.substr(0, slashIdx);
+
+    while (!file.eof())
+    {
+        std::string s, imgPath;
+        std::getline(file, s);
+        if (s.empty() || s[0] == '#')
+            continue;
+        std::stringstream ss;
+        ss << s;
+        double thumb;
+        ss >> thumb >> imgPath;
+        v.push_back(dir + '/' + imgPath);
+    }
+
+    return v;
+}
+
+struct DepthWriter
+{
+    DepthWriter(std::string fileList) : file(fileList, std::ios::out), count(0), dir()
+    {
+        size_t slashIdx = fileList.rfind('/');
+        slashIdx        = slashIdx != std::string::npos ? slashIdx : fileList.rfind('\\');
+        dir             = fileList.substr(0, slashIdx);
+
+        if (!file.is_open())
+            throw std::runtime_error("Failed to write depth list");
+
+        file << "# depth maps saved from device" << std::endl;
+        file << "# useless_number filename" << std::endl;
+    }
+
+    void append(InputArray _depth)
+    {
+        Mat depth                  = _depth.getMat();
+        std::string depthFname     = cv::format("%04d.png", count);
+        std::string fullDepthFname = dir + '/' + depthFname;
+        if (!imwrite(fullDepthFname, depth))
+            throw std::runtime_error("Failed to write depth to file " + fullDepthFname);
+        file << count++ << " " << depthFname << std::endl;
+    }
+
+    std::fstream file;
+    int count;
+    std::string dir;
+};
+
+namespace Kinect2Params
+{
+static const Size frameSize = Size(512, 424);
+// approximate values, no guarantee to be correct
+static const float focal = 366.1f;
+static const float cx    = 258.2f;
+static const float cy    = 204.f;
+static const float k1    = 0.12f;
+static const float k2    = -0.34f;
+static const float k3    = 0.12f;
+};  // namespace Kinect2Params
+
+struct DepthSource
+{
+   public:
+    enum Type
+    {
+        DEPTH_LIST,
+        DEPTH_KINECT2_LIST,
+        DEPTH_KINECT2,
+        DEPTH_REALSENSE
+    };
+
+    DepthSource(int cam) : DepthSource("", cam) {}
+
+    DepthSource(String fileListName) : DepthSource(fileListName, -1) {}
+
+    DepthSource(String fileListName, int cam)
+        : depthFileList(fileListName.empty() ? std::vector<std::string>()
+                                             : readDepth(fileListName)),
+          frameIdx(0),
+          undistortMap1(),
+          undistortMap2()
+    {
+        if (cam >= 0)
+        {
+            vc = VideoCapture(VideoCaptureAPIs::CAP_OPENNI2 + cam);
+            if (vc.isOpened())
+            {
+                sourceType = Type::DEPTH_KINECT2;
+            }
+            else
+            {
+                vc = VideoCapture(VideoCaptureAPIs::CAP_REALSENSE + cam);
+                if (vc.isOpened())
+                {
+                    sourceType = Type::DEPTH_REALSENSE;
+                }
+            }
+        }
+        else
+        {
+            vc         = VideoCapture();
+            sourceType = Type::DEPTH_KINECT2_LIST;
+        }
+    }
+
+    UMat getDepth()
+    {
+        UMat out;
+        if (!vc.isOpened())
+        {
+            if (frameIdx < depthFileList.size())
+            {
+                Mat f = cv::imread(depthFileList[frameIdx++], IMREAD_ANYDEPTH);
+                f.copyTo(out);
+            }
+            else
+            {
+                return UMat();
+            }
+        }
+        else
+        {
+            vc.grab();
+            switch (sourceType)
+            {
+                case Type::DEPTH_KINECT2: vc.retrieve(out, CAP_OPENNI_DEPTH_MAP); break;
+                case Type::DEPTH_REALSENSE: vc.retrieve(out, CAP_INTELPERC_DEPTH_MAP); break;
+                default:
+                    // unknown depth source
+                    vc.retrieve(out);
+            }
+
+            // workaround for Kinect 2
+            if (sourceType == Type::DEPTH_KINECT2)
+            {
+                out = out(Rect(Point(), Kinect2Params::frameSize));
+
+                UMat outCopy;
+                // linear remap adds gradient between valid and invalid pixels
+                // which causes garbage, use nearest instead
+                remap(out, outCopy, undistortMap1, undistortMap2, cv::INTER_NEAREST);
+
+                cv::flip(outCopy, out, 1);
+            }
+        }
+        if (out.empty())
+            throw std::runtime_error("Matrix is empty");
+        return out;
+    }
+
+    bool empty() { return depthFileList.empty() && !(vc.isOpened()); }
+
+    void updateIntrinsics(Matx33f& _intrinsics, Size& _frameSize, float& _depthFactor)
+    {
+        if (vc.isOpened())
+        {
+            // this should be set in according to user's depth sensor
+            int w = (int)vc.get(VideoCaptureProperties::CAP_PROP_FRAME_WIDTH);
+            int h = (int)vc.get(VideoCaptureProperties::CAP_PROP_FRAME_HEIGHT);
+
+            // it's recommended to calibrate sensor to obtain its intrinsics
+            float fx, fy, cx, cy;
+            float depthFactor = 1000.f;
+            Size frameSize;
+            if (sourceType == Type::DEPTH_KINECT2)
+            {
+                fx = fy = Kinect2Params::focal;
+                cx      = Kinect2Params::cx;
+                cy      = Kinect2Params::cy;
+
+                frameSize = Kinect2Params::frameSize;
+            }
+            else
+            {
+                if (sourceType == Type::DEPTH_REALSENSE)
+                {
+                    fx          = (float)vc.get(CAP_PROP_INTELPERC_DEPTH_FOCAL_LENGTH_HORZ);
+                    fy          = (float)vc.get(CAP_PROP_INTELPERC_DEPTH_FOCAL_LENGTH_VERT);
+                    depthFactor = 1.f / (float)vc.get(CAP_PROP_INTELPERC_DEPTH_SATURATION_VALUE);
+                }
+                else
+                {
+                    fx = fy =
+                        (float)vc.get(CAP_OPENNI_DEPTH_GENERATOR | CAP_PROP_OPENNI_FOCAL_LENGTH);
+                }
+
+                cx = w / 2 - 0.5f;
+                cy = h / 2 - 0.5f;
+
+                frameSize = Size(w, h);
+            }
+
+            Matx33f camMatrix = Matx33f(fx, 0, cx, 0, fy, cy, 0, 0, 1);
+            _intrinsics       = camMatrix;
+            _frameSize        = frameSize;
+            _depthFactor      = depthFactor;
+        }
+    }
+
+    void updateVolumeParams(const Vec3i& _resolution, float& _voxelSize, float& _tsdfTruncDist,
+                            Affine3f& _volumePose, float& _depthTruncateThreshold)
+    {
+        float volumeSize        = 3.0f;
+        _depthTruncateThreshold = 0.0f;
+        // RealSense has shorter depth range, some params should be tuned
+        if (sourceType == Type::DEPTH_REALSENSE)
+        {
+            volumeSize              = 1.f;
+            _voxelSize              = volumeSize / _resolution[0];
+            _tsdfTruncDist          = 0.01f;
+            _depthTruncateThreshold = 2.5f;
+        }
+        _volumePose = Affine3f().translate(Vec3f(-volumeSize / 2.f, -volumeSize / 2.f, 0.05f));
+    }
+
+    void updateICPParams(float& _icpDistThresh, float& _bilateralSigmaDepth)
+    {
+        _icpDistThresh       = 0.1f;
+        _bilateralSigmaDepth = 0.04f;
+        // RealSense has shorter depth range, some params should be tuned
+        if (sourceType == Type::DEPTH_REALSENSE)
+        {
+            _icpDistThresh       = 0.01f;
+            _bilateralSigmaDepth = 0.01f;
+        }
+    }
+
+    void updateParams(large_kinfu::Params& params)
+    {
+        if (vc.isOpened())
+        {
+            updateIntrinsics(params.intr, params.frameSize, params.depthFactor);
+            updateVolumeParams(params.volumeParams.resolution, params.volumeParams.voxelSize,
+                               params.volumeParams.tsdfTruncDist, params.volumeParams.pose,
+                               params.truncateThreshold);
+            updateICPParams(params.icpDistThresh, params.bilateral_sigma_depth);
+
+            if (sourceType == Type::DEPTH_KINECT2)
+            {
+                Matx<float, 1, 5> distCoeffs;
+                distCoeffs(0) = Kinect2Params::k1;
+                distCoeffs(1) = Kinect2Params::k2;
+                distCoeffs(4) = Kinect2Params::k3;
+
+                initUndistortRectifyMap(params.intr, distCoeffs, cv::noArray(), params.intr,
+                                        params.frameSize, CV_16SC2, undistortMap1, undistortMap2);
+            }
+        }
+    }
+
+    void updateParams(kinfu::Params& params)
+    {
+        if (vc.isOpened())
+        {
+            updateIntrinsics(params.intr, params.frameSize, params.depthFactor);
+            updateVolumeParams(params.volumeDims, params.voxelSize,
+                               params.tsdf_trunc_dist, params.volumePose, params.truncateThreshold);
+            updateICPParams(params.icpDistThresh, params.bilateral_sigma_depth);
+
+            if (sourceType == Type::DEPTH_KINECT2)
+            {
+                Matx<float, 1, 5> distCoeffs;
+                distCoeffs(0) = Kinect2Params::k1;
+                distCoeffs(1) = Kinect2Params::k2;
+                distCoeffs(4) = Kinect2Params::k3;
+
+                initUndistortRectifyMap(params.intr, distCoeffs, cv::noArray(), params.intr,
+                                        params.frameSize, CV_16SC2, undistortMap1, undistortMap2);
+            }
+        }
+    }
+
+    std::vector<std::string> depthFileList;
+    size_t frameIdx;
+    VideoCapture vc;
+    UMat undistortMap1, undistortMap2;
+    Type sourceType;
+};
+}  // namespace io_utils
+
+}  // namespace cv
+#endif /* ifndef OPENCV_RGBS_IO_UTILS_HPP */