cpp_api/api/cloudViewer_2t_2pipelines_2kernel_2Registration_8cpp_source.html

 // ----------------------------------------------------------------------------

 // -                        CloudViewer: www.cloudViewer.org                  -

 // ----------------------------------------------------------------------------

 // Copyright (c) 2018-2024 www.cloudViewer.org

 // SPDX-License-Identifier: MIT

 // ----------------------------------------------------------------------------


 #include "cloudViewer/t/pipelines/kernel/Registration.h"


 #include "cloudViewer/core/Dispatch.h"

 #include "cloudViewer/core/TensorCheck.h"

 #include "cloudViewer/t/pipelines/kernel/RegistrationImpl.h"


 namespace cloudViewer {

 namespace t {

 namespace pipelines {

 namespace kernel {


 core::Tensor ComputePosePointToPlane(const core::Tensor &source_points,

                                      const core::Tensor &target_points,

                                      const core::Tensor &target_normals,

                                      const core::Tensor &correspondence_indices,

                                      const registration::RobustKernel &kernel) {

     const core::Device device = source_points.GetDevice();


     // Pose {6,} tensor [output].

     core::Tensor pose = core::Tensor::Empty({6}, core::Float64, device);


     float residual = 0;

     int inlier_count = 0;


     if (source_points.IsCPU()) {

         ComputePosePointToPlaneCPU(

                 source_points.Contiguous(), target_points.Contiguous(),

                 target_normals.Contiguous(),

                 correspondence_indices.Contiguous(), pose, residual,

                 inlier_count, source_points.GetDtype(), device, kernel);

     } else if (source_points.IsCUDA()) {

         core::CUDAScopedDevice scoped_device(source_points.GetDevice());

         CUDA_CALL(ComputePosePointToPlaneCUDA, source_points.Contiguous(),

                   target_points.Contiguous(), target_normals.Contiguous(),

                   correspondence_indices.Contiguous(), pose, residual,

                   inlier_count, source_points.GetDtype(), device, kernel);

     } else {

         utility::LogError("Unimplemented device.");

     }


     utility::LogDebug("PointToPlane Transform: residual {}, inlier_count {}",

                       residual, inlier_count);


     return pose;

 }


 core::Tensor ComputePoseColoredICP(const core::Tensor &source_points,

                                    const core::Tensor &source_colors,

                                    const core::Tensor &target_points,

                                    const core::Tensor &target_normals,

                                    const core::Tensor &target_colors,

                                    const core::Tensor &target_color_gradients,

                                    const core::Tensor &correspondence_indices,

                                    const registration::RobustKernel &kernel,

                                    const double &lambda_geometric) {

     const core::Device device = source_points.GetDevice();


     // Pose {6,} tensor [output].

     core::Tensor pose = core::Tensor::Empty({6}, core::Dtype::Float64, device);


     float residual = 0;

     int inlier_count = 0;


     if (source_points.IsCPU()) {

         ComputePoseColoredICPCPU(

                 source_points.Contiguous(), source_colors.Contiguous(),

                 target_points.Contiguous(), target_normals.Contiguous(),

                 target_colors.Contiguous(), target_color_gradients.Contiguous(),

                 correspondence_indices.Contiguous(), pose, residual,

                 inlier_count, source_points.GetDtype(), device, kernel,

                 lambda_geometric);

     } else if (source_points.IsCUDA()) {

         core::CUDAScopedDevice scoped_device(source_points.GetDevice());

         CUDA_CALL(ComputePoseColoredICPCUDA, source_points.Contiguous(),

                   source_colors.Contiguous(), target_points.Contiguous(),

                   target_normals.Contiguous(), target_colors.Contiguous(),

                   target_color_gradients.Contiguous(),

                   correspondence_indices.Contiguous(), pose, residual,

                   inlier_count, source_points.GetDtype(), device, kernel,

                   lambda_geometric);

     } else {

         utility::LogError("Unimplemented device.");

     }


     utility::LogDebug("PointToPlane Transform: residual {}, inlier_count {}",

                       residual, inlier_count);


     return pose;

 }


 core::Tensor ComputePoseDopplerICP(

         const core::Tensor &source_points,

         const core::Tensor &source_dopplers,

         const core::Tensor &source_directions,

         const core::Tensor &target_points,

         const core::Tensor &target_normals,

         const core::Tensor &correspondence_indices,

         const core::Tensor &current_transform,

         const core::Tensor &transform_vehicle_to_sensor,

         const std::size_t iteration,

         const double period,

         const double lambda_doppler,

         const bool reject_dynamic_outliers,

         const double doppler_outlier_threshold,

         const std::size_t outlier_rejection_min_iteration,

         const std::size_t geometric_robust_loss_min_iteration,

         const std::size_t doppler_robust_loss_min_iteration,

         const registration::RobustKernel &geometric_kernel,

         const registration::RobustKernel &doppler_kernel) {

     const core::Device device = source_points.GetDevice();

     const core::Dtype dtype = source_points.GetDtype();


     // Pose {6,} tensor [ouput].

     core::Tensor output_pose =

             core::Tensor::Empty({6}, core::Dtype::Float64, device);


     float residual = 0;

     int inlier_count = 0;


     // Use robust kernels only after a specified minimum number of iterations.

     const auto kernel_default = registration::RobustKernel(

             registration::RobustKernelMethod::L2Loss, 1.0, 1.0);

     const auto kernel_geometric =

             (iteration >= geometric_robust_loss_min_iteration)

                     ? geometric_kernel

                     : kernel_default;

     const auto kernel_doppler = (iteration >= doppler_robust_loss_min_iteration)

                                         ? doppler_kernel

                                         : kernel_default;


     // Enable outlier rejection based on the current iteration count.

     const bool reject_outliers = reject_dynamic_outliers &&

                                  (iteration >= outlier_rejection_min_iteration);


     // Extract the rotation and translation parts from the matrix.

     const core::Tensor R_S_to_V =

             transform_vehicle_to_sensor

                     .GetItem({core::TensorKey::Slice(0, 3, 1),

                               core::TensorKey::Slice(0, 3, 1)})

                     .Inverse()

                     .Flatten()

                     .To(device, dtype);

     const core::Tensor r_v_to_s_in_V =

             transform_vehicle_to_sensor

                     .GetItem({core::TensorKey::Slice(0, 3, 1),

                               core::TensorKey::Slice(3, 4, 1)})

                     .Flatten()

                     .To(device, dtype);


     // Compute the pose (rotation + translation) vector.

     const core::Tensor state_vector =

             pipelines::kernel::TransformationToPose(current_transform)

                     .To(device, dtype);


     // Compute the linear and angular velocity from the pose vector.

     const core::Tensor w_v_in_V =

             (state_vector.GetItem(core::TensorKey::Slice(0, 3, 1)).Neg() /

              period)

                     .To(device, dtype);

     const core::Tensor v_v_in_V =

             (state_vector.GetItem(core::TensorKey::Slice(3, 6, 1)).Neg() /

              period)

                     .To(device, dtype);


     core::Device::DeviceType device_type = device.GetType();

     if (device_type == core::Device::DeviceType::CPU) {

         ComputePoseDopplerICPCPU(

                 source_points.Contiguous(), source_dopplers.Contiguous(),

                 source_directions.Contiguous(), target_points.Contiguous(),

                 target_normals.Contiguous(),

                 correspondence_indices.Contiguous(), output_pose, residual,

                 inlier_count, dtype, device, R_S_to_V.Contiguous(),

                 r_v_to_s_in_V.Contiguous(), w_v_in_V.Contiguous(),

                 v_v_in_V.Contiguous(), period, reject_outliers,

                 doppler_outlier_threshold, kernel_geometric, kernel_doppler,

                 lambda_doppler);

     } else if (device_type == core::Device::DeviceType::CUDA) {

         CUDA_CALL(ComputePoseDopplerICPCUDA, source_points.Contiguous(),

                   source_dopplers.Contiguous(), source_directions.Contiguous(),

                   target_points.Contiguous(), target_normals.Contiguous(),

                   correspondence_indices.Contiguous(), output_pose, residual,

                   inlier_count, dtype, device, R_S_to_V.Contiguous(),

                   r_v_to_s_in_V.Contiguous(), w_v_in_V.Contiguous(),

                   v_v_in_V.Contiguous(), period, reject_outliers,

                   doppler_outlier_threshold, kernel_geometric, kernel_doppler,

                   lambda_doppler);

     } else {

         utility::LogError("Unimplemented device.");

     }


     utility::LogDebug(

             "DopplerPointToPlane Transform: residual {}, inlier_count {}",

             residual, inlier_count);


     return output_pose;

 }


 std::tuple<core::Tensor, core::Tensor> ComputeRtPointToPoint(

         const core::Tensor &source_points,

         const core::Tensor &target_points,

         const core::Tensor &correspondence_indices) {

     const core::Device device = source_points.GetDevice();


     // [Output] Rotation and translation tensor of type Float64.

     core::Tensor R, t;


     int inlier_count = 0;


     if (source_points.IsCPU()) {

         // Pointer to point cloud data - indexed according to correspondences.

         ComputeRtPointToPointCPU(

                 source_points.Contiguous(), target_points.Contiguous(),

                 correspondence_indices.Contiguous(), R, t, inlier_count,

                 source_points.GetDtype(), device);

     } else if (source_points.IsCUDA()) {

 #ifdef BUILD_CUDA_MODULE

         core::CUDAScopedDevice scoped_device(source_points.GetDevice());

         // TODO: Implement optimized CUDA reduction kernel.

         core::Tensor valid = correspondence_indices.Ne(-1).Reshape({-1});

         // correpondence_set : (i, corres[i]).


         if (valid.GetLength() == 0) {

             utility::LogError("No valid correspondence present.");

         }


         // source[i] and target[corres[i]] is a correspondence.

         core::Tensor source_indices =

                 core::Tensor::Arange(0, source_points.GetShape()[0], 1,

                                      core::Int64, device)

                         .IndexGet({valid});

         // Only take valid indices.

         core::Tensor target_indices =

                 correspondence_indices.IndexGet({valid}).Reshape({-1});


         // Number of good correspondences (C).

         inlier_count = source_indices.GetLength();


         core::Tensor source_select = source_points.IndexGet({source_indices});

         core::Tensor target_select = target_points.IndexGet({target_indices});


         // https://ieeexplore.ieee.org/document/88573

         core::Tensor mean_s = source_select.Mean({0}, true);

         core::Tensor mean_t = target_select.Mean({0}, true);


         // Compute linear system on CPU as Float64.

         core::Device host("CPU:0");

         core::Tensor Sxy = (target_select - mean_t)

                                    .T()

                                    .Matmul(source_select - mean_s)

                                    .Div_(static_cast<float>(inlier_count))

                                    .To(host, core::Float64);


         mean_s = mean_s.To(host, core::Float64);

         mean_t = mean_t.To(host, core::Float64);


         core::Tensor U, D, VT;

         std::tie(U, D, VT) = Sxy.SVD();

         core::Tensor S = core::Tensor::Eye(3, core::Float64, host);

         if (U.Det() * (VT.T()).Det() < 0) {

             S[-1][-1] = -1;

         }

         R = U.Matmul(S.Matmul(VT));

         t = mean_t.Reshape({-1}) - R.Matmul(mean_s.T()).Reshape({-1});

 #else

         utility::LogError("Not compiled with CUDA, but CUDA device is used.");

 #endif

     } else {

         utility::LogError("Unimplemented device.");

     }

     return std::make_tuple(R, t);

 }


 core::Tensor ComputeInformationMatrix(

         const core::Tensor &target_points,

         const core::Tensor &correspondence_indices) {

     const core::Device device = target_points.GetDevice();


     core::Tensor information_matrix =

             core::Tensor::Empty({6, 6}, core::Float64, core::Device("CPU:0"));


     if (target_points.IsCPU()) {

         ComputeInformationMatrixCPU(

                 target_points.Contiguous(), correspondence_indices.Contiguous(),

                 information_matrix, target_points.GetDtype(), device);

     } else if (target_points.IsCUDA()) {

         core::CUDAScopedDevice scoped_device(target_points.GetDevice());

         CUDA_CALL(ComputeInformationMatrixCUDA, target_points.Contiguous(),

                   correspondence_indices.Contiguous(), information_matrix,

                   target_points.GetDtype(), device);

     } else {

         utility::LogError("Unimplemented device.");

     }


     return information_matrix;

 }


 }  // namespace kernel

 }  // namespace pipelines

 }  // namespace t

 }  // namespace cloudViewer

CUDA_CALL
#define CUDA_CALL(cuda_function,...)
Definition: CUDAUtils.h:49

Dispatch.h

RegistrationImpl.h

TensorCheck.h

cloudViewer::core::CUDAScopedDevice
When CUDA is not enabled, this is a dummy class.
Definition: CUDAUtils.h:214

cloudViewer::core::Device
Definition: Device.h:18

cloudViewer::core::Device::GetType
DeviceType GetType() const
Returns type of the device, e.g. DeviceType::CPU, DeviceType::CUDA.
Definition: Device.h:58

cloudViewer::core::Device::DeviceType
DeviceType
Type for device.
Definition: Device.h:21

cloudViewer::core::Device::DeviceType::CPU
@ CPU

cloudViewer::core::Device::DeviceType::CUDA
@ CUDA

cloudViewer::core::Dtype
Definition: Dtype.h:21

cloudViewer::core::Dtype::Float64
static const Dtype Float64
Definition: Dtype.h:25

cloudViewer::core::IsDevice::IsCUDA
bool IsCUDA() const
Definition: Device.h:99

cloudViewer::core::IsDevice::IsCPU
bool IsCPU() const
Definition: Device.h:95

cloudViewer::core::TensorKey::Slice
static TensorKey Slice(utility::optional< int64_t > start, utility::optional< int64_t > stop, utility::optional< int64_t > step)
Definition: TensorKey.cpp:138

cloudViewer::core::Tensor
Definition: Tensor.h:32

cloudViewer::core::Tensor::Det
double Det() const
Compute the determinant of a 2D square tensor.
Definition: Tensor.cpp:1092

cloudViewer::core::Tensor::Contiguous
Tensor Contiguous() const
Definition: Tensor.cpp:772

cloudViewer::core::Tensor::Matmul
Tensor Matmul(const Tensor &rhs) const
Definition: Tensor.cpp:1919

cloudViewer::core::Tensor::Neg
Tensor Neg() const
Element-wise negation of a tensor, returning a new tensor.
Definition: Tensor.cpp:1329

cloudViewer::core::Tensor::Arange
static Tensor Arange(const Scalar start, const Scalar stop, const Scalar step=1, const Dtype dtype=core::Int64, const Device &device=core::Device("CPU:0"))
Create a 1D tensor with evenly spaced values in the given interval.
Definition: Tensor.cpp:436

cloudViewer::core::Tensor::GetLength
int64_t GetLength() const
Definition: Tensor.h:1125

cloudViewer::core::Tensor::Ne
Tensor Ne(const Tensor &value) const
Element-wise not-equals-to of tensors, returning a new boolean tensor.
Definition: Tensor.cpp:1714

cloudViewer::core::Tensor::GetDtype
Dtype GetDtype() const
Definition: Tensor.h:1164

cloudViewer::core::Tensor::GetItem
Tensor GetItem(const TensorKey &tk) const
Definition: Tensor.cpp:473

cloudViewer::core::Tensor::Eye
static Tensor Eye(int64_t n, Dtype dtype, const Device &device)
Create an identity matrix of size n x n.
Definition: Tensor.cpp:418

cloudViewer::core::Tensor::IndexGet
Tensor IndexGet(const std::vector< Tensor > &index_tensors) const
Advanced indexing getter. This will always allocate a new Tensor.
Definition: Tensor.cpp:905

cloudViewer::core::Tensor::GetDevice
Device GetDevice() const override
Definition: Tensor.cpp:1435

cloudViewer::core::Tensor::Reshape
Tensor Reshape(const SizeVector &dst_shape) const
Definition: Tensor.cpp:671

cloudViewer::core::Tensor::Mean
Tensor Mean(const SizeVector &dims, bool keepdim=false) const
Definition: Tensor.cpp:1247

cloudViewer::core::Tensor::Empty
static Tensor Empty(const SizeVector &shape, Dtype dtype, const Device &device=Device("CPU:0"))
Create a tensor with uninitialized values.
Definition: Tensor.cpp:400

cloudViewer::core::Tensor::Div_
Tensor Div_(const Tensor &value)
Definition: Tensor.cpp:1225

cloudViewer::core::Tensor::GetShape
SizeVector GetShape() const
Definition: Tensor.h:1127

cloudViewer::core::Tensor::SVD
std::tuple< Tensor, Tensor, Tensor > SVD() const
Definition: Tensor.cpp:1990

cloudViewer::core::Tensor::T
Tensor T() const
Expects input to be <= 2-D Tensor by swapping dimension 0 and 1.
Definition: Tensor.cpp:1079

cloudViewer::core::Tensor::To
Tensor To(Dtype dtype, bool copy=false) const
Definition: Tensor.cpp:739

cloudViewer::t::pipelines::registration::RobustKernel
Definition: RobustKernel.h:58

LogError
#define LogError(...)
Definition: Logging.h:60

LogDebug
#define LogDebug(...)
Definition: Logging.h:90

cloudViewer::core::Int64
const Dtype Int64
Definition: Dtype.cpp:47

cloudViewer::core::Inverse
void Inverse(const Tensor &A, Tensor &output)
Computes A^{-1} with LU factorization, where A is a N x N square matrix.
Definition: Inverse.cpp:18

cloudViewer::core::Float64
const Dtype Float64
Definition: Dtype.cpp:43

cloudViewer::t::geometry::kernel::image::To
void To(const core::Tensor &src, core::Tensor &dst, double scale, double offset)
Definition: Image.cpp:17

cloudViewer::t::pipelines::kernel::ComputePoseColoredICPCPU
void ComputePoseColoredICPCPU(const core::Tensor &source_points, const core::Tensor &source_colors, const core::Tensor &target_points, const core::Tensor &target_normals, const core::Tensor &target_colors, const core::Tensor &target_color_gradients, const core::Tensor &correspondence_indices, core::Tensor &pose, float &residual, int &inlier_count, const core::Dtype &dtype, const core::Device &device, const registration::RobustKernel &kernel, const double &lambda_geometric)
Definition: RegistrationCPU.cpp:211

cloudViewer::t::pipelines::kernel::ComputePosePointToPlaneCPU
void ComputePosePointToPlaneCPU(const core::Tensor &source_points, const core::Tensor &target_points, const core::Tensor &target_normals, const core::Tensor &correspondence_indices, core::Tensor &pose, float &residual, int &inlier_count, const core::Dtype &dtype, const core::Device &device, const registration::RobustKernel &kernel)
Definition: RegistrationCPU.cpp:99

cloudViewer::t::pipelines::kernel::ComputeRtPointToPointCPU
void ComputeRtPointToPointCPU(const core::Tensor &source_points, const core::Tensor &target_points, const core::Tensor &corres, core::Tensor &R, core::Tensor &t, int &inlier_count, const core::Dtype &dtype, const core::Device &device)
Definition: RegistrationCPU.cpp:547

cloudViewer::t::pipelines::kernel::ComputePoseDopplerICP
core::Tensor ComputePoseDopplerICP(const core::Tensor &source_points, const core::Tensor &source_dopplers, const core::Tensor &source_directions, const core::Tensor &target_points, const core::Tensor &target_normals, const core::Tensor &correspondence_indices, const core::Tensor &current_transform, const core::Tensor &transform_vehicle_to_sensor, const std::size_t iteration, const double period, const double lambda_doppler, const bool reject_dynamic_outliers, const double doppler_outlier_threshold, const std::size_t outlier_rejection_min_iteration, const std::size_t geometric_robust_loss_min_iteration, const std::size_t doppler_robust_loss_min_iteration, const registration::RobustKernel &geometric_kernel, const registration::RobustKernel &doppler_kernel)
Computes pose for DopplerICP registration method.
Definition: Registration.cpp:98

cloudViewer::t::pipelines::kernel::ComputeRtPointToPoint
std::tuple< core::Tensor, core::Tensor > ComputeRtPointToPoint(const core::Tensor &source_points, const core::Tensor &target_points, const core::Tensor &correspondence_indices)
Computes (R) Rotation {3,3} and (t) translation {3,} for point to point registration method.
Definition: Registration.cpp:205

cloudViewer::t::pipelines::kernel::ComputePosePointToPlane
core::Tensor ComputePosePointToPlane(const core::Tensor &source_points, const core::Tensor &target_points, const core::Tensor &target_normals, const core::Tensor &correspondence_indices, const registration::RobustKernel &kernel)
Computes pose for point to plane registration method.
Definition: Registration.cpp:19

cloudViewer::t::pipelines::kernel::ComputePoseDopplerICPCPU
void ComputePoseDopplerICPCPU(const core::Tensor &source_points, const core::Tensor &source_dopplers, const core::Tensor &source_directions, const core::Tensor &target_points, const core::Tensor &target_normals, const core::Tensor &correspondence_indices, core::Tensor &output_pose, float &residual, int &inlier_count, const core::Dtype &dtype, const core::Device &device, const core::Tensor &R_S_to_V, const core::Tensor &r_v_to_s_in_V, const core::Tensor &w_v_in_V, const core::Tensor &v_v_in_V, const double period, const bool reject_dynamic_outliers, const double doppler_outlier_threshold, const registration::RobustKernel &kernel_geometric, const registration::RobustKernel &kernel_doppler, const double lambda_doppler)
Definition: RegistrationCPU.cpp:354

cloudViewer::t::pipelines::kernel::ComputeInformationMatrixCPU
void ComputeInformationMatrixCPU(const core::Tensor &target_points, const core::Tensor &correspondence_indices, core::Tensor &information_matrix, const core::Dtype &dtype, const core::Device &device)
Definition: RegistrationCPU.cpp:640

cloudViewer::t::pipelines::kernel::ComputeInformationMatrix
core::Tensor ComputeInformationMatrix(const core::Tensor &target_points, const core::Tensor &correspondence_indices)
Computes Information Matrix of shape {6, 6}, of dtype Float64 on device CPU:0, from the target point ...
Definition: Registration.cpp:280

cloudViewer::t::pipelines::kernel::ComputePoseColoredICP
core::Tensor ComputePoseColoredICP(const core::Tensor &source_points, const core::Tensor &source_colors, const core::Tensor &target_points, const core::Tensor &target_normals, const core::Tensor &target_colors, const core::Tensor &target_color_gradients, const core::Tensor &correspondence_indices, const registration::RobustKernel &kernel, const double &lambda_geometric)
Computes pose for colored-icp registration method.
Definition: Registration.cpp:54

cloudViewer::t::pipelines::kernel::TransformationToPose
core::Tensor TransformationToPose(const core::Tensor &transformation)
Convert transformation matrix to pose.
Definition: TransformationConverter.cpp:119

cloudViewer::t::pipelines::registration::RobustKernelMethod::L2Loss
@ L2Loss

cloudViewer
Generic file read and write utility for python interface.
Definition: AutoSegmentationTools.h:16

Registration.h