cpp_api/api/LeastSquares_8cpp_source.html

 // ----------------------------------------------------------------------------

 // -                        CloudViewer: www.cloudViewer.org                  -

 // ----------------------------------------------------------------------------

 // Copyright (c) 2018-2024 www.cloudViewer.org

 // SPDX-License-Identifier: MIT

 // ----------------------------------------------------------------------------


 #include "cloudViewer/core/linalg/LeastSquares.h"


 #include <unordered_map>


 #include "cloudViewer/core/CUDAUtils.h"


 namespace cloudViewer {

 namespace core {


 void LeastSquares(const Tensor &A, const Tensor &B, Tensor &X) {

     AssertTensorDtypes(A, {Float32, Float64});

     AssertTensorDevice(B, A.GetDevice());

     AssertTensorDtype(B, A.GetDtype());


     const Device device = A.GetDevice();

     const Dtype dtype = A.GetDtype();


     // Check dimensions

     SizeVector A_shape = A.GetShape();

     SizeVector B_shape = B.GetShape();

     if (A_shape.size() != 2) {

         utility::LogError("Tensor A must be 2D, but got {}D", A_shape.size());

     }

     if (B_shape.size() != 1 && B_shape.size() != 2) {

         utility::LogError(

                 "Tensor B must be 1D (vector) or 2D (matrix), but got {}D.",

                 B_shape.size());

     }

     if (B_shape[0] != A_shape[0]) {

         utility::LogError("Tensor A and B's first dimension mismatch.");

     }


     int64_t m = A_shape[0];

     int64_t n = A_shape[1];

     int64_t k = B_shape.size() == 2 ? B_shape[1] : 1;

     if (m == 0 || n == 0 || k == 0) {

         utility::LogError(

                 "Tensor shapes should not contain dimensions with zero.");

     }


     if (m < n) {

         utility::LogError("Tensor A shape must satisfy rows({}) > cols({}).", m,

                           n);

     }


     // A and B are modified in-place

     Tensor A_copy = A.T().Clone();

     Tensor B_copy = B.T().Clone();


     void *A_data = A_copy.GetDataPtr();

     void *B_data = B_copy.GetDataPtr();


     if (device.IsCUDA()) {

 #ifdef BUILD_CUDA_MODULE

         CUDAScopedDevice scoped_device(device);

         LeastSquaresCUDA(A_data, B_data, m, n, k, dtype, device);

 #else

         utility::LogError("Unimplemented device.");

 #endif

     } else if (device.IsSYCL()) {

 #ifdef BUILD_SYCL_MODULE

         LeastSquaresSYCL(A_data, B_data, m, n, k, dtype, device);

 #else

         utility::LogError("Unimplemented device.");

 #endif

     } else {

         LeastSquaresCPU(A_data, B_data, m, n, k, dtype, device);

     }


     X = B_copy.T().Slice(0, 0, n);

 }

 }  // namespace core

 }  // namespace cloudViewer

CUDAUtils.h
Common CUDA utilities.

LeastSquares.h

X
void * X
Definition: SmallVector.cpp:45

AssertTensorDevice
#define AssertTensorDevice(tensor,...)
Definition: TensorCheck.h:45

AssertTensorDtype
#define AssertTensorDtype(tensor,...)
Definition: TensorCheck.h:21

AssertTensorDtypes
#define AssertTensorDtypes(tensor,...)
Definition: TensorCheck.h:33

cloudViewer::core::CUDAScopedDevice
When CUDA is not enabled, this is a dummy class.
Definition: CUDAUtils.h:214

cloudViewer::core::Device
Definition: Device.h:18

cloudViewer::core::Device::IsCUDA
bool IsCUDA() const
Returns true iff device type is CUDA.
Definition: Device.h:49

cloudViewer::core::Device::IsSYCL
bool IsSYCL() const
Returns true iff device type is SYCL GPU.
Definition: Device.h:52

cloudViewer::core::Dtype
Definition: Dtype.h:21

cloudViewer::core::SizeVector
Definition: SizeVector.h:70

cloudViewer::core::SmallVectorBase::size
size_t size() const
Definition: SmallVector.h:119

cloudViewer::core::Tensor
Definition: Tensor.h:32

cloudViewer::core::Tensor::GetDtype
Dtype GetDtype() const
Definition: Tensor.h:1164

cloudViewer::core::Tensor::GetDataPtr
T * GetDataPtr()
Definition: Tensor.h:1144

cloudViewer::core::Tensor::GetDevice
Device GetDevice() const override
Definition: Tensor.cpp:1435

cloudViewer::core::Tensor::Clone
Tensor Clone() const
Copy Tensor to the same device.
Definition: Tensor.h:502

cloudViewer::core::Tensor::GetShape
SizeVector GetShape() const
Definition: Tensor.h:1127

cloudViewer::core::Tensor::T
Tensor T() const
Expects input to be <= 2-D Tensor by swapping dimension 0 and 1.
Definition: Tensor.cpp:1079

cloudViewer::core::Tensor::Slice
Tensor Slice(int64_t dim, int64_t start, int64_t stop, int64_t step=1) const
Definition: Tensor.cpp:857

LogError
#define LogError(...)
Definition: Logging.h:60

cloudViewer::core::LeastSquaresCUDA
void LeastSquaresCUDA(void *A_data, void *B_data, int64_t m, int64_t n, int64_t k, Dtype dtype, const Device &device)
Definition: LeastSquaresCUDA.cpp:24

cloudViewer::core::LeastSquares
void LeastSquares(const Tensor &A, const Tensor &B, Tensor &X)
Solve AX = B with QR decomposition. A is a full-rank m x n matrix (m >= n).
Definition: LeastSquares.cpp:17

cloudViewer::core::Float64
const Dtype Float64
Definition: Dtype.cpp:43

cloudViewer::core::LeastSquaresSYCL
void LeastSquaresSYCL(void *A_data, void *B_data, int64_t m, int64_t n, int64_t k, Dtype dtype, const Device &device)
Definition: LeastSquaresSYCL.cpp:19

cloudViewer::core::LeastSquaresCPU
void LeastSquaresCPU(void *A_data, void *B_data, int64_t m, int64_t n, int64_t k, Dtype dtype, const Device &device)
Definition: LeastSquaresCPU.cpp:15

cloudViewer::core::Float32
const Dtype Float32
Definition: Dtype.cpp:42

cloudViewer
Generic file read and write utility for python interface.
Definition: AutoSegmentationTools.h:16