cpp_api/api/Matrix_8h_source.html

 // ----------------------------------------------------------------------------

 // -                        CloudViewer: www.cloudViewer.org                  -

 // ----------------------------------------------------------------------------

 // Copyright (c) 2018-2024 www.cloudViewer.org

 // SPDX-License-Identifier: MIT

 // ----------------------------------------------------------------------------


 #pragma once

 #include "cloudViewer/core/CUDAUtils.h"


 namespace cloudViewer {

 namespace core {

 namespace linalg {

 namespace kernel {


 // ---- Matmul ----

 template <typename scalar_t>

 static CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE void matmul3x3_3x1(

         const scalar_t& m00,

         const scalar_t& m01,

         const scalar_t& m02,

         const scalar_t& m10,

         const scalar_t& m11,

         const scalar_t& m12,

         const scalar_t& m20,

         const scalar_t& m21,

         const scalar_t& m22,

         const scalar_t& v0,

         const scalar_t& v1,

         const scalar_t& v2,

         scalar_t& o0,

         scalar_t& o1,

         scalar_t& o2) {

     o0 = m00 * v0 + m01 * v1 + m02 * v2;

     o1 = m10 * v0 + m11 * v1 + m12 * v2;

     o2 = m20 * v0 + m21 * v1 + m22 * v2;

 }


 template <typename scalar_t>

 CLOUDVIEWER_HOST_DEVICE CLOUDVIEWER_FORCE_INLINE void matmul3x3_3x1(

         const scalar_t* A_3x3, const scalar_t* B_3x1, scalar_t* C_3x1) {

     C_3x1[0] = A_3x3[0] * B_3x1[0] + A_3x3[1] * B_3x1[1] + A_3x3[2] * B_3x1[2];

     C_3x1[1] = A_3x3[3] * B_3x1[0] + A_3x3[4] * B_3x1[1] + A_3x3[5] * B_3x1[2];

     C_3x1[2] = A_3x3[6] * B_3x1[0] + A_3x3[7] * B_3x1[1] + A_3x3[8] * B_3x1[2];

 }


 template <typename scalar_t>

 CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE void matmul3x3_3x3(

         const scalar_t* A_3x3, const scalar_t* B_3x3, scalar_t* C_3x3) {

     matmul3x3_3x1(A_3x3[0], A_3x3[1], A_3x3[2], A_3x3[3], A_3x3[4], A_3x3[5],

                   A_3x3[6], A_3x3[7], A_3x3[8], B_3x3[0], B_3x3[3], B_3x3[6],

                   C_3x3[0], C_3x3[3], C_3x3[6]);

     matmul3x3_3x1(A_3x3[0], A_3x3[1], A_3x3[2], A_3x3[3], A_3x3[4], A_3x3[5],

                   A_3x3[6], A_3x3[7], A_3x3[8], B_3x3[1], B_3x3[4], B_3x3[7],

                   C_3x3[1], C_3x3[4], C_3x3[7]);

     matmul3x3_3x1(A_3x3[0], A_3x3[1], A_3x3[2], A_3x3[3], A_3x3[4], A_3x3[5],

                   A_3x3[6], A_3x3[7], A_3x3[8], B_3x3[2], B_3x3[5], B_3x3[8],

                   C_3x3[2], C_3x3[5], C_3x3[8]);

 }


 template <typename scalar_t>

 CLOUDVIEWER_HOST_DEVICE CLOUDVIEWER_FORCE_INLINE void cross_3x1(

         const scalar_t* A_3x1_input,

         const scalar_t* B_3x1_input,

         scalar_t* C_3x1_output) {

     C_3x1_output[0] =

             A_3x1_input[1] * B_3x1_input[2] - A_3x1_input[2] * B_3x1_input[1];

     C_3x1_output[1] =

             A_3x1_input[2] * B_3x1_input[0] - A_3x1_input[0] * B_3x1_input[2];

     C_3x1_output[2] =

             A_3x1_input[0] * B_3x1_input[1] - A_3x1_input[1] * B_3x1_input[0];

 }


 template <typename scalar_t>

 CLOUDVIEWER_HOST_DEVICE CLOUDVIEWER_FORCE_INLINE scalar_t

 cross_mag_3x1(const scalar_t* A_3x1_input, const scalar_t* B_3x1_input) {

     scalar_t temp_0 =

             A_3x1_input[1] * B_3x1_input[2] - A_3x1_input[2] * B_3x1_input[1];

     scalar_t temp_1 =

             A_3x1_input[2] * B_3x1_input[0] - A_3x1_input[0] * B_3x1_input[2];

     scalar_t temp_2 =

             A_3x1_input[0] * B_3x1_input[1] - A_3x1_input[1] * B_3x1_input[0];

     return sqrt(temp_0 * temp_0 + temp_1 * temp_1 + temp_2 * temp_2);

 }


 template <typename scalar_t>

 CLOUDVIEWER_HOST_DEVICE CLOUDVIEWER_FORCE_INLINE scalar_t

 dot_3x1(const scalar_t* A_3x1_input, const scalar_t* B_3x1_input) {

     return A_3x1_input[0] * B_3x1_input[0] + A_3x1_input[1] * B_3x1_input[1] +

            A_3x1_input[2] * B_3x1_input[2];

 }


 // ---- Determinant ----

 template <typename scalar_t>

 CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE scalar_t

 det2x2(const scalar_t* A_2x2) {

     return A_2x2[0] * A_2x2[3] - A_2x2[1] * A_2x2[2];

 }


 template <typename scalar_t>

 CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE scalar_t

 det3x3(const scalar_t* A_3x3) {

     return A_3x3[0] * (A_3x3[4] * A_3x3[8] - A_3x3[5] * A_3x3[7]) -

            A_3x3[3] * (A_3x3[1] * A_3x3[8] - A_3x3[2] * A_3x3[7]) +

            A_3x3[6] * (A_3x3[1] * A_3x3[5] - A_3x3[2] * A_3x3[4]);

 }


 template <typename scalar_t>

 CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE bool inverse2x2(

         const scalar_t* A_2x2, scalar_t* output_2x2) {

     scalar_t det = det3x3(A_2x2);

     if (det < 1e-12) {

         return false;

     } else {

         scalar_t invdet = 1.0 / det;

         output_2x2[0] = A_2x2[3] * det;

         output_2x2[1] = -A_2x2[1] * det;

         output_2x2[2] = -A_2x2[2] * det;

         output_2x2[3] = A_2x2[0] * det;

     }

     return true;

 }


 // ---- Matrix Inverse ----

 template <typename scalar_t>

 CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE bool inverse3x3(

         const scalar_t* A_3x3, scalar_t* output_3x3) {

     scalar_t det = det3x3(A_3x3);

     if (det < 1e-12) {

         return false;

     } else {

         scalar_t invdet = 1.0 / det;

         output_3x3[0] = (A_3x3[4] * A_3x3[8] - A_3x3[7] * A_3x3[5]) * invdet;

         output_3x3[1] = (A_3x3[2] * A_3x3[7] - A_3x3[1] * A_3x3[8]) * invdet;

         output_3x3[2] = (A_3x3[1] * A_3x3[5] - A_3x3[2] * A_3x3[4]) * invdet;

         output_3x3[3] = (A_3x3[5] * A_3x3[6] - A_3x3[3] * A_3x3[8]) * invdet;

         output_3x3[4] = (A_3x3[0] * A_3x3[8] - A_3x3[2] * A_3x3[6]) * invdet;

         output_3x3[5] = (A_3x3[3] * A_3x3[2] - A_3x3[0] * A_3x3[5]) * invdet;

         output_3x3[6] = (A_3x3[3] * A_3x3[7] - A_3x3[6] * A_3x3[4]) * invdet;

         output_3x3[7] = (A_3x3[6] * A_3x3[1] - A_3x3[0] * A_3x3[7]) * invdet;

         output_3x3[8] = (A_3x3[0] * A_3x3[4] - A_3x3[3] * A_3x3[1]) * invdet;

     }

     return true;

 }


 // ---- Matrix Transpose ----

 template <typename scalar_t>

 CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE void transpose2x2_(

         scalar_t* A_2x2) {

     scalar_t temp_01 = A_2x2[1];

     A_2x2[1] = A_2x2[2];

     A_2x2[2] = temp_01;

 }


 template <typename scalar_t>

 CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE void transpose2x2(

         const scalar_t* A_2x2, scalar_t* output_2x2) {

     output_2x2[0] = A_2x2[0];

     output_2x2[1] = A_2x2[2];

     output_2x2[2] = A_2x2[1];

     output_2x2[3] = A_2x2[3];

 }


 template <typename scalar_t>

 CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE void transpose3x3_(

         scalar_t* A_3x3) {

     scalar_t temp_01 = A_3x3[1];

     scalar_t temp_02 = A_3x3[2];

     scalar_t temp_12 = A_3x3[5];

     A_3x3[1] = A_3x3[3];

     A_3x3[2] = A_3x3[6];

     A_3x3[5] = A_3x3[7];

     A_3x3[3] = temp_01;

     A_3x3[6] = temp_02;

     A_3x3[7] = temp_12;

 }


 template <typename scalar_t>

 CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE void transpose3x3(

         const scalar_t* A_3x3, scalar_t* output_3x3) {

     output_3x3[0] = A_3x3[0];

     output_3x3[1] = A_3x3[3];

     output_3x3[2] = A_3x3[6];


     output_3x3[3] = A_3x3[1];

     output_3x3[4] = A_3x3[4];

     output_3x3[5] = A_3x3[7];


     output_3x3[6] = A_3x3[2];

     output_3x3[7] = A_3x3[5];

     output_3x3[8] = A_3x3[8];

 }


 template <typename scalar_t>

 CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE void transpose4x4_(

         scalar_t* A_4x4) {

     scalar_t temp_01 = A_4x4[1];

     scalar_t temp_02 = A_4x4[2];

     scalar_t temp_03 = A_4x4[3];

     scalar_t temp_12 = A_4x4[6];

     scalar_t temp_13 = A_4x4[7];

     scalar_t temp_23 = A_4x4[11];

     A_4x4[1] = A_4x4[4];

     A_4x4[2] = A_4x4[8];

     A_4x4[3] = A_4x4[12];

     A_4x4[6] = A_4x4[9];

     A_4x4[7] = A_4x4[13];

     A_4x4[11] = A_4x4[14];

     A_4x4[4] = temp_01;

     A_4x4[8] = temp_02;

     A_4x4[12] = temp_03;

     A_4x4[9] = temp_12;

     A_4x4[13] = temp_13;

     A_4x4[14] = temp_23;

 }


 template <typename scalar_t>

 CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE void transpose4x4(

         const scalar_t* A_4x4, scalar_t* output_4x4) {

     output_4x4[0] = A_4x4[0];

     output_4x4[1] = A_4x4[4];

     output_4x4[2] = A_4x4[8];

     output_4x4[3] = A_4x4[12];


     output_4x4[4] = A_4x4[1];

     output_4x4[5] = A_4x4[5];

     output_4x4[6] = A_4x4[9];

     output_4x4[7] = A_4x4[13];


     output_4x4[8] = A_4x4[2];

     output_4x4[9] = A_4x4[6];

     output_4x4[10] = A_4x4[10];

     output_4x4[11] = A_4x4[14];


     output_4x4[12] = A_4x4[3];

     output_4x4[13] = A_4x4[7];

     output_4x4[14] = A_4x4[11];

     output_4x4[15] = A_4x4[15];

 }


 }  // namespace kernel

 }  // namespace linalg

 }  // namespace core

 }  // namespace cloudViewer

CUDAUtils.h
Common CUDA utilities.

CLOUDVIEWER_FORCE_INLINE
#define CLOUDVIEWER_FORCE_INLINE
Definition: CUDAUtils.h:43

CLOUDVIEWER_HOST_DEVICE
#define CLOUDVIEWER_HOST_DEVICE
Definition: CUDAUtils.h:44

CLOUDVIEWER_DEVICE
#define CLOUDVIEWER_DEVICE
Definition: CUDAUtils.h:45

cloudViewer::core::linalg::kernel::det3x3
CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE scalar_t det3x3(const scalar_t *A_3x3)
Definition: Matrix.h:102

cloudViewer::core::linalg::kernel::transpose3x3
CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE void transpose3x3(const scalar_t *A_3x3, scalar_t *output_3x3)
Definition: Matrix.h:179

cloudViewer::core::linalg::kernel::transpose2x2
CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE void transpose2x2(const scalar_t *A_2x2, scalar_t *output_2x2)
Definition: Matrix.h:156

cloudViewer::core::linalg::kernel::matmul3x3_3x1
static CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE void matmul3x3_3x1(const scalar_t &m00, const scalar_t &m01, const scalar_t &m02, const scalar_t &m10, const scalar_t &m11, const scalar_t &m12, const scalar_t &m20, const scalar_t &m21, const scalar_t &m22, const scalar_t &v0, const scalar_t &v1, const scalar_t &v2, scalar_t &o0, scalar_t &o1, scalar_t &o2)
Definition: Matrix.h:18

cloudViewer::core::linalg::kernel::cross_3x1
CLOUDVIEWER_HOST_DEVICE CLOUDVIEWER_FORCE_INLINE void cross_3x1(const scalar_t *A_3x1_input, const scalar_t *B_3x1_input, scalar_t *C_3x1_output)
Definition: Matrix.h:62

cloudViewer::core::linalg::kernel::cross_mag_3x1
CLOUDVIEWER_HOST_DEVICE CLOUDVIEWER_FORCE_INLINE scalar_t cross_mag_3x1(const scalar_t *A_3x1_input, const scalar_t *B_3x1_input)
Definition: Matrix.h:76

cloudViewer::core::linalg::kernel::transpose3x3_
CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE void transpose3x3_(scalar_t *A_3x3)
Definition: Matrix.h:165

cloudViewer::core::linalg::kernel::transpose4x4
CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE void transpose4x4(const scalar_t *A_4x4, scalar_t *output_4x4)
Definition: Matrix.h:218

cloudViewer::core::linalg::kernel::transpose4x4_
CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE void transpose4x4_(scalar_t *A_4x4)
Definition: Matrix.h:195

cloudViewer::core::linalg::kernel::det2x2
CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE scalar_t det2x2(const scalar_t *A_2x2)
Definition: Matrix.h:96

cloudViewer::core::linalg::kernel::matmul3x3_3x3
CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE void matmul3x3_3x3(const scalar_t *A_3x3, const scalar_t *B_3x3, scalar_t *C_3x3)
Definition: Matrix.h:48

cloudViewer::core::linalg::kernel::inverse3x3
CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE bool inverse3x3(const scalar_t *A_3x3, scalar_t *output_3x3)
Definition: Matrix.h:126

cloudViewer::core::linalg::kernel::dot_3x1
CLOUDVIEWER_HOST_DEVICE CLOUDVIEWER_FORCE_INLINE scalar_t dot_3x1(const scalar_t *A_3x1_input, const scalar_t *B_3x1_input)
Definition: Matrix.h:88

cloudViewer::core::linalg::kernel::inverse2x2
CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE bool inverse2x2(const scalar_t *A_2x2, scalar_t *output_2x2)
Definition: Matrix.h:109

cloudViewer::core::linalg::kernel::transpose2x2_
CLOUDVIEWER_DEVICE CLOUDVIEWER_FORCE_INLINE void transpose2x2_(scalar_t *A_2x2)
Definition: Matrix.h:148

cloudViewer
Generic file read and write utility for python interface.
Definition: AutoSegmentationTools.h:16