cpp_api/api/NonZeroCPU_8cpp_source.html

 // ----------------------------------------------------------------------------

 // -                        CloudViewer: www.cloudViewer.org                  -

 // ----------------------------------------------------------------------------

 // Copyright (c) 2018-2024 www.cloudViewer.org

 // SPDX-License-Identifier: MIT

 // ----------------------------------------------------------------------------


 #include <Logging.h>

 #include <Parallel.h>


 #include <numeric>


 #include "cloudViewer/core/Indexer.h"

 #include "cloudViewer/core/kernel/NonZero.h"


 namespace cloudViewer {

 namespace core {

 namespace kernel {


 Tensor NonZeroCPU(const Tensor& src) {

     // Get flattened non-zero indices.

     TensorIterator src_iter(src);

     const int64_t num_elements = src.NumElements();

     std::vector<int64_t> indices(static_cast<size_t>(num_elements));

     std::iota(std::begin(indices), std::end(indices), 0);

     std::vector<int64_t> non_zero_indices(num_elements);

     DISPATCH_DTYPE_TO_TEMPLATE_WITH_BOOL(src.GetDtype(), [&]() {

         auto it = std::copy_if(

                 indices.begin(), indices.end(), non_zero_indices.begin(),

                 [&src_iter](int64_t index) {

                     const void* src_ptr = src_iter.GetPtr(index);

                     CLOUDVIEWER_ASSERT(src_ptr != nullptr && "Internal error.");

                     return static_cast<float>(

                                    *static_cast<const scalar_t*>(src_ptr)) != 0;

                 });

         non_zero_indices.resize(std::distance(non_zero_indices.begin(), it));

     });


     // Transform flattened indices to indices in each dimension.

     SizeVector shape = src.GetShape();

     const int64_t num_dims = src.NumDims();

     const size_t num_non_zeros = non_zero_indices.size();


     SizeVector result_shape{num_dims, static_cast<int64_t>(num_non_zeros)};

     Tensor result(result_shape, core::Int64, src.GetDevice());

     TensorIterator result_iter(result);


     std::vector<std::vector<int64_t>> non_zero_indices_by_dimensions(

             num_dims, std::vector<int64_t>(num_non_zeros, 0));

 #pragma omp parallel for schedule(static) \

         num_threads(utility::EstimateMaxThreads())

     for (int64_t i = 0; i < static_cast<int64_t>(num_non_zeros); i++) {

         int64_t non_zero_index = non_zero_indices[i];

         for (int64_t dim = num_dims - 1; dim >= 0; dim--) {

             void* result_ptr = result_iter.GetPtr(dim * num_non_zeros + i);

             CLOUDVIEWER_ASSERT(result_ptr != nullptr && "Internal error.");

             *static_cast<int64_t*>(result_ptr) = non_zero_index % shape[dim];

             non_zero_index = non_zero_index / shape[dim];

         }

     }


     return result;

 }


 }  // namespace kernel

 }  // namespace core

 }  // namespace cloudViewer

DISPATCH_DTYPE_TO_TEMPLATE_WITH_BOOL
#define DISPATCH_DTYPE_TO_TEMPLATE_WITH_BOOL(DTYPE,...)
Definition: Dispatch.h:68

Indexer.h

CLOUDVIEWER_ASSERT
#define CLOUDVIEWER_ASSERT(...)
Definition: Macro.h:51

NonZero.h

Parallel.h

result
core::Tensor result
Definition: VtkUtils.cpp:76

cloudViewer::core::SizeVector
Definition: SizeVector.h:70

cloudViewer::core::SmallVectorBase::size
size_t size() const
Definition: SmallVector.h:119

cloudViewer::core::TensorIterator
Definition: Indexer.h:222

cloudViewer::core::Tensor
Definition: Tensor.h:32

cloudViewer::core::Tensor::GetDtype
Dtype GetDtype() const
Definition: Tensor.h:1164

cloudViewer::core::Tensor::NumElements
int64_t NumElements() const
Definition: Tensor.h:1170

Logging.h

cloudViewer::core::kernel::NonZeroCPU
Tensor NonZeroCPU(const Tensor &src)
Definition: NonZeroCPU.cpp:20

cloudViewer::core::Int64
const Dtype Int64
Definition: Dtype.cpp:47

cloudViewer
Generic file read and write utility for python interface.
Definition: AutoSegmentationTools.h:16