cpp_api/api/CVViewer_2benchmarks_2core_2UnaryEW_8cpp_source.html

 // ----------------------------------------------------------------------------

 // -                        CloudViewer: www.cloudViewer.org                  -

 // ----------------------------------------------------------------------------

 // Copyright (c) 2018-2024 www.cloudViewer.org

 // SPDX-License-Identifier: MIT

 // ----------------------------------------------------------------------------


 #include <benchmark/benchmark.h>


 #include <random>

 #include <type_traits>


 #include "benchmarks/benchmark_utilities/Rand.h"

 #include "cloudViewer/core/CUDAUtils.h"

 #include "cloudViewer/core/Indexer.h"

 #include "cloudViewer/core/ParallelFor.h"

 #include "cloudViewer/core/Tensor.h"

 #include "cloudViewer/utility/Logging.h"


 namespace cloudViewer {

 namespace core {


 enum class UnaryOpCode {

     Sqrt,

     Sin,

     Cos,

     Neg,

     Exp,

     Abs,

     IsNan,

     IsInf,

     IsFinite,

     Floor,

     Ceil,

     Round,

     Trunc,

     LogicalNot,

 };


 std::function<Tensor(const Tensor&)> MakeOperation(UnaryOpCode op) {

     switch (op) {

         case UnaryOpCode::Sqrt:

             return [](const Tensor& arg) -> Tensor { return arg.Sqrt(); };


         case UnaryOpCode::Sin:

             return [](const Tensor& arg) -> Tensor { return arg.Sin(); };


         case UnaryOpCode::Cos:

             return [](const Tensor& arg) -> Tensor { return arg.Cos(); };


         case UnaryOpCode::Neg:

             return [](const Tensor& arg) -> Tensor { return arg.Neg(); };


         case UnaryOpCode::Exp:

             return [](const Tensor& arg) -> Tensor { return arg.Exp(); };


         case UnaryOpCode::Abs:

             return [](const Tensor& arg) -> Tensor { return arg.Abs(); };


         case UnaryOpCode::IsNan:

             return [](const Tensor& arg) -> Tensor { return arg.IsNan(); };


         case UnaryOpCode::IsInf:

             return [](const Tensor& arg) -> Tensor { return arg.IsInf(); };


         case UnaryOpCode::IsFinite:

             return [](const Tensor& arg) -> Tensor { return arg.IsFinite(); };


         case UnaryOpCode::Floor:

             return [](const Tensor& arg) -> Tensor { return arg.Floor(); };


         case UnaryOpCode::Ceil:

             return [](const Tensor& arg) -> Tensor { return arg.Ceil(); };


         case UnaryOpCode::Round:

             return [](const Tensor& arg) -> Tensor { return arg.Round(); };


         case UnaryOpCode::Trunc:

             return [](const Tensor& arg) -> Tensor { return arg.Trunc(); };


         case UnaryOpCode::LogicalNot:

             return [](const Tensor& arg) -> Tensor { return arg.LogicalNot(); };


         default:

             utility::LogError("Unknown operation {}", static_cast<int>(op));

     }

 }


 void UnaryEW(benchmark::State& state,

              int size,

              UnaryOpCode op_code,

              const Dtype& dtype,

              const Device& device) {

     Tensor arg = benchmarks::Rand({1, size}, 1, {1, 127}, dtype, device);

     auto op = MakeOperation(op_code);


     Tensor result = op(arg);

     benchmark::DoNotOptimize(result);


     for (auto _ : state) {

         Tensor result = op(arg);

         benchmark::DoNotOptimize(result);


         cuda::Synchronize(device);

     }

 }


 #define ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, DTYPE)                   \

     BENCHMARK_CAPTURE(FN, OP##__##DEVICE_NAME##_##DTYPE##__100, 100,       \

                       UnaryOpCode::OP, DTYPE, DEVICE)                      \

             ->Unit(benchmark::kMillisecond);                               \

     BENCHMARK_CAPTURE(FN, OP##__##DEVICE_NAME##_##DTYPE##__100000, 100000, \

                       UnaryOpCode::OP, DTYPE, DEVICE)                      \

             ->Unit(benchmark::kMillisecond);                               \

     BENCHMARK_CAPTURE(FN, OP##__##DEVICE_NAME##_##DTYPE##__100000000,      \

                       100000000, UnaryOpCode::OP, DTYPE, DEVICE)           \

             ->Unit(benchmark::kMillisecond);


 #define ENUM_BM_DTYPE(FN, OP, DEVICE, DEVICE_NAME)     \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, Int8)    \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, UInt8)   \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, Int16)   \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, UInt16)  \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, Int32)   \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, UInt32)  \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, Int64)   \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, UInt64)  \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, Float32) \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, Float64)


 #define ENUM_BM_DTYPE_FLOAT(FN, OP, DEVICE, DEVICE_NAME) \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, Float32)   \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, Float64)


 #define ENUM_BM_DTYPE_WITH_BOOL(FN, OP, DEVICE, DEVICE_NAME) \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, Bool)          \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, Int8)          \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, UInt8)         \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, Int16)         \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, UInt16)        \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, Int32)         \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, UInt32)        \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, Int64)         \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, UInt64)        \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, Float32)       \

     ENUM_BM_SIZE(FN, OP, DEVICE, DEVICE_NAME, Float64)


 // #ifdef BUILD_CUDA_MODULE

 // #define ENUM_BM_TENSOR(FN, OP)

 //     ENUM_BM_DTYPE(FN, OP, Device("CPU:0"), CPU)

 //     ENUM_BM_DTYPE(FN, OP, Device("CUDA:0"), CUDA)

 // #else

 #define ENUM_BM_TENSOR(FN, OP) ENUM_BM_DTYPE(FN, OP, Device("CPU:0"), CPU)

 // #endif


 // #ifdef BUILD_CUDA_MODULE

 // #define ENUM_BM_TENSOR_FLOAT(FN, OP)

 //     ENUM_BM_DTYPE_FLOAT(FN, OP, Device("CPU:0"), CPU)

 //     ENUM_BM_DTYPE_FLOAT(FN, OP, Device("CUDA:0"), CUDA)

 // #else

 #define ENUM_BM_TENSOR_FLOAT(FN, OP) \

     ENUM_BM_DTYPE_FLOAT(FN, OP, Device("CPU:0"), CPU)

 // #endif


 // #ifdef BUILD_CUDA_MODULE

 // #define ENUM_BM_TENSOR_WTIH_BOOL(FN, OP)

 //     ENUM_BM_DTYPE_WITH_BOOL(FN, OP, Device("CPU:0"), CPU)

 //     ENUM_BM_DTYPE_WITH_BOOL(FN, OP, Device("CUDA:0"), CUDA)

 // #else

 #define ENUM_BM_TENSOR_WTIH_BOOL(FN, OP) \

     ENUM_BM_DTYPE_WITH_BOOL(FN, OP, Device("CPU:0"), CPU)

 // #endif


 ENUM_BM_TENSOR_FLOAT(UnaryEW, Sqrt)

 ENUM_BM_TENSOR_FLOAT(UnaryEW, Sin)

 ENUM_BM_TENSOR_FLOAT(UnaryEW, Cos)

 ENUM_BM_TENSOR_FLOAT(UnaryEW, Exp)

 ENUM_BM_TENSOR_FLOAT(UnaryEW, IsNan)

 ENUM_BM_TENSOR_FLOAT(UnaryEW, IsInf)

 ENUM_BM_TENSOR_FLOAT(UnaryEW, IsFinite)

 ENUM_BM_TENSOR(UnaryEW, Abs)

 ENUM_BM_TENSOR(UnaryEW, Neg)

 ENUM_BM_TENSOR(UnaryEW, Floor)

 ENUM_BM_TENSOR(UnaryEW, Ceil)

 ENUM_BM_TENSOR(UnaryEW, Round)

 ENUM_BM_TENSOR(UnaryEW, Trunc)

 ENUM_BM_TENSOR_WTIH_BOOL(UnaryEW, LogicalNot)


 }  // namespace core

 }  // namespace cloudViewer

CUDAUtils.h
Common CUDA utilities.

ENUM_BM_TENSOR_FLOAT
#define ENUM_BM_TENSOR_FLOAT(FN, OP)
Definition: UnaryEW.cpp:161

ENUM_BM_TENSOR_WTIH_BOOL
#define ENUM_BM_TENSOR_WTIH_BOOL(FN, OP)
Definition: UnaryEW.cpp:170

ENUM_BM_TENSOR
#define ENUM_BM_TENSOR(FN, OP)
Definition: UnaryEW.cpp:153

size
int size
Definition: FileIOFactory.cpp:130

Indexer.h

ParallelFor.h

Rand.h

Tensor.h

result
core::Tensor result
Definition: VtkUtils.cpp:76

cloudViewer::core::Device
Definition: Device.h:18

cloudViewer::core::Dtype
Definition: Dtype.h:21

cloudViewer::core::Tensor
Definition: Tensor.h:32

cloudViewer::core::Tensor::Sqrt
Tensor Sqrt() const
Element-wise square root of a tensor, returns a new tensor.
Definition: Tensor.cpp:1296

cloudViewer::core::Tensor::Neg
Tensor Neg() const
Element-wise negation of a tensor, returning a new tensor.
Definition: Tensor.cpp:1329

cloudViewer::core::Tensor::Round
Tensor Round() const
Element-wise round value of a tensor, returning a new tensor.
Definition: Tensor.cpp:1423

cloudViewer::core::Tensor::Trunc
Tensor Trunc() const
Element-wise trunc value of a tensor, returning a new tensor.
Definition: Tensor.cpp:1429

cloudViewer::core::Tensor::LogicalNot
Tensor LogicalNot() const
Definition: Tensor.cpp:1442

cloudViewer::core::Tensor::Exp
Tensor Exp() const
Element-wise exponential of a tensor, returning a new tensor.
Definition: Tensor.cpp:1340

cloudViewer::core::Tensor::Cos
Tensor Cos() const
Element-wise cosine of a tensor, returning a new tensor.
Definition: Tensor.cpp:1318

cloudViewer::core::Tensor::IsFinite
Tensor IsFinite() const
Definition: Tensor.cpp:1382

cloudViewer::core::Tensor::Abs
Tensor Abs() const
Element-wise absolute value of a tensor, returning a new tensor.
Definition: Tensor.cpp:1351

cloudViewer::core::Tensor::Sin
Tensor Sin() const
Element-wise sine of a tensor, returning a new tensor.
Definition: Tensor.cpp:1307

cloudViewer::core::Tensor::Ceil
Tensor Ceil() const
Element-wise ceil value of a tensor, returning a new tensor.
Definition: Tensor.cpp:1417

cloudViewer::core::Tensor::IsInf
Tensor IsInf() const
Definition: Tensor.cpp:1372

cloudViewer::core::Tensor::IsNan
Tensor IsNan() const
Definition: Tensor.cpp:1362

cloudViewer::core::Tensor::Floor
Tensor Floor() const
Element-wise floor value of a tensor, returning a new tensor.
Definition: Tensor.cpp:1411

LogError
#define LogError(...)
Definition: Logging.h:60

Logging.h

cloudViewer::benchmarks::Rand
core::Tensor Rand(const core::SizeVector &shape, size_t seed, const std::pair< core::Scalar, core::Scalar > &range, core::Dtype dtype, const core::Device &device)
Returns a Tensor with random values within the range range .
Definition: Rand.cpp:23

cloudViewer::core::cuda::Synchronize
void Synchronize()
Definition: CUDAUtils.cpp:59

cloudViewer::core::UnaryEW
void UnaryEW(benchmark::State &state, int size, UnaryOpCode op_code, const Dtype &dtype, const Device &device)
Definition: UnaryEW.cpp:89

cloudViewer::core::UnaryOpCode
UnaryOpCode
Definition: UnaryEW.cpp:23

cloudViewer::core::UnaryOpCode::Sin
@ Sin

cloudViewer::core::UnaryOpCode::Abs
@ Abs

cloudViewer::core::UnaryOpCode::LogicalNot
@ LogicalNot

cloudViewer::core::UnaryOpCode::IsInf
@ IsInf

cloudViewer::core::UnaryOpCode::IsNan
@ IsNan

cloudViewer::core::UnaryOpCode::Sqrt
@ Sqrt

cloudViewer::core::UnaryOpCode::Round
@ Round

cloudViewer::core::UnaryOpCode::Ceil
@ Ceil

cloudViewer::core::UnaryOpCode::Exp
@ Exp

cloudViewer::core::UnaryOpCode::Trunc
@ Trunc

cloudViewer::core::UnaryOpCode::IsFinite
@ IsFinite

cloudViewer::core::UnaryOpCode::Floor
@ Floor

cloudViewer::core::UnaryOpCode::Neg
@ Neg

cloudViewer::core::UnaryOpCode::Cos
@ Cos

cloudViewer::core::MakeOperation
static std::function< Tensor(const Tensor &, const Tensor &)> MakeOperation(BinaryOpCode op)
Definition: BinaryEW.cpp:38

cloudViewer
Generic file read and write utility for python interface.
Definition: AutoSegmentationTools.h:16