cpp_api/api/Linalg_8cpp_source.html

 // ----------------------------------------------------------------------------

 // -                        CloudViewer: www.cloudViewer.org                  -

 // ----------------------------------------------------------------------------

 // Copyright (c) 2018-2024 www.cloudViewer.org

 // SPDX-License-Identifier: MIT

 // ----------------------------------------------------------------------------


 #include <benchmark/benchmark.h>


 #include "cloudViewer/core/CUDAUtils.h"

 #include "cloudViewer/core/Tensor.h"

 #include "cloudViewer/utility/Logging.h"


 namespace cloudViewer {

 namespace core {


 void MatmulAB(benchmark::State& state, const Device& device) {

     Tensor A = Tensor::Ones({10000, 4}, core::Float32, device);

     Tensor B = Tensor::Ones({4, 10000}, core::Float32, device);


     Tensor output = A.Matmul(B);

     for (auto _ : state) {

         output = A.Matmul(B);

         core::cuda::Synchronize(device);

     }

 }


 BENCHMARK_CAPTURE(MatmulAB, CPU, Device("CPU:0"))

         ->Unit(benchmark::kMillisecond);


 #ifdef BUILD_CUDA_MODULE

 BENCHMARK_CAPTURE(MatmulAB, CUDA, Device("CUDA:0"))

         ->Unit(benchmark::kMillisecond);

 #endif


 }  // namespace core

 }  // namespace cloudViewer

CUDAUtils.h
Common CUDA utilities.

Tensor.h

cloudViewer::core::Device
Definition: Device.h:18

cloudViewer::core::Tensor
Definition: Tensor.h:32

cloudViewer::core::Tensor::Matmul
Tensor Matmul(const Tensor &rhs) const
Definition: Tensor.cpp:1919

cloudViewer::core::Tensor::Ones
static Tensor Ones(const SizeVector &shape, Dtype dtype, const Device &device=Device("CPU:0"))
Create a tensor fill with ones.
Definition: Tensor.cpp:412

Logging.h

cloudViewer::core::cuda::Synchronize
void Synchronize()
Definition: CUDAUtils.cpp:59

cloudViewer::core::BENCHMARK_CAPTURE
BENCHMARK_CAPTURE(BinaryEW, Add__CPU_Int8__100, 100, BinaryOpCode::Add, Int8, Device("CPU:0")) -> Unit(benchmark::kMillisecond)

cloudViewer::core::MatmulAB
void MatmulAB(benchmark::State &state, const Device &device)
Definition: Linalg.cpp:17

cloudViewer::core::Float32
const Dtype Float32
Definition: Dtype.cpp:42

cloudViewer
Generic file read and write utility for python interface.
Definition: AutoSegmentationTools.h:16