8 #include <benchmark/benchmark.h>
22 for (
auto _ : state) {
29 ->Unit(benchmark::kMillisecond);
31 #ifdef BUILD_CUDA_MODULE
33 ->Unit(benchmark::kMillisecond);
Tensor Matmul(const Tensor &rhs) const
static Tensor Ones(const SizeVector &shape, Dtype dtype, const Device &device=Device("CPU:0"))
Create a tensor fill with ones.
BENCHMARK_CAPTURE(BinaryEW, Add__CPU_Int8__100, 100, BinaryOpCode::Add, Int8, Device("CPU:0")) -> Unit(benchmark::kMillisecond)
void MatmulAB(benchmark::State &state, const Device &device)
Generic file read and write utility for python interface.