1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37
|
// ----------------------------------------------------------------------------
// - Open3D: www.open3d.org -
// ----------------------------------------------------------------------------
// Copyright (c) 2018-2024 www.open3d.org
// SPDX-License-Identifier: MIT
// ----------------------------------------------------------------------------
#include <benchmark/benchmark.h>
#include "open3d/core/CUDAUtils.h"
#include "open3d/core/Tensor.h"
#include "open3d/utility/Logging.h"
namespace open3d {
namespace core {
void MatmulAB(benchmark::State& state, const Device& device) {
Tensor A = Tensor::Ones({10000, 4}, core::Float32, device);
Tensor B = Tensor::Ones({4, 10000}, core::Float32, device);
Tensor output = A.Matmul(B);
for (auto _ : state) {
output = A.Matmul(B);
core::cuda::Synchronize(device);
}
}
BENCHMARK_CAPTURE(MatmulAB, CPU, Device("CPU:0"))
->Unit(benchmark::kMillisecond);
#ifdef BUILD_CUDA_MODULE
BENCHMARK_CAPTURE(MatmulAB, CUDA, Device("CUDA:0"))
->Unit(benchmark::kMillisecond);
#endif
} // namespace core
} // namespace open3d
|