1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125
|
// ----------------------------------------------------------------------------
// - Open3D: www.open3d.org -
// ----------------------------------------------------------------------------
// Copyright (c) 2018-2024 www.open3d.org
// SPDX-License-Identifier: MIT
// ----------------------------------------------------------------------------
#ifdef BUILD_CUDA_MODULE
#include "open3d/core/CUDAUtils.h"
#include <sstream>
#include <thread>
#include <vector>
#include "tests/Tests.h"
// #include <fmt/std.h> // fmt version >=9, else:
namespace {
// Use std::ostringstream to get string representation.
template <typename T>
std::string to_str(T var) {
std::ostringstream ss;
ss << var;
return ss.str();
}
} // namespace
namespace open3d {
namespace tests {
TEST(CUDAUtils, InitState) {
const int device_count = core::cuda::DeviceCount();
const core::CUDAState& cuda_state = core::CUDAState::GetInstance();
utility::LogInfo("Number of CUDA devices: {}", device_count);
for (int i = 0; i < device_count; ++i) {
for (int j = 0; j < device_count; ++j) {
utility::LogInfo("P2PEnabled {}->{}: {}", i, j,
cuda_state.IsP2PEnabled(i, j));
}
}
}
void CheckScopedStreamManually() {
int current_device = core::cuda::GetDevice();
ASSERT_EQ(core::cuda::GetStream(), core::cuda::GetDefaultStream());
ASSERT_EQ(core::cuda::GetDevice(), current_device);
cudaStream_t stream;
OPEN3D_CUDA_CHECK(cudaStreamCreate(&stream));
{
core::CUDAScopedStream scoped_stream(stream);
ASSERT_EQ(core::cuda::GetStream(), stream);
ASSERT_NE(core::cuda::GetStream(), core::cuda::GetDefaultStream());
ASSERT_EQ(core::cuda::GetDevice(), current_device);
}
OPEN3D_CUDA_CHECK(cudaStreamDestroy(stream));
ASSERT_EQ(core::cuda::GetStream(), core::cuda::GetDefaultStream());
ASSERT_EQ(core::cuda::GetDevice(), current_device);
}
void CheckScopedStreamAutomatically() {
int current_device = core::cuda::GetDevice();
ASSERT_EQ(core::cuda::GetStream(), core::cuda::GetDefaultStream());
ASSERT_EQ(core::cuda::GetDevice(), current_device);
{
core::CUDAScopedStream scoped_stream(
core::CUDAScopedStream::CreateNewStream);
ASSERT_NE(core::cuda::GetStream(), core::cuda::GetDefaultStream());
ASSERT_EQ(core::cuda::GetDevice(), current_device);
}
ASSERT_EQ(core::cuda::GetStream(), core::cuda::GetDefaultStream());
ASSERT_EQ(core::cuda::GetDevice(), current_device);
}
void CheckScopedStreamMultiThreaded(const std::function<void()>& func) {
std::vector<std::thread> threads;
// NVCC does not like capturing const int by reference on Windows, use int.
int kIterations = 100000;
int kThreads = 8;
for (int i = 0; i < kThreads; ++i) {
threads.emplace_back([&kIterations, &func]() {
utility::LogDebug("Starting thread with ID {}",
to_str(std::this_thread::get_id()));
for (int i = 0; i < kIterations; ++i) {
func();
}
});
}
for (auto& thread : threads) {
if (thread.joinable()) {
utility::LogDebug("Joining thread with ID {}",
to_str(thread.get_id()));
thread.join();
}
}
}
TEST(CUDAUtils, ScopedStreamManually) { CheckScopedStreamManually(); }
TEST(CUDAUtils, ScopedStreamManuallyMultiThreaded) {
CheckScopedStreamMultiThreaded(&CheckScopedStreamManually);
}
TEST(CUDAUtils, ScopedStreamAutomatically) { CheckScopedStreamAutomatically(); }
TEST(CUDAUtils, ScopedStreamAutomaticallyMultiThreaded) {
CheckScopedStreamMultiThreaded(&CheckScopedStreamAutomatically);
}
} // namespace tests
} // namespace open3d
#endif
|