utils.hpp
1 /*
2  * Copyright (c) 2021-2025, NVIDIA CORPORATION.
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  * http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  * See the License for the specific language governing permissions and
14  * limitations under the License.
15  */
16 #pragma once
17 
18 #include <chrono>
19 #include <cstring>
20 #include <future>
21 #include <optional>
22 #include <stdexcept>
23 #include <tuple>
24 #include <type_traits>
25 
26 #include <kvikio/error.hpp>
27 #include <kvikio/shim/cuda.hpp>
28 
29 namespace kvikio {
30 
31 std::size_t get_page_size();
32 
33 [[nodiscard]] off_t convert_size2off(std::size_t x);
34 
35 [[nodiscard]] ssize_t convert_size2ssize(std::size_t x);
36 
37 [[nodiscard]] CUdeviceptr convert_void2deviceptr(void const* devPtr);
38 
42 template <typename T, std::enable_if_t<std::is_integral_v<T>>* = nullptr>
43 [[nodiscard]] std::int64_t convert_to_64bit(T value)
44 {
45  if constexpr (std::numeric_limits<T>::max() > std::numeric_limits<std::int64_t>::max()) {
46  KVIKIO_EXPECT(value <= std::numeric_limits<std::int64_t>::max(),
47  "convert_to_64bit(x): x too large to fit std::int64_t",
48  std::overflow_error);
49  }
50  return std::int64_t(value);
51 }
52 
57 [[nodiscard]] inline std::uint64_t convert_to_64bit(std::uint64_t value) { return value; }
58 
62 template <typename T, std::enable_if_t<std::is_floating_point_v<T>>* = nullptr>
63 [[nodiscard]] double convert_to_64bit(T value)
64 {
65  return double(value);
66 }
67 
76 #ifdef KVIKIO_CUDA_FOUND
77 bool is_host_memory(void const* ptr);
78 #else
79 constexpr bool is_host_memory(void const* ptr) { return true; }
80 #endif
81 
88 [[nodiscard]] int get_device_ordinal_from_pointer(CUdeviceptr dev_ptr);
89 
98 [[nodiscard]] KVIKIO_EXPORT CUcontext get_primary_cuda_context(int ordinal);
99 
106 [[nodiscard]] std::optional<CUcontext> get_context_associated_pointer(CUdeviceptr dev_ptr);
107 
114 [[nodiscard]] bool current_context_can_access_pointer(CUdeviceptr dev_ptr);
115 
132 [[nodiscard]] CUcontext get_context_from_pointer(void const* devPtr);
133 
138  private:
139  CUcontext _ctx;
140 
141  public:
142  PushAndPopContext(CUcontext ctx);
143  PushAndPopContext(PushAndPopContext const&) = delete;
144  PushAndPopContext& operator=(PushAndPopContext const&) = delete;
146  PushAndPopContext&& operator=(PushAndPopContext&&) = delete;
148 };
149 
150 // Find the base and offset of the memory allocation `devPtr` is in
151 std::tuple<void*, std::size_t, std::size_t> get_alloc_info(void const* devPtr,
152  CUcontext* ctx = nullptr);
153 
165 template <typename T>
166 std::future<std::decay_t<T>> make_ready_future(T&& t)
167 {
168  std::promise<std::decay_t<T>> p;
169  auto fut = p.get_future();
170  p.set_value(std::forward<T>(t));
171  return fut;
172 }
173 
185 template <typename T>
186 bool is_future_done(T const& future)
187 {
188  KVIKIO_EXPECT(future.valid(),
189  "The future object does not refer to a valid shared state.",
190  std::invalid_argument);
191  return future.wait_for(std::chrono::seconds(0)) != std::future_status::timeout;
192 }
193 
194 } // namespace kvikio
Push CUDA context on creation and pop it on destruction.
Definition: utils.hpp:137
#define KVIKIO_EXPECT(...)
Macro for checking pre-conditions or conditions that throws an exception when a condition is violated...
Definition: error.hpp:216
KvikIO namespace.
Definition: batch.hpp:27
CUcontext get_context_from_pointer(void const *devPtr)
Return a CUDA context that can be used with the given device pointer.
constexpr bool is_host_memory(void const *ptr)
Check if ptr points to host memory (as opposed to device memory)
Definition: utils.hpp:79
std::int64_t convert_to_64bit(T value)
Help function to convert value to 64 bit signed integer.
Definition: utils.hpp:43
bool current_context_can_access_pointer(CUdeviceptr dev_ptr)
Check if the current CUDA context can access the given device pointer.
bool is_future_done(T const &future)
Check the status of the future object. True indicates that the result is available in the future's sh...
Definition: utils.hpp:186
KVIKIO_EXPORT CUcontext get_primary_cuda_context(int ordinal)
Given a device ordinal, return the primary context of the device.
std::future< std::decay_t< T > > make_ready_future(T &&t)
Create a shared state in a future object that is immediately ready.
Definition: utils.hpp:166
std::optional< CUcontext > get_context_associated_pointer(CUdeviceptr dev_ptr)
Return the CUDA context associated the given device pointer, if any.
int get_device_ordinal_from_pointer(CUdeviceptr dev_ptr)
Return the device owning the pointer.