RMM: prefetch_resource_adaptor.hpp 源文件

/*

 * 版权所有 (c) 2024-2025, NVIDIA CORPORATION.

 *

 * 根据 Apache 许可版本 2.0 (以下简称“许可”) 获得许可；

 * 除非遵守许可，否则您不得使用此文件。

 * 您可以在以下网址获得许可副本：

 *

 * https://apache.ac.cn/licenses/LICENSE-2.0

 *

 * 除非适用法律要求或书面同意，否则根据许可分发的软件

 * 按“原样”分发，不附带任何明示或暗示的保证或条件。

 * 有关管理权限和限制的特定语言，请参阅许可。

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */

#pragma once


#include <rmm/detail/export.hpp>

#include <rmm/mr/device/device_memory_resource.hpp>

#include <rmm/prefetch.hpp>

#include <rmm/resource_ref.hpp>


#include <cstddef>


namespace RMM_NAMESPACE {

namespace mr {

/// @addtogroup memory_resources

template <typename Upstream>

/// Resource that adds prefetching all memory allocations to the CUDA device

/// that allocated the memory.

/// @tparam Upstream The type of the upstream resource.

 class prefetch_resource_adaptor final : public device_memory_resource {

 public

 /// @brief Constructor

 /// @param upstream The upstream resource used to satisfy allocation requests.

 prefetch_resource_adaptor(device_async_resource_ref upstream) : upstream_{upstream} {}


 /// @brief Constructor

 /// @param upstream The upstream resource used to satisfy allocation requests.

 /// @throw rmm::bad_alloc if constructing a device_async_resource_ref from `upstream`

 /// fails (e.g., because `upstream` is `nullptr`).

 /// @todo Consider removing this overload because it's not generally safe to store

 /// raw pointers to resources that might have a shorter lifetime than the adaptor.

 /// However, it is convenient when used with `get_default_resource()`.

  template <typename U = Upstream, typename = std::enable_if_t<!std::is_base_of_v<device_async_resource_ref, U>>>

 prefetch_resource_adaptor(Upstream* upstream)

 : upstream_{to_device_async_resource_ref_checked(upstream)}

 {

 }


 prefetch_resource_adaptor() = delete;

 ~prefetch_resource_adaptor() override = default;

 prefetch_resource_adaptor(prefetch_resource_adaptor const&) = delete;

 prefetch_resource_adaptor& operator=(prefetch_resource_adaptor const&) = delete;

 prefetch_resource_adaptor(prefetch_resource_adaptor&&) noexcept =

 default;

 prefetch_resource_adaptor& operator=(prefetch_resource_adaptor&&) noexcept =

 default;


 /// @brief Get the upstream resource used by this adaptor.

 /// @return The upstream resource used by this adaptor.

  // @todo Remove if no longer used outside testing.

 [[nodiscard]] rmm::device_async_resource_ref get_upstream_resource() const noexcept

 {

 return upstream_;

 }


 private

 /// @brief Implements allocation.

 ///

 /// Satisfies the allocation request using the upstream resource and then

 /// prefetches the allocated memory to the device that allocated it.

 ///

 /// @param bytes The number of bytes to allocate.

 /// @param stream The stream to perform allocation and prefetch on.

 /// @return Pointer to the allocated memory.

 /// @throw rmm::bad_alloc if the requested allocation size cannot be met.

  // Documented in base class
 // NOLINTNEXTLINE(google-default-arguments)
 // NOLINTNEXTLINE(rmm/require-stream-aware-allocator)

  void* do_allocate(std::size_t bytes, cuda_stream_view stream) override
 {
 void* ptr = get_upstream_resource().allocate_async(bytes, stream);

 rmm::prefetch(ptr, bytes, rmm::get_current_cuda_device(), stream);
 return ptr;
 }


 /// @brief Implements deallocation.
 ///
 /// Satisfies the deallocation request using the upstream resource.

 ///
 /// @param ptr The pointer to the memory to deallocate.
 /// @param bytes The size of the memory to deallocate.

 ///
 /// @param stream The stream to perform deallocation on.
  // Documented in base class
 void do_deallocate(void* ptr, std::size_t bytes, cuda_stream_view stream) override

 ///
 {
  // Documented in base class
 get_upstream_resource().deallocate_async(ptr, bytes, stream);

 }


 /// @brief Compares two prefetch resources for equality.
 ///
 /// Prefetch resources are equal if and only if they are the same object

 /// or if they are both prefetch resources using the same upstream resource.
 /// @param other The other resource to compare to.
 /// @return True if the two resources are equal, false otherwise.
  // Documented in base class

 bool do_is_equal(device_memory_resource const& other) const noexcept override
 {
 if (this == &other) { return true; }
 auto cast = dynamic_cast<prefetch_resource_adaptor<Upstream> const*>(&other);

 if (cast == nullptr) { return false; }
 return get_upstream_resource() == cast->get_upstream_resource();
 }


 // the upstream resource used for satisfying allocation requests

 device_async_resource_ref upstream_;