cuda-battery/unique__ptr_8hpp_source.html

// Copyright 2021 Pierre Talbot


#ifndef CUDA_BATTERY_UNIQUE_PTR_HPP

#define CUDA_BATTERY_UNIQUE_PTR_HPP


#include "utility.hpp"

#include "allocator.hpp"


/** \file unique_ptr.hpp

 Similar to std::unique_ptr with small technical differences:

 *   - There is no specialization for arrays (e.g., unique_ptr<T[]>).

     - We rely on an allocator and provide a function `allocate_unique` to build the pointer in place.

     - Additional function `make_unique_block` and `make_unique_grid`

 * Similarly to vector, the allocator is scoped, meaning it is propagated to the underlying type constructor if it takes one.

*/


namespace battery {


template <class T, class Allocator = standard_allocator>


class unique_ptr {

public:

  using element_type = T;

  using pointer = T*;

  using allocator_type = Allocator;

  using this_type = unique_ptr<element_type, allocator_type>;

private:

  Allocator allocator;

  T* ptr;


  template<class U, class Alloc>

  friend class unique_ptr;

public:


  CUDA unique_ptr(const allocator_type& allocator = allocator_type())

   : allocator(allocator), ptr(nullptr) {}


  CUDA unique_ptr(std::nullptr_t, const allocator_type& allocator = allocator_type())

   : allocator(allocator), ptr(nullptr) {}


  // `ptr` must have been allocated using `allocator_type`.


  CUDA explicit unique_ptr(pointer ptr, const allocator_type& allocator = allocator_type())

   : allocator(allocator), ptr(ptr) {}


  CUDA unique_ptr(this_type&& from) : ptr(from.ptr), allocator(from.allocator) {

    from.ptr = nullptr;

  }


  template<class U>


  CUDA unique_ptr(unique_ptr<U, Allocator>&& from)

   : ptr(static_cast<T*>(from.ptr)), allocator(from.allocator)

  {

    from.ptr = nullptr;

  }


  CUDA unique_ptr(const this_type&) = delete;


  CUDA NI ~unique_ptr() {

    if(ptr != nullptr) {

      ptr->~T();

      allocator.deallocate(ptr);

      ptr = nullptr;

    }

  }


  CUDA void swap(unique_ptr& other) {

    ::battery::swap(ptr, other.ptr);

    ::battery::swap(allocator, other.allocator);

  }


  CUDA unique_ptr& operator=(unique_ptr&& r) {

    this_type(std::move(r)).swap(*this);

    return *this;

  }


  template<class U>


  CUDA unique_ptr& operator=(unique_ptr<U, Allocator>&& r) {

    this_type(std::move(r)).swap(*this);

    return *this;

  }


  CUDA unique_ptr& operator=(std::nullptr_t) {

    this_type(allocator).swap(*this);

    return *this;

  }


  CUDA pointer release() {

    pointer p = ptr;

    ptr = nullptr;

    return p;

  }


  CUDA void reset(pointer ptr = pointer()) {

    this_type(ptr, allocator).swap(*this);

  }


  CUDA pointer get() const {

    return ptr;

  }


  CUDA allocator_type get_allocator() const {

    return allocator;

  }


  CUDA explicit operator bool() const {

    return ptr != nullptr;

  }


  CUDA T& operator*() const {

    assert(bool(ptr));

    return *ptr;

  }


  CUDA pointer operator->() const {

    assert(bool(ptr));

    return ptr;

  }


};


template<class T, class Alloc, class... Args>


CUDA NI unique_ptr<T, Alloc> allocate_unique(const Alloc& alloc, Args&&... args) {

  Alloc allocator(alloc);

  T* ptr = static_cast<T*>(allocator.allocate(sizeof(T)));

  assert(ptr != nullptr);

  if constexpr(std::is_constructible<T, Args&&..., const Alloc&>{}) {

    new(ptr) T(std::forward<Args>(args)..., allocator);

  }

  else {

    new(ptr) T(std::forward<Args>(args)...);

  }

  return unique_ptr<T, Alloc>(ptr, allocator);

}


/** Similar to `allocate_unique` but with an default-constructed allocator. */

template<class T, class Alloc, class... Args>


CUDA unique_ptr<T, Alloc> make_unique(Args&&... args) {

  return allocate_unique<T>(Alloc(), std::forward<Args>(args)...);

}


#ifdef __CUDACC__


}


#include <cooperative_groups.h>


namespace battery {


/** We construct a `unique_ptr` in the style of `allocate_unique` but the function is allowed to be entered by all threads of a block.

 * Only one thread of the block will call the function `allocate_unique`.

 * The created pointer is stored in one of the `unique_ptr` passed as parameter to allow for RAII.

 * The function returns a reference to the object created.

 * Usage:

 * ```

 * battery::unique_ptr<int, battery::global_allocator> ptr;

 * int& block_int = battery::make_unique_block(ptr, 10);

 * // all threads can now use `block_int`.

 * // ...

 * // Don't forget to synchronize at the end of the function, to avoid deleting the unique_ptr before all threads are done using it.

 * auto block = cooperative_groups::this_thread_block();

 * block.sync(); // or __syncthreads();

 * ```

 *

 * NOTE: this function use the cooperative groups library.

 */

template<class T, class Alloc, class... Args>

__device__ NI T& make_unique_block(unique_ptr<T, Alloc>& ptr, Args&&... args) {

  __shared__ T* raw_ptr;

  auto block = cooperative_groups::this_thread_block();

  invoke_one(block, [&](){

    ptr = allocate_unique<T, Alloc>(ptr.get_allocator(), std::forward<Args>(args)...);

    raw_ptr = ptr.get();

  });

  block.sync();

  T* data_ptr = raw_ptr;

  // This extra synchronization is required in case a thread returns quickly and re-enter the function to allocate another pointer.

  // Indeed, it seems that shared variable (`raw_ptr` above) are static.

  block.sync();

  return *data_ptr;

}


namespace impl {

  __device__ void* raw_ptr;

}


/** Same as `make_unique_block` but for the grid (all blocks).

 * NOTE: a kernel using this function must be launched using `cudaLaunchCooperativeKernel` instead of the `<<<...>>>` syntax.

 */

template<class T, class Alloc, class... Args>

__device__ NI T& make_unique_grid(unique_ptr<T, Alloc>& ptr, Args&&... args) {

  auto grid = cooperative_groups::this_grid();

  invoke_one(grid, [&](){

    ptr = allocate_unique<T, Alloc>(ptr.get_allocator(), std::forward<Args>(args)...);

    impl::raw_ptr = static_cast<void*>(ptr.get());

  });

  grid.sync();

  T* data_ptr = static_cast<T*>(impl::raw_ptr);

  // See comment of make_unique_block for why this extra barrier is required.

  grid.sync();

  return *data_ptr;

}


#endif


} // namespace battery


#endif

allocator.hpp

battery::unique_ptr
Definition unique_ptr.hpp:20

battery::unique_ptr::operator=
CUDA unique_ptr & operator=(unique_ptr< U, Allocator > &&r)
Definition unique_ptr.hpp:74

battery::unique_ptr::allocator_type
Allocator allocator_type
Definition unique_ptr.hpp:24

battery::unique_ptr::operator=
CUDA unique_ptr & operator=(unique_ptr &&r)
Definition unique_ptr.hpp:68

battery::unique_ptr::pointer
T * pointer
Definition unique_ptr.hpp:23

battery::unique_ptr::operator->
CUDA pointer operator->() const
Definition unique_ptr.hpp:111

battery::unique_ptr::unique_ptr
CUDA unique_ptr(unique_ptr< U, Allocator > &&from)
Definition unique_ptr.hpp:47

battery::unique_ptr::unique_ptr
CUDA unique_ptr(this_type &&from)
Definition unique_ptr.hpp:42

battery::unique_ptr::unique_ptr
CUDA unique_ptr(const this_type &)=delete

battery::unique_ptr::operator=
CUDA unique_ptr & operator=(std::nullptr_t)
Definition unique_ptr.hpp:79

battery::unique_ptr::get
CUDA pointer get() const
Definition unique_ptr.hpp:94

battery::unique_ptr::reset
CUDA void reset(pointer ptr=pointer())
Definition unique_ptr.hpp:90

battery::unique_ptr::~unique_ptr
CUDA NI ~unique_ptr()
Definition unique_ptr.hpp:55

battery::unique_ptr::release
CUDA pointer release()
Definition unique_ptr.hpp:84

battery::unique_ptr::get_allocator
CUDA allocator_type get_allocator() const
Definition unique_ptr.hpp:98

battery::unique_ptr::element_type
T element_type
Definition unique_ptr.hpp:22

battery::unique_ptr::unique_ptr
CUDA unique_ptr(const allocator_type &allocator=allocator_type())
Definition unique_ptr.hpp:33

battery::unique_ptr::operator*
CUDA T & operator*() const
Definition unique_ptr.hpp:106

battery::unique_ptr::swap
CUDA void swap(unique_ptr &other)
Definition unique_ptr.hpp:63

battery::unique_ptr::unique_ptr
CUDA unique_ptr(std::nullptr_t, const allocator_type &allocator=allocator_type())
Definition unique_ptr.hpp:35

battery::unique_ptr::this_type
unique_ptr< element_type, allocator_type > this_type
Definition unique_ptr.hpp:25

battery::unique_ptr::unique_ptr
CUDA unique_ptr(pointer ptr, const allocator_type &allocator=allocator_type())
Definition unique_ptr.hpp:39

battery
Definition algorithm.hpp:10

battery::make_unique
CUDA unique_ptr< T, Alloc > make_unique(Args &&... args)
Definition unique_ptr.hpp:133

battery::allocate_unique
CUDA NI unique_ptr< T, Alloc > allocate_unique(const Alloc &alloc, Args &&... args)
Definition unique_ptr.hpp:118

battery::swap
CUDA constexpr void swap(T &a, T &b)
Definition utility.hpp:91

utility.hpp

CUDA
#define CUDA
Definition utility.hpp:59

NI
#define NI
Definition utility.hpp:62