column_device_view.cuh
Go to the documentation of this file.
1 /*
2  * SPDX-FileCopyrightText: Copyright (c) 2019-2025, NVIDIA CORPORATION.
3  * SPDX-License-Identifier: Apache-2.0
4  */
5 #pragma once
6 
9 #include <cudf/detail/utilities/alignment.hpp>
10 #include <cudf/lists/list_view.hpp>
14 #include <cudf/utilities/span.hpp>
16 
17 #include <rmm/cuda_stream_view.hpp>
18 
19 #include <thrust/iterator/counting_iterator.h>
20 #include <thrust/iterator/transform_iterator.h>
21 #include <thrust/pair.h>
22 
23 #include <functional>
24 
30 namespace CUDF_EXPORT cudf {
31 
38 class alignas(16) column_device_view : public column_device_view_core {
39  public:
41 
42  column_device_view() = delete;
43  ~column_device_view() = default;
58 
68  column_device_view(column_view column, void* h_ptr, void* d_ptr);
69 
87  size_type size) const noexcept
88  {
89  return column_device_view{this->type(),
90  size,
91  this->head(),
92  this->null_mask(),
93  this->offset() + offset,
94  static_cast<column_device_view*>(d_children),
95  this->num_child_columns()};
96  }
97 
115  template <typename T, CUDF_ENABLE_IF(is_rep_layout_compatible<T>())>
116  [[nodiscard]] __device__ T element(size_type element_index) const noexcept
117  {
118  return base::element<T>(element_index);
119  }
120 
132  template <typename T, CUDF_ENABLE_IF(cuda::std::is_same_v<T, string_view>)>
133  [[nodiscard]] __device__ T element(size_type element_index) const noexcept
134  {
135  return base::element<T>(element_index);
136  }
137 
148  template <typename T, CUDF_ENABLE_IF(cudf::is_fixed_point<T>())>
149  [[nodiscard]] __device__ T element(size_type element_index) const noexcept
150  {
151  return base::element<T>(element_index);
152  }
153 
154  private:
160  struct index_element_fn {
161  template <typename IndexType,
162  CUDF_ENABLE_IF(is_index_type<IndexType>() and cuda::std::is_signed_v<IndexType>)>
163  __device__ size_type operator()(column_device_view const& indices, size_type index)
164  {
165  return static_cast<size_type>(indices.element<IndexType>(index));
166  }
167 
168  template <typename IndexType,
169  typename... Args,
170  CUDF_ENABLE_IF(not(is_index_type<IndexType>() and cuda::std::is_signed_v<IndexType>))>
171  __device__ size_type operator()(Args&&... args)
172  {
173  CUDF_UNREACHABLE("dictionary indices must be a signed integral type");
174  }
175  };
176 
177  public:
202  template <typename T, CUDF_ENABLE_IF(cuda::std::is_same_v<T, dictionary32>)>
203  [[nodiscard]] __device__ T element(size_type element_index) const noexcept
204  {
205  size_type index = element_index + offset(); // account for this view's _offset
206  auto const indices = child(0);
207  return dictionary32{type_dispatcher(indices.type(), index_element_fn{}, indices, index)};
208  }
209 
216  template <typename T>
217  CUDF_HOST_DEVICE static constexpr bool has_element_accessor()
218  {
219  return has_element_accessor_impl<column_device_view, T>::value;
220  }
221 
223  using count_it = thrust::counting_iterator<size_type>;
227  template <typename T>
228  using const_iterator = thrust::transform_iterator<detail::value_accessor<T>, count_it>;
229 
245  template <typename T, CUDF_ENABLE_IF(column_device_view::has_element_accessor<T>())>
246  [[nodiscard]] const_iterator<T> begin() const
247  {
249  }
250 
265  template <typename T, CUDF_ENABLE_IF(column_device_view::has_element_accessor<T>())>
266  [[nodiscard]] const_iterator<T> end() const
267  {
268  return const_iterator<T>{count_it{size()}, detail::value_accessor<T>{*this}};
269  }
270 
274  template <typename T, typename Nullate>
276  thrust::transform_iterator<detail::optional_accessor<T, Nullate>, count_it>;
277 
281  template <typename T, bool has_nulls>
283  thrust::transform_iterator<detail::pair_accessor<T, has_nulls>, count_it>;
284 
290  template <typename T, bool has_nulls>
292  thrust::transform_iterator<detail::pair_rep_accessor<T, has_nulls>, count_it>;
293 
348  template <typename T,
349  typename Nullate,
350  CUDF_ENABLE_IF(column_device_view::has_element_accessor<T>())>
351  auto optional_begin(Nullate has_nulls) const
352  {
355  }
356 
378  template <typename T,
379  bool has_nulls,
380  CUDF_ENABLE_IF(column_device_view::has_element_accessor<T>())>
382  {
385  }
386 
410  template <typename T,
411  bool has_nulls,
412  CUDF_ENABLE_IF(column_device_view::has_element_accessor<T>())>
414  {
417  }
418 
435  template <typename T,
436  typename Nullate,
437  CUDF_ENABLE_IF(column_device_view::has_element_accessor<T>())>
438  auto optional_end(Nullate has_nulls) const
439  {
442  }
443 
455  template <typename T,
456  bool has_nulls,
457  CUDF_ENABLE_IF(column_device_view::has_element_accessor<T>())>
459  {
462  }
463 
476  template <typename T,
477  bool has_nulls,
478  CUDF_ENABLE_IF(column_device_view::has_element_accessor<T>())>
480  {
483  }
484 
503  static std::unique_ptr<column_device_view, std::function<void(column_device_view*)>> create(
505 
512  void destroy();
513 
521  static std::size_t extent(column_view const& source_view);
522 
529  [[nodiscard]] __device__ column_device_view child(size_type child_index) const noexcept
530  {
531  return static_cast<column_device_view*>(d_children)[child_index];
532  }
533 
539  [[nodiscard]] __device__ device_span<column_device_view const> children() const noexcept
540  {
541  return {static_cast<column_device_view*>(d_children), static_cast<std::size_t>(_num_children)};
542  }
543 
549  [[nodiscard]] CUDF_HOST_DEVICE size_type num_child_columns() const noexcept
550  {
551  return _num_children;
552  }
553 
554  private:
568  size_type size,
569  void const* data,
570  bitmask_type const* null_mask,
571  size_type offset,
572  column_device_view* children,
573  size_type num_children)
574  : column_device_view_core{type, size, data, null_mask, offset, children, num_children}
575  {
576  }
577 
588  column_device_view(column_view source);
589 };
590 
598  public:
600 
601  mutable_column_device_view() = delete;
602  ~mutable_column_device_view() = default;
617 
628 
647  static std::unique_ptr<mutable_column_device_view,
648  std::function<void(mutable_column_device_view*)>>
651 
669  template <typename T, CUDF_ENABLE_IF(is_rep_layout_compatible<T>())>
670  [[nodiscard]] __device__ T& element(size_type element_index) const noexcept
671  {
672  return base::element<T>(element_index);
673  }
674 
681  template <typename T>
682  CUDF_HOST_DEVICE static constexpr bool has_element_accessor()
683  {
684  return has_element_accessor_impl<mutable_column_device_view, T>::value;
685  }
686 
688  using count_it = thrust::counting_iterator<size_type>;
692  template <typename T>
693  using iterator = thrust::transform_iterator<detail::mutable_value_accessor<T>, count_it>;
694 
705  template <typename T, CUDF_ENABLE_IF(mutable_column_device_view::has_element_accessor<T>())>
707  {
709  }
710 
721  template <typename T, CUDF_ENABLE_IF(mutable_column_device_view::has_element_accessor<T>())>
723  {
725  }
726 
733  [[nodiscard]] __device__ mutable_column_device_view child(size_type child_index) const noexcept
734  {
735  return static_cast<mutable_column_device_view*>(d_children)[child_index];
736  }
737 
746  static std::size_t extent(mutable_column_view source_view);
747 
754  void destroy();
755 
756  private:
766 };
767 
768 static_assert(sizeof(column_device_view) == sizeof(column_device_view_core),
769  "column_device_view and raw_column_device_view must be bitwise-compatible");
770 
771 static_assert(
773  "mutable_column_device_view and raw_mutable_column_device_view must be bitwise-compatible");
774 
775 namespace detail {
776 
791 template <typename T>
794 
800  value_accessor(column_device_view const& _col) : col{_col}
801  {
802  CUDF_EXPECTS(type_id_matches_device_storage_type<T>(col.type().id()), "the data type mismatch");
803  }
804 
810  __device__ T operator()(cudf::size_type i) const { return col.element<T>(i); }
811 };
812 
839 template <typename T, typename Nullate>
842 
849  optional_accessor(column_device_view const& _col, Nullate with_nulls)
850  : col{_col}, has_nulls{with_nulls}
851  {
852  CUDF_EXPECTS(type_id_matches_device_storage_type<T>(col.type().id()), "the data type mismatch");
853  if (with_nulls) { CUDF_EXPECTS(_col.nullable(), "Unexpected non-nullable column."); }
854  }
855 
863  __device__ inline cuda::std::optional<T> operator()(cudf::size_type i) const
864  {
865  if (has_nulls) {
866  return (col.is_valid_nocheck(i)) ? cuda::std::optional<T>{col.element<T>(i)}
867  : cuda::std::optional<T>{cuda::std::nullopt};
868  }
869  return cuda::std::optional<T>{col.element<T>(i)};
870  }
871 
872  Nullate has_nulls{};
873 };
874 
894 template <typename T, bool has_nulls = false>
897 
903  pair_accessor(column_device_view const& _col) : col{_col}
904  {
905  CUDF_EXPECTS(type_id_matches_device_storage_type<T>(col.type().id()), "the data type mismatch");
906  if (has_nulls) { CUDF_EXPECTS(_col.nullable(), "Unexpected non-nullable column."); }
907  }
908 
915  __device__ inline thrust::pair<T, bool> operator()(cudf::size_type i) const
916  {
917  return {col.element<T>(i), (has_nulls ? col.is_valid_nocheck(i) : true)};
918  }
919 };
920 
940 template <typename T, bool has_nulls = false>
943 
945 
951  pair_rep_accessor(column_device_view const& _col) : col{_col}
952  {
953  CUDF_EXPECTS(type_id_matches_device_storage_type<T>(col.type().id()), "the data type mismatch");
954  if (has_nulls) { CUDF_EXPECTS(_col.nullable(), "Unexpected non-nullable column."); }
955  }
956 
963  __device__ inline thrust::pair<rep_type, bool> operator()(cudf::size_type i) const
964  {
965  return {get_rep<T>(i), (has_nulls ? col.is_valid_nocheck(i) : true)};
966  }
967 
968  private:
969  template <typename R>
970  [[nodiscard]] __device__ inline auto get_rep(cudf::size_type i) const
971  requires(std::is_same_v<R, rep_type>)
972  {
973  return col.element<R>(i);
974  }
975 
976  template <typename R>
977  [[nodiscard]] __device__ inline auto get_rep(cudf::size_type i) const
978  requires(not std::is_same_v<R, rep_type>)
979  {
980  return col.element<R>(i).value();
981  }
982 };
983 
995 template <typename T>
998 
1005  {
1006  CUDF_EXPECTS(type_id_matches_device_storage_type<T>(col.type().id()), "the data type mismatch");
1007  }
1008 
1015  __device__ T& operator()(cudf::size_type i) { return col.element<T>(i); }
1016 };
1017 
1043 template <typename ColumnDeviceView, typename ColumnViewIterator>
1044 ColumnDeviceView* child_columns_to_device_array(ColumnViewIterator child_begin,
1045  ColumnViewIterator child_end,
1046  void* h_ptr,
1047  void* d_ptr)
1048 {
1049  ColumnDeviceView* d_children = detail::align_ptr_for_type<ColumnDeviceView>(d_ptr);
1050  auto num_children = std::distance(child_begin, child_end);
1051  if (num_children > 0) {
1052  // The beginning of the memory must be the fixed-sized ColumnDeviceView
1053  // struct objects in order for d_children to be used as an array.
1054  auto h_column = detail::align_ptr_for_type<ColumnDeviceView>(h_ptr);
1055  auto d_column = d_children;
1056 
1057  // Any child data is assigned past the end of this array: h_end and d_end.
1058  auto h_end = reinterpret_cast<int8_t*>(h_column + num_children);
1059  auto d_end = reinterpret_cast<int8_t*>(d_column + num_children);
1060  std::for_each(child_begin, child_end, [&](auto const& col) {
1061  // inplace-new each child into host memory
1062  new (h_column) ColumnDeviceView(col, h_end, d_end);
1063  h_column++; // advance to next child
1064  // update the pointers for holding this child column's child data
1065  auto col_child_data_size = ColumnDeviceView::extent(col) - sizeof(ColumnDeviceView);
1066  h_end += col_child_data_size;
1067  d_end += col_child_data_size;
1068  });
1069  }
1070  return d_children;
1071 }
1072 
1073 } // namespace detail
1074 } // namespace CUDF_EXPORT cudf
An immutable, non-owning view of device data as a column of elements that is trivially copyable and u...
An immutable, non-owning view of device data as a column of elements that is trivially copyable and u...
static std::unique_ptr< column_device_view, std::function< void(column_device_view *)> > create(column_view source_view, rmm::cuda_stream_view stream=cudf::get_default_stream())
Factory to construct a column view that is usable in device memory.
column_device_view child(size_type child_index) const noexcept
Returns the specified child.
void destroy()
Destroy the column_device_view object.
column_device_view & operator=(column_device_view &&)=default
Move assignment operator.
thrust::counting_iterator< size_type > count_it
Counting iterator.
static constexpr CUDF_HOST_DEVICE bool has_element_accessor()
For a given T, indicates if column_device_view::element<T>() has a valid overload.
const_pair_iterator< T, has_nulls > pair_end() const
Return a pair iterator to the element following the last element of the column.
const_pair_rep_iterator< T, has_nulls > pair_rep_end() const
Return a pair iterator to the element following the last element of the column.
const_pair_iterator< T, has_nulls > pair_begin() const
Return a pair iterator to the first element of the column.
T element(size_type element_index) const noexcept
Returns a copy of the element at the specified index.
column_device_view & operator=(column_device_view const &)=default
Copy assignment operator.
CUDF_HOST_DEVICE column_device_view slice(size_type offset, size_type size) const noexcept
Get a new column_device_view which is a slice of this column.
thrust::transform_iterator< detail::value_accessor< T >, count_it > const_iterator
Iterator for navigating this column.
auto optional_end(Nullate has_nulls) const
Return an optional iterator to the element following the last element of the column.
thrust::transform_iterator< detail::pair_accessor< T, has_nulls >, count_it > const_pair_iterator
Pair iterator for navigating this column.
const_pair_rep_iterator< T, has_nulls > pair_rep_begin() const
Return a pair iterator to the first element of the column.
thrust::transform_iterator< detail::optional_accessor< T, Nullate >, count_it > const_optional_iterator
Optional iterator for navigating this column.
CUDF_HOST_DEVICE size_type num_child_columns() const noexcept
Returns the number of child columns.
auto optional_begin(Nullate has_nulls) const
Return an optional iterator to the first element of the column.
column_device_view(column_device_view const &)=default
Copy constructor.
column_device_view(column_device_view &&)=default
Move constructor.
const_iterator< T > begin() const
Return an iterator to the first element of the column.
thrust::transform_iterator< detail::pair_rep_accessor< T, has_nulls >, count_it > const_pair_rep_iterator
Pair rep iterator for navigating this column.
static std::size_t extent(column_view const &source_view)
Return the size in bytes of the amount of memory needed to hold a device view of the specified column...
column_device_view(column_view column, void *h_ptr, void *d_ptr)
Creates an instance of this class using the specified host memory pointer (h_ptr) to store child obje...
const_iterator< T > end() const
Returns an iterator to the element following the last element of the column.
device_span< column_device_view const > children() const noexcept
Returns a span containing the children of this column.
A non-owning, immutable view of device data as a column of elements, some of which may be null as ind...
A container of nullable device data as a column of elements.
Definition: column.hpp:36
Indicator for the logical data type of an element in a column.
Definition: types.hpp:238
constexpr CUDF_HOST_DEVICE type_id id() const noexcept
Returns the type identifier.
Definition: types.hpp:282
CUDF_HOST_DEVICE data_type type() const noexcept
Returns the element type.
bool is_valid_nocheck(size_type element_index) const noexcept
Returns whether the specified element holds a valid value (i.e., not null)
CUDF_HOST_DEVICE bool nullable() const noexcept
Indicates whether the column can contain null elements, i.e., if it has an allocated bitmask.
A mutable, non-owning view of device data as a column of elements that is trivially copyable and usab...
A mutable, non-owning view of device data as a column of elements that is trivially copyable and usab...
static constexpr CUDF_HOST_DEVICE bool has_element_accessor()
For a given T, indicates if mutable_column_device_view::element<T>() has a valid overload.
void destroy()
Destroy the mutable_column_device_view object.
mutable_column_device_view(mutable_column_view column, void *h_ptr, void *d_ptr)
Creates an instance of this class using the specified host memory pointer (h_ptr) to store child obje...
static std::size_t extent(mutable_column_view source_view)
Return the size in bytes of the amount of memory needed to hold a device view of the specified column...
thrust::counting_iterator< size_type > count_it
Counting iterator.
mutable_column_device_view child(size_type child_index) const noexcept
Returns the specified child.
mutable_column_device_view(mutable_column_device_view const &)=default
Copy constructor.
T & element(size_type element_index) const noexcept
Returns reference to element at the specified index.
iterator< T > end()
Return one past the last element after underlying data is casted to the specified type.
mutable_column_device_view & operator=(mutable_column_device_view &&)=default
Move assignment operator.
mutable_column_device_view(mutable_column_device_view &&)=default
Move constructor.
mutable_column_device_view & operator=(mutable_column_device_view const &)=default
Copy assignment operator.
static std::unique_ptr< mutable_column_device_view, std::function< void(mutable_column_device_view *)> > create(mutable_column_view source_view, rmm::cuda_stream_view stream=cudf::get_default_stream())
Factory to construct a column view that is usable in device memory.
thrust::transform_iterator< detail::mutable_value_accessor< T >, count_it > iterator
Iterator for navigating this column.
iterator< T > begin()
Return first element (accounting for offset) after underlying data is casted to the specified type.
A non-owning, mutable view of device data as a column of elements, some of which may be null as indic...
ColumnDeviceView * child_columns_to_device_array(ColumnViewIterator child_begin, ColumnViewIterator child_end, void *h_ptr, void *d_ptr)
Helper function for use by column_device_view and mutable_column_device_view constructors to build de...
Column device view class definitions.
column view class definitions
rmm::cuda_stream_view const get_default_stream()
Get the current default stream.
CUDF_HOST_DEVICE constexpr decltype(auto) __forceinline__ type_dispatcher(cudf::data_type dtype, Functor f, Ts &&... args)
Invokes an operator() template with the type instantiation based on the specified cudf::data_type's i...
std::conditional_t< std::is_same_v< numeric::decimal32, T >, int32_t, std::conditional_t< std::is_same_v< numeric::decimal64, T >, int64_t, std::conditional_t< std::is_same_v< numeric::decimal128, T >, __int128_t, T > >> device_storage_type_t
"Returns" the corresponding type that is stored on the device when using cudf::column
#define CUDF_EXPECTS(...)
Macro for checking (pre-)conditions that throws an exception when a condition is violated.
Definition: error.hpp:143
int32_t size_type
Row index type for columns and tables.
Definition: types.hpp:84
uint32_t bitmask_type
Bitmask type stored as 32-bit unsigned integer.
Definition: types.hpp:85
size_type distance(T f, T l)
Similar to std::distance but returns cudf::size_type and performs static_cast
Definition: types.hpp:99
#define CUDF_ENABLE_IF(...)
Convenience macro for SFINAE as an unnamed template parameter.
Definition: traits.hpp:39
Class definition for cudf::list_view.
cuDF interfaces
Definition: host_udf.hpp:26
bool has_nulls(table_view const &view)
Returns True if the table has nulls in any of its columns.
APIs for spans.
Class definition for cudf::strings_column_view.
Class definition for cudf::struct_view.
Mutable value accessor of column without null bitmask.
T & operator()(cudf::size_type i)
Accessor.
mutable_value_accessor(mutable_column_device_view &_col)
Constructor.
mutable_column_device_view col
mutable column view of column in device
optional accessor of a column
cuda::std::optional< T > operator()(cudf::size_type i) const
Returns a cuda::std::optional of column[i].
column_device_view const col
column view of column in device
optional_accessor(column_device_view const &_col, Nullate with_nulls)
Constructor.
pair accessor of column with/without null bitmask
column_device_view const col
column view of column in device
thrust::pair< T, bool > operator()(cudf::size_type i) const
Pair accessor.
pair_accessor(column_device_view const &_col)
constructor
pair accessor of column with/without null bitmask
thrust::pair< rep_type, bool > operator()(cudf::size_type i) const
Pair accessor.
column_device_view const col
column view of column in device
device_storage_type_t< T > rep_type
representation type
pair_rep_accessor(column_device_view const &_col)
constructor
value accessor of column without null bitmask
column_device_view const col
column view of column in device
value_accessor(column_device_view const &_col)
constructor
T operator()(cudf::size_type i) const
Returns the value of element at index i
Device version of C++20 std::span with reduced feature set.
Definition: span.hpp:323
A strongly typed wrapper for indices in a DICTIONARY type column.
Definition: dictionary.hpp:38
Defines the mapping between cudf::type_id runtime type information and concrete C++ types.
#define CUDF_HOST_DEVICE
Indicates that the function or method is usable on host and device.
Definition: types.hpp:21