column_device_view.cuh
Go to the documentation of this file.
1 /*
2  * SPDX-FileCopyrightText: Copyright (c) 2019-2026, NVIDIA CORPORATION.
3  * SPDX-License-Identifier: Apache-2.0
4  */
5 #pragma once
6 
9 #include <cudf/detail/utilities/alignment.hpp>
10 #include <cudf/lists/list_view.hpp>
14 #include <cudf/utilities/span.hpp>
16 
17 #include <rmm/cuda_stream_view.hpp>
18 
19 #include <cuda/std/utility>
20 #include <thrust/iterator/counting_iterator.h>
21 #include <thrust/iterator/transform_iterator.h>
22 
23 #include <functional>
24 
30 namespace CUDF_EXPORT cudf {
31 
38 class alignas(16) column_device_view : public column_device_view_core {
39  public:
41 
42  column_device_view() = delete;
43  ~column_device_view() = default;
58 
68  column_device_view(column_view column, void* h_ptr, void* d_ptr);
69 
87  size_type size) const noexcept
88  {
89  return column_device_view{this->type(),
90  size,
91  this->head(),
92  this->null_count(),
93  this->null_mask(),
94  this->offset() + offset,
95  static_cast<column_device_view*>(d_children),
96  this->num_child_columns()};
97  }
98 
116  template <typename T, CUDF_ENABLE_IF(is_rep_layout_compatible<T>())>
117  [[nodiscard]] __device__ T element(size_type element_index) const noexcept
118  {
119  return base::element<T>(element_index);
120  }
121 
133  template <typename T, CUDF_ENABLE_IF(cuda::std::is_same_v<T, string_view>)>
134  [[nodiscard]] __device__ T element(size_type element_index) const noexcept
135  {
136  return base::element<T>(element_index);
137  }
138 
149  template <typename T, CUDF_ENABLE_IF(cudf::is_fixed_point<T>())>
150  [[nodiscard]] __device__ T element(size_type element_index) const noexcept
151  {
152  return base::element<T>(element_index);
153  }
154 
155  private:
161  struct index_element_fn {
162  template <typename IndexType,
163  CUDF_ENABLE_IF(is_index_type<IndexType>() and cuda::std::is_signed_v<IndexType>)>
164  __device__ size_type operator()(column_device_view const& indices, size_type index)
165  {
166  return static_cast<size_type>(indices.element<IndexType>(index));
167  }
168 
169  template <typename IndexType,
170  typename... Args,
171  CUDF_ENABLE_IF(not(is_index_type<IndexType>() and cuda::std::is_signed_v<IndexType>))>
172  __device__ size_type operator()(Args&&... args)
173  {
174  CUDF_UNREACHABLE("dictionary indices must be a signed integral type");
175  }
176  };
177 
178  public:
203  template <typename T, CUDF_ENABLE_IF(cuda::std::is_same_v<T, dictionary32>)>
204  [[nodiscard]] __device__ T element(size_type element_index) const noexcept
205  {
206  size_type index = element_index + offset(); // account for this view's _offset
207  auto const indices = child(0);
208  return dictionary32{type_dispatcher(indices.type(), index_element_fn{}, indices, index)};
209  }
210 
217  template <typename T>
218  CUDF_HOST_DEVICE static constexpr bool has_element_accessor()
219  {
220  return has_element_accessor_impl<column_device_view, T>::value;
221  }
222 
224  using count_it = thrust::counting_iterator<size_type>;
228  template <typename T>
229  using const_iterator = thrust::transform_iterator<detail::value_accessor<T>, count_it>;
230 
246  template <typename T, CUDF_ENABLE_IF(column_device_view::has_element_accessor<T>())>
247  [[nodiscard]] const_iterator<T> begin() const
248  {
250  }
251 
266  template <typename T, CUDF_ENABLE_IF(column_device_view::has_element_accessor<T>())>
267  [[nodiscard]] const_iterator<T> end() const
268  {
269  return const_iterator<T>{count_it{size()}, detail::value_accessor<T>{*this}};
270  }
271 
275  template <typename T, typename Nullate>
277  thrust::transform_iterator<detail::optional_accessor<T, Nullate>, count_it>;
278 
282  template <typename T, bool has_nulls>
284  thrust::transform_iterator<detail::pair_accessor<T, has_nulls>, count_it>;
285 
291  template <typename T, bool has_nulls>
293  thrust::transform_iterator<detail::pair_rep_accessor<T, has_nulls>, count_it>;
294 
349  template <typename T,
350  typename Nullate,
351  CUDF_ENABLE_IF(column_device_view::has_element_accessor<T>())>
352  auto optional_begin(Nullate has_nulls) const
353  {
356  }
357 
379  template <typename T,
380  bool has_nulls,
381  CUDF_ENABLE_IF(column_device_view::has_element_accessor<T>())>
383  {
386  }
387 
411  template <typename T,
412  bool has_nulls,
413  CUDF_ENABLE_IF(column_device_view::has_element_accessor<T>())>
415  {
418  }
419 
436  template <typename T,
437  typename Nullate,
438  CUDF_ENABLE_IF(column_device_view::has_element_accessor<T>())>
439  auto optional_end(Nullate has_nulls) const
440  {
443  }
444 
456  template <typename T,
457  bool has_nulls,
458  CUDF_ENABLE_IF(column_device_view::has_element_accessor<T>())>
460  {
463  }
464 
477  template <typename T,
478  bool has_nulls,
479  CUDF_ENABLE_IF(column_device_view::has_element_accessor<T>())>
481  {
484  }
485 
504  static std::unique_ptr<column_device_view, std::function<void(column_device_view*)>> create(
506 
513  void destroy();
514 
522  static std::size_t extent(column_view const& source_view);
523 
530  [[nodiscard]] __device__ column_device_view child(size_type child_index) const noexcept
531  {
532  return static_cast<column_device_view*>(d_children)[child_index];
533  }
534 
540  [[nodiscard]] __device__ device_span<column_device_view const> children() const noexcept
541  {
542  return {static_cast<column_device_view*>(d_children), static_cast<std::size_t>(_num_children)};
543  }
544 
550  [[nodiscard]] CUDF_HOST_DEVICE size_type num_child_columns() const noexcept
551  {
552  return _num_children;
553  }
554 
555  private:
570  size_type size,
571  void const* data,
573  bitmask_type const* null_mask,
574  size_type offset,
575  column_device_view* children,
576  size_type num_children)
578  type, size, data, null_count, null_mask, offset, children, num_children}
579  {
580  }
581 
592  column_device_view(column_view source);
593 };
594 
602  public:
604 
605  mutable_column_device_view() = delete;
606  ~mutable_column_device_view() = default;
621 
632 
651  static std::unique_ptr<mutable_column_device_view,
652  std::function<void(mutable_column_device_view*)>>
655 
673  template <typename T, CUDF_ENABLE_IF(is_rep_layout_compatible<T>())>
674  [[nodiscard]] __device__ T& element(size_type element_index) const noexcept
675  {
676  return base::element<T>(element_index);
677  }
678 
685  template <typename T>
686  CUDF_HOST_DEVICE static constexpr bool has_element_accessor()
687  {
688  return has_element_accessor_impl<mutable_column_device_view, T>::value;
689  }
690 
692  using count_it = thrust::counting_iterator<size_type>;
696  template <typename T>
697  using iterator = thrust::transform_iterator<detail::mutable_value_accessor<T>, count_it>;
698 
709  template <typename T, CUDF_ENABLE_IF(mutable_column_device_view::has_element_accessor<T>())>
711  {
713  }
714 
725  template <typename T, CUDF_ENABLE_IF(mutable_column_device_view::has_element_accessor<T>())>
727  {
729  }
730 
737  [[nodiscard]] __device__ mutable_column_device_view child(size_type child_index) const noexcept
738  {
739  return static_cast<mutable_column_device_view*>(d_children)[child_index];
740  }
741 
750  static std::size_t extent(mutable_column_view source_view);
751 
758  void destroy();
759 
760  private:
770 };
771 
772 static_assert(sizeof(column_device_view) == sizeof(column_device_view_core),
773  "column_device_view and raw_column_device_view must be bitwise-compatible");
774 
775 static_assert(
777  "mutable_column_device_view and raw_mutable_column_device_view must be bitwise-compatible");
778 
779 namespace detail {
780 
795 template <typename T>
798 
804  value_accessor(column_device_view const& _col) : col{_col}
805  {
806  CUDF_EXPECTS(type_id_matches_device_storage_type<T>(col.type().id()), "the data type mismatch");
807  }
808 
814  __device__ T operator()(cudf::size_type i) const { return col.element<T>(i); }
815 };
816 
843 template <typename T, typename Nullate>
846 
853  optional_accessor(column_device_view const& _col, Nullate with_nulls)
854  : col{_col}, has_nulls{with_nulls}
855  {
856  CUDF_EXPECTS(type_id_matches_device_storage_type<T>(col.type().id()), "the data type mismatch");
857  if (with_nulls) { CUDF_EXPECTS(_col.nullable(), "Unexpected non-nullable column."); }
858  }
859 
867  __device__ inline cuda::std::optional<T> operator()(cudf::size_type i) const
868  {
869  if (has_nulls) {
870  return (col.is_valid_nocheck(i)) ? cuda::std::optional<T>{col.element<T>(i)}
871  : cuda::std::optional<T>{cuda::std::nullopt};
872  }
873  return cuda::std::optional<T>{col.element<T>(i)};
874  }
875 
876  Nullate has_nulls{};
877 };
878 
898 template <typename T, bool has_nulls = false>
901 
907  pair_accessor(column_device_view const& _col) : col{_col}
908  {
909  CUDF_EXPECTS(type_id_matches_device_storage_type<T>(col.type().id()), "the data type mismatch");
910  if (has_nulls) { CUDF_EXPECTS(_col.nullable(), "Unexpected non-nullable column."); }
911  }
912 
919  __device__ inline cuda::std::pair<T, bool> operator()(cudf::size_type i) const
920  {
921  return {col.element<T>(i), (has_nulls ? col.is_valid_nocheck(i) : true)};
922  }
923 };
924 
944 template <typename T, bool has_nulls = false>
947 
949 
955  pair_rep_accessor(column_device_view const& _col) : col{_col}
956  {
957  CUDF_EXPECTS(type_id_matches_device_storage_type<T>(col.type().id()), "the data type mismatch");
958  if (has_nulls) { CUDF_EXPECTS(_col.nullable(), "Unexpected non-nullable column."); }
959  }
960 
967  __device__ inline cuda::std::pair<rep_type, bool> operator()(cudf::size_type i) const
968  {
969  return {get_rep<T>(i), (has_nulls ? col.is_valid_nocheck(i) : true)};
970  }
971 
972  private:
973  template <typename R>
974  [[nodiscard]] __device__ inline auto get_rep(cudf::size_type i) const
975  requires(std::is_same_v<R, rep_type>)
976  {
977  return col.element<R>(i);
978  }
979 
980  template <typename R>
981  [[nodiscard]] __device__ inline auto get_rep(cudf::size_type i) const
982  requires(not std::is_same_v<R, rep_type>)
983  {
984  return col.element<R>(i).value();
985  }
986 };
987 
999 template <typename T>
1002 
1009  {
1010  CUDF_EXPECTS(type_id_matches_device_storage_type<T>(col.type().id()), "the data type mismatch");
1011  }
1012 
1019  __device__ T& operator()(cudf::size_type i) { return col.element<T>(i); }
1020 };
1021 
1047 template <typename ColumnDeviceView, typename ColumnViewIterator>
1048 ColumnDeviceView* child_columns_to_device_array(ColumnViewIterator child_begin,
1049  ColumnViewIterator child_end,
1050  void* h_ptr,
1051  void* d_ptr)
1052 {
1053  ColumnDeviceView* d_children = detail::align_ptr_for_type<ColumnDeviceView>(d_ptr);
1054  auto num_children = std::distance(child_begin, child_end);
1055  if (num_children > 0) {
1056  // The beginning of the memory must be the fixed-sized ColumnDeviceView
1057  // struct objects in order for d_children to be used as an array.
1058  auto h_column = detail::align_ptr_for_type<ColumnDeviceView>(h_ptr);
1059  auto d_column = d_children;
1060 
1061  // Any child data is assigned past the end of this array: h_end and d_end.
1062  auto h_end = reinterpret_cast<int8_t*>(h_column + num_children);
1063  auto d_end = reinterpret_cast<int8_t*>(d_column + num_children);
1064  std::for_each(child_begin, child_end, [&](auto const& col) {
1065  // inplace-new each child into host memory
1066  new (h_column) ColumnDeviceView(col, h_end, d_end);
1067  h_column++; // advance to next child
1068  // update the pointers for holding this child column's child data
1069  auto col_child_data_size = ColumnDeviceView::extent(col) - sizeof(ColumnDeviceView);
1070  h_end += col_child_data_size;
1071  d_end += col_child_data_size;
1072  });
1073  }
1074  return d_children;
1075 }
1076 
1077 } // namespace detail
1078 } // namespace CUDF_EXPORT cudf
An immutable, non-owning view of device data as a column of elements that is trivially copyable and u...
An immutable, non-owning view of device data as a column of elements that is trivially copyable and u...
static std::unique_ptr< column_device_view, std::function< void(column_device_view *)> > create(column_view source_view, rmm::cuda_stream_view stream=cudf::get_default_stream())
Factory to construct a column view that is usable in device memory.
column_device_view child(size_type child_index) const noexcept
Returns the specified child.
void destroy()
Destroy the column_device_view object.
column_device_view & operator=(column_device_view &&)=default
Move assignment operator.
thrust::counting_iterator< size_type > count_it
Counting iterator.
static constexpr CUDF_HOST_DEVICE bool has_element_accessor()
For a given T, indicates if column_device_view::element<T>() has a valid overload.
const_pair_iterator< T, has_nulls > pair_end() const
Return a pair iterator to the element following the last element of the column.
const_pair_rep_iterator< T, has_nulls > pair_rep_end() const
Return a pair iterator to the element following the last element of the column.
const_pair_iterator< T, has_nulls > pair_begin() const
Return a pair iterator to the first element of the column.
T element(size_type element_index) const noexcept
Returns a copy of the element at the specified index.
column_device_view & operator=(column_device_view const &)=default
Copy assignment operator.
CUDF_HOST_DEVICE column_device_view slice(size_type offset, size_type size) const noexcept
Get a new column_device_view which is a slice of this column.
thrust::transform_iterator< detail::value_accessor< T >, count_it > const_iterator
Iterator for navigating this column.
auto optional_end(Nullate has_nulls) const
Return an optional iterator to the element following the last element of the column.
thrust::transform_iterator< detail::pair_accessor< T, has_nulls >, count_it > const_pair_iterator
Pair iterator for navigating this column.
const_pair_rep_iterator< T, has_nulls > pair_rep_begin() const
Return a pair iterator to the first element of the column.
thrust::transform_iterator< detail::optional_accessor< T, Nullate >, count_it > const_optional_iterator
Optional iterator for navigating this column.
CUDF_HOST_DEVICE size_type num_child_columns() const noexcept
Returns the number of child columns.
auto optional_begin(Nullate has_nulls) const
Return an optional iterator to the first element of the column.
column_device_view(column_device_view const &)=default
Copy constructor.
column_device_view(column_device_view &&)=default
Move constructor.
const_iterator< T > begin() const
Return an iterator to the first element of the column.
thrust::transform_iterator< detail::pair_rep_accessor< T, has_nulls >, count_it > const_pair_rep_iterator
Pair rep iterator for navigating this column.
static std::size_t extent(column_view const &source_view)
Return the size in bytes of the amount of memory needed to hold a device view of the specified column...
column_device_view(column_view column, void *h_ptr, void *d_ptr)
Creates an instance of this class using the specified host memory pointer (h_ptr) to store child obje...
const_iterator< T > end() const
Returns an iterator to the element following the last element of the column.
device_span< column_device_view const > children() const noexcept
Returns a span containing the children of this column.
A non-owning, immutable view of device data as a column of elements, some of which may be null as ind...
A container of nullable device data as a column of elements.
Definition: column.hpp:36
Indicator for the logical data type of an element in a column.
Definition: types.hpp:277
constexpr CUDF_HOST_DEVICE type_id id() const noexcept
Returns the type identifier.
Definition: types.hpp:321
CUDF_HOST_DEVICE data_type type() const noexcept
Returns the element type.
bool is_valid_nocheck(size_type element_index) const noexcept
Returns whether the specified element holds a valid value (i.e., not null)
CUDF_HOST_DEVICE bool nullable() const noexcept
Indicates whether the column can contain null elements, i.e., if it has an allocated bitmask.
A mutable, non-owning view of device data as a column of elements that is trivially copyable and usab...
A mutable, non-owning view of device data as a column of elements that is trivially copyable and usab...
static constexpr CUDF_HOST_DEVICE bool has_element_accessor()
For a given T, indicates if mutable_column_device_view::element<T>() has a valid overload.
void destroy()
Destroy the mutable_column_device_view object.
mutable_column_device_view(mutable_column_view column, void *h_ptr, void *d_ptr)
Creates an instance of this class using the specified host memory pointer (h_ptr) to store child obje...
static std::size_t extent(mutable_column_view source_view)
Return the size in bytes of the amount of memory needed to hold a device view of the specified column...
thrust::counting_iterator< size_type > count_it
Counting iterator.
mutable_column_device_view child(size_type child_index) const noexcept
Returns the specified child.
mutable_column_device_view(mutable_column_device_view const &)=default
Copy constructor.
T & element(size_type element_index) const noexcept
Returns reference to element at the specified index.
iterator< T > end()
Return one past the last element after underlying data is casted to the specified type.
mutable_column_device_view & operator=(mutable_column_device_view &&)=default
Move assignment operator.
mutable_column_device_view(mutable_column_device_view &&)=default
Move constructor.
mutable_column_device_view & operator=(mutable_column_device_view const &)=default
Copy assignment operator.
static std::unique_ptr< mutable_column_device_view, std::function< void(mutable_column_device_view *)> > create(mutable_column_view source_view, rmm::cuda_stream_view stream=cudf::get_default_stream())
Factory to construct a column view that is usable in device memory.
thrust::transform_iterator< detail::mutable_value_accessor< T >, count_it > iterator
Iterator for navigating this column.
iterator< T > begin()
Return first element (accounting for offset) after underlying data is casted to the specified type.
A non-owning, mutable view of device data as a column of elements, some of which may be null as indic...
ColumnDeviceView * child_columns_to_device_array(ColumnViewIterator child_begin, ColumnViewIterator child_end, void *h_ptr, void *d_ptr)
Helper function for use by column_device_view and mutable_column_device_view constructors to build de...
Column device view class definitions.
column view class definitions
size_type null_count(bitmask_type const *bitmask, size_type start, size_type stop, rmm::cuda_stream_view stream=cudf::get_default_stream())
Given a validity bitmask, counts the number of null elements (unset bits) in the range [start,...
rmm::cuda_stream_view const get_default_stream()
Get the current default stream.
CUDF_HOST_DEVICE constexpr decltype(auto) __forceinline__ type_dispatcher(cudf::data_type dtype, Functor f, Ts &&... args)
Invokes an operator() template with the type instantiation based on the specified cudf::data_type's i...
std::conditional_t< std::is_same_v< numeric::decimal32, T >, int32_t, std::conditional_t< std::is_same_v< numeric::decimal64, T >, int64_t, std::conditional_t< std::is_same_v< numeric::decimal128, T >, __int128_t, T > >> device_storage_type_t
"Returns" the corresponding type that is stored on the device when using cudf::column
#define CUDF_EXPECTS(...)
Macro for checking (pre-)conditions that throws an exception when a condition is violated.
Definition: error.hpp:143
cuda::std::span< T, Extent > device_span
Device span is an alias of cuda::std::span.
Definition: span.hpp:320
int32_t size_type
Row index type for columns and tables.
Definition: types.hpp:84
uint32_t bitmask_type
Bitmask type stored as 32-bit unsigned integer.
Definition: types.hpp:85
size_type distance(T f, T l)
Similar to std::distance but returns cudf::size_type and performs static_cast
Definition: types.hpp:99
#define CUDF_ENABLE_IF(...)
Convenience macro for SFINAE as an unnamed template parameter.
Definition: traits.hpp:39
Class definition for cudf::list_view.
cuDF interfaces
Definition: host_udf.hpp:26
bool has_nulls(table_view const &view)
Returns True if the table has nulls in any of its columns.
APIs for spans.
Class definition for cudf::strings_column_view.
Class definition for cudf::struct_view.
Mutable value accessor of column without null bitmask.
T & operator()(cudf::size_type i)
Accessor.
mutable_value_accessor(mutable_column_device_view &_col)
Constructor.
mutable_column_device_view col
mutable column view of column in device
optional accessor of a column
cuda::std::optional< T > operator()(cudf::size_type i) const
Returns a cuda::std::optional of column[i].
column_device_view const col
column view of column in device
optional_accessor(column_device_view const &_col, Nullate with_nulls)
Constructor.
pair accessor of column with/without null bitmask
cuda::std::pair< T, bool > operator()(cudf::size_type i) const
Pair accessor.
column_device_view const col
column view of column in device
pair_accessor(column_device_view const &_col)
constructor
pair accessor of column with/without null bitmask
cuda::std::pair< rep_type, bool > operator()(cudf::size_type i) const
Pair accessor.
column_device_view const col
column view of column in device
device_storage_type_t< T > rep_type
representation type
pair_rep_accessor(column_device_view const &_col)
constructor
value accessor of column without null bitmask
column_device_view const col
column view of column in device
value_accessor(column_device_view const &_col)
constructor
T operator()(cudf::size_type i) const
Returns the value of element at index i
A strongly typed wrapper for indices in a DICTIONARY type column.
Definition: dictionary.hpp:38
Defines the mapping between cudf::type_id runtime type information and concrete C++ types.
#define CUDF_HOST_DEVICE
Indicates that the function or method is usable on host and device.
Definition: types.hpp:21