19 #include <cudf_test/column_utilities.hpp>
20 #include <cudf_test/default_stream.hpp>
25 #include <cudf/detail/concatenate.hpp>
26 #include <cudf/detail/iterator.cuh>
27 #include <cudf/detail/utilities/vector_factories.hpp>
35 #include <cudf/utilities/export.hpp>
42 #include <thrust/copy.h>
43 #include <thrust/functional.h>
44 #include <thrust/host_vector.h>
45 #include <thrust/iterator/constant_iterator.h>
46 #include <thrust/iterator/counting_iterator.h>
47 #include <thrust/iterator/transform_iterator.h>
54 namespace CUDF_EXPORT
cudf {
90 std::unique_ptr<cudf::column>
release() {
return std::move(wrapped); }
93 std::unique_ptr<cudf::column> wrapped{};
99 template <
typename From,
typename To>
109 template <
typename FromT = From,
111 std::enable_if_t<std::is_same_v<FromT, ToT>,
void>* =
nullptr>
126 typename FromT = From,
129 std::is_constructible_v<ToT, FromT>),
131 constexpr ToT
operator()(FromT element)
const
133 return static_cast<ToT
>(element);
145 typename FromT = From,
147 std::enable_if_t<std::is_integral_v<FromT> && cudf::is_timestamp<ToT>(),
void>* =
nullptr>
150 return ToT{
typename ToT::duration{element}};
164 template <
typename ElementTo,
165 typename ElementFrom,
166 typename InputIterator,
167 std::enable_if_t<not cudf::is_fixed_point<ElementTo>()>* =
nullptr>
170 static_assert(cudf::is_fixed_width<ElementTo>(),
"Unexpected non-fixed width type.");
171 auto transformer = fixed_width_type_converter<ElementFrom, ElementTo>{};
172 auto transform_begin = thrust::make_transform_iterator(begin, transformer);
174 auto const elements = thrust::host_vector<ElementTo>(transform_begin, transform_begin + size);
193 template <
typename ElementTo,
194 typename ElementFrom,
195 typename InputIterator,
196 std::enable_if_t<not cudf::is_fixed_point<ElementFrom>() and
198 rmm::device_buffer make_elements(InputIterator begin, InputIterator end)
200 using RepType =
typename ElementTo::rep;
201 auto transformer = fixed_width_type_converter<ElementFrom, RepType>{};
202 auto transform_begin = thrust::make_transform_iterator(begin, transformer);
204 auto const elements = thrust::host_vector<RepType>(transform_begin, transform_begin + size);
219 template <
typename ElementTo,
220 typename ElementFrom,
221 typename InputIterator,
222 std::enable_if_t<cudf::is_fixed_point<ElementFrom>() and
224 rmm::device_buffer make_elements(InputIterator begin, InputIterator end)
227 using RepType =
typename ElementTo::rep;
229 CUDF_EXPECTS(std::all_of(begin, end, [](ElementFrom v) {
return v.scale() == 0; }),
230 "Only zero-scale fixed-point values are supported");
232 auto to_rep = [](ElementTo fp) {
return fp.value(); };
233 auto transformer_begin = thrust::make_transform_iterator(begin, to_rep);
235 auto const elements = thrust::host_vector<RepType>(transformer_begin, transformer_begin + size);
254 template <
typename Val
idityIterator>
255 std::pair<std::vector<bitmask_type>,
cudf::size_type> make_null_mask_vector(ValidityIterator begin,
256 ValidityIterator end)
261 auto null_mask = std::vector<bitmask_type>(num_words, 0);
263 for (
auto i = 0; i < size; ++i) {
287 template <
typename Val
idityIterator>
288 std::pair<rmm::device_buffer, cudf::size_type> make_null_mask(ValidityIterator begin,
289 ValidityIterator end)
291 auto [null_mask,
null_count] = make_null_mask_vector(begin, end);
312 template <
typename StringsIterator,
typename Val
idityIterator>
313 auto make_chars_and_offsets(StringsIterator begin, StringsIterator end, ValidityIterator v)
315 std::vector<char> chars{};
316 std::vector<cudf::size_type> offsets(1, 0);
317 for (
auto str = begin; str < end; ++str) {
318 std::string tmp = (*v++) ? std::string(*str) : std::string{};
319 chars.insert(chars.end(), std::cbegin(tmp), std::cend(tmp));
320 auto const last_offset =
static_cast<std::size_t
>(offsets.back());
321 auto const next_offset = last_offset + tmp.length();
323 next_offset <
static_cast<std::size_t
>(std::numeric_limits<cudf::size_type>::max()),
324 "Cannot use strings_column_wrapper to build a large strings column");
327 return std::pair(std::move(chars), std::move(offsets));
339 template <
typename ElementTo,
typename SourceElementT = ElementTo>
347 std::vector<ElementTo> empty;
351 detail::make_elements<ElementTo, SourceElementT>(empty.begin(), empty.end()),
374 template <
typename InputIterator>
380 detail::make_elements<ElementTo, SourceElementT>(begin, end),
408 template <
typename InputIterator,
typename Val
idityIterator>
413 auto [null_mask,
null_count] = detail::make_null_mask(v, v + size);
416 detail::make_elements<ElementTo, SourceElementT>(begin, end),
417 std::move(null_mask),
433 template <
typename ElementFrom>
456 template <
typename ElementFrom>
458 std::initializer_list<bool> validity)
480 template <
typename Val
idityIterator,
typename ElementFrom>
504 template <
typename InputIterator>
507 std::initializer_list<bool>
const& validity)
529 template <
typename ElementFrom>
533 thrust::make_transform_iterator(elements.begin(), [](
auto const& e) { return e.first; });
534 auto end = begin + elements.size();
536 thrust::make_transform_iterator(elements.begin(), [](
auto const& e) { return e.second; });
546 template <
typename Rep>
565 template <
typename FixedPo
intRepIterator>
567 FixedPointRepIterator end,
571 CUDF_EXPECTS(numeric::is_supported_representation_type<Rep>(),
"not valid representation type");
574 auto const elements = thrust::host_vector<Rep>(begin, end);
575 auto const id = type_to_id<numeric::fixed_point<Rep, numeric::Radix::BASE_10>>();
630 template <
typename FixedPo
intRepIterator,
typename Val
idityIterator>
632 FixedPointRepIterator end,
637 CUDF_EXPECTS(numeric::is_supported_representation_type<Rep>(),
"not valid representation type");
640 auto const elements = thrust::host_vector<Rep>(begin, end);
641 auto const id = type_to_id<numeric::fixed_point<Rep, numeric::Radix::BASE_10>>();
643 auto [null_mask,
null_count] = detail::make_null_mask(v, v + size);
648 std::move(null_mask),
670 std::initializer_list<bool> validity,
673 std::cbegin(elements), std::cend(elements), std::cbegin(validity), scale)
695 template <
typename Val
idityIterator>
723 template <
typename FixedPo
intRepIterator>
725 FixedPointRepIterator end,
726 std::initializer_list<bool>
const& validity,
763 template <
typename StringsIterator>
767 if (num_strings == 0) {
771 auto all_valid = thrust::make_constant_iterator(
true);
772 auto [chars, offsets] = detail::make_chars_and_offsets(begin, end, all_valid);
773 auto d_chars = cudf::detail::make_device_uvector_async(
775 auto d_offsets = std::make_unique<cudf::column>(
776 cudf::detail::make_device_uvector_sync(
812 template <
typename StringsIterator,
typename Val
idityIterator>
817 if (num_strings == 0) {
821 auto [chars, offsets] = detail::make_chars_and_offsets(begin, end, v);
822 auto [null_mask,
null_count] = detail::make_null_mask_vector(v, v + num_strings);
823 auto d_chars = cudf::detail::make_device_uvector_async(
825 auto d_offsets = std::make_unique<cudf::column>(
826 cudf::detail::make_device_uvector_async(
830 auto d_bitmask = cudf::detail::make_device_uvector_sync(
833 num_strings, std::move(d_offsets), d_chars.release(),
null_count, d_bitmask.release());
871 template <
typename Val
idityIterator>
893 std::initializer_list<bool> validity)
921 thrust::make_transform_iterator(strings.begin(), [](
auto const& s) { return s.first; });
922 auto end = begin + strings.size();
924 thrust::make_transform_iterator(strings.begin(), [](
auto const& s) { return s.second; });
937 template <
typename KeyElementTo,
typename SourceElementT = KeyElementTo>
972 template <
typename InputIterator>
1006 template <
typename InputIterator,
typename Val
idityIterator>
1029 template <
typename ElementFrom>
1053 template <
typename ElementFrom>
1055 std::initializer_list<bool> validity)
1078 template <
typename Val
idityIterator,
typename ElementFrom>
1104 template <
typename InputIterator>
1107 std::initializer_list<bool>
const& validity)
1172 template <
typename StringsIterator>
1208 template <
typename StringsIterator,
typename Val
idityIterator>
1252 template <
typename Val
idityIterator>
1274 std::initializer_list<bool> validity)
1315 template <
typename T,
typename SourceElementT = T>
1336 template <typename Element = T, std::enable_if_t<cudf::is_fixed_width<Element>()>* =
nullptr>
1339 build_from_non_nested(
1358 template <
typename Element = T,
1359 typename InputIterator,
1360 std::enable_if_t<cudf::is_fixed_width<Element>()>* =
nullptr>
1363 build_from_non_nested(
1382 template <
typename Element = T,
1383 typename ValidityIterator,
1384 std::enable_if_t<cudf::is_fixed_width<Element>()>* =
nullptr>
1388 build_from_non_nested(
1409 template <
typename Element = T,
1410 typename InputIterator,
1411 typename ValidityIterator,
1412 std::enable_if_t<cudf::is_fixed_width<Element>()>* =
nullptr>
1416 build_from_non_nested(
1433 template <
typename Element = T,
1434 std::enable_if_t<std::is_same_v<Element, cudf::string_view>>* =
nullptr>
1437 build_from_non_nested(
1456 template <
typename Element = T,
1457 typename ValidityIterator,
1458 std::enable_if_t<std::is_same_v<Element, cudf::string_view>>* =
nullptr>
1462 build_from_non_nested(
1490 std::vector<bool> valids;
1491 build_from_nested(elements, valids);
1535 template <
typename Val
idityIterator>
1540 std::vector<bool> validity;
1544 std::back_inserter(validity),
1546 build_from_nested(elements, validity);
1578 std::unique_ptr<cudf::column>&& offsets,
1579 std::unique_ptr<cudf::column>&& values,
1588 std::move(null_mask),
1608 void build_from_nested(std::initializer_list<lists_column_wrapper<T, SourceElementT>> elements,
1609 std::vector<bool>
const& v)
1611 auto valids = cudf::detail::make_counting_transform_iterator(
1612 0, [&v](
auto i) {
return v.empty() ?
true : v[i]; });
1615 auto const hierarchy_and_depth =
1616 std::accumulate(elements.begin(),
1618 std::pair<column_view, int32_t>{{}, -1},
1619 [](
auto acc, lists_column_wrapper
const& lcw) {
1620 return lcw.depth > acc.second ? std::pair(lcw.get_view(), lcw.depth) : acc;
1622 column_view expected_hierarchy = hierarchy_and_depth.first;
1623 int32_t
const expected_depth = hierarchy_and_depth.second;
1626 auto [cols, stubs] = preprocess_columns(elements, expected_hierarchy, expected_depth);
1630 std::vector<size_type> offsetv;
1634 std::back_inserter(offsetv),
1637 size_type ret = count;
1638 if (valid) { count += col.size(); }
1642 offsetv.push_back(count);
1647 std::vector<column_view> children;
1649 std::cbegin(cols), std::cend(cols), valids, std::back_inserter(children), thrust::identity{});
1657 depth = expected_depth + 1;
1661 return cudf::test::detail::make_null_mask(v.begin(), v.end());
1669 std::move(null_mask),
1680 void build_from_non_nested(std::unique_ptr<column> c)
1685 std::vector<size_type> offsetv;
1686 if (c->size() > 0) {
1687 offsetv.push_back(0);
1688 offsetv.push_back(c->size());
1697 size_type num_elements = offsets->size() == 0 ? 0 : offsets->size() - 1;
1740 std::unique_ptr<column> normalize_column(column_view
const& col,
1741 column_view
const& expected_hierarchy)
1744 if (col.type().id() != type_id::LIST) {
1745 CUDF_EXPECTS(col.is_empty(),
"Encountered mismatched column!");
1747 auto remainder =
empty_like(expected_hierarchy);
1751 lists_column_view lcv(col);
1754 std::make_unique<column>(lcv.offsets()),
1755 normalize_column(lists_column_view(col).child(),
1756 lists_column_view(expected_hierarchy).child()),
1763 std::pair<std::vector<column_view>, std::vector<std::unique_ptr<column>>> preprocess_columns(
1764 std::initializer_list<lists_column_wrapper<T, SourceElementT>>
const& elements,
1765 column_view& expected_hierarchy,
1768 std::vector<std::unique_ptr<column>> stubs;
1769 std::vector<column_view> cols;
1776 std::back_inserter(cols),
1777 [&](lists_column_wrapper
const& l) -> column_view {
1781 if (l.depth < expected_depth) {
1795 CUDF_EXPECTS(l.wrapped->size() == 0,
"Mismatch in column types!");
1796 stubs.push_back(empty_like(expected_hierarchy));
1798 stubs.push_back(normalize_column(l.get_view(), expected_hierarchy));
1800 return *(stubs.back());
1803 return l.get_view();
1806 return {std::move(cols), std::move(stubs)};
1809 [[nodiscard]] column_view get_view()
const
1811 return root ? lists_column_view(*wrapped).child() : *wrapped;
1851 std::vector<bool>
const& validity = {})
1853 init(std::move(child_columns), validity);
1877 std::initializer_list<std::reference_wrapper<detail::column_wrapper>> child_column_wrappers,
1878 std::vector<bool>
const& validity = {})
1880 std::vector<std::unique_ptr<cudf::column>> child_columns;
1881 child_columns.reserve(child_column_wrappers.size());
1883 child_column_wrappers.end(),
1884 std::back_inserter(child_columns),
1885 [&](
auto const& column_wrapper) {
1886 return std::make_unique<cudf::column>(column_wrapper.get(),
1887 cudf::test::get_default_stream());
1889 init(std::move(child_columns), validity);
1912 template <
typename V>
1914 std::initializer_list<std::reference_wrapper<detail::column_wrapper>> child_column_wrappers,
1917 std::vector<std::unique_ptr<cudf::column>> child_columns;
1918 child_columns.reserve(child_column_wrappers.size());
1920 child_column_wrappers.end(),
1921 std::back_inserter(child_columns),
1922 [&](
auto const& column_wrapper) {
1923 return std::make_unique<cudf::column>(column_wrapper.get(),
1924 cudf::test::get_default_stream());
1926 init(std::move(child_columns), validity_iter);
1930 void init(std::vector<std::unique_ptr<cudf::column>>&& child_columns,
1931 std::vector<bool>
const& validity)
1933 size_type num_rows = child_columns.empty() ? 0 : child_columns[0]->size();
1936 child_columns.end(),
1937 [&](
auto const& p_column) { return p_column->size() == num_rows; }),
1938 "All struct member columns must have the same row count.");
1941 "Validity buffer must have as many elements as rows in the struct column.");
1945 return cudf::test::detail::make_null_mask(validity.begin(), validity.end());
1949 std::move(child_columns),
1951 std::move(null_mask),
1955 template <
typename V>
1956 void init(std::vector<std::unique_ptr<cudf::column>>&& child_columns, V validity_iterator)
1958 size_type const num_rows = child_columns.empty() ? 0 : child_columns[0]->size();
1961 child_columns.end(),
1962 [&](
auto const& p_column) { return p_column->size() == num_rows; }),
1963 "All struct member columns must have the same row count.");
1965 std::vector<bool> validity(num_rows);
1966 std::copy(validity_iterator, validity_iterator + num_rows, validity.begin());
1968 init(std::move(child_columns), validity);
Utilities for bit and bitmask operations.
A non-owning, immutable view of device data as a column of elements, some of which may be null as ind...
A container of nullable device data as a column of elements.
Indicator for the logical data type of an element in a column.
A wrapper class for operations on a dictionary column.
column_view indices() const noexcept
Returns the column of indices.
column_view keys() const noexcept
Returns the column of keys.
Given a column-view of lists type, an instance of this class provides a wrapper on this compound colu...
A non-owning, mutable view of device data as a column of elements, some of which may be null as indic...
Base class for a wrapper around a cudf::column.
std::unique_ptr< cudf::column > release()
Releases internal unique_ptr to wrapped column.
dictionary_column_wrapper(StringsIterator begin, StringsIterator end, ValidityIterator v)
Construct a nullable dictionary column of strings from the range [begin,end) using the range [v,...
dictionary_column_wrapper(std::initializer_list< std::string > strings, std::initializer_list< bool > validity)
Construct a nullable dictionary column of strings from a list of strings and a list of booleans to in...
column_view indices() const
Access indices column view.
dictionary_column_wrapper(std::initializer_list< std::string > strings)
Construct a non-nullable dictionary column of strings from a list of strings.
dictionary_column_wrapper(StringsIterator begin, StringsIterator end)
Construct a non-nullable dictionary column of strings from the range [begin,end).
dictionary_column_wrapper(std::initializer_list< std::string > strings, ValidityIterator v)
Construct a nullable dictionary column of strings from a list of strings and the range [v,...
column_view keys() const
Access keys column view.
dictionary_column_wrapper()
Default constructor initializes an empty dictionary column of strings.
column_wrapper derived class for wrapping dictionary columns.
dictionary_column_wrapper(std::initializer_list< ElementFrom > elements)
Construct a non-nullable dictionary column of fixed-width elements from an initializer list.
dictionary_column_wrapper(std::initializer_list< ElementFrom > elements, std::initializer_list< bool > validity)
Construct a nullable dictionary column from a list of fixed-width elements using another list to indi...
dictionary_column_wrapper(std::initializer_list< ElementFrom > element_list, ValidityIterator v)
Construct a nullable dictionary column from a list of fixed-width elements and the range [v,...
dictionary_column_wrapper()
Default constructor initializes an empty column with dictionary type.
dictionary_column_wrapper(InputIterator begin, InputIterator end)
Construct a non-nullable dictionary column of the fixed-width elements in the range [begin,...
dictionary_column_wrapper(InputIterator begin, InputIterator end, ValidityIterator v)
Construct a nullable dictionary column of the fixed-width elements in the range [begin,...
dictionary_column_wrapper(InputIterator begin, InputIterator end, std::initializer_list< bool > const &validity)
Construct a nullable dictionary column of the fixed-width elements in the range [begin,...
A wrapper for a column of fixed-width elements.
fixed_point_column_wrapper(FixedPointRepIterator begin, FixedPointRepIterator end, std::initializer_list< bool > const &validity, numeric::scale_type scale)
Construct a nullable column of the decimal elements in the range [begin,end) using a validity initial...
fixed_point_column_wrapper(std::initializer_list< Rep > elements, std::initializer_list< bool > validity, numeric::scale_type scale)
Construct a nullable column from an initializer list of decimal elements using another list to indica...
fixed_point_column_wrapper(FixedPointRepIterator begin, FixedPointRepIterator end, numeric::scale_type scale)
Construct a non-nullable column of the decimal elements in the range [begin,end).
fixed_point_column_wrapper(std::initializer_list< Rep > element_list, ValidityIterator v, numeric::scale_type scale)
Construct a nullable column from an initializer list of decimal elements and the range [v,...
fixed_point_column_wrapper(std::initializer_list< Rep > values, numeric::scale_type scale)
Construct a non-nullable column of decimal elements from an initializer list.
fixed_point_column_wrapper(FixedPointRepIterator begin, FixedPointRepIterator end, ValidityIterator v, numeric::scale_type scale)
Construct a nullable column of the fixed-point elements from a range.
column_wrapper derived class for wrapping columns of fixed-width elements.
fixed_width_column_wrapper(InputIterator begin, InputIterator end, std::initializer_list< bool > const &validity)
Construct a nullable column of the fixed-width elements in the range [begin,end) using a validity ini...
fixed_width_column_wrapper(std::initializer_list< std::pair< ElementFrom, bool >> elements)
Construct a nullable column from a list of pairs of fixed-width elements and validity booleans of eac...
fixed_width_column_wrapper(std::initializer_list< ElementFrom > elements, std::initializer_list< bool > validity)
Construct a nullable column from a list of fixed-width elements using another list to indicate the va...
fixed_width_column_wrapper(std::initializer_list< ElementFrom > elements)
Construct a non-nullable column of fixed-width elements from an initializer list.
fixed_width_column_wrapper(InputIterator begin, InputIterator end, ValidityIterator v)
Construct a nullable column of the fixed-width elements in the range [begin,end) using the range [v,...
fixed_width_column_wrapper(std::initializer_list< ElementFrom > element_list, ValidityIterator v)
Construct a nullable column from a list of fixed-width elements and the range [v, v + element_list....
fixed_width_column_wrapper(InputIterator begin, InputIterator end)
Construct a non-nullable column of the fixed-width elements in the range [begin,end).
fixed_width_column_wrapper()
Default constructor initializes an empty column with proper dtype.
column_wrapper derived class for wrapping columns of lists.
lists_column_wrapper(InputIterator begin, InputIterator end)
Construct a lists column containing a single list of fixed-width type from an iterator range.
lists_column_wrapper(std::initializer_list< lists_column_wrapper< T, SourceElementT >> elements, ValidityIterator v)
Construct a lists column of nested lists from an initializer list of values and a validity iterator.
static lists_column_wrapper< T > make_one_empty_row_column(bool valid=true)
Construct a list column containing a single empty, optionally null row.
lists_column_wrapper(InputIterator begin, InputIterator end, ValidityIterator v)
Construct a lists column containing a single list of fixed-width type from an iterator range and a va...
lists_column_wrapper()
Construct am empty lists column.
lists_column_wrapper(std::initializer_list< lists_column_wrapper< T, SourceElementT >> elements)
Construct a lists column of nested lists from an initializer list of values.
lists_column_wrapper(std::initializer_list< SourceElementT > elements)
Construct a lists column containing a single list of fixed-width type from an initializer list of val...
lists_column_wrapper(std::initializer_list< std::string > elements, ValidityIterator v)
Construct a lists column containing a single list of strings from an initializer list of values and a...
lists_column_wrapper(std::initializer_list< std::string > elements)
Construct a lists column containing a single list of strings from an initializer list of values.
lists_column_wrapper(std::initializer_list< SourceElementT > elements, ValidityIterator v)
Construct a lists column containing a single list of fixed-width type from an initializer list of val...
column_wrapper derived class for wrapping columns of strings.
strings_column_wrapper(std::initializer_list< std::pair< std::string, bool >> strings)
Construct a nullable column from a list of pairs of strings and validity booleans of each string.
strings_column_wrapper()
Default constructor initializes an empty column of strings.
strings_column_wrapper(std::initializer_list< std::string > strings)
Construct a non-nullable column of strings from a list of strings.
strings_column_wrapper(std::initializer_list< std::string > strings, std::initializer_list< bool > validity)
Construct a nullable column of strings from a list of strings and a list of booleans to indicate the ...
strings_column_wrapper(std::initializer_list< std::string > strings, ValidityIterator v)
Construct a nullable column of strings from a list of strings and the range [v, v + strings....
strings_column_wrapper(StringsIterator begin, StringsIterator end)
Construct a non-nullable column of strings from the range [begin,end).
strings_column_wrapper(StringsIterator begin, StringsIterator end, ValidityIterator v)
Construct a nullable column of strings from the range [begin,end) using the range [v,...
column_wrapper derived class for wrapping columns of structs.
structs_column_wrapper(std::initializer_list< std::reference_wrapper< detail::column_wrapper >> child_column_wrappers, V validity_iter)
Constructs a struct column from the list of column wrappers for child columns.
structs_column_wrapper(std::initializer_list< std::reference_wrapper< detail::column_wrapper >> child_column_wrappers, std::vector< bool > const &validity={})
Constructs a struct column from the list of column wrappers for child columns.
structs_column_wrapper(std::vector< std::unique_ptr< cudf::column >> &&child_columns, std::vector< bool > const &validity={})
Constructs a struct column from the specified list of pre-constructed child columns.
void const * data() const noexcept
Class definition for cudf::column.
Column APIs for gather, scatter, split, slice, etc.
Dictionary column encode and decode APIs.
Class definition for fixed point data type.
std::unique_ptr< column > empty_like(column_view const &input)
Initializes and returns an empty column of the same type as the input.
std::unique_ptr< column > make_strings_column(cudf::device_span< thrust::pair< char const *, size_type > const > strings, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref())
Construct a STRING type column given a device span of pointer/size pairs.
std::unique_ptr< cudf::column > make_structs_column(size_type num_rows, std::vector< std::unique_ptr< column >> &&child_columns, size_type null_count, rmm::device_buffer &&null_mask, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref())
Construct a STRUCT column using specified child columns as members.
std::unique_ptr< column > make_empty_column(data_type type)
Creates an empty column of the specified type.
std::unique_ptr< cudf::column > make_lists_column(size_type num_rows, std::unique_ptr< column > offsets_column, std::unique_ptr< column > child_column, size_type null_count, rmm::device_buffer &&null_mask, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref())
Construct a LIST type column given offsets column, child column, null mask and null count.
cudf::size_type null_count(bitmask_type const *bitmask, size_type start, size_type stop, rmm::cuda_stream_view stream=cudf::get_default_stream())
Given a validity bitmask, counts the number of null elements (unset bits) in the range [start,...
std::size_t bitmask_allocation_size_bytes(size_type number_of_bits, std::size_t padding_boundary=64)
Computes the required bytes necessary to represent the specified number of bits with a given padding ...
rmm::device_buffer copy_bitmask(bitmask_type const *mask, size_type begin_bit, size_type end_bit, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref())
Creates a device_buffer from a slice of bitmask defined by a range of indices [begin_bit,...
rmm::device_buffer create_null_mask(size_type size, mask_state state, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref())
Creates a device_buffer for use as a null value indicator bitmask of a column.
std::unique_ptr< column > concatenate(host_span< column_view const > columns_to_concat, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref())
Concatenates multiple columns into a single column.
rmm::cuda_stream_view const get_default_stream()
Get the current default stream.
std::unique_ptr< column > encode(column_view const &column, data_type indices_type=data_type{type_id::UINT32}, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref())
Construct a dictionary column by dictionary encoding an existing column.
scale_type
The scale type for fixed_point.
rmm::device_async_resource_ref get_current_device_resource_ref()
Get the current device memory resource reference.
device_async_resource_ref get_current_device_resource_ref()
std::unique_ptr< column > is_fixed_point(strings_column_view const &input, data_type decimal_type=data_type{type_id::DECIMAL64}, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=cudf::get_current_device_resource_ref())
Returns a boolean column identifying strings in which all characters are valid for conversion to fixe...
CUDF_HOST_DEVICE void set_bit_unsafe(bitmask_type *bitmask, size_type bit_index)
Sets the specified bit to 1
#define CUDF_EXPECTS(...)
Macro for checking (pre-)conditions that throws an exception when a condition is violated.
int32_t size_type
Row index type for columns and tables.
uint32_t bitmask_type
Bitmask type stored as 32-bit unsigned integer.
size_type distance(T f, T l)
Similar to std::distance but returns cudf::size_type and performs static_cast
constexpr bool is_nested()
Indicates whether T is a nested type.
@ ALL_NULL
Null mask allocated, initialized to all elements NULL.
@ DICTIONARY32
Dictionary type using int32 indices.
Class definition for cudf::lists_column_view.
fixed_point and supporting types
APIs for managing validity bitmasks.
Convert between source and target types when they differ and where possible.
constexpr ToT operator()(FromT element) const
No conversion necessary: Same type, simply copy element to output.
Defines the mapping between cudf::type_id runtime type information and concrete C++ types.
Type declarations for libcudf.