interop.hpp
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2020-2024, NVIDIA CORPORATION.
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  * http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  * See the License for the specific language governing permissions and
14  * limitations under the License.
15  */
16 
17 #pragma once
18 
19 // We disable warning 611 because the `arrow::TableBatchReader` only partially
20 // override the `ReadNext` method of `arrow::RecordBatchReader::ReadNext`
21 // triggering warning 611-D from nvcc.
22 #ifdef __CUDACC__
23 #pragma nv_diag_suppress 611
24 #pragma nv_diag_suppress 2810
25 #endif
26 #include <rmm/resource_ref.hpp>
27 
28 #include <arrow/api.h>
29 #ifdef __CUDACC__
30 #pragma nv_diag_default 611
31 #pragma nv_diag_default 2810
32 #endif
33 
34 #include <cudf/column/column.hpp>
35 #include <cudf/detail/transform.hpp>
36 #include <cudf/table/table.hpp>
38 #include <cudf/types.hpp>
39 #include <cudf/utilities/span.hpp>
40 
41 #include <rmm/mr/device/per_device_resource.hpp>
42 
43 struct DLManagedTensor;
44 
45 struct ArrowDeviceArray;
46 
47 struct ArrowSchema;
48 
49 namespace cudf {
73 std::unique_ptr<table> from_dlpack(
74  DLManagedTensor const* managed_tensor,
75  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
76 
95 DLManagedTensor* to_dlpack(
96  table_view const& input,
97  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
98  // end of group
100 
114  std::string name;
115  std::vector<column_metadata> children_meta;
116 
122  column_metadata(std::string const& _name) : name(_name) {}
123  column_metadata() = default;
124 };
125 
146 std::shared_ptr<arrow::Table> to_arrow(table_view input,
147  std::vector<column_metadata> const& metadata = {},
148  rmm::cuda_stream_view stream = cudf::get_default_stream(),
149  arrow::MemoryPool* ar_mr = arrow::default_memory_pool());
150 
168 std::shared_ptr<arrow::Scalar> to_arrow(cudf::scalar const& input,
169  column_metadata const& metadata = {},
170  rmm::cuda_stream_view stream = cudf::get_default_stream(),
171  arrow::MemoryPool* ar_mr = arrow::default_memory_pool());
172 
177 using unique_schema_t = std::unique_ptr<ArrowSchema, void (*)(ArrowSchema*)>;
178 
183 using unique_device_array_t = std::unique_ptr<ArrowDeviceArray, void (*)(ArrowDeviceArray*)>;
184 
202 
228  cudf::table&& table,
229  rmm::cuda_stream_view stream = cudf::get_default_stream(),
230  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
231 
257  cudf::column&& col,
258  rmm::cuda_stream_view stream = cudf::get_default_stream(),
259  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
260 
289  cudf::table_view const& table,
290  rmm::cuda_stream_view stream = cudf::get_default_stream(),
291  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
292 
321  cudf::column_view const& col,
322  rmm::cuda_stream_view stream = cudf::get_default_stream(),
323  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
324 
333 std::unique_ptr<table> from_arrow(
334  arrow::Table const& input,
335  rmm::cuda_stream_view stream = cudf::get_default_stream(),
336  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
337 
346 std::unique_ptr<cudf::scalar> from_arrow(
347  arrow::Scalar const& input,
348  rmm::cuda_stream_view stream = cudf::get_default_stream(),
349  rmm::device_async_resource_ref mr = rmm::mr::get_current_device_resource());
350 
355 using owned_columns_t = std::vector<std::unique_ptr<cudf::column>>;
356 
365 template <typename ViewType>
372  explicit custom_view_deleter(owned_columns_t&& owned) : owned_mem_{std::move(owned)} {}
373 
379  void operator()(ViewType* ptr) const { delete ptr; }
380 
382 };
383 
389  std::unique_ptr<cudf::table_view, custom_view_deleter<cudf::table_view>>;
390 
427  ArrowSchema const* schema,
428  ArrowDeviceArray const* input,
429  rmm::cuda_stream_view stream = cudf::get_default_stream(),
430  rmm::mr::device_memory_resource* mr = rmm::mr::get_current_device_resource());
431 
437  std::unique_ptr<cudf::column_view, custom_view_deleter<cudf::column_view>>;
438 
470  ArrowSchema const* schema,
471  ArrowDeviceArray const* input,
472  rmm::cuda_stream_view stream = cudf::get_default_stream(),
473  rmm::mr::device_memory_resource* mr = rmm::mr::get_current_device_resource());
474  // end of group
476 } // namespace cudf
A non-owning, immutable view of device data as a column of elements, some of which may be null as ind...
A container of nullable device data as a column of elements.
Definition: column.hpp:48
An owning class to represent a singular value.
Definition: scalar.hpp:49
A set of cudf::column_view's of the same size.
Definition: table_view.hpp:187
A set of cudf::column's of the same size.
Definition: table.hpp:41
Class definition for cudf::column.
rmm::cuda_stream_view const get_default_stream()
Get the current default stream.
std::unique_ptr< cudf::table_view, custom_view_deleter< cudf::table_view > > unique_table_view_t
typedef for a unique_ptr to a cudf::table_view with custom deleter
Definition: interop.hpp:389
std::vector< std::unique_ptr< cudf::column > > owned_columns_t
typedef for a vector of owning columns, used for conversion from ArrowDeviceArray
Definition: interop.hpp:355
unique_table_view_t from_arrow_device(ArrowSchema const *schema, ArrowDeviceArray const *input, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::mr::device_memory_resource *mr=rmm::mr::get_current_device_resource())
Create cudf::table_view from given ArrowDeviceArray and ArrowSchema
unique_schema_t to_arrow_schema(cudf::table_view const &input, cudf::host_span< column_metadata const > metadata)
Create ArrowSchema from cudf table and metadata.
std::unique_ptr< cudf::column_view, custom_view_deleter< cudf::column_view > > unique_column_view_t
typedef for a unique_ptr to a cudf::column_view with custom deleter
Definition: interop.hpp:437
std::unique_ptr< table > from_arrow(arrow::Table const &input, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Create cudf::table from given arrow Table input.
std::unique_ptr< ArrowSchema, void(*)(ArrowSchema *)> unique_schema_t
typedef for a unique_ptr to an ArrowSchema with custom deleter
Definition: interop.hpp:177
unique_column_view_t from_arrow_device_column(ArrowSchema const *schema, ArrowDeviceArray const *input, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::mr::device_memory_resource *mr=rmm::mr::get_current_device_resource())
Create cudf::column_view from given ArrowDeviceArray and ArrowSchema
std::unique_ptr< ArrowDeviceArray, void(*)(ArrowDeviceArray *)> unique_device_array_t
typedef for a unique_ptr to an ArrowDeviceArray with a custom deleter
Definition: interop.hpp:183
std::shared_ptr< arrow::Table > to_arrow(table_view input, std::vector< column_metadata > const &metadata={}, rmm::cuda_stream_view stream=cudf::get_default_stream(), arrow::MemoryPool *ar_mr=arrow::default_memory_pool())
Create arrow::Table from cudf table input
unique_device_array_t to_arrow_device(cudf::table &&table, rmm::cuda_stream_view stream=cudf::get_default_stream(), rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Create ArrowDeviceArray from cudf table and metadata.
DLManagedTensor * to_dlpack(table_view const &input, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Convert a cudf table into a DLPack DLTensor.
std::unique_ptr< table > from_dlpack(DLManagedTensor const *managed_tensor, rmm::device_async_resource_ref mr=rmm::mr::get_current_device_resource())
Convert a DLPack DLTensor into a cudf table.
cuDF interfaces
Definition: aggregation.hpp:34
APIs for spans.
Detailed metadata information for arrow array.
Definition: interop.hpp:113
std::vector< column_metadata > children_meta
Metadata of children of the column.
Definition: interop.hpp:115
std::string name
Name of the column.
Definition: interop.hpp:114
column_metadata(std::string const &_name)
Construct a new column metadata object.
Definition: interop.hpp:122
functor for a custom deleter to a unique_ptr of table_view
Definition: interop.hpp:366
void operator()(ViewType *ptr) const
operator to delete the unique_ptr
Definition: interop.hpp:379
owned_columns_t owned_mem_
Owned columns that must be deleted.
Definition: interop.hpp:381
custom_view_deleter(owned_columns_t &&owned)
Construct a new custom view deleter object.
Definition: interop.hpp:372
C++20 std::span with reduced feature set.
Definition: span.hpp:224
Class definition for cudf::table.
Class definitions for (mutable)_table_view
Type declarations for libcudf.