26 #include <cudf/utilities/export.hpp>
28 #include <string_view>
31 namespace CUDF_EXPORT
cudf {
63 std::vector<parquet_column_schema> children)
64 : _name{name}, _type{type}, _children{std::move(children)}
73 [[nodiscard]]
auto name()
const {
return _name; }
80 [[nodiscard]]
auto type()
const {
return _type; }
87 [[nodiscard]]
auto const&
children() const& {
return _children; }
93 [[nodiscard]]
auto children() && {
return std::move(_children); }
102 [[nodiscard]]
auto const&
child(
int idx)
const& {
return children().at(idx); }
108 [[nodiscard]]
auto child(
int idx) && {
return std::move(children().at(idx)); }
121 std::vector<parquet_column_schema> _children;
148 [[nodiscard]]
auto const&
root() const& {
return _root; }
154 [[nodiscard]]
auto root() && {
return std::move(_root); }
194 std::vector<size_type> num_rowgroups_per_file,
196 std::vector<row_group_metadata> rg_metadata,
198 : _schema{std::move(schema)},
200 _num_rowgroups{num_rowgroups},
201 _num_rowgroups_per_file{std::move(num_rowgroups_per_file)},
202 _file_metadata{std::move(file_metadata)},
203 _rowgroup_metadata{std::move(rg_metadata)},
213 [[nodiscard]]
auto const&
schema()
const {
return _schema; }
222 [[nodiscard]]
auto num_rows()
const {
return _num_rows; }
243 [[nodiscard]]
auto const&
metadata()
const {
return _file_metadata; }
265 std::vector<size_type> _num_rowgroups_per_file;
266 key_value_metadata _file_metadata;
267 std::vector<row_group_metadata> _rowgroup_metadata;
268 column_chunk_metadata _column_chunk_metadata;
parquet_metadata read_parquet_metadata(source_info const &src_info)
Reads metadata of parquet dataset.
Type
Basic data types in Parquet, determines how data is physically stored.
int32_t size_type
Row index type for columns and tables.
cuDF-IO API type definitions
Parquet footer schema structs.
Schema of a parquet column, including the nested columns.
auto const & child(int idx) const &
Returns schema of the child with the given index.
auto name() const
Returns parquet column name; can be empty.
auto const & children() const &
Returns schemas of all child columns.
auto type() const
Returns parquet physical type of the column.
auto children() &&
Returns schemas of all child columns.
auto num_children() const
Returns the number of child columns.
parquet_column_schema()=default
Default constructor.
parquet_column_schema(std::string_view name, Type type, std::vector< parquet_column_schema > children)
constructor
auto child(int idx) &&
Returns schema of the child with the given index.
Schema of a parquet file.
parquet_schema()=default
Default constructor.
auto root() &&
Returns the schema of the struct column that contains all columns as fields.
auto const & root() const &
Returns the schema of the struct column that contains all columns as fields.
parquet_schema(parquet_column_schema root_column_schema)
constructor
Source information for read interfaces.