// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
#pragma once
#include "arrow/io/interfaces.h"
#include "parquet/encryption/type_fwd.h"
#include "parquet/types.h"
#include <optional>
#include <vector>
namespace parquet {
class EncodedStatistics;
struct PageIndexLocation;
/// \brief ColumnIndex is a proxy around format::ColumnIndex.
class PARQUET_EXPORT ColumnIndex {
public:
/// \brief Create a ColumnIndex from a serialized thrift message.
static std::unique_ptr<ColumnIndex> Make(const ColumnDescriptor& descr,
const void* serialized_index,
uint32_t index_len,
const ReaderProperties& properties,
Decryptor* decryptor = NULLPTR);
virtual ~ColumnIndex() = default;
/// \brief A bitmap with a bit set for each data page that has only null values.
///
/// The length of this vector is equal to the number of data pages in the column.
virtual const std::vector<bool>& null_pages() const = 0;
/// \brief A vector of encoded lower bounds for each data page in this column.
///
/// `null_pages` should be inspected first, as only pages with non-null values
/// may have their lower bounds populated.
virtual const std::vector<std::string>& encoded_min_values() const = 0;
/// \brief A vector of encoded upper bounds for each data page in this column.
///
/// `null_pages` should be inspected first, as only pages with non-null values
/// may have their upper bounds populated.
virtual const std::vector<std::string>& encoded_max_values() const = 0;
/// \brief The ordering of lower and upper bounds.
///
/// The boundary order applies across all lower bounds, and all upper bounds,
/// respectively. However, the order between lower bounds and upper bounds
/// cannot be derived from this.
virtual BoundaryOrder::type boundary_order() const = 0;
/// \brief Whether per-page null count information is available.
virtual bool has_null_counts() const = 0;
/// \brief An optional vector with the number of null values in each data page.
///
/// `has_null_counts` should be called first to determine if this information is
/// available.
virtual const std::vector<int64_t>& null_counts() const = 0;
/// \brief A vector of page indices for non-null pages.
virtual const std::vector<int32_t>& non_null_page_indices() const = 0;
};
/// \brief Typed implementation of ColumnIndex.
template <typename DType>
class PARQUET_EXPORT TypedColumnIndex : public ColumnIndex {
public:
using T = typename DType::c_type;
/// \brief A vector of lower bounds for each data page in this column.
///
/// This is like `encoded_min_values`, but with the values decoded according to
/// the column's physical type.
/// `min_values` and `max_values` can be used together with `boundary_order`
/// in order to prune some data pages when searching for specific values.
virtual const std::vector<T>& min_values() const = 0;
/// \brief A vector of upper bounds for each data page in this column.
///
/// Just like `min_values`, but for upper bounds instead of lower bounds.
virtual const std::vector<T>& max_values() const = 0;
};
using BoolColumnIndex = TypedColumnIndex<BooleanType>;
using Int32ColumnIndex = TypedColumnIndex<Int32Type>;
using Int64ColumnIndex = TypedColumnIndex<Int64Type>;
using FloatColumnIndex = TypedColumnIndex<FloatType>;
using DoubleColumnIndex = TypedColumnIndex<DoubleType>;
using ByteArrayColumnIndex = TypedColumnIndex<ByteArrayType>;
using FLBAColumnIndex = TypedColumnIndex<FLBAType>;
/// \brief PageLocation is a proxy around format::PageLocation.
struct PARQUET_EXPORT PageLocation {
/// File offset of the data page.
int64_t offset;
/// Total compressed size of the data page and header.
int32_t compressed_page_size;
/// Row id of the first row in the page within the row group.
int64_t first_row_index;
};
/// \brief OffsetIndex is a proxy around format::OffsetIndex.
class PARQUET_EXPORT OffsetIndex {
public:
/// \brief Create a OffsetIndex from a serialized thrift message.
static std::unique_ptr<OffsetIndex> Make(const void* serialized_index,
uint32_t index_len,
const ReaderProperties& properties,
Decryptor* decryptor = NULLPTR);
virtual ~OffsetIndex() = default;
/// \brief A vector of locations for each data page in this column.
virtual const std::vector<PageLocation>& page_locations() const = 0;
};
/// \brief Interface for reading the page index for a Parquet row group.
class PARQUET_EXPORT RowGroupPageIndexReader {
public:
virtual ~RowGroupPageIndexReader() = default;
/// \brief Read column index of a column chunk.
///
/// \param[in] i column ordinal of the column chunk.
/// \returns column index of the column or nullptr if it does not exist.
/// \throws ParquetException if the index is out of bound.
virtual std::shared_ptr<ColumnIndex> GetColumnIndex(int32_t i) = 0;
/// \brief Read offset index of a column chunk.
///
/// \param[in] i column ordinal of the column chunk.
/// \returns offset index of the column or nullptr if it does not exist.
/// \throws ParquetException if the index is out of bound.
virtual std::shared_ptr<OffsetIndex> GetOffsetIndex(int32_t i) = 0;
};
struct PageIndexSelection {
/// Specifies whether to read the column index.
bool column_index = false;
/// Specifies whether to read the offset index.
bool offset_index = false;
};
PARQUET_EXPORT
std::ostream& operator<<(std::ostream& out, const PageIndexSelection& params);
struct RowGroupIndexReadRange {
/// Base start and total size of column index of all column chunks in a row group.
/// If none of the column chunks have column index, it is set to std::nullopt.
std::optional<::arrow::io::ReadRange> column_index = std::nullopt;
/// Base start and total size of offset index of all column chunks in a row group.
/// If none of the column chunks have offset index, it is set to std::nullopt.
std::optional<::arrow::io::ReadRange> offset_index = std::nullopt;
};
/// \brief Interface for reading the page index for a Parquet file.
class PARQUET_EXPORT PageIndexReader {
public:
virtual ~PageIndexReader() = default;
/// \brief Create a PageIndexReader instance.
/// \returns a PageIndexReader instance.
/// WARNING: The returned PageIndexReader references to all the input parameters, so
/// it must not outlive all of the input parameters. Usually these input parameters
/// come from the same ParquetFileReader object, so it must not outlive the reader
/// that creates this PageIndexReader.
static std::shared_ptr<PageIndexReader> Make(
::arrow::io::RandomAccessFile* input, std::shared_ptr<FileMetaData> file_metadata,
const ReaderProperties& properties,
InternalFileDecryptor* file_decryptor = NULLPTR);
/// \brief Get the page index reader of a specific row group.
/// \param[in] i row group ordinal to get page index reader.
/// \returns RowGroupPageIndexReader of the specified row group. A nullptr may or may
/// not be returned if the page index for the row group is unavailable. It is
/// the caller's responsibility to check the return value of follow-up calls
/// to the RowGroupPageIndexReader.
/// \throws ParquetException if the index is out of bound.
virtual std::shared_ptr<RowGroupPageIndexReader> RowGroup(int i) = 0;
/// \brief Advise the reader which part of page index will be read later.
///
/// The PageIndexReader can optionally prefetch and cache page index that
/// may be read later to get better performance.
///
/// The contract of this function is as below:
/// 1) If WillNeed() has not been called for a specific row group and the page index
/// exists, follow-up calls to get column index or offset index of all columns in
/// this row group SHOULD NOT FAIL, but the performance may not be optimal.
/// 2) If WillNeed() has been called for a specific row group, follow-up calls to get
/// page index are limited to columns and index type requested by WillNeed().
/// So it MAY FAIL if columns that are not requested by WillNeed() are requested.
/// 3) Later calls to WillNeed() MAY OVERRIDE previous calls of same row groups.
/// For example,
/// 1) If WillNeed() is not called for row group 0, then follow-up calls to read
/// column index and/or offset index of all columns of row group 0 should not
/// fail if its page index exists.
/// 2) If WillNeed() is called for columns 0 and 1 for row group 0, then follow-up
/// call to read page index of column 2 for row group 0 MAY FAIL even if its
/// page index exists.
/// 3) If WillNeed() is called for row group 0 with offset index only, then
/// follow-up call to read column index of row group 0 MAY FAIL even if
/// the column index of this column exists.
/// 4) If WillNeed() is called for columns 0 and 1 for row group 0, then later
/// call to WillNeed() for columns 1 and 2 for row group 0. The later one
/// overrides previous call and only columns 1 and 2 of row group 0 are allowed
/// to access.
///
/// \param[in] row_group_indices list of row group ordinal to read page index later.
/// \param[in] column_indices list of column ordinal to read page index later. If it is
/// empty, it means all columns in the row group will be read.
/// \param[in] selection which kind of page index is required later.
virtual void WillNeed(const std::vector<int32_t>& row_group_indices,
const std::vector<int32_t>& column_indices,
const PageIndexSelection& selection) = 0;
/// \brief Advise the reader page index of these row groups will not be read anymore.
///
/// The PageIndexReader implementation has the opportunity to cancel any prefetch or
/// release resource that are related to these row groups.
///
/// \param[in] row_group_indices list of row group ordinal that whose page index will
/// not be accessed anymore.
virtual void WillNotNeed(const std::vector<int32_t>& row_group_indices) = 0;
/// \brief Determine the column index and offset index ranges for the given row group.
///
/// \param[in] row_group_metadata row group metadata to get column chunk metadata.
/// \param[in] columns list of column ordinals to get page index. If the list is empty,
/// it means all columns in the row group.
/// \returns RowGroupIndexReadRange of the specified row group. Throws ParquetException
/// if the selected column ordinal is out of bound or metadata of page index
/// is corrupted.
static RowGroupIndexReadRange DeterminePageIndexRangesInRowGroup(
const RowGroupMetaData& row_group_metadata, const std::vector<int32_t>& columns);
};
/// \brief Interface for collecting column index of data pages in a column chunk.
class PARQUET_EXPORT ColumnIndexBuilder {
public:
/// \brief API convenience to create a ColumnIndexBuilder.
static std::unique_ptr<ColumnIndexBuilder> Make(const ColumnDescriptor* descr);
virtual ~ColumnIndexBuilder() = default;
/// \brief Add statistics of a data page.
///
/// If the ColumnIndexBuilder has seen any corrupted statistics, it will
/// not update statistics anymore.
///
/// \param stats Page statistics in the encoded form.
virtual void AddPage(const EncodedStatistics& stats) = 0;
/// \brief Complete the column index.
///
/// Once called, AddPage() can no longer be called.
/// WriteTo() and Build() can only called after Finish() has been called.
virtual void Finish() = 0;
/// \brief Serialize the column index thrift message.
///
/// If the ColumnIndexBuilder has seen any corrupted statistics, it will
/// not write any data to the sink.
///
/// \param[out] sink output stream to write the serialized message.
/// \param[in] encryptor encryptor to encrypt the serialized column index.
virtual void WriteTo(::arrow::io::OutputStream* sink,
Encryptor* encryptor = NULLPTR) const = 0;
/// \brief Create a ColumnIndex directly.
///
/// \return If the ColumnIndexBuilder has seen any corrupted statistics, it simply
/// returns nullptr. Otherwise the column index is built and returned.
virtual std::unique_ptr<ColumnIndex> Build() const = 0;
};
/// \brief Interface for collecting offset index of data pages in a column chunk.
class PARQUET_EXPORT OffsetIndexBuilder {
public:
/// \brief API convenience to create a OffsetIndexBuilder.
static std::unique_ptr<OffsetIndexBuilder> Make();
virtual ~OffsetIndexBuilder() = default;
/// \brief Add page location of a data page.
virtual void AddPage(int64_t offset, int32_t compressed_page_size,
int64_t first_row_index) = 0;
/// \brief Add page location of a data page.
void AddPage(const PageLocation& page_location) {
AddPage(page_location.offset, page_location.compressed_page_size,
page_location.first_row_index);
}
/// \brief Complete the offset index.
///
/// In the buffered row group mode, data pages are flushed into memory
/// sink and the OffsetIndexBuilder has only collected the relative offset
/// which requires adjustment once they are flushed to the file.
///
/// \param final_position Final stream offset to add for page offset adjustment.
virtual void Finish(int64_t final_position) = 0;
/// \brief Serialize the offset index thrift message.
///
/// \param[out] sink output stream to write the serialized message.
/// \param[in] encryptor encryptor to encrypt the serialized offset index.
virtual void WriteTo(::arrow::io::OutputStream* sink,
Encryptor* encryptor = NULLPTR) const = 0;
/// \brief Create an OffsetIndex directly.
virtual std::unique_ptr<OffsetIndex> Build() const = 0;
};
/// \brief Interface for collecting page index of a parquet file.
class PARQUET_EXPORT PageIndexBuilder {
public:
/// \brief API convenience to create a PageIndexBuilder.
static std::unique_ptr<PageIndexBuilder> Make(
const SchemaDescriptor* schema, InternalFileEncryptor* file_encryptor = NULLPTR);
virtual ~PageIndexBuilder() = default;
/// \brief Start a new row group.
virtual void AppendRowGroup() = 0;
/// \brief Get the ColumnIndexBuilder from column ordinal.
///
Loading ...