pub struct ColumnChunkMetaData {Show 22 fields
column_descr: ColumnDescPtr,
encodings: Vec<Encoding>,
file_path: Option<String>,
file_offset: i64,
num_values: i64,
compression: Compression,
total_compressed_size: i64,
total_uncompressed_size: i64,
data_page_offset: i64,
index_page_offset: Option<i64>,
dictionary_page_offset: Option<i64>,
statistics: Option<Statistics>,
encoding_stats: Option<Vec<PageEncodingStats>>,
bloom_filter_offset: Option<i64>,
bloom_filter_length: Option<i32>,
offset_index_offset: Option<i64>,
offset_index_length: Option<i32>,
column_index_offset: Option<i64>,
column_index_length: Option<i32>,
unencoded_byte_array_data_bytes: Option<i64>,
repetition_level_histogram: Option<LevelHistogram>,
definition_level_histogram: Option<LevelHistogram>,
}
Expand description
Metadata for a column chunk.
Fields§
§column_descr: ColumnDescPtr
§encodings: Vec<Encoding>
§file_path: Option<String>
§file_offset: i64
§num_values: i64
§compression: Compression
§total_compressed_size: i64
§total_uncompressed_size: i64
§data_page_offset: i64
§index_page_offset: Option<i64>
§dictionary_page_offset: Option<i64>
§statistics: Option<Statistics>
§encoding_stats: Option<Vec<PageEncodingStats>>
§bloom_filter_offset: Option<i64>
§bloom_filter_length: Option<i32>
§offset_index_offset: Option<i64>
§offset_index_length: Option<i32>
§column_index_offset: Option<i64>
§column_index_length: Option<i32>
§unencoded_byte_array_data_bytes: Option<i64>
§repetition_level_histogram: Option<LevelHistogram>
§definition_level_histogram: Option<LevelHistogram>
Implementations§
Source§impl ColumnChunkMetaData
Represents common operations for a column chunk.
impl ColumnChunkMetaData
Represents common operations for a column chunk.
Sourcepub fn builder(column_descr: ColumnDescPtr) -> ColumnChunkMetaDataBuilder
pub fn builder(column_descr: ColumnDescPtr) -> ColumnChunkMetaDataBuilder
Returns builder for column chunk metadata.
Sourcepub fn file_path(&self) -> Option<&str>
pub fn file_path(&self) -> Option<&str>
File where the column chunk is stored.
If not set, assumed to belong to the same file as the metadata. This path is relative to the current file.
Sourcepub fn file_offset(&self) -> i64
pub fn file_offset(&self) -> i64
Byte offset of ColumnMetaData
in file_path()
.
Note that the meaning of this field has been inconsistent between implementations
so its use has since been deprecated in the Parquet specification. Modern implementations
will set this to 0
to indicate that the ColumnMetaData
is solely contained in the
ColumnChunk
struct.
Sourcepub fn column_type(&self) -> Type
pub fn column_type(&self) -> Type
Type of this column. Must be primitive.
Sourcepub fn column_path(&self) -> &ColumnPath
pub fn column_path(&self) -> &ColumnPath
Path (or identifier) of this column.
Sourcepub fn column_descr(&self) -> &ColumnDescriptor
pub fn column_descr(&self) -> &ColumnDescriptor
Descriptor for this column.
Sourcepub fn column_descr_ptr(&self) -> ColumnDescPtr
pub fn column_descr_ptr(&self) -> ColumnDescPtr
Reference counted clone of descriptor for this column.
Sourcepub fn num_values(&self) -> i64
pub fn num_values(&self) -> i64
Total number of values in this column chunk.
Sourcepub fn compression(&self) -> Compression
pub fn compression(&self) -> Compression
Compression for this column.
Sourcepub fn compressed_size(&self) -> i64
pub fn compressed_size(&self) -> i64
Returns the total compressed data size of this column chunk.
Sourcepub fn uncompressed_size(&self) -> i64
pub fn uncompressed_size(&self) -> i64
Returns the total uncompressed data size of this column chunk.
Sourcepub fn data_page_offset(&self) -> i64
pub fn data_page_offset(&self) -> i64
Returns the offset for the column data.
Sourcepub fn index_page_offset(&self) -> Option<i64>
pub fn index_page_offset(&self) -> Option<i64>
Returns the offset for the index page.
Sourcepub fn dictionary_page_offset(&self) -> Option<i64>
pub fn dictionary_page_offset(&self) -> Option<i64>
Returns the offset for the dictionary page, if any.
Sourcepub fn byte_range(&self) -> (u64, u64)
pub fn byte_range(&self) -> (u64, u64)
Returns the offset and length in bytes of the column chunk within the file
Sourcepub fn statistics(&self) -> Option<&Statistics>
pub fn statistics(&self) -> Option<&Statistics>
Returns statistics that are set for this column chunk,
or None
if no statistics are available.
Sourcepub fn page_encoding_stats(&self) -> Option<&Vec<PageEncodingStats>>
pub fn page_encoding_stats(&self) -> Option<&Vec<PageEncodingStats>>
Returns the offset for the page encoding stats,
or None
if no page encoding stats are available.
Sourcepub fn bloom_filter_offset(&self) -> Option<i64>
pub fn bloom_filter_offset(&self) -> Option<i64>
Returns the offset for the bloom filter.
Sourcepub fn bloom_filter_length(&self) -> Option<i32>
pub fn bloom_filter_length(&self) -> Option<i32>
Returns the offset for the bloom filter.
Sourcepub fn column_index_offset(&self) -> Option<i64>
pub fn column_index_offset(&self) -> Option<i64>
Returns the offset for the column index.
Sourcepub fn column_index_length(&self) -> Option<i32>
pub fn column_index_length(&self) -> Option<i32>
Returns the offset for the column index length.
Sourcepub(crate) fn column_index_range(&self) -> Option<Range<usize>>
pub(crate) fn column_index_range(&self) -> Option<Range<usize>>
Returns the range for the offset index if any
Sourcepub fn offset_index_offset(&self) -> Option<i64>
pub fn offset_index_offset(&self) -> Option<i64>
Returns the offset for the offset index.
Sourcepub fn offset_index_length(&self) -> Option<i32>
pub fn offset_index_length(&self) -> Option<i32>
Returns the offset for the offset index length.
Sourcepub(crate) fn offset_index_range(&self) -> Option<Range<usize>>
pub(crate) fn offset_index_range(&self) -> Option<Range<usize>>
Returns the range for the offset index if any
Sourcepub fn unencoded_byte_array_data_bytes(&self) -> Option<i64>
pub fn unencoded_byte_array_data_bytes(&self) -> Option<i64>
Returns the number of bytes of variable length data after decoding.
Only set for BYTE_ARRAY columns. This field may not be set by older writers.
Sourcepub fn repetition_level_histogram(&self) -> Option<&LevelHistogram>
pub fn repetition_level_histogram(&self) -> Option<&LevelHistogram>
Returns the repetition level histogram.
The returned value vec[i]
is how many values are at repetition level i
. For example,
vec[0]
indicates how many rows the page contains.
This field may not be set by older writers.
Sourcepub fn definition_level_histogram(&self) -> Option<&LevelHistogram>
pub fn definition_level_histogram(&self) -> Option<&LevelHistogram>
Returns the definition level histogram.
The returned value vec[i]
is how many values are at definition level i
. For example,
vec[max_definition_level]
indicates how many non-null values are present in the page.
This field may not be set by older writers.
Sourcepub fn from_thrift(column_descr: ColumnDescPtr, cc: ColumnChunk) -> Result<Self>
pub fn from_thrift(column_descr: ColumnDescPtr, cc: ColumnChunk) -> Result<Self>
Method to convert from Thrift.
Sourcepub fn to_thrift(&self) -> ColumnChunk
pub fn to_thrift(&self) -> ColumnChunk
Method to convert to Thrift.
Sourcepub fn to_column_metadata_thrift(&self) -> ColumnMetaData
pub fn to_column_metadata_thrift(&self) -> ColumnMetaData
Method to convert to Thrift ColumnMetaData
Sourcepub fn into_builder(self) -> ColumnChunkMetaDataBuilder
pub fn into_builder(self) -> ColumnChunkMetaDataBuilder
Converts this ColumnChunkMetaData
into a ColumnChunkMetaDataBuilder
Trait Implementations§
Source§impl Clone for ColumnChunkMetaData
impl Clone for ColumnChunkMetaData
Source§fn clone(&self) -> ColumnChunkMetaData
fn clone(&self) -> ColumnChunkMetaData
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
source
. Read moreSource§impl Debug for ColumnChunkMetaData
impl Debug for ColumnChunkMetaData
Source§impl From<ColumnChunkMetaData> for ColumnChunkMetaDataBuilder
impl From<ColumnChunkMetaData> for ColumnChunkMetaDataBuilder
Source§fn from(value: ColumnChunkMetaData) -> Self
fn from(value: ColumnChunkMetaData) -> Self
Source§impl HeapSize for ColumnChunkMetaData
impl HeapSize for ColumnChunkMetaData
Source§impl PartialEq for ColumnChunkMetaData
impl PartialEq for ColumnChunkMetaData
impl StructuralPartialEq for ColumnChunkMetaData
Auto Trait Implementations§
impl !Freeze for ColumnChunkMetaData
impl RefUnwindSafe for ColumnChunkMetaData
impl Send for ColumnChunkMetaData
impl Sync for ColumnChunkMetaData
impl Unpin for ColumnChunkMetaData
impl UnwindSafe for ColumnChunkMetaData
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
self
into a Left
variant of Either<Self, Self>
if into_left
is true
.
Converts self
into a Right
variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
self
into a Left
variant of Either<Self, Self>
if into_left(&self)
returns true
.
Converts self
into a Right
variant of Either<Self, Self>
otherwise. Read more