parquet::file::metadata

Struct ColumnChunkMetaData

Source
pub struct ColumnChunkMetaData {
Show 22 fields column_descr: ColumnDescPtr, encodings: Vec<Encoding>, file_path: Option<String>, file_offset: i64, num_values: i64, compression: Compression, total_compressed_size: i64, total_uncompressed_size: i64, data_page_offset: i64, index_page_offset: Option<i64>, dictionary_page_offset: Option<i64>, statistics: Option<Statistics>, encoding_stats: Option<Vec<PageEncodingStats>>, bloom_filter_offset: Option<i64>, bloom_filter_length: Option<i32>, offset_index_offset: Option<i64>, offset_index_length: Option<i32>, column_index_offset: Option<i64>, column_index_length: Option<i32>, unencoded_byte_array_data_bytes: Option<i64>, repetition_level_histogram: Option<LevelHistogram>, definition_level_histogram: Option<LevelHistogram>,
}
Expand description

Metadata for a column chunk.

Fields§

§column_descr: ColumnDescPtr§encodings: Vec<Encoding>§file_path: Option<String>§file_offset: i64§num_values: i64§compression: Compression§total_compressed_size: i64§total_uncompressed_size: i64§data_page_offset: i64§index_page_offset: Option<i64>§dictionary_page_offset: Option<i64>§statistics: Option<Statistics>§encoding_stats: Option<Vec<PageEncodingStats>>§bloom_filter_offset: Option<i64>§bloom_filter_length: Option<i32>§offset_index_offset: Option<i64>§offset_index_length: Option<i32>§column_index_offset: Option<i64>§column_index_length: Option<i32>§unencoded_byte_array_data_bytes: Option<i64>§repetition_level_histogram: Option<LevelHistogram>§definition_level_histogram: Option<LevelHistogram>

Implementations§

Source§

impl ColumnChunkMetaData

Represents common operations for a column chunk.

Source

pub fn builder(column_descr: ColumnDescPtr) -> ColumnChunkMetaDataBuilder

Returns builder for column chunk metadata.

Source

pub fn file_path(&self) -> Option<&str>

File where the column chunk is stored.

If not set, assumed to belong to the same file as the metadata. This path is relative to the current file.

Source

pub fn file_offset(&self) -> i64

Byte offset of ColumnMetaData in file_path().

Note that the meaning of this field has been inconsistent between implementations so its use has since been deprecated in the Parquet specification. Modern implementations will set this to 0 to indicate that the ColumnMetaData is solely contained in the ColumnChunk struct.

Source

pub fn column_type(&self) -> Type

Type of this column. Must be primitive.

Source

pub fn column_path(&self) -> &ColumnPath

Path (or identifier) of this column.

Source

pub fn column_descr(&self) -> &ColumnDescriptor

Descriptor for this column.

Source

pub fn column_descr_ptr(&self) -> ColumnDescPtr

Reference counted clone of descriptor for this column.

Source

pub fn encodings(&self) -> &Vec<Encoding>

All encodings used for this column.

Source

pub fn num_values(&self) -> i64

Total number of values in this column chunk.

Source

pub fn compression(&self) -> Compression

Compression for this column.

Source

pub fn compressed_size(&self) -> i64

Returns the total compressed data size of this column chunk.

Source

pub fn uncompressed_size(&self) -> i64

Returns the total uncompressed data size of this column chunk.

Source

pub fn data_page_offset(&self) -> i64

Returns the offset for the column data.

Source

pub fn index_page_offset(&self) -> Option<i64>

Returns the offset for the index page.

Source

pub fn dictionary_page_offset(&self) -> Option<i64>

Returns the offset for the dictionary page, if any.

Source

pub fn byte_range(&self) -> (u64, u64)

Returns the offset and length in bytes of the column chunk within the file

Source

pub fn statistics(&self) -> Option<&Statistics>

Returns statistics that are set for this column chunk, or None if no statistics are available.

Source

pub fn page_encoding_stats(&self) -> Option<&Vec<PageEncodingStats>>

Returns the offset for the page encoding stats, or None if no page encoding stats are available.

Source

pub fn bloom_filter_offset(&self) -> Option<i64>

Returns the offset for the bloom filter.

Source

pub fn bloom_filter_length(&self) -> Option<i32>

Returns the offset for the bloom filter.

Source

pub fn column_index_offset(&self) -> Option<i64>

Returns the offset for the column index.

Source

pub fn column_index_length(&self) -> Option<i32>

Returns the offset for the column index length.

Source

pub(crate) fn column_index_range(&self) -> Option<Range<usize>>

Returns the range for the offset index if any

Source

pub fn offset_index_offset(&self) -> Option<i64>

Returns the offset for the offset index.

Source

pub fn offset_index_length(&self) -> Option<i32>

Returns the offset for the offset index length.

Source

pub(crate) fn offset_index_range(&self) -> Option<Range<usize>>

Returns the range for the offset index if any

Source

pub fn unencoded_byte_array_data_bytes(&self) -> Option<i64>

Returns the number of bytes of variable length data after decoding.

Only set for BYTE_ARRAY columns. This field may not be set by older writers.

Source

pub fn repetition_level_histogram(&self) -> Option<&LevelHistogram>

Returns the repetition level histogram.

The returned value vec[i] is how many values are at repetition level i. For example, vec[0] indicates how many rows the page contains. This field may not be set by older writers.

Source

pub fn definition_level_histogram(&self) -> Option<&LevelHistogram>

Returns the definition level histogram.

The returned value vec[i] is how many values are at definition level i. For example, vec[max_definition_level] indicates how many non-null values are present in the page. This field may not be set by older writers.

Source

pub fn from_thrift(column_descr: ColumnDescPtr, cc: ColumnChunk) -> Result<Self>

Method to convert from Thrift.

Source

pub fn to_thrift(&self) -> ColumnChunk

Method to convert to Thrift.

Source

pub fn to_column_metadata_thrift(&self) -> ColumnMetaData

Method to convert to Thrift ColumnMetaData

Source

pub fn into_builder(self) -> ColumnChunkMetaDataBuilder

Trait Implementations§

Source§

impl Clone for ColumnChunkMetaData

Source§

fn clone(&self) -> ColumnChunkMetaData

Returns a copy of the value. Read more
1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more
Source§

impl Debug for ColumnChunkMetaData

Source§

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more
Source§

impl From<ColumnChunkMetaData> for ColumnChunkMetaDataBuilder

Source§

fn from(value: ColumnChunkMetaData) -> Self

Converts to this type from the input type.
Source§

impl HeapSize for ColumnChunkMetaData

Source§

fn heap_size(&self) -> usize

Return the size of any bytes allocated on the heap by this object, including heap memory in those structures Read more
Source§

impl PartialEq for ColumnChunkMetaData

Source§

fn eq(&self, other: &ColumnChunkMetaData) -> bool

Tests for self and other values to be equal, and is used by ==.
1.0.0 · Source§

fn ne(&self, other: &Rhs) -> bool

Tests for !=. The default implementation is almost always sufficient, and should not be overridden without very good reason.
Source§

impl StructuralPartialEq for ColumnChunkMetaData

Auto Trait Implementations§

Blanket Implementations§

Source§

impl<T> Any for T
where T: 'static + ?Sized,

Source§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
Source§

impl<T> Borrow<T> for T
where T: ?Sized,

Source§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
Source§

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
Source§

impl<T> CloneToUninit for T
where T: Clone,

Source§

unsafe fn clone_to_uninit(&self, dst: *mut T)

🔬This is a nightly-only experimental API. (clone_to_uninit)
Performs copy-assignment from self to dst. Read more
Source§

impl<T> From<T> for T

Source§

fn from(t: T) -> T

Returns the argument unchanged.

Source§

impl<T, U> Into<U> for T
where U: From<T>,

Source§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source§

impl<T> IntoEither for T

Source§

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
Source§

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
Source§

impl<T> ToOwned for T
where T: Clone,

Source§

type Owned = T

The resulting type after obtaining ownership.
Source§

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more
Source§

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more
Source§

impl<T, U> TryFrom<U> for T
where U: Into<T>,

Source§

type Error = Infallible

The type returned in the event of a conversion error.
Source§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
Source§

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

Source§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
Source§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.
§

impl<T> Allocation for T
where T: RefUnwindSafe + Send + Sync,

§

impl<T> ErasedDestructor for T
where T: 'static,

§

impl<T> MaybeSendSync for T