Struct parquet::encoding::DictEncoder[][src]

pub struct DictEncoder<T: DataType> { /* fields omitted */ }
Expand description

Dictionary encoder. The dictionary encoding builds a dictionary of values encountered in a given column. The dictionary page is written first, before the data pages of the column chunk.

Dictionary page format: the entries in the dictionary - in dictionary order - using the plain encoding.

Data page format: the bit width used to encode the entry ids stored as 1 byte (max bit width = 32), followed by the values encoded using RLE/Bit packed described above (with the given bit width).

Implementations

impl<T: DataType> DictEncoder<T>[src]

pub fn new(desc: ColumnDescPtr, mem_tracker: MemTrackerPtr) -> Self[src]

Creates new dictionary encoder.

pub fn is_sorted(&self) -> bool[src]

Returns true if dictionary entries are sorted, false otherwise.

pub fn num_entries(&self) -> usize[src]

Returns number of unique values (keys) in the dictionary.

pub fn dict_encoded_size(&self) -> usize[src]

Returns size of unique values (keys) in the dictionary, in bytes.

pub fn write_dict(&self) -> Result<ByteBufferPtr>[src]

Writes out the dictionary values with PLAIN encoding in a byte buffer, and return the result.

pub fn write_indices(&mut self) -> Result<ByteBufferPtr>[src]

Writes out the dictionary values with RLE encoding in a byte buffer, and return the result.

Trait Implementations

impl<T: DataType> Encoder<T> for DictEncoder<T>[src]

fn put(&mut self, values: &[T::T]) -> Result<()>[src]

Encodes data from values.

fn encoding(&self) -> Encoding[src]

Returns the encoding type of this encoder.

fn estimated_data_encoded_size(&self) -> usize[src]

Returns an estimate of the encoded data, in bytes. Method call must be O(1). Read more

fn flush_buffer(&mut self) -> Result<ByteBufferPtr>[src]

Flushes the underlying byte buffer that’s being processed by this encoder, and return the immutable copy of it. This will also reset the internal state. Read more

fn put_spaced(&mut self, values: &[T::T], valid_bits: &[u8]) -> Result<usize>[src]

Encodes data from values, which contains spaces for null values, that is identified by valid_bits. Read more

Auto Trait Implementations

impl<T> RefUnwindSafe for DictEncoder<T> where
    <T as DataType>::T: RefUnwindSafe

impl<T> Send for DictEncoder<T> where
    <T as DataType>::T: Send

impl<T> Sync for DictEncoder<T> where
    <T as DataType>::T: Sync

impl<T> Unpin for DictEncoder<T> where
    <T as DataType>::T: Unpin

impl<T> UnwindSafe for DictEncoder<T> where
    <T as DataType>::T: UnwindSafe

Blanket Implementations

impl<T> Any for T where
    T: 'static + ?Sized
[src]

pub fn type_id(&self) -> TypeId[src]

Gets the TypeId of self. Read more

impl<T> Borrow<T> for T where
    T: ?Sized
[src]

pub fn borrow(&self) -> &T[src]

Immutably borrows from an owned value. Read more

impl<T> BorrowMut<T> for T where
    T: ?Sized
[src]

pub fn borrow_mut(&mut self) -> &mut T[src]

Mutably borrows from an owned value. Read more

impl<T> From<T> for T[src]

pub fn from(t: T) -> T[src]

Performs the conversion.

impl<T, U> Into<U> for T where
    U: From<T>, 
[src]

pub fn into(self) -> U[src]

Performs the conversion.

impl<T, U> TryFrom<U> for T where
    U: Into<T>, 
[src]

type Error = Infallible

The type returned in the event of a conversion error.

pub fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>[src]

Performs the conversion.

impl<T, U> TryInto<U> for T where
    U: TryFrom<T>, 
[src]

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.

pub fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>[src]

Performs the conversion.

impl<V, T> VZip<V> for T where
    V: MultiLane<T>, 

pub fn vzip(self) -> V