pub struct BinaryArray<O>where
    O: Offset,{ /* private fields */ }
Expand description

A BinaryArray is Arrow’s semantically equivalent of an immutable Vec<Option<Vec<u8>>>. It implements Array.

The size of this struct is O(1), as all data is stored behind an std::sync::Arc.

Example

use arrow2::array::BinaryArray;
use arrow2::bitmap::Bitmap;
use arrow2::buffer::Buffer;

let array = BinaryArray::<i32>::from([Some([1, 2].as_ref()), None, Some([3].as_ref())]);
assert_eq!(array.value(0), &[1, 2]);
assert_eq!(array.iter().collect::<Vec<_>>(), vec![Some([1, 2].as_ref()), None, Some([3].as_ref())]);
assert_eq!(array.values_iter().collect::<Vec<_>>(), vec![[1, 2].as_ref(), &[], &[3]]);
// the underlying representation:
assert_eq!(array.values(), &Buffer::from(vec![1, 2, 3]));
assert_eq!(array.offsets().buffer(), &Buffer::from(vec![0, 2, 2, 3]));
assert_eq!(array.validity(), Some(&Bitmap::from([true, false, true])));

Generic parameter

The generic parameter Offset can only be i32 or i64 and tradeoffs maximum array length with memory usage:

  • the sum of lengths of all elements cannot exceed Offset::MAX
  • the total size of the underlying data is array.len() * size_of::<Offset>() + sum of lengths of all elements

Safety

The following invariants hold:

  • Two consecutives offsets casted (as) to usize are valid slices of values.
  • len is equal to validity.len(), when defined.

Implementations§

§

impl<O> BinaryArray<O>where O: Offset,

pub fn try_new( data_type: DataType, offsets: OffsetsBuffer<O>, values: Buffer<u8>, validity: Option<Bitmap> ) -> Result<BinaryArray<O>, Error>

Returns a BinaryArray created from its internal representation.

Errors

This function returns an error iff:

  • The last offset is not equal to the values’ length.
  • the validity’s length is not equal to offsets.len().
  • The data_type’s crate::datatypes::PhysicalType is not equal to either Binary or LargeBinary.
Implementation

This function is O(1)

pub fn from_slice<T, P>(slice: P) -> BinaryArray<O>where T: AsRef<[u8]>, P: AsRef<[T]>,

Creates a new BinaryArray from slices of &[u8].

pub fn from<T, P>(slice: P) -> BinaryArray<O>where T: AsRef<[u8]>, P: AsRef<[Option<T>]>,

Creates a new BinaryArray from a slice of optional &[u8].

pub fn iter( &self ) -> ZipValidity<&[u8], ArrayValuesIter<'_, BinaryArray<O>>, BitmapIter<'_>>

Returns an iterator of Option<&[u8]> over every element of this array.

pub fn values_iter(&self) -> ArrayValuesIter<'_, BinaryArray<O>>

Returns an iterator of &[u8] over every element of this array, ignoring the validity

pub fn len(&self) -> usize

Returns the length of this array

pub fn value(&self, i: usize) -> &[u8]

Returns the element at index i

Panics

iff i >= self.len()

pub unsafe fn value_unchecked(&self, i: usize) -> &[u8]

Returns the element at index i

Safety

Assumes that the i < self.len.

pub fn get(&self, i: usize) -> Option<&[u8]>

Returns the element at index i or None if it is null

Panics

iff i >= self.len()

pub fn data_type(&self) -> &DataType

Returns the DataType of this array.

pub fn values(&self) -> &Buffer<u8>

Returns the values of this BinaryArray.

pub fn offsets(&self) -> &OffsetsBuffer<O>

Returns the offsets of this BinaryArray.

pub fn validity(&self) -> Option<&Bitmap>

The optional validity.

pub fn slice(&mut self, offset: usize, length: usize)

Slices this BinaryArray.

Implementation

This function is O(1).

Panics

iff offset + length > self.len().

pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize)

Slices this BinaryArray.

Implementation

This function is O(1).

Safety

The caller must ensure that offset + length <= self.len().

pub fn sliced(self, offset: usize, length: usize) -> BinaryArray<O>

Returns this array sliced.

Implementation

This function is O(1).

Panics

iff offset + length > self.len().

pub fn sliced_unchecked(self, offset: usize, length: usize) -> BinaryArray<O>

Returns this array sliced.

Implementation

This function is O(1).

Safety

The caller must ensure that offset + length <= self.len().

pub fn with_validity(self, validity: Option<Bitmap>) -> BinaryArray<O>

Returns this array with a new validity.

Panic

Panics iff validity.len() != self.len().

pub fn set_validity(&mut self, validity: Option<Bitmap>)

Sets the validity of this array.

Panics

This function panics iff values.len() != self.len().

pub fn boxed(self) -> Box<dyn Array + 'static, Global>

Boxes this array into a Box<dyn Array>.

pub fn arced(self) -> Arc<dyn Array + 'static>

Arcs this array into a std::sync::Arc<dyn Array>.

pub fn into_mut(self) -> Either<BinaryArray<O>, MutableBinaryArray<O>>

Try to convert this BinaryArray to a MutableBinaryArray

pub fn new_empty(data_type: DataType) -> BinaryArray<O>

Creates an empty BinaryArray, i.e. whose .len is zero.

pub fn new_null(data_type: DataType, length: usize) -> BinaryArray<O>

Creates an null BinaryArray, i.e. whose .null_count() == .len().

pub fn default_data_type() -> DataType

Returns the default DataType, DataType::Binary or DataType::LargeBinary

pub fn new( data_type: DataType, offsets: OffsetsBuffer<O>, values: Buffer<u8>, validity: Option<Bitmap> ) -> BinaryArray<O>

Alias for unwrapping Self::try_new

pub fn from_trusted_len_values_iter<T, I>(iterator: I) -> BinaryArray<O>where T: AsRef<[u8]>, I: TrustedLen<Item = T>,

Returns a BinaryArray from an iterator of trusted length.

The BinaryArray is guaranteed to not have a validity

pub fn from_iter_values<T, I>(iterator: I) -> BinaryArray<O>where T: AsRef<[u8]>, I: Iterator<Item = T>,

Returns a new BinaryArray from a Iterator of &[u8].

The BinaryArray is guaranteed to not have a validity

pub unsafe fn from_trusted_len_iter_unchecked<I, P>( iterator: I ) -> BinaryArray<O>where P: AsRef<[u8]>, I: Iterator<Item = Option<P>>,

Creates a BinaryArray from an iterator of trusted length.

Safety

The iterator must be TrustedLen. I.e. that size_hint().1 correctly reports its length.

pub fn from_trusted_len_iter<I, P>(iterator: I) -> BinaryArray<O>where P: AsRef<[u8]>, I: TrustedLen<Item = Option<P>>,

Creates a BinaryArray from a TrustedLen

pub unsafe fn try_from_trusted_len_iter_unchecked<E, I, P>( iterator: I ) -> Result<BinaryArray<O>, E>where P: AsRef<[u8]>, I: IntoIterator<Item = Result<Option<P>, E>>,

Creates a BinaryArray from an falible iterator of trusted length.

Safety

The iterator must be TrustedLen. I.e. that size_hint().1 correctly reports its length.

pub fn try_from_trusted_len_iter<E, I, P>(iter: I) -> Result<BinaryArray<O>, E>where P: AsRef<[u8]>, I: TrustedLen<Item = Result<Option<P>, E>>,

Creates a BinaryArray from an fallible iterator of trusted length.

Trait Implementations§

§

impl<O> Array for BinaryArray<O>where O: Offset,

§

fn as_any(&self) -> &(dyn Any + 'static)

Converts itself to a reference of Any, which enables downcasting to concrete types.
§

fn as_any_mut(&mut self) -> &mut (dyn Any + 'static)

Converts itself to a mutable reference of Any, which enables mutable downcasting to concrete types.
§

fn len(&self) -> usize

The length of the Array. Every array has a length corresponding to the number of elements (slots).
§

fn data_type(&self) -> &DataType

The DataType of the Array. In combination with Array::as_any, this can be used to downcast trait objects (dyn Array) to concrete arrays.
§

fn slice(&mut self, offset: usize, length: usize)

Slices this Array. Read more
§

unsafe fn slice_unchecked(&mut self, offset: usize, length: usize)

Slices the Array. Read more
§

fn to_boxed(&self) -> Box<dyn Array + 'static, Global>

Clone a &dyn Array to an owned Box<dyn Array>.
§

fn validity(&self) -> Option<&Bitmap>

The validity of the Array: every array has an optional Bitmap that, when available specifies whether the array slot is valid or not (null). When the validity is None, all slots are valid.
§

fn with_validity( &self, validity: Option<Bitmap> ) -> Box<dyn Array + 'static, Global>

Clones this Array with a new new assigned bitmap. Read more
§

fn is_empty(&self) -> bool

whether the array is empty
§

fn null_count(&self) -> usize

The number of null slots on this Array. Read more
§

fn is_null(&self, i: usize) -> bool

Returns whether slot i is null. Read more
§

fn is_valid(&self, i: usize) -> bool

Returns whether slot i is valid. Read more
§

fn sliced( &self, offset: usize, length: usize ) -> Box<dyn Array + 'static, Global>

Returns a slice of this Array. Read more
§

unsafe fn sliced_unchecked( &self, offset: usize, length: usize ) -> Box<dyn Array + 'static, Global>

Returns a slice of this Array. Read more
§

impl<'a> ArrowGetItem for &'a BinaryArray<i64>

§

type Item = &'a [u8]

§

fn get( &self, item: usize ) -> Option<<&'a BinaryArray<i64> as ArrowGetItem>::Item>

§

unsafe fn get_unchecked( &self, item: usize ) -> Option<<&'a BinaryArray<i64> as ArrowGetItem>::Item>

Safety Read more
source§

impl ChunkApplyKernel<BinaryArray<i64>> for ChunkedArray<BinaryType>

source§

fn apply_kernel( &self, f: &dyn Fn(&BinaryArray<i64>) -> Box<dyn Array + 'static, Global> ) -> ChunkedArray<BinaryType>

Apply kernel and return result as a new ChunkedArray.
source§

fn apply_kernel_cast<S>( &self, f: &dyn Fn(&BinaryArray<i64>) -> Box<dyn Array + 'static, Global> ) -> ChunkedArray<S>where S: PolarsDataType,

Apply a kernel that outputs an array of different type.
§

impl<O> Clone for BinaryArray<O>where O: Clone + Offset,

§

fn clone(&self) -> BinaryArray<O>

Returns a copy of the value. Read more
1.0.0 · source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more
§

impl<O> Debug for BinaryArray<O>where O: Offset,

§

fn fmt(&self, f: &mut Formatter<'_>) -> Result<(), Error>

Formats the value using the given formatter. Read more
§

impl<'a, O> From<GrowableBinary<'a, O>> for BinaryArray<O>where O: Offset,

§

fn from(val: GrowableBinary<'a, O>) -> BinaryArray<O>

Converts to this type from the input type.
§

impl<O> From<MutableBinaryArray<O>> for BinaryArray<O>where O: Offset,

§

fn from(other: MutableBinaryArray<O>) -> BinaryArray<O>

Converts to this type from the input type.
§

impl<O> From<MutableBinaryValuesArray<O>> for BinaryArray<O>where O: Offset,

§

fn from(other: MutableBinaryValuesArray<O>) -> BinaryArray<O>

Converts to this type from the input type.
§

impl FromDataBinary for BinaryArray<i64>

§

unsafe fn from_data_unchecked_default( offsets: Buffer<i64>, values: Buffer<u8>, validity: Option<Bitmap> ) -> BinaryArray<i64>

Safety Read more
§

impl<O, P> FromIterator<Option<P>> for BinaryArray<O>where O: Offset, P: AsRef<[u8]>,

§

fn from_iter<I>(iter: I) -> BinaryArray<O>where I: IntoIterator<Item = Option<P>>,

Creates a value from an iterator. Read more
§

impl<O> GenericBinaryArray<O> for BinaryArray<O>where O: Offset,

§

fn values(&self) -> &[u8]

The values of the array
§

fn offsets(&self) -> &[O]

The offsets of the array
§

impl<'a, O> IntoIterator for &'a BinaryArray<O>where O: Offset,

§

type Item = Option<&'a [u8]>

The type of the elements being iterated over.
§

type IntoIter = ZipValidity<&'a [u8], ArrayValuesIter<'a, BinaryArray<O>>, BitmapIter<'a>>

Which kind of iterator are we turning this into?
§

fn into_iter(self) -> <&'a BinaryArray<O> as IntoIterator>::IntoIter

Creates an iterator from a value. Read more
§

impl<O> PartialEq<&(dyn Array + 'static)> for BinaryArray<O>where O: Offset,

§

fn eq(&self, other: &&(dyn Array + 'static)) -> bool

This method tests for self and other values to be equal, and is used by ==.
1.0.0 · source§

fn ne(&self, other: &Rhs) -> bool

This method tests for !=. The default implementation is almost always sufficient, and should not be overridden without very good reason.
§

impl<O> PartialEq<BinaryArray<O>> for &(dyn Array + 'static)where O: Offset,

§

fn eq(&self, other: &BinaryArray<O>) -> bool

This method tests for self and other values to be equal, and is used by ==.
1.0.0 · source§

fn ne(&self, other: &Rhs) -> bool

This method tests for !=. The default implementation is almost always sufficient, and should not be overridden without very good reason.
§

impl<O> PartialEq<BinaryArray<O>> for BinaryArray<O>where O: Offset,

§

fn eq(&self, other: &BinaryArray<O>) -> bool

This method tests for self and other values to be equal, and is used by ==.
1.0.0 · source§

fn ne(&self, other: &Rhs) -> bool

This method tests for !=. The default implementation is almost always sufficient, and should not be overridden without very good reason.
§

impl ValueSize for BinaryArray<i64>

§

fn get_values_size(&self) -> usize

Useful for a Utf8 or a List to get underlying value size. During a rechunk this is handy
§

impl ArrowArray for BinaryArray<i64>

Auto Trait Implementations§

§

impl<O> RefUnwindSafe for BinaryArray<O>

§

impl<O> Send for BinaryArray<O>

§

impl<O> Sync for BinaryArray<O>

§

impl<O> Unpin for BinaryArray<O>

§

impl<O> UnwindSafe for BinaryArray<O>

Blanket Implementations§

source§

impl<T> Any for Twhere T: 'static + ?Sized,

source§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
source§

impl<T> Borrow<T> for Twhere T: ?Sized,

source§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
source§

impl<T> BorrowMut<T> for Twhere T: ?Sized,

source§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
source§

impl<T> DynClone for Twhere T: Clone,

source§

fn __clone_box(&self, _: Private) -> *mut ()

source§

impl<T> From<T> for T

source§

fn from(t: T) -> T

Returns the argument unchanged.

source§

impl<T, U> Into<U> for Twhere U: From<T>,

source§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

§

impl<A> IsValid for Awhere A: ArrowArray,

§

unsafe fn is_valid_unchecked(&self, i: usize) -> bool

Safety Read more
§

unsafe fn is_null_unchecked(&self, i: usize) -> bool

Safety Read more
§

impl<T> Pointable for T

§

const ALIGN: usize = mem::align_of::<T>()

The alignment of pointer.
§

type Init = T

The type for initializers.
§

unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more
§

unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more
§

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more
§

unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more
§

impl<A> PolarsArray for Awhere A: Array + ?Sized,

§

fn has_validity(&self) -> bool

§

impl<T> SlicedArray for Twhere T: Array + Clone,

§

fn slice_typed(&self, offset: usize, length: usize) -> T

Slices this Array. Read more
§

unsafe fn slice_typed_unchecked(&self, offset: usize, length: usize) -> T

Slices the Array. Read more
source§

impl<T> ToOwned for Twhere T: Clone,

§

type Owned = T

The resulting type after obtaining ownership.
source§

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more
source§

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more
source§

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

§

type Error = Infallible

The type returned in the event of a conversion error.
source§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
source§

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
source§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.
§

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

§

fn vzip(self) -> V