use super::{Array, Splitable};
use crate::bitmap::Bitmap;
use crate::buffer::Buffer;
use crate::datatypes::ArrowDataType;
#[cfg(feature = "arrow_rs")]
mod data;
mod ffi;
pub(super) mod fmt;
mod iterator;
mod mutable;
pub use mutable::*;
use polars_error::{polars_bail, polars_ensure, PolarsResult};
#[derive(Clone)]
pub struct FixedSizeBinaryArray {
size: usize, data_type: ArrowDataType,
values: Buffer<u8>,
validity: Option<Bitmap>,
}
impl FixedSizeBinaryArray {
pub fn try_new(
data_type: ArrowDataType,
values: Buffer<u8>,
validity: Option<Bitmap>,
) -> PolarsResult<Self> {
let size = Self::maybe_get_size(&data_type)?;
if values.len() % size != 0 {
polars_bail!(ComputeError:
"values (of len {}) must be a multiple of size ({}) in FixedSizeBinaryArray.",
values.len(),
size
)
}
let len = values.len() / size;
if validity
.as_ref()
.map_or(false, |validity| validity.len() != len)
{
polars_bail!(ComputeError: "validity mask length must be equal to the number of values divided by size")
}
Ok(Self {
size,
data_type,
values,
validity,
})
}
pub fn new(data_type: ArrowDataType, values: Buffer<u8>, validity: Option<Bitmap>) -> Self {
Self::try_new(data_type, values, validity).unwrap()
}
pub fn new_empty(data_type: ArrowDataType) -> Self {
Self::new(data_type, Buffer::new(), None)
}
pub fn new_null(data_type: ArrowDataType, length: usize) -> Self {
let size = Self::maybe_get_size(&data_type).unwrap();
Self::new(
data_type,
vec![0u8; length * size].into(),
Some(Bitmap::new_zeroed(length)),
)
}
}
impl FixedSizeBinaryArray {
pub fn slice(&mut self, offset: usize, length: usize) {
assert!(
offset + length <= self.len(),
"the offset of the new Buffer cannot exceed the existing length"
);
unsafe { self.slice_unchecked(offset, length) }
}
pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize) {
self.validity = self
.validity
.take()
.map(|bitmap| bitmap.sliced_unchecked(offset, length))
.filter(|bitmap| bitmap.unset_bits() > 0);
self.values
.slice_unchecked(offset * self.size, length * self.size);
}
impl_sliced!();
impl_mut_validity!();
impl_into_array!();
}
impl FixedSizeBinaryArray {
#[inline]
pub fn len(&self) -> usize {
self.values.len() / self.size
}
#[inline]
pub fn validity(&self) -> Option<&Bitmap> {
self.validity.as_ref()
}
pub fn values(&self) -> &Buffer<u8> {
&self.values
}
#[inline]
pub fn value(&self, i: usize) -> &[u8] {
assert!(i < self.len());
unsafe { self.value_unchecked(i) }
}
#[inline]
pub unsafe fn value_unchecked(&self, i: usize) -> &[u8] {
self.values
.get_unchecked(i * self.size..(i + 1) * self.size)
}
#[inline]
pub fn get(&self, i: usize) -> Option<&[u8]> {
if !self.is_null(i) {
unsafe { Some(self.value_unchecked(i)) }
} else {
None
}
}
#[inline]
pub fn to(self, data_type: ArrowDataType) -> Self {
match (
data_type.to_logical_type(),
self.data_type().to_logical_type(),
) {
(ArrowDataType::FixedSizeBinary(size_a), ArrowDataType::FixedSizeBinary(size_b))
if size_a == size_b => {},
_ => panic!("Wrong DataType"),
}
Self {
size: self.size,
data_type,
values: self.values,
validity: self.validity,
}
}
pub fn size(&self) -> usize {
self.size
}
}
impl FixedSizeBinaryArray {
pub(crate) fn maybe_get_size(data_type: &ArrowDataType) -> PolarsResult<usize> {
match data_type.to_logical_type() {
ArrowDataType::FixedSizeBinary(size) => {
polars_ensure!(*size != 0, ComputeError: "FixedSizeBinaryArray expects a positive size");
Ok(*size)
},
other => {
polars_bail!(ComputeError: "FixedSizeBinaryArray expects DataType::FixedSizeBinary. found {other:?}")
},
}
}
pub fn get_size(data_type: &ArrowDataType) -> usize {
Self::maybe_get_size(data_type).unwrap()
}
}
impl Array for FixedSizeBinaryArray {
impl_common_array!();
fn validity(&self) -> Option<&Bitmap> {
self.validity.as_ref()
}
#[inline]
fn with_validity(&self, validity: Option<Bitmap>) -> Box<dyn Array> {
Box::new(self.clone().with_validity(validity))
}
}
impl Splitable for FixedSizeBinaryArray {
fn check_bound(&self, offset: usize) -> bool {
offset < self.len()
}
unsafe fn _split_at_unchecked(&self, offset: usize) -> (Self, Self) {
let (lhs_values, rhs_values) = unsafe { self.values.split_at_unchecked(offset) };
let (lhs_validity, rhs_validity) = unsafe { self.validity.split_at_unchecked(offset) };
let size = self.size;
(
Self {
data_type: self.data_type.clone(),
values: lhs_values,
validity: lhs_validity,
size,
},
Self {
data_type: self.data_type.clone(),
values: rhs_values,
validity: rhs_validity,
size,
},
)
}
}
impl FixedSizeBinaryArray {
pub fn try_from_iter<P: AsRef<[u8]>, I: IntoIterator<Item = Option<P>>>(
iter: I,
size: usize,
) -> PolarsResult<Self> {
MutableFixedSizeBinaryArray::try_from_iter(iter, size).map(|x| x.into())
}
pub fn from_iter<P: AsRef<[u8]>, I: IntoIterator<Item = Option<P>>>(
iter: I,
size: usize,
) -> Self {
MutableFixedSizeBinaryArray::try_from_iter(iter, size)
.unwrap()
.into()
}
pub fn from_slice<const N: usize, P: AsRef<[[u8; N]]>>(a: P) -> Self {
let values = a.as_ref().iter().flatten().copied().collect::<Vec<_>>();
Self::new(ArrowDataType::FixedSizeBinary(N), values.into(), None)
}
pub fn from<const N: usize, P: AsRef<[Option<[u8; N]>]>>(slice: P) -> Self {
MutableFixedSizeBinaryArray::from(slice).into()
}
}