use either::Either;
use polars_error::{PolarsResult, polars_bail};
use super::{Array, Splitable};
use crate::array::iterator::NonNullValuesIter;
use crate::bitmap::utils::{BitmapIter, ZipValidity};
use crate::bitmap::{Bitmap, MutableBitmap};
use crate::compute::utils::{combine_validities_and, combine_validities_or};
use crate::datatypes::{ArrowDataType, PhysicalType};
use crate::trusted_len::TrustedLen;
mod ffi;
pub(super) mod fmt;
mod from;
mod iterator;
mod mutable;
pub use mutable::*;
mod builder;
pub use builder::*;
#[cfg(feature = "proptest")]
pub mod proptest;
#[derive(Clone)]
pub struct BooleanArray {
dtype: ArrowDataType,
values: Bitmap,
validity: Option<Bitmap>,
}
impl BooleanArray {
pub fn try_new(
dtype: ArrowDataType,
values: Bitmap,
validity: Option<Bitmap>,
) -> PolarsResult<Self> {
if validity
.as_ref()
.is_some_and(|validity| validity.len() != values.len())
{
polars_bail!(ComputeError: "validity mask length must match the number of values")
}
if dtype.to_physical_type() != PhysicalType::Boolean {
polars_bail!(ComputeError: "BooleanArray can only be initialized with a DataType whose physical type is Boolean")
}
Ok(Self {
dtype,
values,
validity,
})
}
pub fn new(dtype: ArrowDataType, values: Bitmap, validity: Option<Bitmap>) -> Self {
Self::try_new(dtype, values, validity).unwrap()
}
#[inline]
pub fn iter(&self) -> ZipValidity<bool, BitmapIter<'_>, BitmapIter<'_>> {
ZipValidity::new_with_validity(self.values().iter(), self.validity())
}
#[inline]
pub fn values_iter(&self) -> BitmapIter<'_> {
self.values().iter()
}
#[inline]
pub fn non_null_values_iter(&self) -> NonNullValuesIter<'_, BooleanArray> {
NonNullValuesIter::new(self, self.validity())
}
#[inline]
pub fn len(&self) -> usize {
self.values.len()
}
#[inline]
pub fn values(&self) -> &Bitmap {
&self.values
}
#[inline]
pub fn validity(&self) -> Option<&Bitmap> {
self.validity.as_ref()
}
#[inline]
pub fn dtype(&self) -> &ArrowDataType {
&self.dtype
}
#[inline]
pub fn value(&self, i: usize) -> bool {
self.values.get_bit(i)
}
#[inline]
pub unsafe fn value_unchecked(&self, i: usize) -> bool {
self.values.get_bit_unchecked(i)
}
#[inline]
pub fn get(&self, i: usize) -> Option<bool> {
if !self.is_null(i) {
unsafe { Some(self.value_unchecked(i)) }
} else {
None
}
}
#[inline]
pub fn slice(&mut self, offset: usize, length: usize) {
assert!(
offset + length <= self.len(),
"the offset of the new Buffer cannot exceed the existing length"
);
unsafe { self.slice_unchecked(offset, length) }
}
#[inline]
pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize) {
self.validity = self
.validity
.take()
.map(|bitmap| bitmap.sliced_unchecked(offset, length))
.filter(|bitmap| bitmap.unset_bits() > 0);
self.values.slice_unchecked(offset, length);
}
impl_sliced!();
impl_mut_validity!();
impl_into_array!();
#[must_use]
pub fn with_values(&self, values: Bitmap) -> Self {
let mut out = self.clone();
out.set_values(values);
out
}
pub fn set_values(&mut self, values: Bitmap) {
assert_eq!(
values.len(),
self.len(),
"values length must be equal to this arrays length"
);
self.values = values;
}
pub fn apply_values_mut<F: FnOnce(&mut MutableBitmap)>(&mut self, f: F) {
let values = std::mem::take(&mut self.values);
let mut values = values.make_mut();
f(&mut values);
if let Some(validity) = &self.validity {
assert_eq!(validity.len(), values.len());
}
self.values = values.into();
}
pub fn into_mut(self) -> Either<Self, MutableBooleanArray> {
use Either::*;
if let Some(bitmap) = self.validity {
match bitmap.into_mut() {
Left(bitmap) => Left(BooleanArray::new(self.dtype, self.values, Some(bitmap))),
Right(mutable_bitmap) => match self.values.into_mut() {
Left(immutable) => Left(BooleanArray::new(
self.dtype,
immutable,
Some(mutable_bitmap.into()),
)),
Right(mutable) => Right(
MutableBooleanArray::try_new(self.dtype, mutable, Some(mutable_bitmap))
.unwrap(),
),
},
}
} else {
match self.values.into_mut() {
Left(immutable) => Left(BooleanArray::new(self.dtype, immutable, None)),
Right(mutable) => {
Right(MutableBooleanArray::try_new(self.dtype, mutable, None).unwrap())
},
}
}
}
pub fn new_empty(dtype: ArrowDataType) -> Self {
Self::new(dtype, Bitmap::new(), None)
}
pub fn new_null(dtype: ArrowDataType, length: usize) -> Self {
let bitmap = Bitmap::new_zeroed(length);
Self::new(dtype, bitmap.clone(), Some(bitmap))
}
#[inline]
pub fn from_trusted_len_values_iter<I: TrustedLen<Item = bool>>(iterator: I) -> Self {
MutableBooleanArray::from_trusted_len_values_iter(iterator).into()
}
#[inline]
pub unsafe fn from_trusted_len_values_iter_unchecked<I: Iterator<Item = bool>>(
iterator: I,
) -> Self {
MutableBooleanArray::from_trusted_len_values_iter_unchecked(iterator).into()
}
#[inline]
pub fn from_slice<P: AsRef<[bool]>>(slice: P) -> Self {
MutableBooleanArray::from_slice(slice).into()
}
#[inline]
pub unsafe fn from_trusted_len_iter_unchecked<I, P>(iterator: I) -> Self
where
P: std::borrow::Borrow<bool>,
I: Iterator<Item = Option<P>>,
{
MutableBooleanArray::from_trusted_len_iter_unchecked(iterator).into()
}
#[inline]
pub fn from_trusted_len_iter<I, P>(iterator: I) -> Self
where
P: std::borrow::Borrow<bool>,
I: TrustedLen<Item = Option<P>>,
{
MutableBooleanArray::from_trusted_len_iter(iterator).into()
}
#[inline]
pub unsafe fn try_from_trusted_len_iter_unchecked<E, I, P>(iterator: I) -> Result<Self, E>
where
P: std::borrow::Borrow<bool>,
I: Iterator<Item = Result<Option<P>, E>>,
{
Ok(MutableBooleanArray::try_from_trusted_len_iter_unchecked(iterator)?.into())
}
#[inline]
pub fn try_from_trusted_len_iter<E, I, P>(iterator: I) -> Result<Self, E>
where
P: std::borrow::Borrow<bool>,
I: TrustedLen<Item = Result<Option<P>, E>>,
{
Ok(MutableBooleanArray::try_from_trusted_len_iter(iterator)?.into())
}
pub fn true_and_valid(&self) -> Bitmap {
match &self.validity {
None => self.values.clone(),
Some(validity) => combine_validities_and(Some(&self.values), Some(validity)).unwrap(),
}
}
pub fn true_or_valid(&self) -> Bitmap {
match &self.validity {
None => self.values.clone(),
Some(validity) => combine_validities_or(Some(&self.values), Some(validity)).unwrap(),
}
}
#[must_use]
pub fn into_inner(self) -> (ArrowDataType, Bitmap, Option<Bitmap>) {
let Self {
dtype,
values,
validity,
} = self;
(dtype, values, validity)
}
pub unsafe fn from_inner_unchecked(
dtype: ArrowDataType,
values: Bitmap,
validity: Option<Bitmap>,
) -> Self {
Self {
dtype,
values,
validity,
}
}
}
impl Array for BooleanArray {
impl_common_array!();
fn validity(&self) -> Option<&Bitmap> {
self.validity.as_ref()
}
#[inline]
fn with_validity(&self, validity: Option<Bitmap>) -> Box<dyn Array> {
Box::new(self.clone().with_validity(validity))
}
}
impl Splitable for BooleanArray {
fn check_bound(&self, offset: usize) -> bool {
offset <= self.len()
}
unsafe fn _split_at_unchecked(&self, offset: usize) -> (Self, Self) {
let (lhs_values, rhs_values) = unsafe { self.values.split_at_unchecked(offset) };
let (lhs_validity, rhs_validity) = unsafe { self.validity.split_at_unchecked(offset) };
(
Self {
dtype: self.dtype.clone(),
values: lhs_values,
validity: lhs_validity,
},
Self {
dtype: self.dtype.clone(),
values: rhs_values,
validity: rhs_validity,
},
)
}
}
impl From<Bitmap> for BooleanArray {
fn from(values: Bitmap) -> Self {
Self {
dtype: ArrowDataType::Boolean,
values,
validity: None,
}
}
}