use crate::{
bitmap::Bitmap,
datatypes::{DataType, Field},
error::Error,
};
use super::{new_empty_array, new_null_array, Array};
mod ffi;
pub(super) mod fmt;
mod iterator;
mod mutable;
pub use mutable::*;
#[derive(Clone)]
pub struct StructArray {
data_type: DataType,
values: Vec<Box<dyn Array>>,
validity: Option<Bitmap>,
}
impl StructArray {
pub fn try_new(
data_type: DataType,
values: Vec<Box<dyn Array>>,
validity: Option<Bitmap>,
) -> Result<Self, Error> {
let fields = Self::try_get_fields(&data_type)?;
if fields.is_empty() {
return Err(Error::oos("A StructArray must contain at least one field"));
}
if fields.len() != values.len() {
return Err(Error::oos(
"A StructArray must have a number of fields in its DataType equal to the number of child values",
));
}
fields
.iter().map(|a| &a.data_type)
.zip(values.iter().map(|a| a.data_type()))
.enumerate()
.try_for_each(|(index, (data_type, child))| {
if data_type != child {
Err(Error::oos(format!(
"The children DataTypes of a StructArray must equal the children data types.
However, the field {index} has data type {data_type:?} but the value has data type {child:?}"
)))
} else {
Ok(())
}
})?;
let len = values[0].len();
values
.iter()
.map(|a| a.len())
.enumerate()
.try_for_each(|(index, a_len)| {
if a_len != len {
Err(Error::oos(format!(
"The children must have an equal number of values.
However, the values at index {index} have a length of {a_len}, which is different from values at index 0, {len}."
)))
} else {
Ok(())
}
})?;
if validity
.as_ref()
.map_or(false, |validity| validity.len() != len)
{
return Err(Error::oos(
"The validity length of a StructArray must match its number of elements",
));
}
Ok(Self {
data_type,
values,
validity,
})
}
pub fn new(data_type: DataType, values: Vec<Box<dyn Array>>, validity: Option<Bitmap>) -> Self {
Self::try_new(data_type, values, validity).unwrap()
}
pub fn new_empty(data_type: DataType) -> Self {
if let DataType::Struct(fields) = &data_type {
let values = fields
.iter()
.map(|field| new_empty_array(field.data_type().clone()))
.collect();
Self::new(data_type, values, None)
} else {
panic!("StructArray must be initialized with DataType::Struct");
}
}
pub fn new_null(data_type: DataType, length: usize) -> Self {
if let DataType::Struct(fields) = &data_type {
let values = fields
.iter()
.map(|field| new_null_array(field.data_type().clone(), length))
.collect();
Self::new(data_type, values, Some(Bitmap::new_zeroed(length)))
} else {
panic!("StructArray must be initialized with DataType::Struct");
}
}
}
impl StructArray {
#[must_use]
pub fn into_data(self) -> (Vec<Field>, Vec<Box<dyn Array>>, Option<Bitmap>) {
let Self {
data_type,
values,
validity,
} = self;
let fields = if let DataType::Struct(fields) = data_type {
fields
} else {
unreachable!()
};
(fields, values, validity)
}
#[must_use]
pub fn slice(&self, offset: usize, length: usize) -> Self {
assert!(
offset + length <= self.len(),
"offset + length may not exceed length of array"
);
unsafe { self.slice_unchecked(offset, length) }
}
#[must_use]
pub unsafe fn slice_unchecked(&self, offset: usize, length: usize) -> Self {
let validity = self
.validity
.clone()
.map(|bitmap| bitmap.slice_unchecked(offset, length))
.and_then(|bitmap| (bitmap.unset_bits() > 0).then(|| bitmap));
Self {
data_type: self.data_type.clone(),
values: self
.values
.iter()
.map(|x| x.slice_unchecked(offset, length))
.collect(),
validity,
}
}
#[must_use]
pub fn with_validity(mut self, validity: Option<Bitmap>) -> Self {
self.set_validity(validity);
self
}
pub fn set_validity(&mut self, validity: Option<Bitmap>) {
if matches!(&validity, Some(bitmap) if bitmap.len() != self.len()) {
panic!("validity's length must be equal to the array's length")
}
self.validity = validity;
}
pub fn boxed(self) -> Box<dyn Array> {
Box::new(self)
}
pub fn arced(self) -> std::sync::Arc<dyn Array> {
std::sync::Arc::new(self)
}
}
impl StructArray {
#[inline]
fn len(&self) -> usize {
self.values[0].len()
}
#[inline]
pub fn validity(&self) -> Option<&Bitmap> {
self.validity.as_ref()
}
pub fn values(&self) -> &[Box<dyn Array>] {
&self.values
}
pub fn fields(&self) -> &[Field] {
Self::get_fields(&self.data_type)
}
}
impl StructArray {
pub(crate) fn try_get_fields(data_type: &DataType) -> Result<&[Field], Error> {
match data_type.to_logical_type() {
DataType::Struct(fields) => Ok(fields),
_ => Err(Error::oos(
"Struct array must be created with a DataType whose physical type is Struct",
)),
}
}
pub fn get_fields(data_type: &DataType) -> &[Field] {
Self::try_get_fields(data_type).unwrap()
}
}
impl Array for StructArray {
#[inline]
fn as_any(&self) -> &dyn std::any::Any {
self
}
#[inline]
fn as_any_mut(&mut self) -> &mut dyn std::any::Any {
self
}
#[inline]
fn len(&self) -> usize {
self.len()
}
#[inline]
fn data_type(&self) -> &DataType {
&self.data_type
}
#[inline]
fn validity(&self) -> Option<&Bitmap> {
self.validity.as_ref()
}
fn slice(&self, offset: usize, length: usize) -> Box<dyn Array> {
Box::new(self.slice(offset, length))
}
unsafe fn slice_unchecked(&self, offset: usize, length: usize) -> Box<dyn Array> {
Box::new(self.slice_unchecked(offset, length))
}
fn with_validity(&self, validity: Option<Bitmap>) -> Box<dyn Array> {
Box::new(self.clone().with_validity(validity))
}
fn to_boxed(&self) -> Box<dyn Array> {
Box::new(self.clone())
}
}