use crate::{
bitmap::Bitmap,
buffer::Buffer,
datatypes::*,
error::ArrowError,
types::{days_ms, months_days_ns, NativeType},
};
use super::Array;
use either::Either;
mod ffi;
pub(super) mod fmt;
mod from_natural;
mod iterator;
pub use iterator::*;
mod mutable;
pub use mutable::*;
#[derive(Clone)]
pub struct PrimitiveArray<T: NativeType> {
data_type: DataType,
values: Buffer<T>,
validity: Option<Bitmap>,
}
impl<T: NativeType> PrimitiveArray<T> {
pub fn try_new(
data_type: DataType,
values: Buffer<T>,
validity: Option<Bitmap>,
) -> Result<Self, ArrowError> {
if validity
.as_ref()
.map_or(false, |validity| validity.len() != values.len())
{
return Err(ArrowError::oos(
"validity mask length must match the number of values",
));
}
if data_type.to_physical_type() != PhysicalType::Primitive(T::PRIMITIVE) {
return Err(ArrowError::oos(
"BooleanArray can only be initialized with a DataType whose physical type is Primitive",
));
}
Ok(Self {
data_type,
values,
validity,
})
}
pub fn new(data_type: DataType, values: Buffer<T>, validity: Option<Bitmap>) -> Self {
Self::try_new(data_type, values, validity).unwrap()
}
pub fn from_data(data_type: DataType, values: Buffer<T>, validity: Option<Bitmap>) -> Self {
Self::new(data_type, values, validity)
}
pub fn new_empty(data_type: DataType) -> Self {
Self::new(data_type, Buffer::new(), None)
}
#[inline]
pub fn new_null(data_type: DataType, length: usize) -> Self {
Self::new(
data_type,
Buffer::new_zeroed(length),
Some(Bitmap::new_zeroed(length)),
)
}
}
impl<T: NativeType> PrimitiveArray<T> {
#[inline]
#[must_use]
pub fn slice(&self, offset: usize, length: usize) -> Self {
assert!(
offset + length <= self.len(),
"offset + length may not exceed length of array"
);
unsafe { self.slice_unchecked(offset, length) }
}
#[inline]
#[must_use]
pub unsafe fn slice_unchecked(&self, offset: usize, length: usize) -> Self {
let validity = self
.validity
.clone()
.map(|x| x.slice_unchecked(offset, length));
Self {
data_type: self.data_type.clone(),
values: self.values.clone().slice_unchecked(offset, length),
validity,
}
}
#[must_use]
pub fn with_validity(&self, validity: Option<Bitmap>) -> Self {
if matches!(&validity, Some(bitmap) if bitmap.len() != self.len()) {
panic!("validity should be as least as large as the array")
}
let mut arr = self.clone();
arr.validity = validity;
arr
}
}
impl<T: NativeType> PrimitiveArray<T> {
#[inline]
pub fn len(&self) -> usize {
self.values.len()
}
#[inline]
pub fn validity(&self) -> Option<&Bitmap> {
self.validity.as_ref()
}
#[inline]
pub fn data_type(&self) -> &DataType {
&self.data_type
}
#[inline]
pub fn values(&self) -> &Buffer<T> {
&self.values
}
#[inline]
pub fn value(&self, i: usize) -> T {
self.values()[i]
}
#[inline]
pub unsafe fn value_unchecked(&self, i: usize) -> T {
*self.values.get_unchecked(i)
}
#[inline]
pub fn to(self, data_type: DataType) -> Self {
if !data_type.to_physical_type().eq_primitive(T::PRIMITIVE) {
Err(ArrowError::InvalidArgumentError(format!(
"Type {} does not support logical type {:?}",
std::any::type_name::<T>(),
data_type
)))
.unwrap()
}
Self {
data_type,
values: self.values,
validity: self.validity,
}
}
pub fn into_mut(self) -> Either<Self, MutablePrimitiveArray<T>> {
use Either::*;
if let Some(bitmap) = self.validity {
match bitmap.into_mut() {
Left(bitmap) => Left(PrimitiveArray::new(
self.data_type,
self.values,
Some(bitmap),
)),
Right(mutable_bitmap) => match self.values.into_mut() {
Left(buffer) => Left(PrimitiveArray::new(
self.data_type,
buffer,
Some(mutable_bitmap.into()),
)),
Right(values) => Right(MutablePrimitiveArray::from_data(
self.data_type,
values,
Some(mutable_bitmap),
)),
},
}
} else {
match self.values.into_mut() {
Left(values) => Left(PrimitiveArray::new(self.data_type, values, None)),
Right(values) => Right(MutablePrimitiveArray::from_data(
self.data_type,
values,
None,
)),
}
}
}
}
impl<T: NativeType> Array for PrimitiveArray<T> {
#[inline]
fn as_any(&self) -> &dyn std::any::Any {
self
}
#[inline]
fn len(&self) -> usize {
self.values.len()
}
#[inline]
fn data_type(&self) -> &DataType {
self.data_type()
}
fn validity(&self) -> Option<&Bitmap> {
self.validity.as_ref()
}
fn slice(&self, offset: usize, length: usize) -> Box<dyn Array> {
Box::new(self.slice(offset, length))
}
unsafe fn slice_unchecked(&self, offset: usize, length: usize) -> Box<dyn Array> {
Box::new(self.slice_unchecked(offset, length))
}
fn with_validity(&self, validity: Option<Bitmap>) -> Box<dyn Array> {
Box::new(self.with_validity(validity))
}
}
pub type Int8Array = PrimitiveArray<i8>;
pub type Int16Array = PrimitiveArray<i16>;
pub type Int32Array = PrimitiveArray<i32>;
pub type Int64Array = PrimitiveArray<i64>;
pub type Int128Array = PrimitiveArray<i128>;
pub type DaysMsArray = PrimitiveArray<days_ms>;
pub type MonthsDaysNsArray = PrimitiveArray<months_days_ns>;
pub type Float32Array = PrimitiveArray<f32>;
pub type Float64Array = PrimitiveArray<f64>;
pub type UInt8Array = PrimitiveArray<u8>;
pub type UInt16Array = PrimitiveArray<u16>;
pub type UInt32Array = PrimitiveArray<u32>;
pub type UInt64Array = PrimitiveArray<u64>;
pub type Int8Vec = MutablePrimitiveArray<i8>;
pub type Int16Vec = MutablePrimitiveArray<i16>;
pub type Int32Vec = MutablePrimitiveArray<i32>;
pub type Int64Vec = MutablePrimitiveArray<i64>;
pub type Int128Vec = MutablePrimitiveArray<i128>;
pub type DaysMsVec = MutablePrimitiveArray<days_ms>;
pub type MonthsDaysNsVec = MutablePrimitiveArray<months_days_ns>;
pub type Float32Vec = MutablePrimitiveArray<f32>;
pub type Float64Vec = MutablePrimitiveArray<f64>;
pub type UInt8Vec = MutablePrimitiveArray<u8>;
pub type UInt16Vec = MutablePrimitiveArray<u16>;
pub type UInt32Vec = MutablePrimitiveArray<u32>;
pub type UInt64Vec = MutablePrimitiveArray<u64>;