use std::sync::Arc;
use arrow_array::builder::GenericByteBuilder;
use arrow_array::cast::AsArray;
use arrow_array::{
Array, ArrayRef, BinaryArray, GenericBinaryArray, LargeBinaryArray, OffsetSizeTrait,
};
use arrow_buffer::NullBuffer;
use arrow_schema::{DataType, Field};
use geoarrow_schema::error::{GeoArrowError, GeoArrowResult};
use geoarrow_schema::{GeoArrowType, Metadata, WkbType};
use wkb::reader::Wkb;
use crate::array::WkbViewArray;
use crate::capacity::WkbCapacity;
use crate::trait_::{GeoArrowArray, GeoArrowArrayAccessor, IntoArrow};
use crate::util::{offsets_buffer_i32_to_i64, offsets_buffer_i64_to_i32};
#[derive(Debug, Clone, PartialEq)]
pub struct GenericWkbArray<O: OffsetSizeTrait> {
pub(crate) data_type: WkbType,
pub(crate) array: GenericBinaryArray<O>,
}
impl<O: OffsetSizeTrait> GenericWkbArray<O> {
pub fn new(array: GenericBinaryArray<O>, metadata: Arc<Metadata>) -> Self {
Self {
data_type: WkbType::new(metadata),
array,
}
}
pub fn is_empty(&self) -> bool {
self.len() == 0
}
pub fn inner(&self) -> &GenericBinaryArray<O> {
&self.array
}
pub fn buffer_lengths(&self) -> WkbCapacity {
WkbCapacity::new(
self.array.offsets().last().unwrap().to_usize().unwrap(),
self.len(),
)
}
pub fn num_bytes(&self) -> usize {
let validity_len = self
.array
.nulls()
.as_ref()
.map(|v| v.buffer().len())
.unwrap_or(0);
validity_len + self.buffer_lengths().num_bytes::<O>()
}
#[inline]
pub fn slice(&self, offset: usize, length: usize) -> Self {
assert!(
offset + length <= self.len(),
"offset + length may not exceed length of array"
);
Self {
array: self.array.slice(offset, length),
data_type: self.data_type.clone(),
}
}
pub fn with_metadata(&self, metadata: Arc<Metadata>) -> Self {
let mut arr = self.clone();
arr.data_type = self.data_type.clone().with_metadata(metadata);
arr
}
}
impl<O: OffsetSizeTrait> GeoArrowArray for GenericWkbArray<O> {
fn as_any(&self) -> &dyn std::any::Any {
self
}
fn into_array_ref(self) -> ArrayRef {
Arc::new(self.into_arrow())
}
fn to_array_ref(&self) -> ArrayRef {
self.clone().into_array_ref()
}
#[inline]
fn len(&self) -> usize {
self.array.len()
}
#[inline]
fn logical_nulls(&self) -> Option<NullBuffer> {
self.array.logical_nulls()
}
#[inline]
fn logical_null_count(&self) -> usize {
self.array.logical_null_count()
}
#[inline]
fn is_null(&self, i: usize) -> bool {
self.array.is_null(i)
}
fn data_type(&self) -> GeoArrowType {
if O::IS_LARGE {
GeoArrowType::LargeWkb(self.data_type.clone())
} else {
GeoArrowType::Wkb(self.data_type.clone())
}
}
fn slice(&self, offset: usize, length: usize) -> Arc<dyn GeoArrowArray> {
Arc::new(self.slice(offset, length))
}
fn with_metadata(self, metadata: Arc<Metadata>) -> Arc<dyn GeoArrowArray> {
Arc::new(Self::with_metadata(&self, metadata))
}
}
impl<'a, O: OffsetSizeTrait> GeoArrowArrayAccessor<'a> for GenericWkbArray<O> {
type Item = Wkb<'a>;
unsafe fn value_unchecked(&'a self, index: usize) -> GeoArrowResult<Self::Item> {
let buf = self.array.value(index);
Wkb::try_new(buf).map_err(|err| GeoArrowError::External(Box::new(err)))
}
}
impl<O: OffsetSizeTrait> IntoArrow for GenericWkbArray<O> {
type ArrowArray = GenericBinaryArray<O>;
type ExtensionType = WkbType;
fn into_arrow(self) -> Self::ArrowArray {
self.array
}
fn extension_type(&self) -> &Self::ExtensionType {
&self.data_type
}
}
impl<O: OffsetSizeTrait> From<(GenericBinaryArray<O>, WkbType)> for GenericWkbArray<O> {
fn from((value, typ): (GenericBinaryArray<O>, WkbType)) -> Self {
Self {
data_type: typ,
array: value,
}
}
}
impl TryFrom<(&dyn Array, WkbType)> for GenericWkbArray<i32> {
type Error = GeoArrowError;
fn try_from((value, typ): (&dyn Array, WkbType)) -> GeoArrowResult<Self> {
match value.data_type() {
DataType::Binary => Ok((value.as_binary::<i32>().clone(), typ).into()),
DataType::LargeBinary => {
let geom_array: GenericWkbArray<i64> =
(value.as_binary::<i64>().clone(), typ).into();
geom_array.try_into()
}
dt => Err(GeoArrowError::InvalidGeoArrow(format!(
"Unexpected GenericWkbArray DataType: {dt:?}",
))),
}
}
}
impl TryFrom<(&dyn Array, WkbType)> for GenericWkbArray<i64> {
type Error = GeoArrowError;
fn try_from((value, typ): (&dyn Array, WkbType)) -> GeoArrowResult<Self> {
match value.data_type() {
DataType::Binary => {
let geom_array: GenericWkbArray<i32> =
(value.as_binary::<i32>().clone(), typ).into();
Ok(geom_array.into())
}
DataType::LargeBinary => Ok((value.as_binary::<i64>().clone(), typ).into()),
dt => Err(GeoArrowError::InvalidGeoArrow(format!(
"Unexpected GenericWkbArray DataType: {dt:?}",
))),
}
}
}
impl TryFrom<(&dyn Array, &Field)> for GenericWkbArray<i32> {
type Error = GeoArrowError;
fn try_from((arr, field): (&dyn Array, &Field)) -> GeoArrowResult<Self> {
let typ = field
.try_extension_type::<WkbType>()
.ok()
.unwrap_or_default();
(arr, typ).try_into()
}
}
impl TryFrom<(&dyn Array, &Field)> for GenericWkbArray<i64> {
type Error = GeoArrowError;
fn try_from((arr, field): (&dyn Array, &Field)) -> GeoArrowResult<Self> {
let typ = field
.try_extension_type::<WkbType>()
.ok()
.unwrap_or_default();
(arr, typ).try_into()
}
}
impl From<GenericWkbArray<i32>> for GenericWkbArray<i64> {
fn from(value: GenericWkbArray<i32>) -> Self {
let binary_array = value.array;
let (offsets, values, nulls) = binary_array.into_parts();
let array = LargeBinaryArray::new(offsets_buffer_i32_to_i64(&offsets), values, nulls);
Self {
data_type: value.data_type,
array,
}
}
}
impl TryFrom<GenericWkbArray<i64>> for GenericWkbArray<i32> {
type Error = GeoArrowError;
fn try_from(value: GenericWkbArray<i64>) -> GeoArrowResult<Self> {
let binary_array = value.array;
let (offsets, values, nulls) = binary_array.into_parts();
let array = BinaryArray::new(offsets_buffer_i64_to_i32(&offsets)?, values, nulls);
Ok(Self {
data_type: value.data_type,
array,
})
}
}
impl<O: OffsetSizeTrait> From<WkbViewArray> for GenericWkbArray<O> {
fn from(value: WkbViewArray) -> Self {
let wkb_type = value.data_type;
let binary_view_array = value.array;
let mut builder = GenericByteBuilder::new();
binary_view_array
.iter()
.for_each(|value| builder.append_option(value));
Self {
data_type: wkb_type,
array: builder.finish(),
}
}
}
pub type WkbArray = GenericWkbArray<i32>;
pub type LargeWkbArray = GenericWkbArray<i64>;
#[cfg(test)]
mod test {
use arrow_array::builder::{BinaryBuilder, LargeBinaryBuilder};
use super::*;
use crate::GeoArrowArray;
use crate::builder::WkbBuilder;
use crate::test::point;
fn wkb_data<O: OffsetSizeTrait>() -> GenericWkbArray<O> {
let mut builder = WkbBuilder::new(WkbType::new(Default::default()));
builder.push_geometry(Some(&point::p0())).unwrap();
builder.push_geometry(Some(&point::p1())).unwrap();
builder.push_geometry(Some(&point::p2())).unwrap();
builder.finish()
}
#[test]
fn parse_dyn_array_i32() {
let wkb_array = wkb_data::<i32>();
let array = wkb_array.to_array_ref();
let field = Field::new("geometry", array.data_type().clone(), true)
.with_extension_type(wkb_array.data_type.clone());
let wkb_array_retour: GenericWkbArray<i32> = (array.as_ref(), &field).try_into().unwrap();
assert_eq!(wkb_array, wkb_array_retour);
}
#[test]
fn parse_dyn_array_i64() {
let wkb_array = wkb_data::<i64>();
let array = wkb_array.to_array_ref();
let field = Field::new("geometry", array.data_type().clone(), true)
.with_extension_type(wkb_array.data_type.clone());
let wkb_array_retour: GenericWkbArray<i64> = (array.as_ref(), &field).try_into().unwrap();
assert_eq!(wkb_array, wkb_array_retour);
}
#[test]
fn convert_i32_to_i64() {
let wkb_array = wkb_data::<i32>();
let wkb_array_i64: GenericWkbArray<i64> = wkb_array.clone().into();
let wkb_array_i32: GenericWkbArray<i32> = wkb_array_i64.clone().try_into().unwrap();
assert_eq!(wkb_array, wkb_array_i32);
}
#[test]
fn convert_i64_to_i32_to_i64() {
let wkb_array = wkb_data::<i64>();
let wkb_array_i32: GenericWkbArray<i32> = wkb_array.clone().try_into().unwrap();
let wkb_array_i64: GenericWkbArray<i64> = wkb_array_i32.clone().into();
assert_eq!(wkb_array, wkb_array_i64);
}
#[test]
fn allow_field_without_extension_name() {
let mut builder = BinaryBuilder::new();
builder.append_value(b"a");
let array = Arc::new(builder.finish()) as ArrayRef;
let field = Field::new("geometry", array.data_type().clone(), true);
let _wkt_arr = GenericWkbArray::<i32>::try_from((array.as_ref(), &field)).unwrap();
let mut builder = LargeBinaryBuilder::new();
builder.append_value(b"a");
let array = Arc::new(builder.finish()) as ArrayRef;
let field = Field::new("geometry", array.data_type().clone(), true);
let _wkt_arr = GenericWkbArray::<i64>::try_from((array.as_ref(), &field)).unwrap();
}
}