vortex_scalar/arrow/
mod.rs1use std::sync::Arc;
5
6use arrow_array::*;
7use vortex_dtype::datetime::{TemporalMetadata, TimeUnit, is_temporal_ext_type};
8use vortex_dtype::{DType, PType};
9use vortex_error::{VortexError, vortex_bail, vortex_err};
10
11use crate::Scalar;
12use crate::decimal::DecimalValue;
13
14macro_rules! value_to_arrow_scalar {
15 ($V:expr, $AR:ty) => {
16 Ok(std::sync::Arc::new(
17 $V.map(<$AR>::new_scalar)
18 .unwrap_or_else(|| arrow_array::Scalar::new(<$AR>::new_null(1))),
19 ))
20 };
21}
22
23impl TryFrom<&Scalar> for Arc<dyn Datum> {
24 type Error = VortexError;
25
26 fn try_from(value: &Scalar) -> Result<Arc<dyn Datum>, Self::Error> {
27 match value.dtype() {
28 DType::Null => Ok(Arc::new(NullArray::new(1))),
29 DType::Bool(_) => value_to_arrow_scalar!(value.as_bool().value(), BooleanArray),
30 DType::Primitive(ptype, ..) => {
31 let scalar = value.as_primitive();
32 Ok(match ptype {
33 PType::U8 => scalar
34 .typed_value()
35 .map(|i| Arc::new(UInt8Array::new_scalar(i)) as Arc<dyn Datum>)
36 .unwrap_or_else(|| Arc::new(UInt8Array::new_null(1))),
37 PType::U16 => scalar
38 .typed_value()
39 .map(|i| Arc::new(UInt16Array::new_scalar(i)) as Arc<dyn Datum>)
40 .unwrap_or_else(|| Arc::new(UInt16Array::new_null(1))),
41 PType::U32 => scalar
42 .typed_value()
43 .map(|i| Arc::new(UInt32Array::new_scalar(i)) as Arc<dyn Datum>)
44 .unwrap_or_else(|| Arc::new(UInt32Array::new_null(1))),
45 PType::U64 => scalar
46 .typed_value()
47 .map(|i| Arc::new(UInt64Array::new_scalar(i)) as Arc<dyn Datum>)
48 .unwrap_or_else(|| Arc::new(UInt64Array::new_null(1))),
49 PType::I8 => scalar
50 .typed_value()
51 .map(|i| Arc::new(Int8Array::new_scalar(i)) as Arc<dyn Datum>)
52 .unwrap_or_else(|| Arc::new(Int8Array::new_null(1))),
53 PType::I16 => scalar
54 .typed_value()
55 .map(|i| Arc::new(Int16Array::new_scalar(i)) as Arc<dyn Datum>)
56 .unwrap_or_else(|| Arc::new(Int16Array::new_null(1))),
57 PType::I32 => scalar
58 .typed_value()
59 .map(|i| Arc::new(Int32Array::new_scalar(i)) as Arc<dyn Datum>)
60 .unwrap_or_else(|| Arc::new(Int32Array::new_null(1))),
61 PType::I64 => scalar
62 .typed_value()
63 .map(|i| Arc::new(Int64Array::new_scalar(i)) as Arc<dyn Datum>)
64 .unwrap_or_else(|| Arc::new(Int64Array::new_null(1))),
65 PType::F16 => scalar
66 .typed_value()
67 .map(|i| Arc::new(Float16Array::new_scalar(i)) as Arc<dyn Datum>)
68 .unwrap_or_else(|| Arc::new(Float16Array::new_null(1))),
69 PType::F32 => scalar
70 .typed_value()
71 .map(|i| Arc::new(Float32Array::new_scalar(i)) as Arc<dyn Datum>)
72 .unwrap_or_else(|| Arc::new(Float32Array::new_null(1))),
73 PType::F64 => scalar
74 .typed_value()
75 .map(|i| Arc::new(Float64Array::new_scalar(i)) as Arc<dyn Datum>)
76 .unwrap_or_else(|| Arc::new(Float64Array::new_null(1))),
77 })
78 }
79 DType::Decimal(..) => match value.as_decimal().decimal_value() {
80 Some(DecimalValue::I8(v)) => Ok(Arc::new(Decimal128Array::new_scalar(v as i128))),
82 Some(DecimalValue::I16(v)) => Ok(Arc::new(Decimal128Array::new_scalar(v as i128))),
83 Some(DecimalValue::I32(v)) => Ok(Arc::new(Decimal128Array::new_scalar(v as i128))),
84 Some(DecimalValue::I64(v)) => Ok(Arc::new(Decimal128Array::new_scalar(v as i128))),
85 Some(DecimalValue::I128(v128)) => Ok(Arc::new(Decimal128Array::new_scalar(v128))),
86 Some(DecimalValue::I256(v256)) => {
87 Ok(Arc::new(Decimal256Array::new_scalar(v256.into())))
88 }
89 None => Ok(Arc::new(arrow_array::Scalar::new(
90 Decimal128Array::new_null(1),
91 ))),
92 },
93 DType::Utf8(_) => {
94 value_to_arrow_scalar!(value.as_utf8().value(), StringViewArray)
95 }
96 DType::Binary(_) => {
97 value_to_arrow_scalar!(value.as_binary().value(), BinaryViewArray)
98 }
99 DType::Struct(..) => {
100 todo!("struct scalar conversion")
101 }
102 DType::List(..) => {
103 todo!("list scalar conversion")
104 }
105 DType::Extension(ext) => {
106 if is_temporal_ext_type(ext.id()) {
107 let metadata = TemporalMetadata::try_from(ext.as_ref())?;
108 let storage_scalar = value.as_extension().storage();
109 let primitive = storage_scalar
110 .as_primitive_opt()
111 .ok_or_else(|| vortex_err!("Expected primitive scalar"))?;
112
113 return match metadata {
114 TemporalMetadata::Time(u) => match u {
115 TimeUnit::Ns => value_to_arrow_scalar!(
116 primitive.as_::<i64>()?,
117 Time64NanosecondArray
118 ),
119 TimeUnit::Us => value_to_arrow_scalar!(
120 primitive.as_::<i64>()?,
121 Time64MicrosecondArray
122 ),
123 TimeUnit::Ms => value_to_arrow_scalar!(
124 primitive.as_::<i32>()?,
125 Time32MillisecondArray
126 ),
127 TimeUnit::S => {
128 value_to_arrow_scalar!(primitive.as_::<i32>()?, Time32SecondArray)
129 }
130 TimeUnit::D => {
131 vortex_bail!("Unsupported TimeUnit {u} for {}", ext.id())
132 }
133 },
134 TemporalMetadata::Date(u) => match u {
135 TimeUnit::Ms => {
136 value_to_arrow_scalar!(primitive.as_::<i64>()?, Date64Array)
137 }
138 TimeUnit::D => {
139 value_to_arrow_scalar!(primitive.as_::<i32>()?, Date32Array)
140 }
141 _ => vortex_bail!("Unsupported TimeUnit {u} for {}", ext.id()),
142 },
143 TemporalMetadata::Timestamp(u, _) => match u {
144 TimeUnit::Ns => value_to_arrow_scalar!(
145 primitive.as_::<i64>()?,
146 TimestampNanosecondArray
147 ),
148 TimeUnit::Us => value_to_arrow_scalar!(
149 primitive.as_::<i64>()?,
150 TimestampMicrosecondArray
151 ),
152 TimeUnit::Ms => value_to_arrow_scalar!(
153 primitive.as_::<i64>()?,
154 TimestampMillisecondArray
155 ),
156 TimeUnit::S => value_to_arrow_scalar!(
157 primitive.as_::<i64>()?,
158 TimestampSecondArray
159 ),
160 TimeUnit::D => {
161 vortex_bail!("Unsupported TimeUnit {u} for {}", ext.id())
162 }
163 },
164 };
165 }
166
167 todo!("Non temporal extension scalar conversion")
168 }
169 }
170 }
171}
172
173#[cfg(test)]
174mod tests;