datafusion_functions/datetime/
make_date.rs1use std::any::Any;
19use std::sync::Arc;
20
21use arrow::array::builder::PrimitiveBuilder;
22use arrow::array::cast::AsArray;
23use arrow::array::types::{Date32Type, Int32Type};
24use arrow::array::PrimitiveArray;
25use arrow::datatypes::DataType;
26use arrow::datatypes::DataType::{Date32, Int32, Int64, UInt32, UInt64, Utf8, Utf8View};
27use chrono::prelude::*;
28
29use datafusion_common::{exec_err, utils::take_function_args, Result, ScalarValue};
30use datafusion_expr::{
31 ColumnarValue, Documentation, ScalarUDFImpl, Signature, Volatility,
32};
33use datafusion_macros::user_doc;
34
35#[user_doc(
36 doc_section(label = "Time and Date Functions"),
37 description = "Make a date from year/month/day component parts.",
38 syntax_example = "make_date(year, month, day)",
39 sql_example = r#"```sql
40> select make_date(2023, 1, 31);
41+-------------------------------------------+
42| make_date(Int64(2023),Int64(1),Int64(31)) |
43+-------------------------------------------+
44| 2023-01-31 |
45+-------------------------------------------+
46> select make_date('2023', '01', '31');
47+-----------------------------------------------+
48| make_date(Utf8("2023"),Utf8("01"),Utf8("31")) |
49+-----------------------------------------------+
50| 2023-01-31 |
51+-----------------------------------------------+
52```
53
54Additional examples can be found [here](https://github.com/apache/datafusion/blob/main/datafusion-examples/examples/make_date.rs)
55"#,
56 argument(
57 name = "year",
58 description = "Year to use when making the date. Can be a constant, column or function, and any combination of arithmetic operators."
59 ),
60 argument(
61 name = "month",
62 description = "Month to use when making the date. Can be a constant, column or function, and any combination of arithmetic operators."
63 ),
64 argument(
65 name = "day",
66 description = "Day to use when making the date. Can be a constant, column or function, and any combination of arithmetic operators."
67 )
68)]
69#[derive(Debug)]
70pub struct MakeDateFunc {
71 signature: Signature,
72}
73
74impl Default for MakeDateFunc {
75 fn default() -> Self {
76 Self::new()
77 }
78}
79
80impl MakeDateFunc {
81 pub fn new() -> Self {
82 Self {
83 signature: Signature::uniform(
84 3,
85 vec![Int32, Int64, UInt32, UInt64, Utf8, Utf8View],
86 Volatility::Immutable,
87 ),
88 }
89 }
90}
91
92impl ScalarUDFImpl for MakeDateFunc {
93 fn as_any(&self) -> &dyn Any {
94 self
95 }
96
97 fn name(&self) -> &str {
98 "make_date"
99 }
100
101 fn signature(&self) -> &Signature {
102 &self.signature
103 }
104
105 fn return_type(&self, _arg_types: &[DataType]) -> Result<DataType> {
106 Ok(Date32)
107 }
108
109 fn invoke_with_args(
110 &self,
111 args: datafusion_expr::ScalarFunctionArgs,
112 ) -> Result<ColumnarValue> {
113 let args = args.args;
116 let len = args
117 .iter()
118 .fold(Option::<usize>::None, |acc, arg| match arg {
119 ColumnarValue::Scalar(_) => acc,
120 ColumnarValue::Array(a) => Some(a.len()),
121 });
122
123 let [years, months, days] = take_function_args(self.name(), args)?;
124
125 let years = years.cast_to(&Int32, None)?;
126 let months = months.cast_to(&Int32, None)?;
127 let days = days.cast_to(&Int32, None)?;
128
129 let scalar_value_fn = |col: &ColumnarValue| -> Result<i32> {
130 let ColumnarValue::Scalar(s) = col else {
131 return exec_err!("Expected scalar value");
132 };
133 let ScalarValue::Int32(Some(i)) = s else {
134 return exec_err!("Unable to parse date from null/empty value");
135 };
136 Ok(*i)
137 };
138
139 let value = if let Some(array_size) = len {
140 let to_primitive_array_fn =
141 |col: &ColumnarValue| -> PrimitiveArray<Int32Type> {
142 match col {
143 ColumnarValue::Array(a) => {
144 a.as_primitive::<Int32Type>().to_owned()
145 }
146 _ => {
147 let v = scalar_value_fn(col).unwrap();
148 PrimitiveArray::<Int32Type>::from_value(v, array_size)
149 }
150 }
151 };
152
153 let years = to_primitive_array_fn(&years);
154 let months = to_primitive_array_fn(&months);
155 let days = to_primitive_array_fn(&days);
156
157 let mut builder: PrimitiveBuilder<Date32Type> =
158 PrimitiveArray::builder(array_size);
159 for i in 0..array_size {
160 make_date_inner(
161 years.value(i),
162 months.value(i),
163 days.value(i),
164 |days: i32| builder.append_value(days),
165 )?;
166 }
167
168 let arr = builder.finish();
169
170 ColumnarValue::Array(Arc::new(arr))
171 } else {
172 let mut value = 0;
175 make_date_inner(
176 scalar_value_fn(&years)?,
177 scalar_value_fn(&months)?,
178 scalar_value_fn(&days)?,
179 |days: i32| value = days,
180 )?;
181
182 ColumnarValue::Scalar(ScalarValue::Date32(Some(value)))
183 };
184
185 Ok(value)
186 }
187 fn documentation(&self) -> Option<&Documentation> {
188 self.doc()
189 }
190}
191
192fn make_date_inner<F: FnMut(i32)>(
195 year: i32,
196 month: i32,
197 day: i32,
198 mut date_consumer_fn: F,
199) -> Result<()> {
200 let Ok(m) = u32::try_from(month) else {
201 return exec_err!("Month value '{month:?}' is out of range");
202 };
203 let Ok(d) = u32::try_from(day) else {
204 return exec_err!("Day value '{day:?}' is out of range");
205 };
206
207 if let Some(date) = NaiveDate::from_ymd_opt(year, m, d) {
208 const UNIX_DAYS_FROM_CE: i32 = 719_163;
211
212 date_consumer_fn(date.num_days_from_ce() - UNIX_DAYS_FROM_CE);
216 Ok(())
217 } else {
218 exec_err!("Unable to parse date from {year}, {month}, {day}")
219 }
220}
221
222#[cfg(test)]
223mod tests {
224 use crate::datetime::make_date::MakeDateFunc;
225 use arrow::array::{Array, Date32Array, Int32Array, Int64Array, UInt32Array};
226 use arrow::datatypes::{DataType, Field};
227 use datafusion_common::{DataFusionError, ScalarValue};
228 use datafusion_expr::{ColumnarValue, ScalarUDFImpl};
229 use std::sync::Arc;
230
231 fn invoke_make_date_with_args(
232 args: Vec<ColumnarValue>,
233 number_rows: usize,
234 ) -> Result<ColumnarValue, DataFusionError> {
235 let arg_fields = args
236 .iter()
237 .map(|arg| Field::new("a", arg.data_type(), true).into())
238 .collect::<Vec<_>>();
239 let args = datafusion_expr::ScalarFunctionArgs {
240 args,
241 arg_fields,
242 number_rows,
243 return_field: Field::new("f", DataType::Date32, true).into(),
244 };
245 MakeDateFunc::new().invoke_with_args(args)
246 }
247
248 #[test]
249 fn test_make_date() {
250 let res = invoke_make_date_with_args(
251 vec![
252 ColumnarValue::Scalar(ScalarValue::Int32(Some(2024))),
253 ColumnarValue::Scalar(ScalarValue::Int64(Some(1))),
254 ColumnarValue::Scalar(ScalarValue::UInt32(Some(14))),
255 ],
256 1,
257 )
258 .expect("that make_date parsed values without error");
259
260 if let ColumnarValue::Scalar(ScalarValue::Date32(date)) = res {
261 assert_eq!(19736, date.unwrap());
262 } else {
263 panic!("Expected a scalar value")
264 }
265
266 let res = invoke_make_date_with_args(
267 vec![
268 ColumnarValue::Scalar(ScalarValue::Int64(Some(2024))),
269 ColumnarValue::Scalar(ScalarValue::UInt64(Some(1))),
270 ColumnarValue::Scalar(ScalarValue::UInt32(Some(14))),
271 ],
272 1,
273 )
274 .expect("that make_date parsed values without error");
275
276 if let ColumnarValue::Scalar(ScalarValue::Date32(date)) = res {
277 assert_eq!(19736, date.unwrap());
278 } else {
279 panic!("Expected a scalar value")
280 }
281
282 let res = invoke_make_date_with_args(
283 vec![
284 ColumnarValue::Scalar(ScalarValue::Utf8(Some("2024".to_string()))),
285 ColumnarValue::Scalar(ScalarValue::LargeUtf8(Some("1".to_string()))),
286 ColumnarValue::Scalar(ScalarValue::Utf8(Some("14".to_string()))),
287 ],
288 1,
289 )
290 .expect("that make_date parsed values without error");
291
292 if let ColumnarValue::Scalar(ScalarValue::Date32(date)) = res {
293 assert_eq!(19736, date.unwrap());
294 } else {
295 panic!("Expected a scalar value")
296 }
297
298 let years = Arc::new((2021..2025).map(Some).collect::<Int64Array>());
299 let months = Arc::new((1..5).map(Some).collect::<Int32Array>());
300 let days = Arc::new((11..15).map(Some).collect::<UInt32Array>());
301 let batch_len = years.len();
302 let res = invoke_make_date_with_args(
303 vec![
304 ColumnarValue::Array(years),
305 ColumnarValue::Array(months),
306 ColumnarValue::Array(days),
307 ],
308 batch_len,
309 )
310 .unwrap();
311
312 if let ColumnarValue::Array(array) = res {
313 assert_eq!(array.len(), 4);
314 let mut builder = Date32Array::builder(4);
315 builder.append_value(18_638);
316 builder.append_value(19_035);
317 builder.append_value(19_429);
318 builder.append_value(19_827);
319 assert_eq!(&builder.finish() as &dyn Array, array.as_ref());
320 } else {
321 panic!("Expected a columnar array")
322 }
323
324 let res = invoke_make_date_with_args(
330 vec![ColumnarValue::Scalar(ScalarValue::Int32(Some(1)))],
331 1,
332 );
333 assert_eq!(
334 res.err().unwrap().strip_backtrace(),
335 "Execution error: make_date function requires 3 arguments, got 1"
336 );
337
338 let res = invoke_make_date_with_args(
340 vec![
341 ColumnarValue::Scalar(ScalarValue::IntervalYearMonth(Some(1))),
342 ColumnarValue::Scalar(ScalarValue::TimestampNanosecond(Some(1), None)),
343 ColumnarValue::Scalar(ScalarValue::TimestampNanosecond(Some(1), None)),
344 ],
345 1,
346 );
347 assert_eq!(
348 res.err().unwrap().strip_backtrace(),
349 "Arrow error: Cast error: Casting from Interval(YearMonth) to Int32 not supported"
350 );
351
352 let res = invoke_make_date_with_args(
354 vec![
355 ColumnarValue::Scalar(ScalarValue::Int32(Some(2023))),
356 ColumnarValue::Scalar(ScalarValue::UInt64(Some(u64::MAX))),
357 ColumnarValue::Scalar(ScalarValue::Int32(Some(22))),
358 ],
359 1,
360 );
361 assert_eq!(
362 res.err().unwrap().strip_backtrace(),
363 "Arrow error: Cast error: Can't cast value 18446744073709551615 to type Int32"
364 );
365
366 let res = invoke_make_date_with_args(
368 vec![
369 ColumnarValue::Scalar(ScalarValue::Int32(Some(2023))),
370 ColumnarValue::Scalar(ScalarValue::Int32(Some(22))),
371 ColumnarValue::Scalar(ScalarValue::UInt32(Some(u32::MAX))),
372 ],
373 1,
374 );
375 assert_eq!(
376 res.err().unwrap().strip_backtrace(),
377 "Arrow error: Cast error: Can't cast value 4294967295 to type Int32"
378 );
379 }
380}