use arrow::array::ArrayRef;
use arrow::compute::ilike;
use arrow::datatypes::{DataType, Field};
use datafusion_common::{Result, exec_err, internal_err};
use datafusion_expr::ColumnarValue;
use datafusion_expr::{
ReturnFieldArgs, ScalarFunctionArgs, ScalarUDFImpl, Signature, Volatility,
};
use datafusion_functions::utils::make_scalar_function;
use std::any::Any;
use std::sync::Arc;
#[derive(Debug, PartialEq, Eq, Hash)]
pub struct SparkILike {
signature: Signature,
}
impl Default for SparkILike {
fn default() -> Self {
Self::new()
}
}
impl SparkILike {
pub fn new() -> Self {
Self {
signature: Signature::string(2, Volatility::Immutable),
}
}
}
impl ScalarUDFImpl for SparkILike {
fn as_any(&self) -> &dyn Any {
self
}
fn name(&self) -> &str {
"ilike"
}
fn signature(&self) -> &Signature {
&self.signature
}
fn return_type(&self, _arg_types: &[DataType]) -> Result<DataType> {
internal_err!("return_field_from_args should be used instead")
}
fn return_field_from_args(&self, args: ReturnFieldArgs) -> Result<Arc<Field>> {
let nullable = args.arg_fields.iter().any(|f| f.is_nullable());
Ok(Arc::new(Field::new("ilike", DataType::Boolean, nullable)))
}
fn invoke_with_args(&self, args: ScalarFunctionArgs) -> Result<ColumnarValue> {
make_scalar_function(spark_ilike, vec![])(&args.args)
}
}
pub fn spark_ilike(args: &[ArrayRef]) -> Result<ArrayRef> {
if args.len() != 2 {
return exec_err!("ilike function requires exactly 2 arguments");
}
let result = ilike(&args[0], &args[1])?;
Ok(Arc::new(result))
}
#[cfg(test)]
mod tests {
use super::*;
use crate::function::utils::test::test_scalar_function;
use arrow::array::{Array, BooleanArray};
use arrow::datatypes::{DataType::Boolean, Field};
use datafusion_common::{Result, ScalarValue};
use datafusion_expr::{ColumnarValue, ReturnFieldArgs, ScalarUDFImpl};
macro_rules! test_ilike_string_invoke {
($INPUT1:expr, $INPUT2:expr, $EXPECTED:expr) => {
test_scalar_function!(
SparkILike::new(),
vec![
ColumnarValue::Scalar(ScalarValue::Utf8($INPUT1)),
ColumnarValue::Scalar(ScalarValue::Utf8($INPUT2))
],
$EXPECTED,
bool,
Boolean,
BooleanArray
);
test_scalar_function!(
SparkILike::new(),
vec![
ColumnarValue::Scalar(ScalarValue::LargeUtf8($INPUT1)),
ColumnarValue::Scalar(ScalarValue::LargeUtf8($INPUT2))
],
$EXPECTED,
bool,
Boolean,
BooleanArray
);
test_scalar_function!(
SparkILike::new(),
vec![
ColumnarValue::Scalar(ScalarValue::Utf8View($INPUT1)),
ColumnarValue::Scalar(ScalarValue::Utf8View($INPUT2))
],
$EXPECTED,
bool,
Boolean,
BooleanArray
);
};
}
#[test]
fn test_ilike_invoke() -> Result<()> {
test_ilike_string_invoke!(
Some(String::from("Spark")),
Some(String::from("_park")),
Ok(Some(true))
);
test_ilike_string_invoke!(
Some(String::from("Spark")),
Some(String::from("_PARK")),
Ok(Some(true))
);
test_ilike_string_invoke!(
Some(String::from("SPARK")),
Some(String::from("_park")),
Ok(Some(true))
);
test_ilike_string_invoke!(
Some(String::from("Spark")),
Some(String::from("sp%")),
Ok(Some(true))
);
test_ilike_string_invoke!(
Some(String::from("Spark")),
Some(String::from("SP%")),
Ok(Some(true))
);
test_ilike_string_invoke!(
Some(String::from("Spark")),
Some(String::from("%ARK")),
Ok(Some(true))
);
test_ilike_string_invoke!(
Some(String::from("Spark")),
Some(String::from("xyz")),
Ok(Some(false))
);
test_ilike_string_invoke!(None, Some(String::from("_park")), Ok(None));
test_ilike_string_invoke!(Some(String::from("Spark")), None, Ok(None));
test_ilike_string_invoke!(None, None, Ok(None));
Ok(())
}
#[test]
fn test_ilike_nullability() {
let ilike = SparkILike::new();
let non_nullable_field1 = Arc::new(Field::new("str", DataType::Utf8, false));
let non_nullable_field2 = Arc::new(Field::new("pattern", DataType::Utf8, false));
let result = ilike
.return_field_from_args(ReturnFieldArgs {
arg_fields: &[
Arc::clone(&non_nullable_field1),
Arc::clone(&non_nullable_field2),
],
scalar_arguments: &[None, None],
})
.unwrap();
assert!(!result.is_nullable());
assert_eq!(result.data_type(), &Boolean);
let nullable_field1 = Arc::new(Field::new("str", DataType::Utf8, true));
let result = ilike
.return_field_from_args(ReturnFieldArgs {
arg_fields: &[
Arc::clone(&nullable_field1),
Arc::clone(&non_nullable_field2),
],
scalar_arguments: &[None, None],
})
.unwrap();
assert!(result.is_nullable());
assert_eq!(result.data_type(), &Boolean);
let nullable_field2 = Arc::new(Field::new("pattern", DataType::Utf8, true));
let result = ilike
.return_field_from_args(ReturnFieldArgs {
arg_fields: &[
Arc::clone(&non_nullable_field1),
Arc::clone(&nullable_field2),
],
scalar_arguments: &[None, None],
})
.unwrap();
assert!(result.is_nullable());
assert_eq!(result.data_type(), &Boolean);
let result = ilike
.return_field_from_args(ReturnFieldArgs {
arg_fields: &[Arc::clone(&nullable_field1), Arc::clone(&nullable_field2)],
scalar_arguments: &[None, None],
})
.unwrap();
assert!(result.is_nullable());
assert_eq!(result.data_type(), &Boolean);
}
}