use std::any::Any;
use crate::unicode::common::{RightSlicer, general_left_right};
use crate::utils::make_scalar_function;
use arrow::datatypes::DataType;
use datafusion_common::Result;
use datafusion_common::exec_err;
use datafusion_expr::TypeSignature::Exact;
use datafusion_expr::{
ColumnarValue, Documentation, ScalarUDFImpl, Signature, Volatility,
};
use datafusion_macros::user_doc;
#[user_doc(
doc_section(label = "String Functions"),
description = "Returns a specified number of characters from the right side of a string.",
syntax_example = "right(str, n)",
sql_example = r#"```sql
> select right('datafusion', 6);
+------------------------------------+
| right(Utf8("datafusion"),Int64(6)) |
+------------------------------------+
| fusion |
+------------------------------------+
```"#,
standard_argument(name = "str", prefix = "String"),
argument(name = "n", description = "Number of characters to return."),
related_udf(name = "left")
)]
#[derive(Debug, PartialEq, Eq, Hash)]
pub struct RightFunc {
signature: Signature,
}
impl Default for RightFunc {
fn default() -> Self {
Self::new()
}
}
impl RightFunc {
pub fn new() -> Self {
use DataType::*;
Self {
signature: Signature::one_of(
vec![
Exact(vec![Utf8View, Int64]),
Exact(vec![Utf8, Int64]),
Exact(vec![LargeUtf8, Int64]),
],
Volatility::Immutable,
),
}
}
}
impl ScalarUDFImpl for RightFunc {
fn as_any(&self) -> &dyn Any {
self
}
fn name(&self) -> &str {
"right"
}
fn signature(&self) -> &Signature {
&self.signature
}
fn return_type(&self, arg_types: &[DataType]) -> Result<DataType> {
Ok(arg_types[0].clone())
}
fn invoke_with_args(
&self,
args: datafusion_expr::ScalarFunctionArgs,
) -> Result<ColumnarValue> {
let args = &args.args;
match args[0].data_type() {
DataType::Utf8 | DataType::Utf8View | DataType::LargeUtf8 => {
make_scalar_function(general_left_right::<RightSlicer>, vec![])(args)
}
other => exec_err!(
"Unsupported data type {other:?} for function {},\
expected Utf8View, Utf8 or LargeUtf8.",
self.name()
),
}
}
fn documentation(&self) -> Option<&Documentation> {
self.doc()
}
}
#[cfg(test)]
mod tests {
use arrow::array::{Array, StringArray, StringViewArray};
use arrow::datatypes::DataType::{Utf8, Utf8View};
use datafusion_common::{Result, ScalarValue};
use datafusion_expr::{ColumnarValue, ScalarUDFImpl};
use crate::unicode::right::RightFunc;
use crate::utils::test::test_function;
#[test]
fn test_functions() -> Result<()> {
test_function!(
RightFunc::new(),
vec![
ColumnarValue::Scalar(ScalarValue::from("abcde")),
ColumnarValue::Scalar(ScalarValue::from(2i64)),
],
Ok(Some("de")),
&str,
Utf8,
StringArray
);
test_function!(
RightFunc::new(),
vec![
ColumnarValue::Scalar(ScalarValue::from("abcde")),
ColumnarValue::Scalar(ScalarValue::from(200i64)),
],
Ok(Some("abcde")),
&str,
Utf8,
StringArray
);
test_function!(
RightFunc::new(),
vec![
ColumnarValue::Scalar(ScalarValue::from("abcde")),
ColumnarValue::Scalar(ScalarValue::from(-2i64)),
],
Ok(Some("cde")),
&str,
Utf8,
StringArray
);
test_function!(
RightFunc::new(),
vec![
ColumnarValue::Scalar(ScalarValue::from("abcde")),
ColumnarValue::Scalar(ScalarValue::from(i64::MIN)),
],
Ok(Some("")),
&str,
Utf8,
StringArray
);
test_function!(
RightFunc::new(),
vec![
ColumnarValue::Scalar(ScalarValue::from("abcde")),
ColumnarValue::Scalar(ScalarValue::from(-200i64)),
],
Ok(Some("")),
&str,
Utf8,
StringArray
);
test_function!(
RightFunc::new(),
vec![
ColumnarValue::Scalar(ScalarValue::from("abcde")),
ColumnarValue::Scalar(ScalarValue::from(0i64)),
],
Ok(Some("")),
&str,
Utf8,
StringArray
);
test_function!(
RightFunc::new(),
vec![
ColumnarValue::Scalar(ScalarValue::Utf8(None)),
ColumnarValue::Scalar(ScalarValue::from(2i64)),
],
Ok(None),
&str,
Utf8,
StringArray
);
test_function!(
RightFunc::new(),
vec![
ColumnarValue::Scalar(ScalarValue::from("abcde")),
ColumnarValue::Scalar(ScalarValue::Int64(None)),
],
Ok(None),
&str,
Utf8,
StringArray
);
test_function!(
RightFunc::new(),
vec![
ColumnarValue::Scalar(ScalarValue::from("joséérend")),
ColumnarValue::Scalar(ScalarValue::from(5i64)),
],
Ok(Some("érend")),
&str,
Utf8,
StringArray
);
test_function!(
RightFunc::new(),
vec![
ColumnarValue::Scalar(ScalarValue::from("joséérend")),
ColumnarValue::Scalar(ScalarValue::from(-3i64)),
],
Ok(Some("éérend")),
&str,
Utf8,
StringArray
);
#[cfg(not(feature = "unicode_expressions"))]
test_function!(
RightFunc::new(),
&[
ColumnarValue::Scalar(ScalarValue::from("abcde")),
ColumnarValue::Scalar(ScalarValue::from(2i64)),
],
internal_err!(
"function right requires compilation with feature flag: unicode_expressions."
),
&str,
Utf8,
StringArray
);
test_function!(
RightFunc::new(),
vec![
ColumnarValue::Scalar(ScalarValue::Utf8View(Some("abcde".to_string()))),
ColumnarValue::Scalar(ScalarValue::from(2i64)),
],
Ok(Some("de")),
&str,
Utf8View,
StringViewArray
);
test_function!(
RightFunc::new(),
vec![
ColumnarValue::Scalar(ScalarValue::Utf8View(Some("abcde".to_string()))),
ColumnarValue::Scalar(ScalarValue::from(200i64)),
],
Ok(Some("abcde")),
&str,
Utf8View,
StringViewArray
);
test_function!(
RightFunc::new(),
vec![
ColumnarValue::Scalar(ScalarValue::Utf8View(Some("".to_string()))),
ColumnarValue::Scalar(ScalarValue::from(200i64)),
],
Ok(Some("")),
&str,
Utf8View,
StringViewArray
);
test_function!(
RightFunc::new(),
vec![
ColumnarValue::Scalar(ScalarValue::Utf8View(Some(
"joséérend".to_string()
))),
ColumnarValue::Scalar(ScalarValue::from(-3i64)),
],
Ok(Some("éérend")),
&str,
Utf8View,
StringViewArray
);
let input = "joé楽s𐀀so↓j";
for n in 1..=input.chars().count() {
let expected = input.chars().skip(n).collect::<String>();
test_function!(
RightFunc::new(),
vec![
ColumnarValue::Scalar(ScalarValue::from(input)),
ColumnarValue::Scalar(ScalarValue::from(-(n as i64))),
],
Ok(Some(expected.as_str())),
&str,
Utf8,
StringArray
);
}
Ok(())
}
}