datafusion_functions/string/
uuid.rs

1// Licensed to the Apache Software Foundation (ASF) under one
2// or more contributor license agreements.  See the NOTICE file
3// distributed with this work for additional information
4// regarding copyright ownership.  The ASF licenses this file
5// to you under the Apache License, Version 2.0 (the
6// "License"); you may not use this file except in compliance
7// with the License.  You may obtain a copy of the License at
8//
9//   http://www.apache.org/licenses/LICENSE-2.0
10//
11// Unless required by applicable law or agreed to in writing,
12// software distributed under the License is distributed on an
13// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14// KIND, either express or implied.  See the License for the
15// specific language governing permissions and limitations
16// under the License.
17
18use std::any::Any;
19use std::sync::Arc;
20
21use arrow::array::GenericStringBuilder;
22use arrow::datatypes::DataType;
23use arrow::datatypes::DataType::Utf8;
24use rand::Rng;
25use uuid::Uuid;
26
27use datafusion_common::{Result, assert_or_internal_err};
28use datafusion_expr::{ColumnarValue, Documentation, Volatility};
29use datafusion_expr::{ScalarFunctionArgs, ScalarUDFImpl, Signature};
30use datafusion_macros::user_doc;
31
32#[user_doc(
33    doc_section(label = "String Functions"),
34    description = "Returns [`UUID v4`](https://en.wikipedia.org/wiki/Universally_unique_identifier#Version_4_%28random%29) string value which is unique per row.",
35    syntax_example = "uuid()",
36    sql_example = r#"```sql
37> select uuid();
38+--------------------------------------+
39| uuid()                               |
40+--------------------------------------+
41| 6ec17ef8-1934-41cc-8d59-d0c8f9eea1f0 |
42+--------------------------------------+
43```"#
44)]
45#[derive(Debug, PartialEq, Eq, Hash)]
46pub struct UuidFunc {
47    signature: Signature,
48}
49
50impl Default for UuidFunc {
51    fn default() -> Self {
52        Self::new()
53    }
54}
55
56impl UuidFunc {
57    pub fn new() -> Self {
58        Self {
59            signature: Signature::nullary(Volatility::Volatile),
60        }
61    }
62}
63
64impl ScalarUDFImpl for UuidFunc {
65    fn as_any(&self) -> &dyn Any {
66        self
67    }
68
69    fn name(&self) -> &str {
70        "uuid"
71    }
72
73    fn signature(&self) -> &Signature {
74        &self.signature
75    }
76
77    fn return_type(&self, _arg_types: &[DataType]) -> Result<DataType> {
78        Ok(Utf8)
79    }
80
81    /// Prints random (v4) uuid values per row
82    /// uuid() = 'a0eebc99-9c0b-4ef8-bb6d-6bb9bd380a11'
83    fn invoke_with_args(&self, args: ScalarFunctionArgs) -> Result<ColumnarValue> {
84        assert_or_internal_err!(
85            args.args.is_empty(),
86            "{} function does not accept arguments",
87            self.name()
88        );
89
90        // Generate random u128 values
91        let mut rng = rand::rng();
92        let mut randoms = vec![0u128; args.number_rows];
93        rng.fill(&mut randoms[..]);
94
95        let mut builder = GenericStringBuilder::<i32>::with_capacity(
96            args.number_rows,
97            args.number_rows * 36,
98        );
99
100        let mut buffer = [0u8; 36];
101        for x in &mut randoms {
102            // From Uuid::new_v4(): Mask out the version and variant bits
103            *x = *x & 0xFFFFFFFFFFFF4FFFBFFFFFFFFFFFFFFF | 0x40008000000000000000;
104            let uuid = Uuid::from_u128(*x);
105            let fmt = uuid::fmt::Hyphenated::from_uuid(uuid);
106            builder.append_value(fmt.encode_lower(&mut buffer));
107        }
108
109        Ok(ColumnarValue::Array(Arc::new(builder.finish())))
110    }
111
112    fn documentation(&self) -> Option<&Documentation> {
113        self.doc()
114    }
115}