Skip to main content

arrow_array/array/
null_array.rs

1// Licensed to the Apache Software Foundation (ASF) under one
2// or more contributor license agreements.  See the NOTICE file
3// distributed with this work for additional information
4// regarding copyright ownership.  The ASF licenses this file
5// to you under the Apache License, Version 2.0 (the
6// "License"); you may not use this file except in compliance
7// with the License.  You may obtain a copy of the License at
8//
9//   http://www.apache.org/licenses/LICENSE-2.0
10//
11// Unless required by applicable law or agreed to in writing,
12// software distributed under the License is distributed on an
13// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14// KIND, either express or implied.  See the License for the
15// specific language governing permissions and limitations
16// under the License.
17
18//! Contains the `NullArray` type.
19
20use crate::builder::NullBuilder;
21use crate::{Array, ArrayRef};
22use arrow_buffer::buffer::NullBuffer;
23use arrow_data::{ArrayData, ArrayDataBuilder};
24use arrow_schema::DataType;
25use std::any::Any;
26use std::sync::Arc;
27
28/// An array of [null values](https://arrow.apache.org/docs/format/Columnar.html#null-layout)
29///
30/// A `NullArray` is a simplified array where all values are null.
31///
32/// # Example: Create an array
33///
34/// ```
35/// use arrow_array::{Array, NullArray};
36///
37/// let array = NullArray::new(10);
38///
39/// assert!(array.is_nullable());
40/// assert_eq!(array.len(), 10);
41/// assert_eq!(array.null_count(), 0);
42/// assert_eq!(array.logical_null_count(), 10);
43/// assert_eq!(array.logical_nulls().unwrap().null_count(), 10);
44/// ```
45#[derive(Clone)]
46pub struct NullArray {
47    len: usize,
48}
49
50impl NullArray {
51    /// Create a new [`NullArray`] of the specified length
52    ///
53    /// *Note*: Use [`crate::array::new_null_array`] if you need an array of some
54    /// other [`DataType`].
55    ///
56    pub fn new(length: usize) -> Self {
57        Self { len: length }
58    }
59
60    /// Returns a zero-copy slice of this array with the indicated offset and length.
61    pub fn slice(&self, offset: usize, len: usize) -> Self {
62        assert!(
63            offset.saturating_add(len) <= self.len,
64            "the length + offset of the sliced BooleanBuffer cannot exceed the existing length"
65        );
66
67        Self { len }
68    }
69
70    /// Returns a new null array builder
71    ///
72    /// Note that the `capacity` parameter to this function is _deprecated_. It
73    /// now does nothing, and will be removed in a future version.
74    pub fn builder(_capacity: usize) -> NullBuilder {
75        NullBuilder::new()
76    }
77}
78
79/// SAFETY: Correctly implements the contract of Arrow Arrays
80unsafe impl Array for NullArray {
81    fn as_any(&self) -> &dyn Any {
82        self
83    }
84
85    fn to_data(&self) -> ArrayData {
86        self.clone().into()
87    }
88
89    fn into_data(self) -> ArrayData {
90        self.into()
91    }
92
93    fn data_type(&self) -> &DataType {
94        &DataType::Null
95    }
96
97    fn slice(&self, offset: usize, length: usize) -> ArrayRef {
98        Arc::new(self.slice(offset, length))
99    }
100
101    fn len(&self) -> usize {
102        self.len
103    }
104
105    fn is_empty(&self) -> bool {
106        self.len == 0
107    }
108
109    fn offset(&self) -> usize {
110        0
111    }
112
113    fn nulls(&self) -> Option<&NullBuffer> {
114        None
115    }
116
117    fn logical_nulls(&self) -> Option<NullBuffer> {
118        (self.len != 0).then(|| NullBuffer::new_null(self.len))
119    }
120
121    fn is_nullable(&self) -> bool {
122        !self.is_empty()
123    }
124
125    fn logical_null_count(&self) -> usize {
126        self.len
127    }
128
129    fn get_buffer_memory_size(&self) -> usize {
130        0
131    }
132
133    fn get_array_memory_size(&self) -> usize {
134        std::mem::size_of::<Self>()
135    }
136}
137
138impl From<ArrayData> for NullArray {
139    fn from(data: ArrayData) -> Self {
140        assert_eq!(
141            data.data_type(),
142            &DataType::Null,
143            "NullArray data type should be Null"
144        );
145        assert_eq!(
146            data.buffers().len(),
147            0,
148            "NullArray data should contain 0 buffers"
149        );
150        assert!(
151            data.nulls().is_none(),
152            "NullArray data should not contain a null buffer, as no buffers are required"
153        );
154        Self { len: data.len() }
155    }
156}
157
158impl From<NullArray> for ArrayData {
159    fn from(array: NullArray) -> Self {
160        let builder = ArrayDataBuilder::new(DataType::Null).len(array.len);
161        unsafe { builder.build_unchecked() }
162    }
163}
164
165impl std::fmt::Debug for NullArray {
166    fn fmt(&self, f: &mut std::fmt::Formatter) -> std::fmt::Result {
167        write!(f, "NullArray({})", self.len())
168    }
169}
170
171#[cfg(test)]
172mod tests {
173    use super::*;
174    use crate::{Int64Array, StructArray, make_array};
175    use arrow_data::transform::MutableArrayData;
176    use arrow_schema::Field;
177
178    #[test]
179    fn test_null_array() {
180        let null_arr = NullArray::new(32);
181
182        assert_eq!(null_arr.len(), 32);
183        assert_eq!(null_arr.null_count(), 0);
184        assert_eq!(null_arr.logical_null_count(), 32);
185        assert_eq!(null_arr.logical_nulls().unwrap().null_count(), 32);
186        assert!(null_arr.is_valid(0));
187        assert!(null_arr.is_nullable());
188    }
189
190    #[test]
191    fn test_null_array_slice() {
192        let array1 = NullArray::new(32);
193
194        let array2 = array1.slice(8, 16);
195        assert_eq!(array2.len(), 16);
196        assert_eq!(array2.null_count(), 0);
197        assert_eq!(array2.logical_null_count(), 16);
198        assert_eq!(array2.logical_nulls().unwrap().null_count(), 16);
199        assert!(array2.is_valid(0));
200        assert!(array2.is_nullable());
201    }
202
203    #[test]
204    fn test_debug_null_array() {
205        let array = NullArray::new(1024 * 1024);
206        assert_eq!(format!("{array:?}"), "NullArray(1048576)");
207    }
208
209    #[test]
210    fn test_null_array_with_parent_null_buffer() {
211        let null_array = NullArray::new(1);
212        let int_array = Int64Array::from(vec![42]);
213
214        let fields = vec![
215            Field::new("a", DataType::Int64, true),
216            Field::new("b", DataType::Null, true),
217        ];
218
219        let struct_array_data = ArrayData::builder(DataType::Struct(fields.into()))
220            .len(1)
221            .add_child_data(int_array.to_data())
222            .add_child_data(null_array.to_data())
223            .build()
224            .unwrap();
225
226        let mut mutable = MutableArrayData::new(vec![&struct_array_data], true, 1);
227
228        // Simulate a NULL value in the parent array, for instance, if array being queried by
229        // invalid index
230        mutable.extend_nulls(1);
231        let data = mutable.freeze();
232
233        let struct_array = Arc::new(StructArray::from(data.clone()));
234        assert!(make_array(data) == struct_array);
235    }
236}