vortex_array/arrays/bool/compute/
take.rs

1// SPDX-License-Identifier: Apache-2.0
2// SPDX-FileCopyrightText: Copyright the Vortex contributors
3
4use arrow_buffer::BooleanBuffer;
5use itertools::Itertools as _;
6use num_traits::AsPrimitive;
7use vortex_dtype::match_each_integer_ptype;
8use vortex_error::VortexResult;
9use vortex_mask::Mask;
10use vortex_scalar::Scalar;
11
12use crate::arrays::{BoolArray, BoolVTable, ConstantArray};
13use crate::compute::{TakeKernel, TakeKernelAdapter, fill_null};
14use crate::vtable::ValidityHelper;
15use crate::{Array, ArrayRef, IntoArray, ToCanonical, register_kernel};
16
17impl TakeKernel for BoolVTable {
18    fn take(&self, array: &BoolArray, indices: &dyn Array) -> VortexResult<ArrayRef> {
19        let indices_nulls_zeroed = match indices.validity_mask() {
20            Mask::AllTrue(_) => indices.to_array(),
21            Mask::AllFalse(_) => {
22                return Ok(ConstantArray::new(
23                    Scalar::null(array.dtype().as_nullable()),
24                    indices.len(),
25                )
26                .into_array());
27            }
28            Mask::Values(_) => fill_null(indices, &Scalar::from(0).cast(indices.dtype())?)?,
29        };
30        let indices_nulls_zeroed = indices_nulls_zeroed.to_primitive();
31        let buffer = match_each_integer_ptype!(indices_nulls_zeroed.ptype(), |I| {
32            take_valid_indices(array.boolean_buffer(), indices_nulls_zeroed.as_slice::<I>())
33        });
34
35        Ok(BoolArray::new(buffer, array.validity().take(indices)?).to_array())
36    }
37}
38
39register_kernel!(TakeKernelAdapter(BoolVTable).lift());
40
41fn take_valid_indices<I: AsPrimitive<usize>>(
42    bools: &BooleanBuffer,
43    indices: &[I],
44) -> BooleanBuffer {
45    // For boolean arrays that roughly fit into a single page (at least, on Linux), it's worth
46    // the overhead to convert to a Vec<bool>.
47    if bools.len() <= 4096 {
48        let bools = bools.into_iter().collect_vec();
49        take_byte_bool(bools, indices)
50    } else {
51        take_bool(bools, indices)
52    }
53}
54
55fn take_byte_bool<I: AsPrimitive<usize>>(bools: Vec<bool>, indices: &[I]) -> BooleanBuffer {
56    BooleanBuffer::collect_bool(indices.len(), |idx| {
57        bools[unsafe { indices.get_unchecked(idx).as_() }]
58    })
59}
60
61fn take_bool<I: AsPrimitive<usize>>(bools: &BooleanBuffer, indices: &[I]) -> BooleanBuffer {
62    BooleanBuffer::collect_bool(indices.len(), |idx| {
63        // We can always take from the indices unchecked since collect_bool just iterates len.
64        bools.value(unsafe { indices.get_unchecked(idx).as_() })
65    })
66}
67
68#[cfg(test)]
69mod test {
70    use rstest::rstest;
71    use vortex_buffer::buffer;
72    use vortex_dtype::{DType, Nullability};
73    use vortex_scalar::Scalar;
74
75    use crate::arrays::BoolArray;
76    use crate::arrays::primitive::PrimitiveArray;
77    use crate::compute::conformance::take::test_take_conformance;
78    use crate::compute::take;
79    use crate::validity::Validity;
80    use crate::{Array, ToCanonical};
81
82    #[test]
83    fn take_nullable() {
84        let reference = BoolArray::from_iter(vec![
85            Some(false),
86            Some(true),
87            Some(false),
88            None,
89            Some(false),
90        ]);
91
92        let b = take(
93            reference.as_ref(),
94            PrimitiveArray::from_iter([0, 3, 4]).as_ref(),
95        )
96        .unwrap()
97        .to_bool();
98        assert_eq!(
99            b.boolean_buffer(),
100            BoolArray::from_iter([Some(false), None, Some(false)]).boolean_buffer()
101        );
102
103        let nullable_bool_dtype = DType::Bool(Nullability::Nullable);
104        let all_invalid_indices = PrimitiveArray::from_option_iter([None::<u32>, None, None]);
105        let b = take(reference.as_ref(), all_invalid_indices.as_ref()).unwrap();
106        assert_eq!(b.dtype(), &nullable_bool_dtype);
107        assert_eq!(b.scalar_at(0), Scalar::null(nullable_bool_dtype.clone()));
108        assert_eq!(b.scalar_at(1), Scalar::null(nullable_bool_dtype.clone()));
109        assert_eq!(b.scalar_at(2), Scalar::null(nullable_bool_dtype));
110    }
111
112    #[test]
113    fn test_bool_array_take_with_null_out_of_bounds_indices() {
114        let values = BoolArray::from_iter(vec![Some(false), Some(true), None, None, Some(false)]);
115        let indices = PrimitiveArray::new(
116            buffer![0, 3, 100],
117            Validity::Array(BoolArray::from_iter([true, true, false]).to_array()),
118        );
119        let actual = take(values.as_ref(), indices.as_ref()).unwrap();
120        assert_eq!(actual.scalar_at(0), Scalar::from(Some(false)));
121        // position 3 is null
122        assert_eq!(actual.scalar_at(1), Scalar::null_typed::<bool>());
123        // the third index is null
124        assert_eq!(actual.scalar_at(2), Scalar::null_typed::<bool>());
125    }
126
127    #[test]
128    fn test_non_null_bool_array_take_with_null_out_of_bounds_indices() {
129        let values = BoolArray::from_iter(vec![false, true, false, true, false]);
130        let indices = PrimitiveArray::new(
131            buffer![0, 3, 100],
132            Validity::Array(BoolArray::from_iter([true, true, false]).to_array()),
133        );
134        let actual = take(values.as_ref(), indices.as_ref()).unwrap();
135        assert_eq!(actual.scalar_at(0), Scalar::from(Some(false)));
136        assert_eq!(actual.scalar_at(1), Scalar::from(Some(true)));
137        // the third index is null
138        assert_eq!(actual.scalar_at(2), Scalar::null_typed::<bool>());
139    }
140
141    #[test]
142    fn test_bool_array_take_all_null_indices() {
143        let values = BoolArray::from_iter(vec![Some(false), Some(true), None, None, Some(false)]);
144        let indices = PrimitiveArray::new(
145            buffer![0, 3, 100],
146            Validity::Array(BoolArray::from_iter([false, false, false]).to_array()),
147        );
148        let actual = take(values.as_ref(), indices.as_ref()).unwrap();
149        assert_eq!(actual.scalar_at(0), Scalar::null_typed::<bool>());
150        assert_eq!(actual.scalar_at(1), Scalar::null_typed::<bool>());
151        assert_eq!(actual.scalar_at(2), Scalar::null_typed::<bool>());
152    }
153
154    #[test]
155    fn test_non_null_bool_array_take_all_null_indices() {
156        let values = BoolArray::from_iter(vec![false, true, false, true, false]);
157        let indices = PrimitiveArray::new(
158            buffer![0, 3, 100],
159            Validity::Array(BoolArray::from_iter([false, false, false]).to_array()),
160        );
161        let actual = take(values.as_ref(), indices.as_ref()).unwrap();
162        assert_eq!(actual.scalar_at(0), Scalar::null_typed::<bool>());
163        assert_eq!(actual.scalar_at(1), Scalar::null_typed::<bool>());
164        assert_eq!(actual.scalar_at(2), Scalar::null_typed::<bool>());
165    }
166
167    #[rstest]
168    #[case(BoolArray::from_iter([true, false, true, true, false]))]
169    #[case(BoolArray::from_iter([Some(true), None, Some(false), Some(true), None]))]
170    #[case(BoolArray::from_iter([true, false]))]
171    #[case(BoolArray::from_iter([true]))]
172    fn test_take_bool_conformance(#[case] array: BoolArray) {
173        test_take_conformance(array.as_ref());
174    }
175}