vortex_zigzag/
compress.rs

1// SPDX-License-Identifier: Apache-2.0
2// SPDX-FileCopyrightText: Copyright the Vortex contributors
3
4use vortex_array::arrays::PrimitiveArray;
5use vortex_array::validity::Validity;
6use vortex_array::vtable::ValidityHelper;
7use vortex_buffer::BufferMut;
8use vortex_dtype::{NativePType, PType};
9use vortex_error::{VortexResult, vortex_bail, vortex_panic};
10use zigzag::ZigZag as ExternalZigZag;
11
12use crate::ZigZagArray;
13
14pub fn zigzag_encode(parray: PrimitiveArray) -> VortexResult<ZigZagArray> {
15    let validity = parray.validity().clone();
16    let encoded = match parray.ptype() {
17        PType::I8 => zigzag_encode_primitive::<i8>(parray.into_buffer_mut(), validity),
18        PType::I16 => zigzag_encode_primitive::<i16>(parray.into_buffer_mut(), validity),
19        PType::I32 => zigzag_encode_primitive::<i32>(parray.into_buffer_mut(), validity),
20        PType::I64 => zigzag_encode_primitive::<i64>(parray.into_buffer_mut(), validity),
21        _ => vortex_bail!(
22            "ZigZag can only encode signed integers, got {}",
23            parray.ptype()
24        ),
25    };
26    ZigZagArray::try_new(encoded.to_array())
27}
28
29fn zigzag_encode_primitive<T: ExternalZigZag + NativePType>(
30    values: BufferMut<T>,
31    validity: Validity,
32) -> PrimitiveArray
33where
34    <T as ExternalZigZag>::UInt: NativePType,
35{
36    PrimitiveArray::new(values.map_each(|v| T::encode(v)).freeze(), validity)
37}
38
39pub fn zigzag_decode(parray: PrimitiveArray) -> PrimitiveArray {
40    let validity = parray.validity().clone();
41    match parray.ptype() {
42        PType::U8 => zigzag_decode_primitive::<i8>(parray.into_buffer_mut(), validity),
43        PType::U16 => zigzag_decode_primitive::<i16>(parray.into_buffer_mut(), validity),
44        PType::U32 => zigzag_decode_primitive::<i32>(parray.into_buffer_mut(), validity),
45        PType::U64 => zigzag_decode_primitive::<i64>(parray.into_buffer_mut(), validity),
46        _ => vortex_panic!(
47            "ZigZag can only decode unsigned integers, got {}",
48            parray.ptype()
49        ),
50    }
51}
52
53fn zigzag_decode_primitive<T: ExternalZigZag + NativePType>(
54    values: BufferMut<T::UInt>,
55    validity: Validity,
56) -> PrimitiveArray
57where
58    <T as ExternalZigZag>::UInt: NativePType,
59{
60    PrimitiveArray::new(values.map_each(|v| T::decode(v)).freeze(), validity)
61}
62
63#[cfg(test)]
64mod test {
65    use vortex_array::ToCanonical;
66
67    use super::*;
68    use crate::ZigZagEncoding;
69
70    #[test]
71    fn test_compress_i8() {
72        let compressed = zigzag_encode(PrimitiveArray::from_iter(-100_i8..100)).unwrap();
73        assert_eq!(compressed.encoding_id(), ZigZagEncoding.id());
74        assert_eq!(
75            compressed.to_primitive().as_slice::<i8>(),
76            (-100_i8..100).collect::<Vec<_>>()
77        );
78    }
79    #[test]
80    fn test_compress_i16() {
81        let compressed = zigzag_encode(PrimitiveArray::from_iter(-100_i16..100)).unwrap();
82        assert_eq!(compressed.encoding_id(), ZigZagEncoding.id());
83        assert_eq!(
84            compressed.to_primitive().as_slice::<i16>(),
85            (-100_i16..100).collect::<Vec<_>>()
86        );
87    }
88    #[test]
89    fn test_compress_i32() {
90        let compressed = zigzag_encode(PrimitiveArray::from_iter(-100_i32..100)).unwrap();
91        assert_eq!(compressed.encoding_id(), ZigZagEncoding.id());
92        assert_eq!(
93            compressed.to_primitive().as_slice::<i32>(),
94            (-100_i32..100).collect::<Vec<_>>()
95        );
96    }
97    #[test]
98    fn test_compress_i64() {
99        let compressed = zigzag_encode(PrimitiveArray::from_iter(-100_i64..100)).unwrap();
100        assert_eq!(compressed.encoding_id(), ZigZagEncoding.id());
101        assert_eq!(
102            compressed.to_primitive().as_slice::<i64>(),
103            (-100_i64..100).collect::<Vec<_>>()
104        );
105    }
106}