1use std::collections::HashSet;
5use std::io::Write;
6use std::ops::{Range, RangeBounds};
7use std::{collections::BTreeMap, io::Read};
8
9use arrow_array::{Array, BinaryArray, GenericBinaryArray};
10use arrow_buffer::{Buffer, NullBuffer, OffsetBuffer};
11use byteorder::{ReadBytesExt, WriteBytesExt};
12use deepsize::DeepSizeOf;
13use roaring::{MultiOps, RoaringBitmap, RoaringTreemap};
14
15use crate::Result;
16
17use super::address::RowAddress;
18
19#[derive(Clone, Debug, Default, DeepSizeOf)]
28pub struct RowIdMask {
29 pub allow_list: Option<RowIdTreeMap>,
31 pub block_list: Option<RowIdTreeMap>,
33}
34
35impl RowIdMask {
36 pub fn all_rows() -> Self {
38 Self::default()
39 }
40
41 pub fn allow_nothing() -> Self {
43 Self {
44 allow_list: Some(RowIdTreeMap::new()),
45 block_list: None,
46 }
47 }
48
49 pub fn from_allowed(allow_list: RowIdTreeMap) -> Self {
51 Self {
52 allow_list: Some(allow_list),
53 block_list: None,
54 }
55 }
56
57 pub fn from_block(block_list: RowIdTreeMap) -> Self {
59 Self {
60 allow_list: None,
61 block_list: Some(block_list),
62 }
63 }
64
65 pub fn selected(&self, row_id: u64) -> bool {
67 match (&self.allow_list, &self.block_list) {
68 (None, None) => true,
69 (Some(allow_list), None) => allow_list.contains(row_id),
70 (None, Some(block_list)) => !block_list.contains(row_id),
71 (Some(allow_list), Some(block_list)) => {
72 allow_list.contains(row_id) && !block_list.contains(row_id)
73 }
74 }
75 }
76
77 pub fn selected_indices<'a>(&self, row_ids: impl Iterator<Item = &'a u64> + 'a) -> Vec<u64> {
79 let enumerated_ids = row_ids.enumerate();
80 match (&self.block_list, &self.allow_list) {
81 (Some(block_list), Some(allow_list)) => {
82 enumerated_ids
84 .filter(|(_, row_id)| {
85 !block_list.contains(**row_id) && allow_list.contains(**row_id)
86 })
87 .map(|(idx, _)| idx as u64)
88 .collect()
89 }
90 (Some(block_list), None) => {
91 enumerated_ids
93 .filter(|(_, row_id)| !block_list.contains(**row_id))
94 .map(|(idx, _)| idx as u64)
95 .collect()
96 }
97 (None, Some(allow_list)) => {
98 enumerated_ids
100 .filter(|(_, row_id)| allow_list.contains(**row_id))
101 .map(|(idx, _)| idx as u64)
102 .collect()
103 }
104 (None, None) => {
105 panic!("selected_indices called but prefilter has nothing to filter with")
108 }
109 }
110 }
111
112 pub fn also_block(self, block_list: RowIdTreeMap) -> Self {
114 if block_list.is_empty() {
115 return self;
116 }
117 if let Some(existing) = self.block_list {
118 Self {
119 block_list: Some(existing | block_list),
120 allow_list: self.allow_list,
121 }
122 } else {
123 Self {
124 block_list: Some(block_list),
125 allow_list: self.allow_list,
126 }
127 }
128 }
129
130 pub fn also_allow(self, allow_list: RowIdTreeMap) -> Self {
132 if let Some(existing) = self.allow_list {
133 Self {
134 block_list: self.block_list,
135 allow_list: Some(existing | allow_list),
136 }
137 } else {
138 Self {
139 block_list: self.block_list,
140 allow_list: None,
143 }
144 }
145 }
146
147 pub fn into_arrow(&self) -> Result<BinaryArray> {
160 let block_list_length = self
161 .block_list
162 .as_ref()
163 .map(|bl| bl.serialized_size())
164 .unwrap_or(0);
165 let allow_list_length = self
166 .allow_list
167 .as_ref()
168 .map(|al| al.serialized_size())
169 .unwrap_or(0);
170 let lengths = vec![block_list_length, allow_list_length];
171 let offsets = OffsetBuffer::from_lengths(lengths);
172 let mut value_bytes = vec![0; block_list_length + allow_list_length];
173 let mut validity = vec![false, false];
174 if let Some(block_list) = &self.block_list {
175 validity[0] = true;
176 block_list.serialize_into(&mut value_bytes[0..])?;
177 }
178 if let Some(allow_list) = &self.allow_list {
179 validity[1] = true;
180 allow_list.serialize_into(&mut value_bytes[block_list_length..])?;
181 }
182 let values = Buffer::from(value_bytes);
183 let nulls = NullBuffer::from(validity);
184 Ok(BinaryArray::try_new(offsets, values, Some(nulls))?)
185 }
186
187 pub fn from_arrow(array: &GenericBinaryArray<i32>) -> Result<Self> {
189 let block_list = if array.is_null(0) {
190 None
191 } else {
192 Some(RowIdTreeMap::deserialize_from(array.value(0)))
193 }
194 .transpose()?;
195
196 let allow_list = if array.is_null(1) {
197 None
198 } else {
199 Some(RowIdTreeMap::deserialize_from(array.value(1)))
200 }
201 .transpose()?;
202 Ok(Self {
203 block_list,
204 allow_list,
205 })
206 }
207}
208
209impl std::ops::Not for RowIdMask {
210 type Output = Self;
211
212 fn not(self) -> Self::Output {
213 Self {
214 block_list: self.allow_list,
215 allow_list: self.block_list,
216 }
217 }
218}
219
220impl std::ops::BitAnd for RowIdMask {
221 type Output = Self;
222
223 fn bitand(self, rhs: Self) -> Self::Output {
224 let block_list = match (self.block_list, rhs.block_list) {
225 (None, None) => None,
226 (Some(lhs), None) => Some(lhs),
227 (None, Some(rhs)) => Some(rhs),
228 (Some(lhs), Some(rhs)) => Some(lhs | rhs),
229 };
230 let allow_list = match (self.allow_list, rhs.allow_list) {
231 (None, None) => None,
232 (Some(lhs), None) => Some(lhs),
233 (None, Some(rhs)) => Some(rhs),
234 (Some(lhs), Some(rhs)) => Some(lhs & rhs),
235 };
236 Self {
237 block_list,
238 allow_list,
239 }
240 }
241}
242
243impl std::ops::BitOr for RowIdMask {
244 type Output = Self;
245
246 fn bitor(self, rhs: Self) -> Self::Output {
247 let block_list = match (self.block_list, rhs.block_list) {
248 (None, None) => None,
249 (Some(lhs), None) => Some(lhs),
250 (None, Some(rhs)) => Some(rhs),
251 (Some(lhs), Some(rhs)) => Some(lhs & rhs),
252 };
253 let allow_list = match (self.allow_list, rhs.allow_list) {
254 (None, None) => None,
255 (Some(_), None) => None,
258 (None, Some(_)) => None,
259 (Some(lhs), Some(rhs)) => Some(lhs | rhs),
260 };
261 Self {
262 block_list,
263 allow_list,
264 }
265 }
266}
267
268#[derive(Clone, Debug, Default, PartialEq, DeepSizeOf)]
278pub struct RowIdTreeMap {
279 inner: BTreeMap<u32, RowIdSelection>,
283}
284
285#[derive(Clone, Debug, PartialEq)]
286enum RowIdSelection {
287 Full,
288 Partial(RoaringBitmap),
289}
290
291impl DeepSizeOf for RowIdSelection {
292 fn deep_size_of_children(&self, _context: &mut deepsize::Context) -> usize {
293 match self {
294 Self::Full => 0,
295 Self::Partial(bitmap) => bitmap.serialized_size(),
296 }
297 }
298}
299
300impl RowIdSelection {
301 fn union_all(selections: &[&Self]) -> Self {
302 let mut is_full = false;
303
304 let res = Self::Partial(
305 selections
306 .iter()
307 .filter_map(|selection| match selection {
308 Self::Full => {
309 is_full = true;
310 None
311 }
312 Self::Partial(bitmap) => Some(bitmap),
313 })
314 .union(),
315 );
316
317 if is_full {
318 Self::Full
319 } else {
320 res
321 }
322 }
323}
324
325impl RowIdTreeMap {
326 pub fn new() -> Self {
328 Self::default()
329 }
330
331 pub fn is_empty(&self) -> bool {
332 self.inner.is_empty()
333 }
334
335 pub fn len(&self) -> Option<u64> {
339 self.inner
340 .values()
341 .map(|row_id_selection| match row_id_selection {
342 RowIdSelection::Full => None,
343 RowIdSelection::Partial(indices) => Some(indices.len()),
344 })
345 .try_fold(0_u64, |acc, next| next.map(|next| next + acc))
346 }
347
348 pub fn row_ids(&self) -> Option<impl Iterator<Item = RowAddress> + '_> {
353 let inner_iters = self
354 .inner
355 .iter()
356 .filter_map(|(frag_id, row_id_selection)| match row_id_selection {
357 RowIdSelection::Full => None,
358 RowIdSelection::Partial(bitmap) => Some(
359 bitmap
360 .iter()
361 .map(|row_offset| RowAddress::new_from_parts(*frag_id, row_offset)),
362 ),
363 })
364 .collect::<Vec<_>>();
365 if inner_iters.len() != self.inner.len() {
366 None
367 } else {
368 Some(inner_iters.into_iter().flatten())
369 }
370 }
371
372 pub fn insert(&mut self, value: u64) -> bool {
385 let fragment = (value >> 32) as u32;
386 let row_addr = value as u32;
387 match self.inner.get_mut(&fragment) {
388 None => {
389 let mut set = RoaringBitmap::new();
390 set.insert(row_addr);
391 self.inner.insert(fragment, RowIdSelection::Partial(set));
392 true
393 }
394 Some(RowIdSelection::Full) => false,
395 Some(RowIdSelection::Partial(set)) => set.insert(row_addr),
396 }
397 }
398
399 pub fn insert_range<R: RangeBounds<u64>>(&mut self, range: R) -> u64 {
401 let (mut start_high, mut start_low) = match range.start_bound() {
403 std::ops::Bound::Included(&start) => ((start >> 32) as u32, start as u32),
404 std::ops::Bound::Excluded(&start) => {
405 let start = start.saturating_add(1);
406 ((start >> 32) as u32, start as u32)
407 }
408 std::ops::Bound::Unbounded => (0, 0),
409 };
410
411 let (end_high, end_low) = match range.end_bound() {
412 std::ops::Bound::Included(&end) => ((end >> 32) as u32, end as u32),
413 std::ops::Bound::Excluded(&end) => {
414 let end = end.saturating_sub(1);
415 ((end >> 32) as u32, end as u32)
416 }
417 std::ops::Bound::Unbounded => (u32::MAX, u32::MAX),
418 };
419
420 let mut count = 0;
421
422 while start_high <= end_high {
423 let start = start_low;
424 let end = if start_high == end_high {
425 end_low
426 } else {
427 u32::MAX
428 };
429 let fragment = start_high;
430 match self.inner.get_mut(&fragment) {
431 None => {
432 let mut set = RoaringBitmap::new();
433 count += set.insert_range(start..=end);
434 self.inner.insert(fragment, RowIdSelection::Partial(set));
435 }
436 Some(RowIdSelection::Full) => {}
437 Some(RowIdSelection::Partial(set)) => {
438 count += set.insert_range(start..=end);
439 }
440 }
441 start_high += 1;
442 start_low = 0;
443 }
444
445 count
446 }
447
448 pub fn insert_bitmap(&mut self, fragment: u32, bitmap: RoaringBitmap) {
450 self.inner.insert(fragment, RowIdSelection::Partial(bitmap));
451 }
452
453 pub fn insert_fragment(&mut self, fragment_id: u32) {
455 self.inner.insert(fragment_id, RowIdSelection::Full);
456 }
457
458 pub fn contains(&self, value: u64) -> bool {
460 let upper = (value >> 32) as u32;
461 let lower = value as u32;
462 match self.inner.get(&upper) {
463 None => false,
464 Some(RowIdSelection::Full) => true,
465 Some(RowIdSelection::Partial(fragment_set)) => fragment_set.contains(lower),
466 }
467 }
468
469 pub fn remove(&mut self, value: u64) -> bool {
470 let upper = (value >> 32) as u32;
471 let lower = value as u32;
472 match self.inner.get_mut(&upper) {
473 None => false,
474 Some(RowIdSelection::Full) => {
475 let mut set = RoaringBitmap::full();
476 set.remove(lower);
477 self.inner.insert(upper, RowIdSelection::Partial(set));
478 true
479 }
480 Some(RowIdSelection::Partial(lower_set)) => {
481 let removed = lower_set.remove(lower);
482 if lower_set.is_empty() {
483 self.inner.remove(&upper);
484 }
485 removed
486 }
487 }
488 }
489
490 pub fn retain_fragments(&mut self, frag_ids: impl IntoIterator<Item = u32>) {
491 let frag_id_set = frag_ids.into_iter().collect::<HashSet<_>>();
492 self.inner
493 .retain(|frag_id, _| frag_id_set.contains(frag_id));
494 }
495
496 pub fn serialized_size(&self) -> usize {
498 let mut size = 4;
500 for set in self.inner.values() {
501 size += 8;
503 if let RowIdSelection::Partial(set) = set {
504 size += set.serialized_size();
505 }
506 }
507 size
508 }
509
510 pub fn serialize_into<W: Write>(&self, mut writer: W) -> Result<()> {
524 writer.write_u32::<byteorder::LittleEndian>(self.inner.len() as u32)?;
525 for (fragment, set) in &self.inner {
526 writer.write_u32::<byteorder::LittleEndian>(*fragment)?;
527 if let RowIdSelection::Partial(set) = set {
528 writer.write_u32::<byteorder::LittleEndian>(set.serialized_size() as u32)?;
529 set.serialize_into(&mut writer)?;
530 } else {
531 writer.write_u32::<byteorder::LittleEndian>(0)?;
532 }
533 }
534 Ok(())
535 }
536
537 pub fn deserialize_from<R: Read>(mut reader: R) -> Result<Self> {
539 let num_entries = reader.read_u32::<byteorder::LittleEndian>()?;
540 let mut inner = BTreeMap::new();
541 for _ in 0..num_entries {
542 let fragment = reader.read_u32::<byteorder::LittleEndian>()?;
543 let bitmap_size = reader.read_u32::<byteorder::LittleEndian>()?;
544 if bitmap_size == 0 {
545 inner.insert(fragment, RowIdSelection::Full);
546 } else {
547 let mut buffer = vec![0; bitmap_size as usize];
548 reader.read_exact(&mut buffer)?;
549 let set = RoaringBitmap::deserialize_from(&buffer[..])?;
550 inner.insert(fragment, RowIdSelection::Partial(set));
551 }
552 }
553 Ok(Self { inner })
554 }
555
556 pub fn union_all(maps: &[&Self]) -> Self {
557 let mut new_map = BTreeMap::new();
558
559 for map in maps {
560 for (fragment, selection) in &map.inner {
561 new_map
562 .entry(fragment)
563 .or_insert_with(|| Vec::with_capacity(maps.len()))
565 .push(selection);
566 }
567 }
568
569 let new_map = new_map
570 .into_iter()
571 .map(|(&fragment, selections)| (fragment, RowIdSelection::union_all(&selections)))
572 .collect();
573
574 Self { inner: new_map }
575 }
576
577 pub fn mask(&mut self, mask: &RowIdMask) {
582 if let Some(allow_list) = &mask.allow_list {
583 *self &= allow_list;
584 }
585 if let Some(block_list) = &mask.block_list {
586 *self -= block_list;
587 }
588 }
589
590 pub unsafe fn into_id_iter(self) -> impl Iterator<Item = u64> {
598 self.inner
599 .into_iter()
600 .flat_map(|(fragment, selection)| match selection {
601 RowIdSelection::Full => panic!("Size of full fragment is unknown"),
602 RowIdSelection::Partial(bitmap) => bitmap.into_iter().map(move |val| {
603 let fragment = fragment as u64;
604 let row_offset = val as u64;
605 (fragment << 32) | row_offset
606 }),
607 })
608 }
609}
610
611impl std::ops::BitOr<Self> for RowIdTreeMap {
612 type Output = Self;
613
614 fn bitor(mut self, rhs: Self) -> Self::Output {
615 self |= rhs;
616 self
617 }
618}
619
620impl std::ops::BitOrAssign<Self> for RowIdTreeMap {
621 fn bitor_assign(&mut self, rhs: Self) {
622 for (fragment, rhs_set) in &rhs.inner {
623 let lhs_set = self.inner.get_mut(fragment);
624 if let Some(lhs_set) = lhs_set {
625 match lhs_set {
626 RowIdSelection::Full => {
627 }
629 RowIdSelection::Partial(lhs_bitmap) => match rhs_set {
630 RowIdSelection::Full => {
631 *lhs_set = RowIdSelection::Full;
632 }
633 RowIdSelection::Partial(rhs_set) => {
634 *lhs_bitmap |= rhs_set;
635 }
636 },
637 }
638 } else {
639 self.inner.insert(*fragment, rhs_set.clone());
640 }
641 }
642 }
643}
644
645impl std::ops::BitAnd<Self> for RowIdTreeMap {
646 type Output = Self;
647
648 fn bitand(mut self, rhs: Self) -> Self::Output {
649 self &= &rhs;
650 self
651 }
652}
653
654impl std::ops::BitAndAssign<&Self> for RowIdTreeMap {
655 fn bitand_assign(&mut self, rhs: &Self) {
656 self.inner
658 .retain(|fragment, _| rhs.inner.contains_key(fragment));
659
660 for (fragment, mut lhs_set) in &mut self.inner {
662 match (&mut lhs_set, rhs.inner.get(fragment)) {
663 (_, None) => {} (_, Some(RowIdSelection::Full)) => {
665 }
667 (RowIdSelection::Partial(lhs_set), Some(RowIdSelection::Partial(rhs_set))) => {
668 *lhs_set &= rhs_set;
669 }
670 (RowIdSelection::Full, Some(RowIdSelection::Partial(rhs_set))) => {
671 *lhs_set = RowIdSelection::Partial(rhs_set.clone());
672 }
673 }
674 }
675 self.inner.retain(|_, set| match set {
677 RowIdSelection::Partial(set) => !set.is_empty(),
678 RowIdSelection::Full => true,
679 });
680 }
681}
682
683impl std::ops::SubAssign<&Self> for RowIdTreeMap {
684 fn sub_assign(&mut self, rhs: &Self) {
685 for (fragment, rhs_set) in &rhs.inner {
686 match self.inner.get_mut(fragment) {
687 None => {}
688 Some(RowIdSelection::Full) => {
689 match rhs_set {
691 RowIdSelection::Full => {
692 self.inner.remove(fragment);
693 }
694 RowIdSelection::Partial(rhs_set) => {
695 let mut set = RoaringBitmap::full();
697 set -= rhs_set;
698 self.inner.insert(*fragment, RowIdSelection::Partial(set));
699 }
700 }
701 }
702 Some(RowIdSelection::Partial(lhs_set)) => match rhs_set {
703 RowIdSelection::Full => {
704 self.inner.remove(fragment);
705 }
706 RowIdSelection::Partial(rhs_set) => {
707 *lhs_set -= rhs_set;
708 if lhs_set.is_empty() {
709 self.inner.remove(fragment);
710 }
711 }
712 },
713 }
714 }
715 }
716}
717
718impl FromIterator<u64> for RowIdTreeMap {
719 fn from_iter<T: IntoIterator<Item = u64>>(iter: T) -> Self {
720 let mut inner = BTreeMap::new();
721 for row_id in iter {
722 let upper = (row_id >> 32) as u32;
723 let lower = row_id as u32;
724 match inner.get_mut(&upper) {
725 None => {
726 let mut set = RoaringBitmap::new();
727 set.insert(lower);
728 inner.insert(upper, RowIdSelection::Partial(set));
729 }
730 Some(RowIdSelection::Full) => {
731 }
733 Some(RowIdSelection::Partial(set)) => {
734 set.insert(lower);
735 }
736 }
737 }
738 Self { inner }
739 }
740}
741
742impl<'a> FromIterator<&'a u64> for RowIdTreeMap {
743 fn from_iter<T: IntoIterator<Item = &'a u64>>(iter: T) -> Self {
744 Self::from_iter(iter.into_iter().copied())
745 }
746}
747
748impl From<Range<u64>> for RowIdTreeMap {
749 fn from(range: Range<u64>) -> Self {
750 let mut map = Self::default();
751 map.insert_range(range);
752 map
753 }
754}
755
756impl From<RoaringTreemap> for RowIdTreeMap {
757 fn from(roaring: RoaringTreemap) -> Self {
758 let mut inner = BTreeMap::new();
759 for (fragment, set) in roaring.bitmaps() {
760 inner.insert(fragment, RowIdSelection::Partial(set.clone()));
761 }
762 Self { inner }
763 }
764}
765
766impl Extend<u64> for RowIdTreeMap {
767 fn extend<T: IntoIterator<Item = u64>>(&mut self, iter: T) {
768 for row_id in iter {
769 let upper = (row_id >> 32) as u32;
770 let lower = row_id as u32;
771 match self.inner.get_mut(&upper) {
772 None => {
773 let mut set = RoaringBitmap::new();
774 set.insert(lower);
775 self.inner.insert(upper, RowIdSelection::Partial(set));
776 }
777 Some(RowIdSelection::Full) => {
778 }
780 Some(RowIdSelection::Partial(set)) => {
781 set.insert(lower);
782 }
783 }
784 }
785 }
786}
787
788impl<'a> Extend<&'a u64> for RowIdTreeMap {
789 fn extend<T: IntoIterator<Item = &'a u64>>(&mut self, iter: T) {
790 self.extend(iter.into_iter().copied())
791 }
792}
793
794impl Extend<Self> for RowIdTreeMap {
796 fn extend<T: IntoIterator<Item = Self>>(&mut self, iter: T) {
797 for other in iter {
798 for (fragment, set) in other.inner {
799 match self.inner.get_mut(&fragment) {
800 None => {
801 self.inner.insert(fragment, set);
802 }
803 Some(RowIdSelection::Full) => {
804 }
806 Some(RowIdSelection::Partial(lhs_set)) => match set {
807 RowIdSelection::Full => {
808 self.inner.insert(fragment, RowIdSelection::Full);
809 }
810 RowIdSelection::Partial(rhs_set) => {
811 *lhs_set |= rhs_set;
812 }
813 },
814 }
815 }
816 }
817 }
818}
819
820#[cfg(test)]
821mod tests {
822 use super::*;
823 use proptest::prop_assert_eq;
824
825 #[test]
826 fn test_ops() {
827 let mask = RowIdMask::default();
828 assert!(mask.selected(1));
829 assert!(mask.selected(5));
830 let block_list = mask.also_block(RowIdTreeMap::from_iter(&[0, 5, 15]));
831 assert!(block_list.selected(1));
832 assert!(!block_list.selected(5));
833 let allow_list = RowIdMask::from_allowed(RowIdTreeMap::from_iter(&[0, 2, 5]));
834 assert!(!allow_list.selected(1));
835 assert!(allow_list.selected(5));
836 let combined = block_list & allow_list;
837 assert!(combined.selected(2));
838 assert!(!combined.selected(0));
839 assert!(!combined.selected(5));
840 let other = RowIdMask::from_allowed(RowIdTreeMap::from_iter(&[3]));
841 let combined = combined | other;
842 assert!(combined.selected(2));
843 assert!(combined.selected(3));
844 assert!(!combined.selected(0));
845 assert!(!combined.selected(5));
846
847 let block_list = RowIdMask::from_block(RowIdTreeMap::from_iter(&[0]));
848 let allow_list = RowIdMask::from_allowed(RowIdTreeMap::from_iter(&[3]));
849 let combined = block_list | allow_list;
850 assert!(combined.selected(1));
851 }
852
853 #[test]
854 fn test_map_insert_range() {
855 let ranges = &[
856 (0..10),
857 (40..500),
858 ((u32::MAX as u64 - 10)..(u32::MAX as u64 + 20)),
859 ];
860
861 for range in ranges {
862 let mut mask = RowIdTreeMap::default();
863
864 let count = mask.insert_range(range.clone());
865 let expected = range.end - range.start;
866 assert_eq!(count, expected);
867
868 let count = mask.insert_range(range.clone());
869 assert_eq!(count, 0);
870
871 let new_range = range.start + 5..range.end + 5;
872 let count = mask.insert_range(new_range.clone());
873 assert_eq!(count, 5);
874 }
875
876 let mut mask = RowIdTreeMap::default();
877 let count = mask.insert_range(..10);
878 assert_eq!(count, 10);
879 assert!(mask.contains(0));
880
881 let count = mask.insert_range(20..=24);
882 assert_eq!(count, 5);
883
884 mask.insert_fragment(0);
885 let count = mask.insert_range(100..200);
886 assert_eq!(count, 0);
887 }
888
889 #[test]
890 fn test_map_remove() {
891 let mut mask = RowIdTreeMap::default();
892
893 assert!(!mask.remove(20));
894
895 mask.insert(20);
896 assert!(mask.contains(20));
897 assert!(mask.remove(20));
898 assert!(!mask.contains(20));
899
900 mask.insert_range(10..=20);
901 assert!(mask.contains(15));
902 assert!(mask.remove(15));
903 assert!(!mask.contains(15));
904
905 }
908
909 proptest::proptest! {
910 #[test]
911 fn test_map_serialization_roundtrip(
912 values in proptest::collection::vec(
913 (0..u32::MAX, proptest::option::of(proptest::collection::vec(0..u32::MAX, 0..1000))),
914 0..10
915 )
916 ) {
917 let mut mask = RowIdTreeMap::default();
918 for (fragment, rows) in values {
919 if let Some(rows) = rows {
920 let bitmap = RoaringBitmap::from_iter(rows);
921 mask.insert_bitmap(fragment, bitmap);
922 } else {
923 mask.insert_fragment(fragment);
924 }
925 }
926
927 let mut data = Vec::new();
928 mask.serialize_into(&mut data).unwrap();
929 let deserialized = RowIdTreeMap::deserialize_from(data.as_slice()).unwrap();
930 prop_assert_eq!(mask, deserialized);
931 }
932
933 #[test]
934 fn test_map_intersect(
935 left_full_fragments in proptest::collection::vec(0..u32::MAX, 0..10),
936 left_rows in proptest::collection::vec(0..u64::MAX, 0..1000),
937 right_full_fragments in proptest::collection::vec(0..u32::MAX, 0..10),
938 right_rows in proptest::collection::vec(0..u64::MAX, 0..1000),
939 ) {
940 let mut left = RowIdTreeMap::default();
941 for fragment in left_full_fragments.clone() {
942 left.insert_fragment(fragment);
943 }
944 left.extend(left_rows.iter().copied());
945
946 let mut right = RowIdTreeMap::default();
947 for fragment in right_full_fragments.clone() {
948 right.insert_fragment(fragment);
949 }
950 right.extend(right_rows.iter().copied());
951
952 let mut expected = RowIdTreeMap::default();
953 for fragment in &left_full_fragments {
954 if right_full_fragments.contains(fragment) {
955 expected.insert_fragment(*fragment);
956 }
957 }
958
959 let left_in_right = left_rows.iter().filter(|row| {
960 right_rows.contains(row)
961 || right_full_fragments.contains(&((*row >> 32) as u32))
962 });
963 expected.extend(left_in_right);
964 let right_in_left = right_rows.iter().filter(|row| {
965 left_rows.contains(row)
966 || left_full_fragments.contains(&((*row >> 32) as u32))
967 });
968 expected.extend(right_in_left);
969
970 let actual = left & right;
971 prop_assert_eq!(expected, actual);
972 }
973
974 #[test]
975 fn test_map_union(
976 left_full_fragments in proptest::collection::vec(0..u32::MAX, 0..10),
977 left_rows in proptest::collection::vec(0..u64::MAX, 0..1000),
978 right_full_fragments in proptest::collection::vec(0..u32::MAX, 0..10),
979 right_rows in proptest::collection::vec(0..u64::MAX, 0..1000),
980 ) {
981 let mut left = RowIdTreeMap::default();
982 for fragment in left_full_fragments.clone() {
983 left.insert_fragment(fragment);
984 }
985 left.extend(left_rows.iter().copied());
986
987 let mut right = RowIdTreeMap::default();
988 for fragment in right_full_fragments.clone() {
989 right.insert_fragment(fragment);
990 }
991 right.extend(right_rows.iter().copied());
992
993 let mut expected = RowIdTreeMap::default();
994 for fragment in left_full_fragments {
995 expected.insert_fragment(fragment);
996 }
997 for fragment in right_full_fragments {
998 expected.insert_fragment(fragment);
999 }
1000
1001 let combined_rows = left_rows.iter().chain(right_rows.iter());
1002 expected.extend(combined_rows);
1003
1004 let actual = left | right;
1005 for actual_key_val in &actual.inner {
1006 proptest::prop_assert!(expected.inner.contains_key(actual_key_val.0));
1007 let expected_val = expected.inner.get(actual_key_val.0).unwrap();
1008 prop_assert_eq!(
1009 actual_key_val.1,
1010 expected_val,
1011 "error on key {}",
1012 actual_key_val.0
1013 );
1014 }
1015 prop_assert_eq!(expected, actual);
1016 }
1017
1018 #[test]
1019 fn test_map_subassign_rows(
1020 left_full_fragments in proptest::collection::vec(0..u32::MAX, 0..10),
1021 left_rows in proptest::collection::vec(0..u64::MAX, 0..1000),
1022 right_rows in proptest::collection::vec(0..u64::MAX, 0..1000),
1023 ) {
1024 let mut left = RowIdTreeMap::default();
1025 for fragment in left_full_fragments {
1026 left.insert_fragment(fragment);
1027 }
1028 left.extend(left_rows.iter().copied());
1029
1030 let mut right = RowIdTreeMap::default();
1031 right.extend(right_rows.iter().copied());
1032
1033 let mut expected = left.clone();
1034 for row in right_rows {
1035 expected.remove(row);
1036 }
1037
1038 left -= &right;
1039 prop_assert_eq!(expected, left);
1040 }
1041
1042 #[test]
1043 fn test_map_subassign_frags(
1044 left_full_fragments in proptest::collection::vec(0..u32::MAX, 0..10),
1045 right_full_fragments in proptest::collection::vec(0..u32::MAX, 0..10),
1046 left_rows in proptest::collection::vec(0..u64::MAX, 0..1000),
1047 ) {
1048 let mut left = RowIdTreeMap::default();
1049 for fragment in left_full_fragments {
1050 left.insert_fragment(fragment);
1051 }
1052 left.extend(left_rows.iter().copied());
1053
1054 let mut right = RowIdTreeMap::default();
1055 for fragment in right_full_fragments.clone() {
1056 right.insert_fragment(fragment);
1057 }
1058
1059 let mut expected = left.clone();
1060 for fragment in right_full_fragments {
1061 expected.inner.remove(&fragment);
1062 }
1063
1064 left -= &right;
1065 prop_assert_eq!(expected, left);
1066 }
1067 }
1068}