1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
pub mod boolean;
use crate::utils::TrustMyLength;
use crate::vec::AlignedVec;
use arrow::buffer::MutableBuffer;
use arrow::datatypes::{ArrowNativeType, ArrowPrimitiveType};
use arrow::util::bit_util;
use std::slice::Iter;
pub unsafe trait TrustedLen: Iterator {}
unsafe impl<T> TrustedLen for Iter<'_, T> {}
unsafe impl<B, I: TrustedLen, T: FnMut(I::Item) -> B> TrustedLen for std::iter::Map<I, T> {}
unsafe impl<'a, I, T: 'a> TrustedLen for std::iter::Copied<I>
where
I: TrustedLen<Item = &'a T>,
T: Copy,
{
}
unsafe impl<I> TrustedLen for std::iter::Enumerate<I> where I: TrustedLen {}
unsafe impl<A, B> TrustedLen for std::iter::Zip<A, B>
where
A: TrustedLen,
B: TrustedLen,
{
}
unsafe impl<T> TrustedLen for std::slice::Windows<'_, T> {}
unsafe impl<A, B> TrustedLen for std::iter::Chain<A, B>
where
A: TrustedLen,
B: TrustedLen<Item = A::Item>,
{
}
unsafe impl<T> TrustedLen for std::iter::Once<T> {}
unsafe impl<T> TrustedLen for std::vec::IntoIter<T> {}
unsafe impl<A: Clone> TrustedLen for std::iter::Repeat<A> {}
unsafe impl<A, F: FnMut() -> A> TrustedLen for std::iter::RepeatWith<F> {}
unsafe impl<A: TrustedLen> TrustedLen for std::iter::Take<A> {}
unsafe impl<I: TrustedLen + DoubleEndedIterator> TrustedLen for std::iter::Rev<I> {}
unsafe impl<I: Iterator<Item = J>, J> TrustedLen for TrustMyLength<I, J> {}
unsafe impl<T> TrustedLen for std::ops::Range<T> where std::ops::Range<T>: Iterator {}
unsafe impl<T: ArrowPrimitiveType> TrustedLen for arrow::array::PrimitiveIter<'_, T> {}
unsafe impl TrustedLen for arrow::array::GenericStringIter<'_, i64> {}
unsafe impl TrustedLen for arrow::array::BooleanIter<'_> {}
#[inline]
pub unsafe fn trusted_len_unzip_extend<I, P, T>(
iterator: I,
values: &mut AlignedVec<T>,
validity: &mut MutableBuffer,
) where
T: ArrowNativeType,
P: std::borrow::Borrow<Option<T>>,
I: Iterator<Item = P>,
{
let (_, upper) = iterator.size_hint();
let upper = upper.expect("trusted_len_unzip requires an upper limit");
let offset = values.len();
let dst_validity = validity.as_mut_ptr();
let mut dst = values.as_mut_ptr() as *mut T;
dst = dst.add(offset);
let start = dst;
for (i, item) in iterator.enumerate() {
let item = item.borrow();
if let Some(item) = item {
std::ptr::write(dst, *item);
bit_util::set_bit_raw(dst_validity, i + offset);
} else {
std::ptr::write(dst, T::default());
}
dst = dst.add(1);
}
assert_eq!(
dst.offset_from(start) as usize,
upper,
"Trusted iterator length was not accurately reported"
);
values.set_len(values.len() + upper)
}
pub trait PushUnchecked<T> {
unsafe fn push_unchecked(&mut self, value: T);
unsafe fn push_unchecked_no_len_set(&mut self, value: T);
fn extend_trusted_len<I: IntoIterator<Item = T> + TrustedLen>(&mut self, iter: I);
}
impl<T> PushUnchecked<T> for Vec<T> {
#[inline]
unsafe fn push_unchecked(&mut self, value: T) {
let end = self.as_mut_ptr().add(self.len());
std::ptr::write(end, value);
self.set_len(self.len() + 1);
}
#[inline]
unsafe fn push_unchecked_no_len_set(&mut self, value: T) {
let end = self.as_mut_ptr().add(self.len());
std::ptr::write(end, value);
}
#[inline]
fn extend_trusted_len<I: IntoIterator<Item = T> + TrustedLen>(&mut self, iter: I) {
let iter = iter.into_iter();
let upper = iter.size_hint().1.expect("must have an upper bound");
self.reserve(upper);
unsafe {
let mut dst = self.as_mut_ptr().add(self.len());
for value in iter {
std::ptr::write(dst, value);
dst = dst.add(1)
}
self.set_len(self.len() + upper)
}
}
}