1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
use rand::random;
pub trait ReservoirSampler {
type Item;
fn sample(&mut self, it: Self::Item) -> (usize, usize, Option<Self::Item>);
fn samples(&self) -> &[Option<Self::Item>];
fn lock(self) -> Vec<Option<Self::Item>>;
}
pub struct Reservoir<T> {
total: usize,
pool: Vec<Option<T>>,
}
impl<T: Clone> Reservoir<T> {
pub fn with_capacity(n: usize) -> Self {
Self {
total: 0,
pool: std::vec::from_elem(Option::<T>::None, n),
}
}
}
impl<T> ReservoirSampler for Reservoir<T> {
type Item = T;
fn sample(&mut self, it: Self::Item) -> (usize, usize, Option<Self::Item>) {
let pool_cap = self.pool.capacity();
self.total += 1;
let r = random::<usize>() % self.total + 1;
let mut replaced = None;
if r <= pool_cap {
replaced = self.pool[r - 1].take();
self.pool[r - 1] = Some(it);
}
if self.total <= pool_cap && r < self.total {
self.pool[self.total - 1] = replaced.take();
}
(r, self.total, replaced)
}
fn samples(&self) -> &[Option<Self::Item>] {
&self.pool[..]
}
fn lock(mut self) -> Vec<Option<Self::Item>> {
let mut i = self.total;
while i < self.pool.capacity() {
i += 1;
let r = random::<usize>() % i + 1;
if r <= self.pool.capacity() {
self.pool[i - 1] = self.pool[r - 1].take();
}
}
self.pool
}
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn test() {
let list = [1, 2, 3, 4, 5, 6, 7, 8, 9, 10];
let mut reservoir = Reservoir::<i32>::with_capacity(15);
for &it in &list {
let _ = reservoir.sample(it);
println!("current: {:?}", reservoir.samples());
}
println!("result: {:?}", reservoir.lock());
}
}