1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
extern crate rand;
use rand::Rng;
#[derive(Clone, Debug, PartialEq)]
struct AliasEntry{
val: usize,
alias: usize,
prob_of_val: f64,
}
impl AliasEntry{
pub fn new(val: usize, alias: usize, prob_of_val: f64) -> Self {
return AliasEntry{val, alias, prob_of_val}
}
}
#[derive(Clone, Debug, PartialEq)]
pub struct LoadedDiceSampler<R: Rng> {
entries: Vec<AliasEntry>,
rng: R,
}
impl<R: Rng> LoadedDiceSampler<R> {
pub fn new(probs: Vec<f64>, rng: R) -> Self{
let entries = LoadedDiceSampler::<R>::construct_table(probs);
Self{entries, rng}
}
pub fn sample(&mut self) -> usize{
let index = self.rng.gen_range(0,self.entries.len());
let coin = self.rng.gen::<f64>();
let entry = &self.entries[index];
if coin > entry.prob_of_val {
return entry.alias;
}
return entry.val;
}
fn construct_table(probs: Vec<f64>) -> Vec<AliasEntry>{
let mut res = vec!();
let n = probs.len() as f64;
let inv_n = 1.0 / probs.len() as f64;
let mut tmp = {probs.clone().into_iter().enumerate().collect::<Vec<_>>()};
while tmp.len() > 1{
tmp.sort_by(|&(_,p1), &(_,p2)| p2.partial_cmp(&p1).unwrap());
let (min_i, min_p) = tmp.pop().unwrap();
let &mut (ref max_i, ref mut max_p) = tmp.get_mut(0).unwrap();
res.push(AliasEntry::new(min_i, *max_i, min_p*n));
let used_prob = inv_n - min_p;
*max_p -= used_prob;
}
let (last_i, last_p) = tmp.pop().unwrap();
assert!(0.999 < last_p*n && last_p*n < 1.001);
res.push(AliasEntry::new(last_i, std::usize::MAX, 1.0));
return res;
}
}
#[cfg(test)]
mod tests {
use ::LoadedDiceSampler;
use rand::{thread_rng, Rng};
#[test]
fn it_works() {
let len = thread_rng().gen_range(3,10);
let base = (0..len).map(|_| thread_rng().gen::<f64>()).collect::<Vec<_>>();
let sum : f64 = base.iter().sum();
let base = base.iter().map(|v| v / sum).collect::<Vec<_>>();
let mut s = LoadedDiceSampler::new(base.clone(), thread_rng());
let mut res: Vec<usize> = vec!(0; len);
let iter: usize = 1000000;
for i in (0..iter) {
let i = s.sample();
res[i] += 1;
}
let res_p = res.iter().map(|&f| f as f64 / iter as f64).collect::<Vec<_>>();
println!("{:?}", res_p);
for (i,c) in res.iter().enumerate(){
let p_i = *c as f64 / iter as f64;
assert!(base[i] *0.99 < p_i && base[i] * 1.01 > p_i);
}
}
}