1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
#[cfg(feature = "parallel")]
use rayon::{
Scope,
{self},
};
#[allow(dead_code)]
#[derive(Copy, Clone)]
pub(crate) struct Worker {
cpus: usize,
}
impl Worker {
#[cfg(not(feature = "parallel"))]
pub(crate) fn new() -> Worker {
Self { cpus: 1 }
}
#[cfg(feature = "parallel")]
pub(crate) fn new() -> Worker {
Self {
cpus: rayon::current_num_threads(),
}
}
#[allow(dead_code)]
pub(crate) fn log_num_cpus(&self) -> u32 {
log2_floor(self.cpus)
}
#[cfg(not(feature = "parallel"))]
pub(crate) fn scope<'a, F: 'a + Send + FnOnce(&SerialScope, usize) -> R, R: Send>(
&self,
elements: usize,
f: F,
) -> R {
f(&SerialScope {}, elements)
}
#[cfg(feature = "parallel")]
pub(crate) fn scope<'a, F: 'a + Send + FnOnce(&Scope<'a>, usize) -> R, R: Send>(&self, elements: usize, f: F) -> R {
let chunk_size = match elements < self.cpus {
true => 1,
false => elements / self.cpus,
};
rayon::scope(move |scope| f(scope, chunk_size))
}
}
#[cfg(not(feature = "parallel"))]
pub struct SerialScope {}
#[cfg(not(feature = "parallel"))]
impl SerialScope {
pub fn spawn<Function: FnOnce(&SerialScope)>(&self, body: Function) {
body(self)
}
}
pub(crate) fn log2_floor(num: usize) -> u32 {
assert!(num > 0);
let mut pow = 0;
while (1 << (pow + 1)) <= num {
pow += 1;
}
pow
}
#[test]
fn test_log2_floor() {
assert_eq!(log2_floor(1), 0);
assert_eq!(log2_floor(2), 1);
assert_eq!(log2_floor(3), 1);
assert_eq!(log2_floor(4), 2);
assert_eq!(log2_floor(5), 2);
assert_eq!(log2_floor(6), 2);
assert_eq!(log2_floor(7), 2);
assert_eq!(log2_floor(8), 3);
}