1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
#[cfg(test)]
#[path = "../../../tests/unit/algorithms/clustering/dbscan_test.rs"]
mod dbscan_test;
use hashbrown::{HashMap, HashSet};
use std::hash::Hash;
pub type Cluster<'a, T> = Vec<&'a T>;
pub type NeighborhoodFn<'a, T> = Box<dyn Fn(&'a T, f64) -> Box<dyn Iterator<Item = &'a T> + 'a> + 'a>;
pub fn create_clusters<'a, T>(
points: &'a [T],
epsilon: f64,
min_points: usize,
neighborhood_fn: &NeighborhoodFn<'a, T>,
) -> Vec<Cluster<'a, T>>
where
T: Hash + Eq,
{
let mut point_types = HashMap::<&T, PointType>::new();
let mut clusters = Vec::new();
for point in points {
if point_types.get(point).is_some() {
continue;
}
let mut neighbors = neighborhood_fn(point, epsilon).collect::<Vec<_>>();
if neighbors.len() < min_points {
point_types.insert(point, PointType::Noise);
} else {
let mut cluster = vec![point];
point_types.insert(point, PointType::Clustered);
let mut index = 0;
while index < neighbors.len() {
let point = neighbors[index];
let point_type = point_types.get(point).cloned();
if point_type.is_none() {
let other_neighbours = neighborhood_fn(point, epsilon).collect::<Vec<_>>();
if other_neighbours.len() >= min_points {
let set = neighbors.iter().cloned().collect::<HashSet<_>>();
neighbors.extend(other_neighbours.into_iter().filter(move |point| !set.contains(point)));
}
}
match point_type {
Some(point_type) if point_type == PointType::Clustered => {}
_ => {
point_types.insert(point, PointType::Clustered);
cluster.push(point);
}
}
index += 1;
}
clusters.push(cluster);
}
}
clusters
}
#[derive(Clone, Eq, PartialEq)]
enum PointType {
Noise,
Clustered,
}