1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
use crate::algo::graph::eulerian_path::*;
use crate::algo::graph::UnweightedAdjacencyList;
pub fn reconstruct_string(lmers: &[&[u8]]) -> Result<Vec<u8>, EulerianPathError> {
let l = lmers[0].len();
let mut g = UnweightedAdjacencyList::with_size(lmers.len());
let suffixes: Vec<_> = lmers.iter().map(|lmer| &lmer[1..]).collect();
let prefixes: Vec<_> = lmers.iter().map(|lmer| &lmer[..l - 1]).collect();
for (i, suffix) in suffixes.iter().enumerate() {
for (j, prefix) in prefixes.iter().enumerate() {
if suffix == prefix {
g.add_directed_edge(i, j);
}
}
}
let path = g.eulerian_path()?;
let mut res = lmers[path[0]].to_owned();
for &i in &path[1..] {
res.push(lmers[i][l - 1]);
}
Ok(res)
}
#[cfg(test)]
mod tests {
use super::*;
use rand::seq::SliceRandom;
use rand::thread_rng;
fn _test(s: &[u8]) {
let mut lmers: Vec<_> = s.windows(5).collect();
let mut rng = thread_rng();
lmers.shuffle(&mut rng);
let reconstructed = reconstruct_string(&lmers).unwrap();
assert_eq!(&reconstructed, &s);
}
#[test]
fn test_reconstruct_string_from_lmers() {
_test(b"The quick brown fox jumps over the lazy dog");
_test(b"ATGGCGTGCA")
}
}