1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
use crate::Dataset;
use rand::{prelude::SliceRandom, rngs::StdRng, SeedableRng};
use std::sync::Arc;
pub struct ShuffledDataset<I> {
dataset: Arc<dyn Dataset<I>>,
indexes: Vec<usize>,
}
impl<I> ShuffledDataset<I> {
pub fn new(dataset: Arc<dyn Dataset<I>>, rng: &mut StdRng) -> Self {
let mut indexes = Vec::with_capacity(dataset.len());
for i in 0..dataset.len() {
indexes.push(i);
}
indexes.shuffle(rng);
Self { dataset, indexes }
}
pub fn with_seed(dataset: Arc<dyn Dataset<I>>, seed: u64) -> Self {
let mut rng = StdRng::seed_from_u64(seed);
Self::new(dataset, &mut rng)
}
}
impl<I> Dataset<I> for ShuffledDataset<I>
where
I: Clone,
{
fn get(&self, index: usize) -> Option<I> {
let index = match self.indexes.get(index) {
Some(index) => index,
None => return None,
};
self.dataset.get(*index)
}
fn len(&self) -> usize {
self.dataset.len()
}
}