parallel_processor/buckets/
concurrent.rs

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
use crate::buckets::bucket_writer::BucketItemSerializer;
use crate::buckets::{LockFreeBucket, MultiThreadBuckets};
use crate::memory_data_size::MemoryDataSize;
use crate::utils::panic_on_drop::PanicOnDrop;
use std::sync::Arc;

pub struct BucketsThreadBuffer {
    buffers: Vec<Vec<u8>>,
}

impl BucketsThreadBuffer {
    pub const EMPTY: Self = Self { buffers: vec![] };

    pub fn new(max_buffer_size: MemoryDataSize, buckets_count: usize) -> Self {
        let mut buffers = Vec::with_capacity(buckets_count);
        let capacity = max_buffer_size.as_bytes();
        for _ in 0..buckets_count {
            buffers.push(Vec::with_capacity(capacity));
        }

        Self { buffers }
    }
}

pub struct BucketsThreadDispatcher<B: LockFreeBucket, S: BucketItemSerializer> {
    mtb: Arc<MultiThreadBuckets<B>>,
    thread_data: BucketsThreadBuffer,
    drop_panic: PanicOnDrop,
    serializers: Vec<S>,
}

impl<B: LockFreeBucket, S: BucketItemSerializer> BucketsThreadDispatcher<B, S> {
    pub fn new(mtb: &Arc<MultiThreadBuckets<B>>, thread_data: BucketsThreadBuffer) -> Self {
        assert_eq!(mtb.buckets.len(), thread_data.buffers.len());
        Self {
            mtb: mtb.clone(),
            thread_data,
            drop_panic: PanicOnDrop::new("buckets thread dispatcher not finalized"),
            serializers: (0..mtb.buckets.len()).map(|_| S::new()).collect(),
        }
    }

    #[inline]
    pub fn add_element_extended(
        &mut self,
        bucket: u16,
        extra_data: &S::ExtraData,
        extra_data_buffer: &S::ExtraDataBuffer,
        element: &S::InputElementType<'_>,
    ) {
        let bucket_buf = &mut self.thread_data.buffers[bucket as usize];
        if self.serializers[bucket as usize].get_size(element, extra_data) + bucket_buf.len()
            > bucket_buf.capacity()
            && bucket_buf.len() > 0
        {
            self.mtb.add_data(bucket, bucket_buf.as_slice());
            bucket_buf.clear();
            self.serializers[bucket as usize].reset();
        }
        self.serializers[bucket as usize].write_to(
            element,
            bucket_buf,
            extra_data,
            extra_data_buffer,
        );
    }

    #[inline]
    pub fn add_element(
        &mut self,
        bucket: u16,
        extra_data: &S::ExtraData,
        element: &S::InputElementType<'_>,
    ) where
        S: BucketItemSerializer<ExtraDataBuffer = ()>,
    {
        self.add_element_extended(bucket, extra_data, &(), element);
    }

    pub fn finalize(mut self) -> (BucketsThreadBuffer, Arc<MultiThreadBuckets<B>>) {
        for (index, vec) in self.thread_data.buffers.iter_mut().enumerate() {
            if vec.len() == 0 {
                continue;
            }
            self.mtb.add_data(index as u16, vec.as_slice());
            vec.clear();
        }
        self.drop_panic.disengage();
        (self.thread_data, self.mtb)
    }
}