use std::fmt::Display;
use crate::block::{BlockStructure, OperatorKind, OperatorStructure};
use crate::operator::sink::{Sink, StreamOutputRef};
use crate::operator::{ExchangeData, Operator, StreamElement};
use crate::scheduler::ExecutionMetadata;
#[derive(Debug)]
pub struct CollectVecSink<Out: ExchangeData, PreviousOperators>
where
PreviousOperators: Operator<Out = Out>,
{
prev: PreviousOperators,
result: Option<Vec<Out>>,
output: StreamOutputRef<Vec<Out>>,
}
impl<Out: ExchangeData, PreviousOperators> CollectVecSink<Out, PreviousOperators>
where
PreviousOperators: Operator<Out = Out>,
{
pub(crate) fn new(prev: PreviousOperators, output: StreamOutputRef<Vec<Out>>) -> Self {
Self {
prev,
result: Some(Vec::new()),
output,
}
}
}
impl<Out: ExchangeData, PreviousOperators> Display for CollectVecSink<Out, PreviousOperators>
where
PreviousOperators: Operator<Out = Out>,
{
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
write!(f, "{} -> CollectVecSink", self.prev)
}
}
impl<Out: ExchangeData, PreviousOperators> Operator for CollectVecSink<Out, PreviousOperators>
where
PreviousOperators: Operator<Out = Out>,
{
type Out = ();
fn setup(&mut self, metadata: &mut ExecutionMetadata) {
self.prev.setup(metadata);
}
fn next(&mut self) -> StreamElement<()> {
match self.prev.next() {
StreamElement::Item(t) | StreamElement::Timestamped(t, _) => {
if let Some(result) = self.result.as_mut() {
result.push(t);
}
StreamElement::Item(())
}
StreamElement::Watermark(w) => StreamElement::Watermark(w),
StreamElement::Terminate => {
if let Some(result) = self.result.take() {
*self.output.lock().unwrap() = Some(result);
}
StreamElement::Terminate
}
StreamElement::FlushBatch => StreamElement::FlushBatch,
StreamElement::FlushAndRestart => StreamElement::FlushAndRestart,
}
}
fn structure(&self) -> BlockStructure {
let mut operator = OperatorStructure::new::<Out, _>("CollectVecSink");
operator.kind = OperatorKind::Sink;
self.prev.structure().add_operator(operator)
}
}
impl<Out: ExchangeData, PreviousOperators> Sink for CollectVecSink<Out, PreviousOperators> where
PreviousOperators: Operator<Out = Out>
{
}
impl<Out: ExchangeData, PreviousOperators> Clone for CollectVecSink<Out, PreviousOperators>
where
PreviousOperators: Operator<Out = Out>,
{
fn clone(&self) -> Self {
panic!("CollectVecSink cannot be cloned, replication should be 1");
}
}
#[cfg(test)]
mod tests {
use itertools::Itertools;
use crate::config::RuntimeConfig;
use crate::environment::StreamContext;
use crate::operator::source;
#[test]
fn collect_vec() {
let env = StreamContext::new(RuntimeConfig::local(4));
let source = source::IteratorSource::new(0..10u8);
let res = env.stream(source).collect_vec();
env.execute_blocking();
assert_eq!(res.get().unwrap(), (0..10).collect_vec());
}
}