1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
use timely::dataflow::scopes::child::Iterative;
use timely::dataflow::Scope;
use timely::order::TotalOrder;
use timely::progress::Timestamp;
use differential_dataflow::lattice::Lattice;
use differential_dataflow::operators::JoinCore;
use crate::binding::{AsBinding, Binding};
use crate::plan::{next_id, Dependencies, ImplContext, Implementable};
use crate::{Aid, Eid, Value, Var};
use crate::{CollectionRelation, Relation, ShutdownHandle, VariableMap};
#[derive(Hash, PartialEq, Eq, PartialOrd, Ord, Clone, Debug, Serialize, Deserialize)]
pub struct Join<P1: Implementable, P2: Implementable> {
pub variables: Vec<Var>,
pub left_plan: Box<P1>,
pub right_plan: Box<P2>,
}
impl<P1: Implementable, P2: Implementable> Implementable for Join<P1, P2> {
fn dependencies(&self) -> Dependencies {
Dependencies::merge(
self.left_plan.dependencies(),
self.right_plan.dependencies(),
)
}
fn into_bindings(&self) -> Vec<Binding> {
let mut left_bindings = self.left_plan.into_bindings();
let mut right_bindings = self.right_plan.into_bindings();
let mut bindings = Vec::with_capacity(left_bindings.len() + right_bindings.len());
bindings.append(&mut left_bindings);
bindings.append(&mut right_bindings);
bindings
}
fn datafy(&self) -> Vec<(Eid, Aid, Value)> {
let eid = next_id();
let mut left_data = self.left_plan.datafy();
let mut right_data = self.right_plan.datafy();
let mut left_eids: Vec<(Eid, Aid, Value)> = left_data
.iter()
.map(|(e, _, _)| (eid, "df.join/binding".to_string(), Value::Eid(*e)))
.collect();
let mut right_eids: Vec<(Eid, Aid, Value)> = right_data
.iter()
.map(|(e, _, _)| (eid, "df.join/binding".to_string(), Value::Eid(*e)))
.collect();
let mut data = Vec::with_capacity(
left_data.len() + right_data.len() + left_eids.len() + right_eids.len(),
);
data.append(&mut left_data);
data.append(&mut right_data);
data.append(&mut left_eids);
data.append(&mut right_eids);
data
}
fn implement<'b, T, I, S>(
&self,
nested: &mut Iterative<'b, S, u64>,
local_arrangements: &VariableMap<Iterative<'b, S, u64>>,
context: &mut I,
) -> (CollectionRelation<'b, S>, ShutdownHandle)
where
T: Timestamp + Lattice + TotalOrder,
I: ImplContext<T>,
S: Scope<Timestamp = T>,
{
let (left, shutdown_left) = self
.left_plan
.implement(nested, local_arrangements, context);
let (right, shutdown_right) =
self.right_plan
.implement(nested, local_arrangements, context);
let variables = self
.variables
.iter()
.cloned()
.chain(
left.variables()
.drain(..)
.filter(|x| !self.variables.contains(x)),
)
.chain(
right
.variables()
.drain(..)
.filter(|x| !self.variables.contains(x)),
)
.collect();
let tuples = left.arrange_by_variables(&self.variables).join_core(
&right.arrange_by_variables(&self.variables),
|key, v1, v2| {
Some(
key.iter()
.cloned()
.chain(v1.iter().cloned())
.chain(v2.iter().cloned())
.collect(),
)
},
);
let shutdown_handle = ShutdownHandle::merge(shutdown_left, shutdown_right);
(CollectionRelation { variables, tuples }, shutdown_handle)
}
}