forked from TimelyDataflow/timely-dataflow
-
Notifications
You must be signed in to change notification settings - Fork 10
Expand file tree
/
Copy pathexchange.rs
More file actions
107 lines (98 loc) · 3.46 KB
/
exchange.rs
File metadata and controls
107 lines (98 loc) · 3.46 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
//! The exchange pattern distributes pushed data between many target pushees.
use crate::communication::Push;
use crate::container::PushPartitioned;
use crate::dataflow::channels::Message;
use crate::{Container, Data};
// TODO : Software write combining
/// Distributes records among target pushees according to a distribution function.
pub struct Exchange<T, C: PushPartitioned, P: Push<Message<T, C>>, H>
where
for<'a> H: FnMut(&C::Item<'a>) -> u64
{
pushers: Vec<P>,
buffers: Vec<C>,
current: Option<T>,
hash_func: H,
}
impl<T: Clone, C: PushPartitioned, P: Push<Message<T, C>>, H> Exchange<T, C, P, H>
where
for<'a> H: FnMut(&C::Item<'a>) -> u64
{
/// Allocates a new `Exchange` from a supplied set of pushers and a distribution function.
pub fn new(pushers: Vec<P>, key: H) -> Exchange<T, C, P, H> {
let mut buffers = vec![];
for _ in 0..pushers.len() {
buffers.push(Default::default());
}
Exchange {
pushers,
hash_func: key,
buffers,
current: None,
}
}
#[inline]
fn flush(&mut self, index: usize) {
if !self.buffers[index].is_empty() {
if let Some(ref time) = self.current {
Message::push_at(&mut self.buffers[index], time.clone(), &mut self.pushers[index]);
}
}
}
}
impl<T: Eq+Data, C: Container, P: Push<Message<T, C>>, H, > Push<Message<T, C>> for Exchange<T, C, P, H>
where
C: PushPartitioned,
for<'a> H: FnMut(&C::Item<'a>) -> u64
{
#[inline(never)]
fn push(&mut self, message: &mut Option<Message<T, C>>) {
// if only one pusher, no exchange
if self.pushers.len() == 1 {
self.pushers[0].push(message);
}
else if let Some(message) = message {
let time = &message.time;
let data = &mut message.data;
// if the time isn't right, flush everything.
if self.current.as_ref().map_or(false, |x| x != time) {
for index in 0..self.pushers.len() {
self.flush(index);
}
}
self.current = Some(time.clone());
let hash_func = &mut self.hash_func;
// if the number of pushers is a power of two, use a mask
if self.pushers.len().is_power_of_two() {
let mask = (self.pushers.len() - 1) as u64;
let pushers = &mut self.pushers;
data.push_partitioned(
&mut self.buffers,
move |datum| ((hash_func)(datum) & mask) as usize,
|index, buffer| {
Message::push_at(buffer, time.clone(), &mut pushers[index]);
}
);
}
// as a last resort, use mod (%)
else {
let num_pushers = self.pushers.len() as u64;
let pushers = &mut self.pushers;
data.push_partitioned(
&mut self.buffers,
move |datum| ((hash_func)(datum) % num_pushers) as usize,
|index, buffer| {
Message::push_at(buffer, time.clone(), &mut pushers[index]);
}
);
}
}
else {
// flush
for index in 0..self.pushers.len() {
self.flush(index);
self.pushers[index].push(&mut None);
}
}
}
}