1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170
//! Broadcasts progress information among workers.
use std::rc::Rc;
use crate::progress::{ChangeBatch, Timestamp};
use crate::progress::{Location, Port};
use crate::communication::{Push, Pull};
use crate::logging::TimelyLogger as Logger;
use crate::logging::TimelyProgressLogger as ProgressLogger;
use crate::Bincode;
/// A list of progress updates corresponding to `((child_scope, [in/out]_port, timestamp), delta)`
pub type ProgressVec<T> = Vec<((Location, T), i64)>;
/// A progress update message consisting of source worker id, sequence number and lists of
/// message and internal updates
pub type ProgressMsg<T> = Bincode<(usize, usize, ProgressVec<T>)>;
/// Manages broadcasting of progress updates to and receiving updates from workers.
pub struct Progcaster<T:Timestamp> {
to_push: Option<ProgressMsg<T>>,
pushers: Vec<Box<dyn Push<ProgressMsg<T>>>>,
puller: Box<dyn Pull<ProgressMsg<T>>>,
/// Source worker index
source: usize,
/// Sequence number counter
counter: usize,
/// Sequence of nested scope identifiers indicating the path from the root to this subgraph
addr: Rc<[usize]>,
/// Communication channel identifier
channel_identifier: usize,
progress_logging: Option<ProgressLogger>,
}
impl<T:Timestamp+Send> Progcaster<T> {
/// Creates a new `Progcaster` using a channel from the supplied worker.
pub fn new<A: crate::worker::AsWorker>(worker: &mut A, addr: Rc<[usize]>, mut logging: Option<Logger>, progress_logging: Option<ProgressLogger>) -> Progcaster<T> {
let channel_identifier = worker.new_identifier();
let (pushers, puller) = worker.allocate(channel_identifier, addr.clone());
logging.as_mut().map(|l| l.log(crate::logging::CommChannelsEvent {
identifier: channel_identifier,
kind: crate::logging::CommChannelKind::Progress,
}));
let worker_index = worker.index();
Progcaster {
to_push: None,
pushers,
puller,
source: worker_index,
counter: 0,
addr,
channel_identifier,
progress_logging,
}
}
/// Sends pointstamp changes to all workers.
pub fn send(&mut self, changes: &mut ChangeBatch<(Location, T)>) {
changes.compact();
if !changes.is_empty() {
self.progress_logging.as_ref().map(|l| {
// Pre-allocate enough space; we transfer ownership, so there is not
// an opportunity to re-use allocations (w/o changing the logging
// interface to accept references).
let mut messages = Box::new(Vec::with_capacity(changes.len()));
let mut internal = Box::new(Vec::with_capacity(changes.len()));
for ((location, time), diff) in changes.iter() {
match location.port {
Port::Target(port) => {
messages.push((location.node, port, time.clone(), *diff))
},
Port::Source(port) => {
internal.push((location.node, port, time.clone(), *diff))
}
}
}
l.log(crate::logging::TimelyProgressEvent {
is_send: true,
source: self.source,
channel: self.channel_identifier,
seq_no: self.counter,
addr: self.addr.to_vec(),
messages,
internal,
});
});
for pusher in self.pushers.iter_mut() {
// Attempt to reuse allocations, if possible.
if let Some(tuple) = &mut self.to_push {
tuple.payload.0 = self.source;
tuple.payload.1 = self.counter;
tuple.payload.2.clear();
tuple.payload.2.extend(changes.iter().cloned());
}
// If we don't have an allocation ...
if self.to_push.is_none() {
self.to_push = Some(Bincode::from((
self.source,
self.counter,
changes.clone().into_inner().to_vec(),
)));
}
// TODO: This should probably use a broadcast channel.
pusher.push(&mut self.to_push);
pusher.done();
}
self.counter += 1;
changes.clear();
}
}
/// Receives pointstamp changes from all workers.
pub fn recv(&mut self, changes: &mut ChangeBatch<(Location, T)>) {
while let Some(message) = self.puller.pull() {
let source = message.0;
let counter = message.1;
let recv_changes = &message.2;
let addr = &mut self.addr;
let channel = self.channel_identifier;
// See comments above about the relatively high cost of this logging, and our
// options for improving it if performance limits users who want other logging.
self.progress_logging.as_ref().map(|l| {
let mut messages = Box::new(Vec::with_capacity(changes.len()));
let mut internal = Box::new(Vec::with_capacity(changes.len()));
for ((location, time), diff) in recv_changes.iter() {
match location.port {
Port::Target(port) => {
messages.push((location.node, port, time.clone(), *diff))
},
Port::Source(port) => {
internal.push((location.node, port, time.clone(), *diff))
}
}
}
l.log(crate::logging::TimelyProgressEvent {
is_send: false,
source,
seq_no: counter,
channel,
addr: addr.to_vec(),
messages,
internal,
});
});
// We clone rather than drain to avoid deserialization.
for &(ref update, delta) in recv_changes.iter() {
changes.update(update.clone(), delta);
}
}
}
}