Skip to content

Commit 4e20406

Browse files
committed
Reorganized Activator as Scheduler
1 parent d8d4d42 commit 4e20406

File tree

3 files changed

+62
-41
lines changed

3 files changed

+62
-41
lines changed

timely/src/progress/subgraph.rs

+2-1
Original file line numberDiff line numberDiff line change
@@ -299,10 +299,11 @@ where
299299
self.propagate_pointstamps();
300300

301301
{ // Enqueue active children; scoped to let borrow drop.
302+
use crate::scheduling::activate::Scheduler;
302303
let temp_active = &mut self.temp_active;
303304
self.activations
304305
.borrow_mut()
305-
.for_extensions(&self.path[..], |index| temp_active.push(Reverse(index)));
306+
.extensions(&self.path[..], temp_active);
306307
}
307308

308309
// Schedule child operators.

timely/src/scheduling/activate.rs

+41-25
Original file line numberDiff line numberDiff line change
@@ -8,30 +8,45 @@ use std::time::{Duration, Instant};
88
use std::cmp::Reverse;
99
use crossbeam_channel::{Sender, Receiver};
1010

11-
/// Methods required to act as a timely scheduler.
11+
/// Methods required to act as a scheduler for timely operators.
1212
///
13-
/// The core methods are the activation of "paths", sequences of integers, and
14-
/// the enumeration of active paths by prefix. A scheduler may delay the report
15-
/// of a path indefinitely, but it should report at least one extension for the
16-
/// empty path `&[]` or risk parking the worker thread without a certain unpark.
13+
/// Operators are described by "paths" of integers, indicating the path along
14+
/// a tree of regions, arriving at the the operator. Each path is either "idle"
15+
/// or "active", where the latter indicates that someone has requested that the
16+
/// operator be scheduled by the worker. Operators go from idle to active when
17+
/// the `activate(path)` method is called, and from active to idle when the path
18+
/// is returned through a call to `extensions(path, _)`.
1719
///
18-
/// There is no known harm to "spurious wake-ups" where a not-active path is
19-
/// returned through `extensions()`.
20+
/// The worker will continually probe for extensions to the root empty path `[]`,
21+
/// and then follow all returned addresses, recursively. A scheduler need not
22+
/// schedule all active paths, but it should return *some* active path when the
23+
/// worker probes the empty path, or the worker may put the thread to sleep.
24+
///
25+
/// There is no known harm to scheduling an idle path.
26+
/// The worker may speculatively schedule paths of its own accord.
2027
pub trait Scheduler {
2128
/// Mark a path as immediately scheduleable.
29+
///
30+
/// The scheduler is not required to immediately schedule the path, but it
31+
/// should not signal that it has no work until the path has been scheduled.
2232
fn activate(&mut self, path: &[usize]);
2333
/// Populates `dest` with next identifiers on active extensions of `path`.
2434
///
2535
/// This method is where a scheduler is allowed to exercise some discretion,
2636
/// in that it does not need to present *all* extensions, but it can instead
27-
/// present only those that the runtime should schedule.
28-
fn extensions(&mut self, path: &[usize], dest: &mut Vec<usize>);
37+
/// present only those that the runtime should immediately schedule.
38+
///
39+
/// The worker *will* schedule all extensions before probing new prefixes.
40+
/// The scheduler is invited to rely on this, and to schedule in "batches",
41+
/// where the next time the worker probes for extensions to the empty path
42+
/// then all addresses in the batch have certainly been scheduled.
43+
fn extensions(&mut self, path: &[usize], dest: &mut BinaryHeap<Reverse<usize>>);
2944
}
3045

3146
// Trait objects can be schedulers too.
3247
impl Scheduler for Box<dyn Scheduler> {
3348
fn activate(&mut self, path: &[usize]) { (**self).activate(path) }
34-
fn extensions(&mut self, path: &[usize], dest: &mut Vec<usize>) { (**self).extensions(path, dest) }
49+
fn extensions(&mut self, path: &[usize], dest: &mut BinaryHeap<Reverse<usize>>) { (**self).extensions(path, dest) }
3550
}
3651

3752
/// Allocation-free activation tracker.
@@ -93,7 +108,7 @@ impl Activations {
93108
}
94109

95110
/// Discards the current active set and presents the next active set.
96-
pub fn advance(&mut self) {
111+
fn advance(&mut self) {
97112

98113
// Drain inter-thread activations.
99114
while let Ok(path) = self.rx.try_recv() {
@@ -128,15 +143,15 @@ impl Activations {
128143
self.clean = self.bounds.len();
129144
}
130145

131-
/// Maps a function across activated paths.
132-
pub fn map_active(&self, logic: impl Fn(&[usize])) {
133-
for (offset, length) in self.bounds.iter() {
134-
logic(&self.slices[*offset .. (*offset + *length)]);
135-
}
136-
}
137-
138146
/// Sets as active any symbols that follow `path`.
139-
pub fn for_extensions(&self, path: &[usize], mut action: impl FnMut(usize)) {
147+
fn for_extensions(&mut self, path: &[usize], mut action: impl FnMut(usize)) {
148+
149+
// Each call for the root path is a moment where the worker has reset.
150+
// This relies on a worker implementation that follows the scheduling
151+
// instructions perfectly; if any offered paths are not explored, oops.
152+
if path.is_empty() {
153+
self.advance();
154+
}
140155

141156
let position =
142157
self.bounds[..self.clean]
@@ -209,13 +224,14 @@ impl Activations {
209224
std::thread::park();
210225
}
211226
}
227+
}
212228

213-
/// True iff there are no immediate activations.
214-
///
215-
/// Used by others to guard work done in anticipation of potentially parking.
216-
/// An alternate method name could be `would_park`.
217-
pub fn is_idle(&self) -> bool {
218-
self.bounds.is_empty() && self.timer.is_none()
229+
impl Scheduler for Activations {
230+
fn activate(&mut self, path: &[usize]) {
231+
self.activate(path);
232+
}
233+
fn extensions(&mut self, path: &[usize], dest: &mut BinaryHeap<Reverse<usize>>) {
234+
self.for_extensions(path, |index| dest.push(Reverse(index)));
219235
}
220236
}
221237

timely/src/worker.rs

+19-15
Original file line numberDiff line numberDiff line change
@@ -2,10 +2,11 @@
22
33
use std::rc::Rc;
44
use std::cell::{RefCell, RefMut};
5+
use std::cmp::Reverse;
56
use std::any::Any;
67
use std::str::FromStr;
78
use std::time::{Instant, Duration};
8-
use std::collections::HashMap;
9+
use std::collections::{HashMap, BinaryHeap};
910
use std::collections::hash_map::Entry;
1011
use std::sync::Arc;
1112

@@ -221,7 +222,7 @@ pub struct Worker<A: Allocate> {
221222
logging: Option<Rc<RefCell<crate::logging_core::Registry<crate::logging::WorkerIdentifier>>>>,
222223

223224
activations: Rc<RefCell<Activations>>,
224-
active_dataflows: Vec<usize>,
225+
active_dataflows: BinaryHeap<Reverse<usize>>,
225226

226227
// Temporary storage for channel identifiers during dataflow construction.
227228
// These are then associated with a dataflow once constructed.
@@ -355,12 +356,20 @@ impl<A: Allocate> Worker<A> {
355356
}
356357
}
357358

358-
// Organize activations.
359-
self.activations
360-
.borrow_mut()
361-
.advance();
359+
// Commence a new round of scheduling, starting with dataflows.
360+
// We probe the scheduler for active prefixes, where an empty response
361+
// indicates that the scheduler has no work for us at the moment.
362+
{ // Scoped to let borrow of `self.active_dataflows` drop.
363+
use crate::scheduling::activate::Scheduler;
364+
let active_dataflows = &mut self.active_dataflows;
365+
self.activations
366+
.borrow_mut()
367+
.extensions(&[], active_dataflows);
368+
}
369+
370+
// If no dataflows are active, there is nothing to do. Consider parking.
371+
if self.active_dataflows.is_empty() {
362372

363-
if self.activations.borrow().is_idle() {
364373
// If the timeout is zero, don't bother trying to park.
365374
// More generally, we could put some threshold in here.
366375
if timeout != Some(Duration::new(0, 0)) {
@@ -378,15 +387,10 @@ impl<A: Allocate> Worker<A> {
378387
self.logging().as_mut().map(|l| l.log(crate::logging::ParkEvent::unpark()));
379388
}
380389
}
381-
else { // Schedule active dataflows.
382-
383-
let active_dataflows = &mut self.active_dataflows;
384-
self.activations
385-
.borrow_mut()
386-
.for_extensions(&[], |index| active_dataflows.push(index));
390+
else { // Schedule all active dataflows.
387391

388392
let mut dataflows = self.dataflows.borrow_mut();
389-
for index in active_dataflows.drain(..) {
393+
for Reverse(index) in self.active_dataflows.drain() {
390394
// Step dataflow if it exists, remove if not incomplete.
391395
if let Entry::Occupied(mut entry) = dataflows.entry(index) {
392396
// TODO: This is a moment at which a scheduling decision is being made.
@@ -725,7 +729,7 @@ impl<A: Allocate> Clone for Worker<A> {
725729
dataflow_counter: self.dataflow_counter.clone(),
726730
logging: self.logging.clone(),
727731
activations: self.activations.clone(),
728-
active_dataflows: Vec::new(),
732+
active_dataflows: Default::default(),
729733
temp_channel_ids: self.temp_channel_ids.clone(),
730734
}
731735
}

0 commit comments

Comments
 (0)