Skip to content

Commit e00d695

Browse files
committed
Add JoinHandle::into_join_future().
This allows spawned threads to be incorporated into `Future`-based concurrency control without needing to add separate result-reporting channels and an additional layer of `catch_unwind()` to the thread functions. I believe this will be useful to async/blocking interop and for various applications which want to manage parallel tasks in a lightweight way. There is a small additional cost which is paid even if the mechanism is unused: the algorithm built into the shutdown of a spawned thread must obtain and invoke a `Waker`, and the `Packet` internal struct is larger by one `Mutex<Waker>`. In the future, this `Mutex` should be replaced by something equivalent to `futures::task::AtomicWaker`, which will be more efficient and eliminate deadlock and blocking hazards, but `std` doesn't contain one of those yet. This is not an `impl IntoFuture for JoinHandle` so that it can avoid being insta-stable; particularly because during the design discussion, concerns were raised that a proper implementation should obey structured concurrency via an `AsyncDrop` that forces waiting for the thread. I personally think that would be a mistake, and structured spawning should be its own thing, but this choice of API permits either option in the future by keeping everything unstable, where a trait implementation would not.
1 parent 3ae715c commit e00d695

File tree

4 files changed

+240
-17
lines changed

4 files changed

+240
-17
lines changed

library/std/src/lib.rs

+1
Original file line numberDiff line numberDiff line change
@@ -347,6 +347,7 @@
347347
#![feature(lazy_get)]
348348
#![feature(maybe_uninit_slice)]
349349
#![feature(maybe_uninit_write_slice)]
350+
#![feature(noop_waker)]
350351
#![feature(panic_can_unwind)]
351352
#![feature(panic_internals)]
352353
#![feature(pin_coerce_unsized_trait)]

library/std/src/thread/mod.rs

+171-15
Original file line numberDiff line numberDiff line change
@@ -161,17 +161,18 @@ mod tests;
161161
use crate::any::Any;
162162
use crate::cell::UnsafeCell;
163163
use crate::ffi::CStr;
164+
use crate::future::Future;
164165
use crate::marker::PhantomData;
165166
use crate::mem::{self, ManuallyDrop, forget};
166167
use crate::num::NonZero;
167168
use crate::pin::Pin;
168-
use crate::sync::Arc;
169169
use crate::sync::atomic::{AtomicUsize, Ordering};
170+
use crate::sync::{Arc, Mutex, PoisonError};
170171
use crate::sys::sync::Parker;
171172
use crate::sys::thread as imp;
172173
use crate::sys_common::{AsInner, IntoInner};
173174
use crate::time::{Duration, Instant};
174-
use crate::{env, fmt, io, panic, panicking, str};
175+
use crate::{env, fmt, io, panic, panicking, str, task};
175176

176177
#[stable(feature = "scoped_threads", since = "1.63.0")]
177178
mod scoped;
@@ -487,6 +488,7 @@ impl Builder {
487488
let my_packet: Arc<Packet<'scope, T>> = Arc::new(Packet {
488489
scope: scope_data,
489490
result: UnsafeCell::new(None),
491+
waker: Mutex::new(task::Waker::noop().clone()),
490492
_marker: PhantomData,
491493
});
492494
let their_packet = my_packet.clone();
@@ -532,15 +534,35 @@ impl Builder {
532534
let try_result = panic::catch_unwind(panic::AssertUnwindSafe(|| {
533535
crate::sys::backtrace::__rust_begin_short_backtrace(f)
534536
}));
537+
538+
// Store the `Result` of the thread that the `JoinHandle` can retrieve.
539+
//
535540
// SAFETY: `their_packet` as been built just above and moved by the
536541
// closure (it is an Arc<...>) and `my_packet` will be stored in the
537542
// same `JoinInner` as this closure meaning the mutation will be
538543
// safe (not modify it and affect a value far away).
539544
unsafe { *their_packet.result.get() = Some(try_result) };
540-
// Here `their_packet` gets dropped, and if this is the last `Arc` for that packet that
541-
// will call `decrement_num_running_threads` and therefore signal that this thread is
542-
// done.
545+
546+
// Fetch the `Waker` from the packet; this is needed to support `.into_join_future()`.
547+
// If unused, this just returns `Waker::noop()` which will do nothing.
548+
let waker: task::Waker = {
549+
let placeholder = task::Waker::noop().clone();
550+
let mut guard = their_packet.waker.lock().unwrap_or_else(PoisonError::into_inner);
551+
mem::replace(&mut *guard, placeholder)
552+
};
553+
554+
// Here `their_packet` gets dropped, and if this is the last `Arc` for that packet
555+
// (which happens if the `JoinHandle` has been dropped) that will call
556+
// `decrement_num_running_threads` and therefore signal to the scope (if there is one)
557+
// that this thread is done.
543558
drop(their_packet);
559+
560+
// Now that we have become visibly “finished” by dropping the packet
561+
// (`JoinInner::is_finished` will return true), we can use the `Waker` to signal
562+
// any waiting `JoinFuture`. If instead we are being waited for by
563+
// `JoinHandle::join()`, the actual platform thread termination will be the wakeup.
564+
waker.wake();
565+
544566
// Here, the lifetime `'scope` can end. `main` keeps running for a bit
545567
// after that before returning itself.
546568
};
@@ -1187,8 +1209,6 @@ impl ThreadId {
11871209
}
11881210
}
11891211
} else {
1190-
use crate::sync::{Mutex, PoisonError};
1191-
11921212
static COUNTER: Mutex<u64> = Mutex::new(1);
11931213

11941214
let mut counter = COUNTER.lock().unwrap_or_else(PoisonError::into_inner);
@@ -1569,16 +1589,30 @@ impl fmt::Debug for Thread {
15691589
#[stable(feature = "rust1", since = "1.0.0")]
15701590
pub type Result<T> = crate::result::Result<T, Box<dyn Any + Send + 'static>>;
15711591

1572-
// This packet is used to communicate the return value between the spawned
1573-
// thread and the rest of the program. It is shared through an `Arc` and
1574-
// there's no need for a mutex here because synchronization happens with `join()`
1575-
// (the caller will never read this packet until the thread has exited).
1576-
//
1577-
// An Arc to the packet is stored into a `JoinInner` which in turns is placed
1578-
// in `JoinHandle`.
1592+
/// This packet is used to communicate the return value between the spawned
1593+
/// thread and the rest of the program. It is shared through an [`Arc`].
1594+
///
1595+
/// An Arc to the packet is stored into a [`JoinInner`] which in turn is placed
1596+
/// in [`JoinHandle`] or [`ScopedJoinHandle`].
15791597
struct Packet<'scope, T> {
1598+
/// Communication with the enclosing thread scope if there is one.
15801599
scope: Option<Arc<scoped::ScopeData>>,
1600+
1601+
/// Holds the return value.
1602+
///
1603+
/// Synchronization happens via reference counting: as long as the `Arc<Packet>`
1604+
/// has two or more references, this field is never read, and will only be written
1605+
/// once as the thread terminates. After that happens, either the packet is dropped,
1606+
/// or [`JoinInner::join()`] will `take()` the result value from here.
15811607
result: UnsafeCell<Option<Result<T>>>,
1608+
1609+
/// If a [`JoinFuture`] for this thread exists and has been polled,
1610+
/// this is the waker from that poll. If it does not exist or has not
1611+
/// been polled yet, this is [`task::Waker::noop()`].
1612+
// FIXME: This should be an `AtomicWaker` instead of a `Mutex`,
1613+
// to be cheaper and impossible to deadlock.
1614+
waker: Mutex<task::Waker>,
1615+
15821616
_marker: PhantomData<Option<&'scope scoped::ScopeData>>,
15831617
}
15841618

@@ -1632,6 +1666,10 @@ impl<'scope, T> JoinInner<'scope, T> {
16321666
self.native.join();
16331667
Arc::get_mut(&mut self.packet).unwrap().result.get_mut().take().unwrap()
16341668
}
1669+
1670+
fn is_finished(&self) -> bool {
1671+
Arc::strong_count(&self.packet) == 1
1672+
}
16351673
}
16361674

16371675
/// An owned permission to join on a thread (block on its termination).
@@ -1778,6 +1816,45 @@ impl<T> JoinHandle<T> {
17781816
self.0.join()
17791817
}
17801818

1819+
/// Returns a [`Future`] that resolves when the thread has finished.
1820+
///
1821+
/// Its [output](Future::Output) value is identical to that of [`JoinHandle::join()`];
1822+
/// this is the `async` equivalent of that blocking function.
1823+
///
1824+
/// If the returned future is dropped (cancelled), the thread will become *detached*;
1825+
/// there will be no way to observe or wait for the thread’s termination.
1826+
/// This is identical to the behavior of `JoinHandle` itself.
1827+
///
1828+
/// # Example
1829+
///
1830+
// FIXME: ideally we would actually run this example, with the help of a trivial async executor
1831+
/// ```no_run
1832+
/// #![feature(thread_join_future)]
1833+
/// use std::thread;
1834+
///
1835+
/// async fn do_some_heavy_tasks_in_parallel() -> thread::Result<()> {
1836+
/// let future_1 = thread::spawn(|| {
1837+
/// // ... do something ...
1838+
/// }).into_join_future();
1839+
/// let future_2 = thread::spawn(|| {
1840+
/// // ... do something else ...
1841+
/// }).into_join_future();
1842+
///
1843+
/// // Both threads have been started; now await the completion of both.
1844+
/// future_1.await?;
1845+
/// future_2.await?;
1846+
/// Ok(())
1847+
/// }
1848+
/// ```
1849+
#[unstable(feature = "thread_join_future", issue = "none")]
1850+
pub fn into_join_future(self) -> JoinFuture<'static, T> {
1851+
// The method is not named `into_future()` to avoid overlapping with the stable
1852+
// `IntoFuture::into_future()`. We're not implementing `IntoFuture` in order to
1853+
// keep this unstable and preserve the *option* of compatibly making this obey structured
1854+
// concurrency via an async-Drop that waits for the thread to end.
1855+
JoinFuture::new(self.0)
1856+
}
1857+
17811858
/// Checks if the associated thread has finished running its main function.
17821859
///
17831860
/// `is_finished` supports implementing a non-blocking join operation, by checking
@@ -1790,7 +1867,7 @@ impl<T> JoinHandle<T> {
17901867
/// to return quickly, without blocking for any significant amount of time.
17911868
#[stable(feature = "thread_is_running", since = "1.61.0")]
17921869
pub fn is_finished(&self) -> bool {
1793-
Arc::strong_count(&self.0.packet) == 1
1870+
self.0.is_finished()
17941871
}
17951872
}
17961873

@@ -1816,9 +1893,88 @@ impl<T> fmt::Debug for JoinHandle<T> {
18161893
fn _assert_sync_and_send() {
18171894
fn _assert_both<T: Send + Sync>() {}
18181895
_assert_both::<JoinHandle<()>>();
1896+
_assert_both::<JoinFuture<'static, ()>>();
18191897
_assert_both::<Thread>();
18201898
}
18211899

1900+
/// A [`Future`] that resolves when a thread has finished.
1901+
///
1902+
/// Its [output](Future::Output) value is identical to that of [`JoinHandle::join()`];
1903+
/// this is the `async` equivalent of that blocking function.
1904+
/// Obtain it by calling [`JoinHandle::into_join_future()`] or
1905+
/// [`ScopedJoinHandle::into_join_future()`].
1906+
///
1907+
/// If a `JoinFuture` is dropped (cancelled), and the thread does not belong to a [scope],
1908+
/// the associated thread will become *detached*;
1909+
/// there will be no way to observe or wait for the thread’s termination.
1910+
#[unstable(feature = "thread_join_future", issue = "none")]
1911+
pub struct JoinFuture<'scope, T>(Option<JoinInner<'scope, T>>);
1912+
1913+
impl<'scope, T> JoinFuture<'scope, T> {
1914+
fn new(inner: JoinInner<'scope, T>) -> Self {
1915+
Self(Some(inner))
1916+
}
1917+
1918+
/// Implements the “getting a result” part of joining/polling, without blocking or changing
1919+
/// the `Waker`. Part of the implementation of `poll()`.
1920+
///
1921+
/// If this returns `Some`, then `self.0` is now `None` and the future will panic
1922+
/// if polled again.
1923+
fn take_result(&mut self) -> Option<Result<T>> {
1924+
self.0.take_if(|i| i.is_finished()).map(JoinInner::join)
1925+
}
1926+
}
1927+
1928+
#[unstable(feature = "thread_join_future", issue = "none")]
1929+
impl<T> Future for JoinFuture<'_, T> {
1930+
type Output = Result<T>;
1931+
fn poll(mut self: Pin<&mut Self>, cx: &mut task::Context<'_>) -> task::Poll<Self::Output> {
1932+
if let Some(result) = self.take_result() {
1933+
return task::Poll::Ready(result);
1934+
}
1935+
1936+
// Update the `Waker` the thread should wake when it completes.
1937+
{
1938+
let Some(inner) = &mut self.0 else {
1939+
panic!("polled after complete");
1940+
};
1941+
1942+
let new_waker = cx.waker();
1943+
1944+
// Lock the mutex, and ignore the poison state because there are no meaningful ways
1945+
// the existing contents can be corrupted; they will be overwritten completely and the
1946+
// overwrite is atomic-in-the-database-sense.
1947+
let mut current_waker_guard =
1948+
inner.packet.waker.lock().unwrap_or_else(PoisonError::into_inner);
1949+
1950+
// Overwrite the waker. Note that we are executing the new waker’s clone and the old
1951+
// waker’s destructor; these could panic (which will merely poison the lock) or hang,
1952+
// which will hold the lock, but the most that can do is prevent the thread from
1953+
// exiting because it's trying to acquire `packet.waker`, which it won't do while
1954+
// holding any *other* locks (...unless the thread’s data includes a lock guard that
1955+
// the waker also wants).
1956+
if !new_waker.will_wake(&*current_waker_guard) {
1957+
*current_waker_guard = new_waker.clone();
1958+
}
1959+
}
1960+
1961+
// Check for completion again in case the thread finished while we were busy
1962+
// setting the waker, to prevent a lost wakeup in that case.
1963+
if let Some(result) = self.take_result() {
1964+
task::Poll::Ready(result)
1965+
} else {
1966+
task::Poll::Pending
1967+
}
1968+
}
1969+
}
1970+
1971+
#[unstable(feature = "thread_join_future", issue = "none")]
1972+
impl<T> fmt::Debug for JoinFuture<'_, T> {
1973+
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
1974+
f.debug_struct("JoinHandle").finish_non_exhaustive()
1975+
}
1976+
}
1977+
18221978
/// Returns an estimate of the default amount of parallelism a program should use.
18231979
///
18241980
/// Parallelism is a resource. A given machine provides a certain capacity for

library/std/src/thread/scoped.rs

+21-1
Original file line numberDiff line numberDiff line change
@@ -313,6 +313,26 @@ impl<'scope, T> ScopedJoinHandle<'scope, T> {
313313
self.0.join()
314314
}
315315

316+
/// Returns a [`Future`] that resolves when the thread has finished.
317+
///
318+
/// Its [output] value is identical to that of [`ScopedJoinHandle::join()`];
319+
/// this is the `async` equivalent of that blocking function.
320+
///
321+
/// Note that while this function allows waiting for a scoped thread from `async`
322+
/// functions, the original [`scope()`] is still a blocking function which should
323+
/// not be used in `async` functions.
324+
///
325+
/// [`Future`]: crate::future::Future
326+
/// [output]: crate::future::Future::Output
327+
#[unstable(feature = "thread_join_future", issue = "none")]
328+
pub fn into_join_future(self) -> super::JoinFuture<'scope, T> {
329+
// There is no `ScopedJoinFuture` because the only difference between `JoinHandle`
330+
// and `ScopedJoinHandle` is that `JoinHandle` has no lifetime parameter, because
331+
// it was introduced before scoped threads. `JoinFuture` is new enough that we don’t
332+
// need to make two versions of it.
333+
super::JoinFuture::new(self.0)
334+
}
335+
316336
/// Checks if the associated thread has finished running its main function.
317337
///
318338
/// `is_finished` supports implementing a non-blocking join operation, by checking
@@ -325,7 +345,7 @@ impl<'scope, T> ScopedJoinHandle<'scope, T> {
325345
/// to return quickly, without blocking for any significant amount of time.
326346
#[stable(feature = "scoped_threads", since = "1.63.0")]
327347
pub fn is_finished(&self) -> bool {
328-
Arc::strong_count(&self.0.packet) == 1
348+
self.0.is_finished()
329349
}
330350
}
331351

library/std/src/thread/tests.rs

+47-1
Original file line numberDiff line numberDiff line change
@@ -1,12 +1,14 @@
11
use super::Builder;
22
use crate::any::Any;
3+
use crate::assert_matches::assert_matches;
4+
use crate::future::Future as _;
35
use crate::panic::panic_any;
46
use crate::sync::atomic::{AtomicBool, Ordering};
57
use crate::sync::mpsc::{Sender, channel};
68
use crate::sync::{Arc, Barrier};
79
use crate::thread::{self, Scope, ThreadId};
810
use crate::time::{Duration, Instant};
9-
use crate::{mem, result};
11+
use crate::{mem, result, task};
1012

1113
// !!! These tests are dangerous. If something is buggy, they will hang, !!!
1214
// !!! instead of exiting cleanly. This might wedge the buildbots. !!!
@@ -410,3 +412,47 @@ fn test_minimal_thread_stack() {
410412
assert_eq!(before, 0);
411413
assert_eq!(COUNT.load(Ordering::Relaxed), 1);
412414
}
415+
416+
fn join_future_test(scoped: bool) {
417+
/// Simple `Waker` implementation.
418+
/// If `std` ever gains a `block_on()`, we can consider replacing this with that.
419+
struct MyWaker(Sender<()>);
420+
impl task::Wake for MyWaker {
421+
fn wake(self: Arc<Self>) {
422+
_ = self.0.send(());
423+
}
424+
}
425+
426+
// Communication setup.
427+
let (thread_delay_tx, thread_delay_rx) = channel();
428+
let (waker_tx, waker_rx) = channel();
429+
let waker = task::Waker::from(Arc::new(MyWaker(waker_tx)));
430+
let ctx = &mut task::Context::from_waker(&waker);
431+
432+
thread::scope(|s| {
433+
// Create the thread and the future under test
434+
let thread_body = move || {
435+
thread_delay_rx.recv().unwrap();
436+
"hello"
437+
};
438+
let mut future = crate::pin::pin!(if scoped {
439+
s.spawn(thread_body).into_join_future()
440+
} else {
441+
thread::spawn(thread_body).into_join_future()
442+
});
443+
444+
// Actual test
445+
assert_matches!(future.as_mut().poll(ctx), task::Poll::Pending);
446+
thread_delay_tx.send(()).unwrap(); // Unblock the thread
447+
waker_rx.recv().unwrap(); // Wait for waking (as an executor would)
448+
assert_matches!(future.as_mut().poll(ctx), task::Poll::Ready(Ok("hello")));
449+
});
450+
}
451+
#[test]
452+
fn join_future_unscoped() {
453+
join_future_test(false)
454+
}
455+
#[test]
456+
fn join_future_scoped() {
457+
join_future_test(true)
458+
}

0 commit comments

Comments
 (0)