pool.rs source code [crates/tokio/src/runtime/blocking/pool.rs]

1	//! Thread pool for blocking operations
2
3	use crate::loom::sync::{Arc, Condvar, Mutex};
4	use crate::loom::thread;
5	use crate::runtime::blocking::schedule::BlockingSchedule;
6	use crate::runtime::blocking::{shutdown, BlockingTask};
7	use crate::runtime::builder::ThreadNameFn;
8	use crate::runtime::task::{self, JoinHandle};
9	use crate::runtime::{Builder, Callback, Handle, BOX_FUTURE_THRESHOLD};
10	use crate::util::metric_atomics::MetricAtomicUsize;
11	use crate::util::trace::{blocking_task, SpawnMeta};
12
13	use std::collections::{HashMap, VecDeque};
14	use std::fmt;
15	use std::io;
16	use std::sync::atomic::Ordering;
17	use std::time::Duration;
18
19	pub(crate) struct BlockingPool {
20	spawner: Spawner,
21	shutdown_rx: shutdown::Receiver,
22	}
23
24	#[derive(Clone)]
25	pub(crate) struct Spawner {
26	inner: Arc<Inner>,
27	}
28
29	#[derive(Default)]
30	pub(crate) struct SpawnerMetrics {
31	num_threads: MetricAtomicUsize,
32	num_idle_threads: MetricAtomicUsize,
33	queue_depth: MetricAtomicUsize,
34	}
35
36	impl SpawnerMetrics {
37	fn num_threads(&self) -> usize {
38	self.num_threads.load(Ordering::Relaxed)
39	}
40
41	fn num_idle_threads(&self) -> usize {
42	self.num_idle_threads.load(Ordering::Relaxed)
43	}
44
45	cfg_unstable_metrics! {
46	fn queue_depth(&self) -> usize {
47	self.queue_depth.load(Ordering::Relaxed)
48	}
49	}
50
51	fn inc_num_threads(&self) {
52	self.num_threads.increment();
53	}
54
55	fn dec_num_threads(&self) {
56	self.num_threads.decrement();
57	}
58
59	fn inc_num_idle_threads(&self) {
60	self.num_idle_threads.increment();
61	}
62
63	fn dec_num_idle_threads(&self) -> usize {
64	self.num_idle_threads.decrement()
65	}
66
67	fn inc_queue_depth(&self) {
68	self.queue_depth.increment();
69	}
70
71	fn dec_queue_depth(&self) {
72	self.queue_depth.decrement();
73	}
74	}
75
76	struct Inner {
77	/// State shared between worker threads.
78	shared: Mutex<Shared>,
79
80	/// Pool threads wait on this.
81	condvar: Condvar,
82
83	/// Spawned threads use this name.
84	thread_name: ThreadNameFn,
85
86	/// Spawned thread stack size.
87	stack_size: Option<usize>,
88
89	/// Call after a thread starts.
90	after_start: Option<Callback>,
91
92	/// Call before a thread stops.
93	before_stop: Option<Callback>,
94
95	// Maximum number of threads.
96	thread_cap: usize,
97
98	// Customizable wait timeout.
99	keep_alive: Duration,
100
101	// Metrics about the pool.
102	metrics: SpawnerMetrics,
103	}
104
105	struct Shared {
106	queue: VecDeque<Task>,
107	num_notify: u32,
108	shutdown: bool,
109	shutdown_tx: Option<shutdown::Sender>,
110	/// Prior to shutdown, we clean up `JoinHandles` by having each timed-out
111	/// thread join on the previous timed-out thread. This is not strictly
112	/// necessary but helps avoid Valgrind false positives, see
113	/// <https://github.com/tokio-rs/tokio/commit/646fbae76535e397ef79dbcaacb945d4c829f666>
114	/// for more information.
115	last_exiting_thread: Option<thread::JoinHandle<()>>,
116	/// This holds the `JoinHandles` for all running threads; on shutdown, the thread
117	/// calling shutdown handles joining on these.
118	worker_threads: HashMap<usize, thread::JoinHandle<()>>,
119	/// This is a counter used to iterate `worker_threads` in a consistent order (for loom's
120	/// benefit).
121	worker_thread_index: usize,
122	}
123
124	pub(crate) struct Task {
125	task: task::UnownedTask<BlockingSchedule>,
126	mandatory: Mandatory,
127	}
128
129	#[derive(PartialEq, Eq)]
130	pub(crate) enum Mandatory {
131	#[cfg_attr(not(feature = "fs"), allow(dead_code))]
132	Mandatory,
133	NonMandatory,
134	}
135
136	pub(crate) enum SpawnError {
137	/// Pool is shutting down and the task was not scheduled
138	ShuttingDown,
139	/// There are no worker threads available to take the task
140	/// and the OS failed to spawn a new one
141	NoThreads(io::Error),
142	}
143
144	impl From<SpawnError> for io::Error {
145	fn from(e: SpawnError) -> Self {
146	match e {
147	SpawnError::ShuttingDown => {
148	io::Error::new(kind:io::ErrorKind::Other, error:"blocking pool shutting down")
149	}
150	SpawnError::NoThreads(e: Error) => e,
151	}
152	}
153	}
154
155	impl Task {
156	pub(crate) fn new(task: task::UnownedTask<BlockingSchedule>, mandatory: Mandatory) -> Task {
157	Task { task, mandatory }
158	}
159
160	fn run(self) {
161	self.task.run();
162	}
163
164	fn shutdown_or_run_if_mandatory(self) {
165	match self.mandatory {
166	Mandatory::NonMandatory => self.task.shutdown(),
167	Mandatory::Mandatory => self.task.run(),
168	}
169	}
170	}
171
172	const KEEP_ALIVE: Duration = Duration::from_secs(`10`);
173
174	/// Runs the provided function on an executor dedicated to blocking operations.
175	/// Tasks will be scheduled as non-mandatory, meaning they may not get executed
176	/// in case of runtime shutdown.
177	#[track_caller]
178	#[cfg_attr(target_os = "wasi", allow(dead_code))]
179	pub(crate) fn spawn_blocking<F, R>(func: F) -> JoinHandle<R>
180	where
181	F: FnOnce() -> R + Send + 'static,
182	R: Send + 'static,
183	{
184	let rt: Handle = Handle::current();
185	rt.spawn_blocking(func)
186	}
187
188	cfg_fs! {
189	#[cfg_attr(any(
190	all(loom, not(test)), // the function is covered by loom tests
191	test
192	), allow(dead_code))]
193	/// Runs the provided function on an executor dedicated to blocking
194	/// operations. Tasks will be scheduled as mandatory, meaning they are
195	/// guaranteed to run unless a shutdown is already taking place. In case a
196	/// shutdown is already taking place, `None` will be returned.
197	pub(crate) fn spawn_mandatory_blocking<F, R>(func: F) -> Option<JoinHandle<R>>
198	where
199	F: FnOnce() -> R + Send + 'static,
200	R: Send + 'static,
201	{
202	let rt = Handle::current();
203	rt.inner.blocking_spawner().spawn_mandatory_blocking(&rt, func)
204	}
205	}
206
207	// ===== impl BlockingPool =====
208
209	impl BlockingPool {
210	pub(crate) fn new(builder: &Builder, thread_cap: usize) -> BlockingPool {
211	let (shutdown_tx, shutdown_rx) = shutdown::channel();
212	let keep_alive = builder.keep_alive.unwrap_or(KEEP_ALIVE);
213
214	BlockingPool {
215	spawner: Spawner {
216	inner: Arc::new(Inner {
217	shared: Mutex::new(Shared {
218	queue: VecDeque::new(),
219	num_notify: `0`,
220	shutdown: `false`,
221	shutdown_tx: Some(shutdown_tx),
222	last_exiting_thread: None,
223	worker_threads: HashMap::new(),
224	worker_thread_index: `0`,
225	}),
226	condvar: Condvar::new(),
227	thread_name: builder.thread_name.clone(),
228	stack_size: builder.thread_stack_size,
229	after_start: builder.after_start.clone(),
230	before_stop: builder.before_stop.clone(),
231	thread_cap,
232	keep_alive,
233	metrics: SpawnerMetrics::default(),
234	}),
235	},
236	shutdown_rx,
237	}
238	}
239
240	pub(crate) fn spawner(&self) -> &Spawner {
241	&self.spawner
242	}
243
244	pub(crate) fn shutdown(&mut self, timeout: Option<Duration>) {
245	let mut shared = self.spawner.inner.shared.lock();
246
247	// The function can be called multiple times. First, by explicitly
248	// calling `shutdown` then by the drop handler calling `shutdown`. This
249	// prevents shutting down twice.
250	if shared.shutdown {
251	return;
252	}
253
254	shared.shutdown = `true`;
255	shared.shutdown_tx = None;
256	self.spawner.inner.condvar.notify_all();
257
258	let last_exited_thread = std::mem::take(&mut shared.last_exiting_thread);
259	let workers = std::mem::take(&mut shared.worker_threads);
260
261	drop(shared);
262
263	if self.shutdown_rx.wait(timeout) {
264	let _ = last_exited_thread.map(thread::JoinHandle::join);
265
266	// Loom requires that execution be deterministic, so sort by thread ID before joining.
267	// (HashMaps use a randomly-seeded hash function, so the order is nondeterministic)
268	#[cfg(loom)]
269	let workers: Vec<(usize, thread::JoinHandle<()>)> = {
270	let mut workers: Vec<_> = workers.into_iter().collect();
271	workers.sort_by_key(\|(id, _)\| *id);
272	workers
273	};
274
275	for (_id, handle) in workers {
276	let _ = handle.join();
277	}
278	}
279	}
280	}
281
282	impl Drop for BlockingPool {
283	fn drop(&mut self) {
284	self.shutdown(timeout:None);
285	}
286	}
287
288	impl fmt::Debug for BlockingPool {
289	fn fmt(&self, fmt: &mut fmt::Formatter<'_>) -> fmt::Result {
290	fmt.debug_struct(name:"BlockingPool").finish()
291	}
292	}
293
294	// ===== impl Spawner =====
295
296	impl Spawner {
297	#[track_caller]
298	pub(crate) fn spawn_blocking<F, R>(&self, rt: &Handle, func: F) -> JoinHandle<R>
299	where
300	F: FnOnce() -> R + Send + 'static,
301	R: Send + 'static,
302	{
303	let fn_size = std::mem::size_of::<F>();
304	let (join_handle, spawn_result) = if fn_size > BOX_FUTURE_THRESHOLD {
305	self.spawn_blocking_inner(
306	Box::new(func),
307	Mandatory::NonMandatory,
308	SpawnMeta::new_unnamed(fn_size),
309	rt,
310	)
311	} else {
312	self.spawn_blocking_inner(
313	func,
314	Mandatory::NonMandatory,
315	SpawnMeta::new_unnamed(fn_size),
316	rt,
317	)
318	};
319
320	match spawn_result {
321	Ok(()) => join_handle,
322	// Compat: do not panic here, return the join_handle even though it will never resolve
323	Err(SpawnError::ShuttingDown) => join_handle,
324	Err(SpawnError::NoThreads(e)) => {
325	panic!("OS can't spawn worker thread: {e}")
326	}
327	}
328	}
329
330	cfg_fs! {
331	#[track_caller]
332	#[cfg_attr(any(
333	all(loom, not(test)), // the function is covered by loom tests
334	test
335	), allow(dead_code))]
336	pub(crate) fn spawn_mandatory_blocking<F, R>(&self, rt: &Handle, func: F) -> Option<JoinHandle<R>>
337	where
338	F: FnOnce() -> R + Send + 'static,
339	R: Send + 'static,
340	{
341	let fn_size = std::mem::size_of::<F>();
342	let (join_handle, spawn_result) = if fn_size > BOX_FUTURE_THRESHOLD {
343	self.spawn_blocking_inner(
344	Box::new(func),
345	Mandatory::Mandatory,
346	SpawnMeta::new_unnamed(fn_size),
347	rt,
348	)
349	} else {
350	self.spawn_blocking_inner(
351	func,
352	Mandatory::Mandatory,
353	SpawnMeta::new_unnamed(fn_size),
354	rt,
355	)
356	};
357
358	if spawn_result.is_ok() {
359	Some(join_handle)
360	} else {
361	None
362	}
363	}
364	}
365
366	#[track_caller]
367	pub(crate) fn spawn_blocking_inner<F, R>(
368	&self,
369	func: F,
370	is_mandatory: Mandatory,
371	spawn_meta: SpawnMeta<'_>,
372	rt: &Handle,
373	) -> (JoinHandle<R>, Result<(), SpawnError>)
374	where
375	F: FnOnce() -> R + Send + 'static,
376	R: Send + 'static,
377	{
378	let id = task::Id::next();
379	let fut =
380	blocking_task::<F, BlockingTask<F>>(BlockingTask::new(func), spawn_meta, id.as_u64());
381
382	let (task, handle) = task::unowned(fut, BlockingSchedule::new(rt), id);
383
384	let spawned = self.spawn_task(Task::new(task, is_mandatory), rt);
385	(handle, spawned)
386	}
387
388	fn spawn_task(&self, task: Task, rt: &Handle) -> Result<(), SpawnError> {
389	let mut shared = self.inner.shared.lock();
390
391	if shared.shutdown {
392	// Shutdown the task: it's fine to shutdown this task (even if
393	// mandatory) because it was scheduled after the shutdown of the
394	// runtime began.
395	task.task.shutdown();
396
397	// no need to even push this task; it would never get picked up
398	return Err(SpawnError::ShuttingDown);
399	}
400
401	shared.queue.push_back(task);
402	self.inner.metrics.inc_queue_depth();
403
404	if self.inner.metrics.num_idle_threads() == `0` {
405	// No threads are able to process the task.
406
407	if self.inner.metrics.num_threads() == self.inner.thread_cap {
408	// At max number of threads
409	} else {
410	assert!(shared.shutdown_tx.is_some());
411	let shutdown_tx = shared.shutdown_tx.clone();
412
413	if let Some(shutdown_tx) = shutdown_tx {
414	let id = shared.worker_thread_index;
415
416	match self.spawn_thread(shutdown_tx, rt, id) {
417	Ok(handle) => {
418	self.inner.metrics.inc_num_threads();
419	shared.worker_thread_index += `1`;
420	shared.worker_threads.insert(id, handle);
421	}
422	Err(ref e)
423	if is_temporary_os_thread_error(e)
424	&& self.inner.metrics.num_threads() > `0` =>
425	{
426	// OS temporarily failed to spawn a new thread.
427	// The task will be picked up eventually by a currently
428	// busy thread.
429	}
430	Err(e) => {
431	// The OS refused to spawn the thread and there is no thread
432	// to pick up the task that has just been pushed to the queue.
433	return Err(SpawnError::NoThreads(e));
434	}
435	}
436	}
437	}
438	} else {
439	// Notify an idle worker thread. The notification counter
440	// is used to count the needed amount of notifications
441	// exactly. Thread libraries may generate spurious
442	// wakeups, this counter is used to keep us in a
443	// consistent state.
444	self.inner.metrics.dec_num_idle_threads();
445	shared.num_notify += `1`;
446	self.inner.condvar.notify_one();
447	}
448
449	Ok(())
450	}
451
452	fn spawn_thread(
453	&self,
454	shutdown_tx: shutdown::Sender,
455	rt: &Handle,
456	id: usize,
457	) -> io::Result<thread::JoinHandle<()>> {
458	let mut builder = thread::Builder::new().name((self.inner.thread_name)());
459
460	if let Some(stack_size) = self.inner.stack_size {
461	builder = builder.stack_size(stack_size);
462	}
463
464	let rt = rt.clone();
465
466	builder.spawn(move \|\| {
467	// Only the reference should be moved into the closure
468	let _enter = rt.enter();
469	rt.inner.blocking_spawner().inner.run(id);
470	drop(shutdown_tx);
471	})
472	}
473	}
474
475	cfg_unstable_metrics! {
476	impl Spawner {
477	pub(crate) fn num_threads(&self) -> usize {
478	self.inner.metrics.num_threads()
479	}
480
481	pub(crate) fn num_idle_threads(&self) -> usize {
482	self.inner.metrics.num_idle_threads()
483	}
484
485	pub(crate) fn queue_depth(&self) -> usize {
486	self.inner.metrics.queue_depth()
487	}
488	}
489	}
490
491	// Tells whether the error when spawning a thread is temporary.
492	#[inline]
493	fn is_temporary_os_thread_error(error: &io::Error) -> bool {
494	matches!(error.kind(), io::ErrorKind::WouldBlock)
495	}
496
497	impl Inner {
498	fn run(&self, worker_thread_id: usize) {
499	if let Some(f) = &self.after_start {
500	f();
501	}
502
503	let mut shared = self.shared.lock();
504	let mut join_on_thread = None;
505
506	'main: loop {
507	// BUSY
508	while let Some(task) = shared.queue.pop_front() {
509	self.metrics.dec_queue_depth();
510	drop(shared);
511	task.run();
512
513	shared = self.shared.lock();
514	}
515
516	// IDLE
517	self.metrics.inc_num_idle_threads();
518
519	while !shared.shutdown {
520	let lock_result = self.condvar.wait_timeout(shared, self.keep_alive).unwrap();
521
522	shared = lock_result.0;
523	let timeout_result = lock_result.1;
524
525	if shared.num_notify != `0` {
526	// We have received a legitimate wakeup,
527	// acknowledge it by decrementing the counter
528	// and transition to the BUSY state.
529	shared.num_notify -= `1`;
530	break;
531	}
532
533	// Even if the condvar "timed out", if the pool is entering the
534	// shutdown phase, we want to perform the cleanup logic.
535	if !shared.shutdown && timeout_result.timed_out() {
536	// We'll join the prior timed-out thread's JoinHandle after dropping the lock.
537	// This isn't done when shutting down, because the thread calling shutdown will
538	// handle joining everything.
539	let my_handle = shared.worker_threads.remove(&worker_thread_id);
540	join_on_thread = std::mem::replace(&mut shared.last_exiting_thread, my_handle);
541
542	break 'main;
543	}
544
545	// Spurious wakeup detected, go back to sleep.
546	}
547
548	if shared.shutdown {
549	// Drain the queue
550	while let Some(task) = shared.queue.pop_front() {
551	self.metrics.dec_queue_depth();
552	drop(shared);
553
554	task.shutdown_or_run_if_mandatory();
555
556	shared = self.shared.lock();
557	}
558
559	// Work was produced, and we "took" it (by decrementing num_notify).
560	// This means that num_idle was decremented once for our wakeup.
561	// But, since we are exiting, we need to "undo" that, as we'll stay idle.
562	self.metrics.inc_num_idle_threads();
563	// NOTE: Technically we should also do num_notify++ and notify again,
564	// but since we're shutting down anyway, that won't be necessary.
565	break;
566	}
567	}
568
569	// Thread exit
570	self.metrics.dec_num_threads();
571
572	// num_idle should now be tracked exactly, panic
573	// with a descriptive message if it is not the
574	// case.
575	let prev_idle = self.metrics.dec_num_idle_threads();
576	assert!(
577	prev_idle >= self.metrics.num_idle_threads(),
578	"num_idle_threads underflowed on thread exit"
579	);
580
581	if shared.shutdown && self.metrics.num_threads() == `0` {
582	self.condvar.notify_one();
583	}
584
585	drop(shared);
586
587	if let Some(f) = &self.before_stop {
588	f();
589	}
590
591	if let Some(handle) = join_on_thread {
592	let _ = handle.join();
593	}
594	}
595	}
596
597	impl fmt::Debug for Spawner {
598	fn fmt(&self, fmt: &mut fmt::Formatter<'_>) -> fmt::Result {
599	fmt.debug_struct(name:"blocking::Spawner").finish()
600	}
601	}
602