blob: b7a2cac7f57015b6dd2915da1652a61f04a4aeb5 [file] [log] [blame]
Brian Quinlan81c4d362010-09-18 22:35:02 +00001# Copyright 2009 Brian Quinlan. All Rights Reserved.
2# Licensed to PSF under a Contributor Agreement.
3
4"""Implements ThreadPoolExecutor."""
5
6__author__ = 'Brian Quinlan (brian@sweetapp.com)'
7
Brian Quinlan81c4d362010-09-18 22:35:02 +00008from concurrent.futures import _base
Gregory P. Smitha3d91b42017-06-21 23:41:13 -07009import itertools
Brian Quinlan81c4d362010-09-18 22:35:02 +000010import queue
11import threading
Batuhan Taşkaya03615562020-04-10 17:46:36 +030012import types
Brian Quinlan81c4d362010-09-18 22:35:02 +000013import weakref
Guido van Rossumcfd46612014-09-02 10:39:18 -070014import os
Brian Quinlan81c4d362010-09-18 22:35:02 +000015
Brian Quinlan81c4d362010-09-18 22:35:02 +000016
Antoine Pitrouc13d4542011-03-26 19:29:44 +010017_threads_queues = weakref.WeakKeyDictionary()
Brian Quinlan81c4d362010-09-18 22:35:02 +000018_shutdown = False
Brian Quinlan242c26f2019-06-28 11:54:52 -070019# Lock that ensures that new workers are not created while the interpreter is
20# shutting down. Must be held while mutating _threads_queues and _shutdown.
21_global_shutdown_lock = threading.Lock()
Brian Quinlan81c4d362010-09-18 22:35:02 +000022
23def _python_exit():
24 global _shutdown
Brian Quinlan242c26f2019-06-28 11:54:52 -070025 with _global_shutdown_lock:
26 _shutdown = True
Antoine Pitrouc13d4542011-03-26 19:29:44 +010027 items = list(_threads_queues.items())
28 for t, q in items:
29 q.put(None)
30 for t, q in items:
31 t.join()
Brian Quinlan81c4d362010-09-18 22:35:02 +000032
Kyle Stanleyb61b8182020-03-27 15:31:22 -040033# Register for `_python_exit()` to be called just before joining all
34# non-daemon threads. This is used instead of `atexit.register()` for
35# compatibility with subinterpreters, which no longer support daemon threads.
36# See bpo-39812 for context.
37threading._register_atexit(_python_exit)
Brian Quinlan81c4d362010-09-18 22:35:02 +000038
Antoine Pitrou63ff4132017-11-04 11:05:49 +010039
Brian Quinlan81c4d362010-09-18 22:35:02 +000040class _WorkItem(object):
41 def __init__(self, future, fn, args, kwargs):
42 self.future = future
43 self.fn = fn
44 self.args = args
45 self.kwargs = kwargs
46
47 def run(self):
48 if not self.future.set_running_or_notify_cancel():
49 return
50
51 try:
52 result = self.fn(*self.args, **self.kwargs)
Victor Stinnerbc613152017-08-22 16:50:42 +020053 except BaseException as exc:
54 self.future.set_exception(exc)
55 # Break a reference cycle with the exception 'exc'
56 self = None
Brian Quinlan81c4d362010-09-18 22:35:02 +000057 else:
58 self.future.set_result(result)
59
Batuhan Taşkaya03615562020-04-10 17:46:36 +030060 __class_getitem__ = classmethod(types.GenericAlias)
61
Antoine Pitrou63ff4132017-11-04 11:05:49 +010062
63def _worker(executor_reference, work_queue, initializer, initargs):
64 if initializer is not None:
65 try:
66 initializer(*initargs)
67 except BaseException:
68 _base.LOGGER.critical('Exception in initializer:', exc_info=True)
69 executor = executor_reference()
70 if executor is not None:
71 executor._initializer_failed()
72 return
Brian Quinlan81c4d362010-09-18 22:35:02 +000073 try:
74 while True:
Antoine Pitrou27be5da2011-04-12 17:48:46 +020075 work_item = work_queue.get(block=True)
76 if work_item is not None:
77 work_item.run()
Andrew Svetlov6b973742012-11-03 15:36:01 +020078 # Delete references to object. See issue16284
79 del work_item
Sean904e34d2019-05-22 14:29:58 -070080
81 # attempt to increment idle count
82 executor = executor_reference()
83 if executor is not None:
84 executor._idle_semaphore.release()
85 del executor
Antoine Pitrou27be5da2011-04-12 17:48:46 +020086 continue
Sean904e34d2019-05-22 14:29:58 -070087
Antoine Pitrouc13d4542011-03-26 19:29:44 +010088 executor = executor_reference()
89 # Exit if:
90 # - The interpreter is shutting down OR
91 # - The executor that owns the worker has been collected OR
92 # - The executor that owns the worker has been shutdown.
93 if _shutdown or executor is None or executor._shutdown:
Mark Nemecc4b695f2018-04-10 18:23:14 +010094 # Flag the executor as shutting down as early as possible if it
95 # is not gc-ed yet.
96 if executor is not None:
97 executor._shutdown = True
Antoine Pitrouc13d4542011-03-26 19:29:44 +010098 # Notice other workers
99 work_queue.put(None)
100 return
101 del executor
Florent Xicluna04842a82011-11-11 20:05:50 +0100102 except BaseException:
Brian Quinlan81c4d362010-09-18 22:35:02 +0000103 _base.LOGGER.critical('Exception in worker', exc_info=True)
104
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100105
106class BrokenThreadPool(_base.BrokenExecutor):
107 """
108 Raised when a worker thread in a ThreadPoolExecutor failed initializing.
109 """
110
111
Brian Quinlan81c4d362010-09-18 22:35:02 +0000112class ThreadPoolExecutor(_base.Executor):
Gregory P. Smitha3d91b42017-06-21 23:41:13 -0700113
114 # Used to assign unique thread names when thread_name_prefix is not supplied.
115 _counter = itertools.count().__next__
116
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100117 def __init__(self, max_workers=None, thread_name_prefix='',
118 initializer=None, initargs=()):
Brian Quinlan81c4d362010-09-18 22:35:02 +0000119 """Initializes a new ThreadPoolExecutor instance.
120
121 Args:
122 max_workers: The maximum number of threads that can be used to
123 execute the given calls.
Gregory P. Smith50abe872016-08-07 10:19:20 -0700124 thread_name_prefix: An optional name prefix to give our threads.
ubordignon552ace72019-06-15 13:43:10 +0200125 initializer: A callable used to initialize worker threads.
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100126 initargs: A tuple of arguments to pass to the initializer.
Brian Quinlan81c4d362010-09-18 22:35:02 +0000127 """
Guido van Rossumcfd46612014-09-02 10:39:18 -0700128 if max_workers is None:
Inada Naoki9a7e5b12019-05-28 21:02:52 +0900129 # ThreadPoolExecutor is often used to:
130 # * CPU bound task which releases GIL
131 # * I/O bound task (which releases GIL, of course)
132 #
133 # We use cpu_count + 4 for both types of tasks.
134 # But we limit it to 32 to avoid consuming surprisingly large resource
135 # on many core machine.
136 max_workers = min(32, (os.cpu_count() or 1) + 4)
Brian Quinlan20efceb2014-05-17 13:51:10 -0700137 if max_workers <= 0:
138 raise ValueError("max_workers must be greater than 0")
139
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100140 if initializer is not None and not callable(initializer):
141 raise TypeError("initializer must be a callable")
142
Brian Quinlan81c4d362010-09-18 22:35:02 +0000143 self._max_workers = max_workers
Antoine Pitrouab745042018-01-18 10:38:03 +0100144 self._work_queue = queue.SimpleQueue()
Sean904e34d2019-05-22 14:29:58 -0700145 self._idle_semaphore = threading.Semaphore(0)
Brian Quinlan81c4d362010-09-18 22:35:02 +0000146 self._threads = set()
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100147 self._broken = False
Brian Quinlan81c4d362010-09-18 22:35:02 +0000148 self._shutdown = False
149 self._shutdown_lock = threading.Lock()
Gregory P. Smitha3d91b42017-06-21 23:41:13 -0700150 self._thread_name_prefix = (thread_name_prefix or
151 ("ThreadPoolExecutor-%d" % self._counter()))
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100152 self._initializer = initializer
153 self._initargs = initargs
Brian Quinlan81c4d362010-09-18 22:35:02 +0000154
Serhiy Storchaka142566c2019-06-05 18:22:31 +0300155 def submit(self, fn, /, *args, **kwargs):
Brian Quinlan242c26f2019-06-28 11:54:52 -0700156 with self._shutdown_lock, _global_shutdown_lock:
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100157 if self._broken:
158 raise BrokenThreadPool(self._broken)
159
Brian Quinlan81c4d362010-09-18 22:35:02 +0000160 if self._shutdown:
161 raise RuntimeError('cannot schedule new futures after shutdown')
Mark Nemecc4b695f2018-04-10 18:23:14 +0100162 if _shutdown:
Serhiy Storchaka34fd4c22018-11-05 16:20:25 +0200163 raise RuntimeError('cannot schedule new futures after '
Mark Nemecc4b695f2018-04-10 18:23:14 +0100164 'interpreter shutdown')
Brian Quinlan81c4d362010-09-18 22:35:02 +0000165
166 f = _base.Future()
167 w = _WorkItem(f, fn, args, kwargs)
168
169 self._work_queue.put(w)
170 self._adjust_thread_count()
171 return f
172 submit.__doc__ = _base.Executor.submit.__doc__
173
174 def _adjust_thread_count(self):
Sean904e34d2019-05-22 14:29:58 -0700175 # if idle threads are available, don't spin new threads
176 if self._idle_semaphore.acquire(timeout=0):
177 return
178
Antoine Pitrouc13d4542011-03-26 19:29:44 +0100179 # When the executor gets lost, the weakref callback will wake up
180 # the worker threads.
181 def weakref_cb(_, q=self._work_queue):
182 q.put(None)
Sean904e34d2019-05-22 14:29:58 -0700183
Gregory P. Smith50abe872016-08-07 10:19:20 -0700184 num_threads = len(self._threads)
185 if num_threads < self._max_workers:
186 thread_name = '%s_%d' % (self._thread_name_prefix or self,
187 num_threads)
188 t = threading.Thread(name=thread_name, target=_worker,
Antoine Pitrouc13d4542011-03-26 19:29:44 +0100189 args=(weakref.ref(self, weakref_cb),
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100190 self._work_queue,
191 self._initializer,
192 self._initargs))
Brian Quinlan81c4d362010-09-18 22:35:02 +0000193 t.start()
194 self._threads.add(t)
Antoine Pitrouc13d4542011-03-26 19:29:44 +0100195 _threads_queues[t] = self._work_queue
Brian Quinlan81c4d362010-09-18 22:35:02 +0000196
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100197 def _initializer_failed(self):
198 with self._shutdown_lock:
199 self._broken = ('A thread initializer failed, the thread pool '
200 'is not usable anymore')
201 # Drain work queue and mark pending futures failed
202 while True:
203 try:
204 work_item = self._work_queue.get_nowait()
205 except queue.Empty:
206 break
207 if work_item is not None:
208 work_item.future.set_exception(BrokenThreadPool(self._broken))
209
Kyle Stanley339fd462020-02-02 07:49:00 -0500210 def shutdown(self, wait=True, *, cancel_futures=False):
Brian Quinlan81c4d362010-09-18 22:35:02 +0000211 with self._shutdown_lock:
212 self._shutdown = True
Kyle Stanley339fd462020-02-02 07:49:00 -0500213 if cancel_futures:
214 # Drain all work items from the queue, and then cancel their
215 # associated futures.
216 while True:
217 try:
218 work_item = self._work_queue.get_nowait()
219 except queue.Empty:
220 break
221 if work_item is not None:
222 work_item.future.cancel()
223
224 # Send a wake-up to prevent threads calling
225 # _work_queue.get(block=True) from permanently blocking.
Antoine Pitrouc13d4542011-03-26 19:29:44 +0100226 self._work_queue.put(None)
Brian Quinlan81c4d362010-09-18 22:35:02 +0000227 if wait:
228 for t in self._threads:
229 t.join()
230 shutdown.__doc__ = _base.Executor.shutdown.__doc__