blob: 51c942f51abd371e80ffa07c2b212336afb8eae2 [file] [log] [blame]
Brian Quinlan81c4d362010-09-18 22:35:02 +00001# Copyright 2009 Brian Quinlan. All Rights Reserved.
2# Licensed to PSF under a Contributor Agreement.
3
4"""Implements ThreadPoolExecutor."""
5
6__author__ = 'Brian Quinlan (brian@sweetapp.com)'
7
Brian Quinlan81c4d362010-09-18 22:35:02 +00008from concurrent.futures import _base
Gregory P. Smitha3d91b42017-06-21 23:41:13 -07009import itertools
Brian Quinlan81c4d362010-09-18 22:35:02 +000010import queue
11import threading
Batuhan Taşkaya03615562020-04-10 17:46:36 +030012import types
Brian Quinlan81c4d362010-09-18 22:35:02 +000013import weakref
Guido van Rossumcfd46612014-09-02 10:39:18 -070014import os
Brian Quinlan81c4d362010-09-18 22:35:02 +000015
Brian Quinlan81c4d362010-09-18 22:35:02 +000016
Antoine Pitrouc13d4542011-03-26 19:29:44 +010017_threads_queues = weakref.WeakKeyDictionary()
Brian Quinlan81c4d362010-09-18 22:35:02 +000018_shutdown = False
Brian Quinlan242c26f2019-06-28 11:54:52 -070019# Lock that ensures that new workers are not created while the interpreter is
20# shutting down. Must be held while mutating _threads_queues and _shutdown.
21_global_shutdown_lock = threading.Lock()
Brian Quinlan81c4d362010-09-18 22:35:02 +000022
23def _python_exit():
24 global _shutdown
Brian Quinlan242c26f2019-06-28 11:54:52 -070025 with _global_shutdown_lock:
26 _shutdown = True
Antoine Pitrouc13d4542011-03-26 19:29:44 +010027 items = list(_threads_queues.items())
28 for t, q in items:
29 q.put(None)
30 for t, q in items:
31 t.join()
Brian Quinlan81c4d362010-09-18 22:35:02 +000032
Kyle Stanleyb61b8182020-03-27 15:31:22 -040033# Register for `_python_exit()` to be called just before joining all
34# non-daemon threads. This is used instead of `atexit.register()` for
35# compatibility with subinterpreters, which no longer support daemon threads.
36# See bpo-39812 for context.
37threading._register_atexit(_python_exit)
Brian Quinlan81c4d362010-09-18 22:35:02 +000038
Miss Islington (bot)d0d83a92021-09-20 11:52:23 -070039# At fork, reinitialize the `_global_shutdown_lock` lock in the child process
40if hasattr(os, 'register_at_fork'):
41 os.register_at_fork(before=_global_shutdown_lock.acquire,
42 after_in_child=_global_shutdown_lock._at_fork_reinit,
43 after_in_parent=_global_shutdown_lock.release)
44
Antoine Pitrou63ff4132017-11-04 11:05:49 +010045
Brian Quinlan81c4d362010-09-18 22:35:02 +000046class _WorkItem(object):
47 def __init__(self, future, fn, args, kwargs):
48 self.future = future
49 self.fn = fn
50 self.args = args
51 self.kwargs = kwargs
52
53 def run(self):
54 if not self.future.set_running_or_notify_cancel():
55 return
56
57 try:
58 result = self.fn(*self.args, **self.kwargs)
Victor Stinnerbc613152017-08-22 16:50:42 +020059 except BaseException as exc:
60 self.future.set_exception(exc)
61 # Break a reference cycle with the exception 'exc'
62 self = None
Brian Quinlan81c4d362010-09-18 22:35:02 +000063 else:
64 self.future.set_result(result)
65
Batuhan Taşkaya03615562020-04-10 17:46:36 +030066 __class_getitem__ = classmethod(types.GenericAlias)
67
Antoine Pitrou63ff4132017-11-04 11:05:49 +010068
69def _worker(executor_reference, work_queue, initializer, initargs):
70 if initializer is not None:
71 try:
72 initializer(*initargs)
73 except BaseException:
74 _base.LOGGER.critical('Exception in initializer:', exc_info=True)
75 executor = executor_reference()
76 if executor is not None:
77 executor._initializer_failed()
78 return
Brian Quinlan81c4d362010-09-18 22:35:02 +000079 try:
80 while True:
Antoine Pitrou27be5da2011-04-12 17:48:46 +020081 work_item = work_queue.get(block=True)
82 if work_item is not None:
83 work_item.run()
Andrew Svetlov6b973742012-11-03 15:36:01 +020084 # Delete references to object. See issue16284
85 del work_item
Sean904e34d2019-05-22 14:29:58 -070086
87 # attempt to increment idle count
88 executor = executor_reference()
89 if executor is not None:
90 executor._idle_semaphore.release()
91 del executor
Antoine Pitrou27be5da2011-04-12 17:48:46 +020092 continue
Sean904e34d2019-05-22 14:29:58 -070093
Antoine Pitrouc13d4542011-03-26 19:29:44 +010094 executor = executor_reference()
95 # Exit if:
96 # - The interpreter is shutting down OR
97 # - The executor that owns the worker has been collected OR
98 # - The executor that owns the worker has been shutdown.
99 if _shutdown or executor is None or executor._shutdown:
Mark Nemecc4b695f2018-04-10 18:23:14 +0100100 # Flag the executor as shutting down as early as possible if it
101 # is not gc-ed yet.
102 if executor is not None:
103 executor._shutdown = True
Antoine Pitrouc13d4542011-03-26 19:29:44 +0100104 # Notice other workers
105 work_queue.put(None)
106 return
107 del executor
Florent Xicluna04842a82011-11-11 20:05:50 +0100108 except BaseException:
Brian Quinlan81c4d362010-09-18 22:35:02 +0000109 _base.LOGGER.critical('Exception in worker', exc_info=True)
110
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100111
112class BrokenThreadPool(_base.BrokenExecutor):
113 """
114 Raised when a worker thread in a ThreadPoolExecutor failed initializing.
115 """
116
117
Brian Quinlan81c4d362010-09-18 22:35:02 +0000118class ThreadPoolExecutor(_base.Executor):
Gregory P. Smitha3d91b42017-06-21 23:41:13 -0700119
120 # Used to assign unique thread names when thread_name_prefix is not supplied.
121 _counter = itertools.count().__next__
122
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100123 def __init__(self, max_workers=None, thread_name_prefix='',
124 initializer=None, initargs=()):
Brian Quinlan81c4d362010-09-18 22:35:02 +0000125 """Initializes a new ThreadPoolExecutor instance.
126
127 Args:
128 max_workers: The maximum number of threads that can be used to
129 execute the given calls.
Gregory P. Smith50abe872016-08-07 10:19:20 -0700130 thread_name_prefix: An optional name prefix to give our threads.
ubordignon552ace72019-06-15 13:43:10 +0200131 initializer: A callable used to initialize worker threads.
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100132 initargs: A tuple of arguments to pass to the initializer.
Brian Quinlan81c4d362010-09-18 22:35:02 +0000133 """
Guido van Rossumcfd46612014-09-02 10:39:18 -0700134 if max_workers is None:
Inada Naoki9a7e5b12019-05-28 21:02:52 +0900135 # ThreadPoolExecutor is often used to:
136 # * CPU bound task which releases GIL
137 # * I/O bound task (which releases GIL, of course)
138 #
139 # We use cpu_count + 4 for both types of tasks.
140 # But we limit it to 32 to avoid consuming surprisingly large resource
141 # on many core machine.
142 max_workers = min(32, (os.cpu_count() or 1) + 4)
Brian Quinlan20efceb2014-05-17 13:51:10 -0700143 if max_workers <= 0:
144 raise ValueError("max_workers must be greater than 0")
145
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100146 if initializer is not None and not callable(initializer):
147 raise TypeError("initializer must be a callable")
148
Brian Quinlan81c4d362010-09-18 22:35:02 +0000149 self._max_workers = max_workers
Antoine Pitrouab745042018-01-18 10:38:03 +0100150 self._work_queue = queue.SimpleQueue()
Sean904e34d2019-05-22 14:29:58 -0700151 self._idle_semaphore = threading.Semaphore(0)
Brian Quinlan81c4d362010-09-18 22:35:02 +0000152 self._threads = set()
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100153 self._broken = False
Brian Quinlan81c4d362010-09-18 22:35:02 +0000154 self._shutdown = False
155 self._shutdown_lock = threading.Lock()
Gregory P. Smitha3d91b42017-06-21 23:41:13 -0700156 self._thread_name_prefix = (thread_name_prefix or
157 ("ThreadPoolExecutor-%d" % self._counter()))
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100158 self._initializer = initializer
159 self._initargs = initargs
Brian Quinlan81c4d362010-09-18 22:35:02 +0000160
Serhiy Storchaka142566c2019-06-05 18:22:31 +0300161 def submit(self, fn, /, *args, **kwargs):
Brian Quinlan242c26f2019-06-28 11:54:52 -0700162 with self._shutdown_lock, _global_shutdown_lock:
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100163 if self._broken:
164 raise BrokenThreadPool(self._broken)
165
Brian Quinlan81c4d362010-09-18 22:35:02 +0000166 if self._shutdown:
167 raise RuntimeError('cannot schedule new futures after shutdown')
Mark Nemecc4b695f2018-04-10 18:23:14 +0100168 if _shutdown:
Serhiy Storchaka34fd4c22018-11-05 16:20:25 +0200169 raise RuntimeError('cannot schedule new futures after '
Mark Nemecc4b695f2018-04-10 18:23:14 +0100170 'interpreter shutdown')
Brian Quinlan81c4d362010-09-18 22:35:02 +0000171
172 f = _base.Future()
173 w = _WorkItem(f, fn, args, kwargs)
174
175 self._work_queue.put(w)
176 self._adjust_thread_count()
177 return f
178 submit.__doc__ = _base.Executor.submit.__doc__
179
180 def _adjust_thread_count(self):
Sean904e34d2019-05-22 14:29:58 -0700181 # if idle threads are available, don't spin new threads
182 if self._idle_semaphore.acquire(timeout=0):
183 return
184
Antoine Pitrouc13d4542011-03-26 19:29:44 +0100185 # When the executor gets lost, the weakref callback will wake up
186 # the worker threads.
187 def weakref_cb(_, q=self._work_queue):
188 q.put(None)
Sean904e34d2019-05-22 14:29:58 -0700189
Gregory P. Smith50abe872016-08-07 10:19:20 -0700190 num_threads = len(self._threads)
191 if num_threads < self._max_workers:
192 thread_name = '%s_%d' % (self._thread_name_prefix or self,
193 num_threads)
194 t = threading.Thread(name=thread_name, target=_worker,
Antoine Pitrouc13d4542011-03-26 19:29:44 +0100195 args=(weakref.ref(self, weakref_cb),
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100196 self._work_queue,
197 self._initializer,
198 self._initargs))
Brian Quinlan81c4d362010-09-18 22:35:02 +0000199 t.start()
200 self._threads.add(t)
Antoine Pitrouc13d4542011-03-26 19:29:44 +0100201 _threads_queues[t] = self._work_queue
Brian Quinlan81c4d362010-09-18 22:35:02 +0000202
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100203 def _initializer_failed(self):
204 with self._shutdown_lock:
205 self._broken = ('A thread initializer failed, the thread pool '
206 'is not usable anymore')
207 # Drain work queue and mark pending futures failed
208 while True:
209 try:
210 work_item = self._work_queue.get_nowait()
211 except queue.Empty:
212 break
213 if work_item is not None:
214 work_item.future.set_exception(BrokenThreadPool(self._broken))
215
Kyle Stanley339fd462020-02-02 07:49:00 -0500216 def shutdown(self, wait=True, *, cancel_futures=False):
Brian Quinlan81c4d362010-09-18 22:35:02 +0000217 with self._shutdown_lock:
218 self._shutdown = True
Kyle Stanley339fd462020-02-02 07:49:00 -0500219 if cancel_futures:
220 # Drain all work items from the queue, and then cancel their
221 # associated futures.
222 while True:
223 try:
224 work_item = self._work_queue.get_nowait()
225 except queue.Empty:
226 break
227 if work_item is not None:
228 work_item.future.cancel()
229
230 # Send a wake-up to prevent threads calling
231 # _work_queue.get(block=True) from permanently blocking.
Antoine Pitrouc13d4542011-03-26 19:29:44 +0100232 self._work_queue.put(None)
Brian Quinlan81c4d362010-09-18 22:35:02 +0000233 if wait:
234 for t in self._threads:
235 t.join()
236 shutdown.__doc__ = _base.Executor.shutdown.__doc__