blob: 0a61e3a9ac1bd1b8232eb8bb893b97a4327bc46c [file] [log] [blame]
Brian Quinlan81c4d362010-09-18 22:35:02 +00001# Copyright 2009 Brian Quinlan. All Rights Reserved.
2# Licensed to PSF under a Contributor Agreement.
3
4"""Implements ThreadPoolExecutor."""
5
6__author__ = 'Brian Quinlan (brian@sweetapp.com)'
7
8import atexit
9from concurrent.futures import _base
Gregory P. Smitha3d91b42017-06-21 23:41:13 -070010import itertools
Brian Quinlan81c4d362010-09-18 22:35:02 +000011import queue
12import threading
13import weakref
Guido van Rossumcfd46612014-09-02 10:39:18 -070014import os
Brian Quinlan81c4d362010-09-18 22:35:02 +000015
16# Workers are created as daemon threads. This is done to allow the interpreter
17# to exit when there are still idle threads in a ThreadPoolExecutor's thread
18# pool (i.e. shutdown() was not called). However, allowing workers to die with
19# the interpreter has two undesirable properties:
Raymond Hettinger15f44ab2016-08-30 10:47:49 -070020# - The workers would still be running during interpreter shutdown,
Brian Quinlan81c4d362010-09-18 22:35:02 +000021# meaning that they would fail in unpredictable ways.
22# - The workers could be killed while evaluating a work item, which could
23# be bad if the callable being evaluated has external side-effects e.g.
24# writing to a file.
25#
26# To work around this problem, an exit handler is installed which tells the
27# workers to exit when their work queues are empty and then waits until the
28# threads finish.
29
Antoine Pitrouc13d4542011-03-26 19:29:44 +010030_threads_queues = weakref.WeakKeyDictionary()
Brian Quinlan81c4d362010-09-18 22:35:02 +000031_shutdown = False
32
33def _python_exit():
34 global _shutdown
35 _shutdown = True
Antoine Pitrouc13d4542011-03-26 19:29:44 +010036 items = list(_threads_queues.items())
37 for t, q in items:
38 q.put(None)
39 for t, q in items:
40 t.join()
Brian Quinlan81c4d362010-09-18 22:35:02 +000041
42atexit.register(_python_exit)
43
Antoine Pitrou63ff4132017-11-04 11:05:49 +010044
Brian Quinlan81c4d362010-09-18 22:35:02 +000045class _WorkItem(object):
46 def __init__(self, future, fn, args, kwargs):
47 self.future = future
48 self.fn = fn
49 self.args = args
50 self.kwargs = kwargs
51
52 def run(self):
53 if not self.future.set_running_or_notify_cancel():
54 return
55
56 try:
57 result = self.fn(*self.args, **self.kwargs)
Victor Stinnerbc613152017-08-22 16:50:42 +020058 except BaseException as exc:
59 self.future.set_exception(exc)
60 # Break a reference cycle with the exception 'exc'
61 self = None
Brian Quinlan81c4d362010-09-18 22:35:02 +000062 else:
63 self.future.set_result(result)
64
Antoine Pitrou63ff4132017-11-04 11:05:49 +010065
66def _worker(executor_reference, work_queue, initializer, initargs):
67 if initializer is not None:
68 try:
69 initializer(*initargs)
70 except BaseException:
71 _base.LOGGER.critical('Exception in initializer:', exc_info=True)
72 executor = executor_reference()
73 if executor is not None:
74 executor._initializer_failed()
75 return
Brian Quinlan81c4d362010-09-18 22:35:02 +000076 try:
77 while True:
Antoine Pitrou27be5da2011-04-12 17:48:46 +020078 work_item = work_queue.get(block=True)
79 if work_item is not None:
80 work_item.run()
Andrew Svetlov6b973742012-11-03 15:36:01 +020081 # Delete references to object. See issue16284
82 del work_item
Antoine Pitrou27be5da2011-04-12 17:48:46 +020083 continue
Antoine Pitrouc13d4542011-03-26 19:29:44 +010084 executor = executor_reference()
85 # Exit if:
86 # - The interpreter is shutting down OR
87 # - The executor that owns the worker has been collected OR
88 # - The executor that owns the worker has been shutdown.
89 if _shutdown or executor is None or executor._shutdown:
Mark Nemecc4b695f2018-04-10 18:23:14 +010090 # Flag the executor as shutting down as early as possible if it
91 # is not gc-ed yet.
92 if executor is not None:
93 executor._shutdown = True
Antoine Pitrouc13d4542011-03-26 19:29:44 +010094 # Notice other workers
95 work_queue.put(None)
96 return
97 del executor
Florent Xicluna04842a82011-11-11 20:05:50 +010098 except BaseException:
Brian Quinlan81c4d362010-09-18 22:35:02 +000099 _base.LOGGER.critical('Exception in worker', exc_info=True)
100
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100101
102class BrokenThreadPool(_base.BrokenExecutor):
103 """
104 Raised when a worker thread in a ThreadPoolExecutor failed initializing.
105 """
106
107
Brian Quinlan81c4d362010-09-18 22:35:02 +0000108class ThreadPoolExecutor(_base.Executor):
Gregory P. Smitha3d91b42017-06-21 23:41:13 -0700109
110 # Used to assign unique thread names when thread_name_prefix is not supplied.
111 _counter = itertools.count().__next__
112
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100113 def __init__(self, max_workers=None, thread_name_prefix='',
114 initializer=None, initargs=()):
Brian Quinlan81c4d362010-09-18 22:35:02 +0000115 """Initializes a new ThreadPoolExecutor instance.
116
117 Args:
118 max_workers: The maximum number of threads that can be used to
119 execute the given calls.
Gregory P. Smith50abe872016-08-07 10:19:20 -0700120 thread_name_prefix: An optional name prefix to give our threads.
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100121 initializer: An callable used to initialize worker threads.
122 initargs: A tuple of arguments to pass to the initializer.
Brian Quinlan81c4d362010-09-18 22:35:02 +0000123 """
Guido van Rossumcfd46612014-09-02 10:39:18 -0700124 if max_workers is None:
125 # Use this number because ThreadPoolExecutor is often
126 # used to overlap I/O instead of CPU work.
127 max_workers = (os.cpu_count() or 1) * 5
Brian Quinlan20efceb2014-05-17 13:51:10 -0700128 if max_workers <= 0:
129 raise ValueError("max_workers must be greater than 0")
130
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100131 if initializer is not None and not callable(initializer):
132 raise TypeError("initializer must be a callable")
133
Brian Quinlan81c4d362010-09-18 22:35:02 +0000134 self._max_workers = max_workers
Antoine Pitrouab745042018-01-18 10:38:03 +0100135 self._work_queue = queue.SimpleQueue()
Brian Quinlan81c4d362010-09-18 22:35:02 +0000136 self._threads = set()
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100137 self._broken = False
Brian Quinlan81c4d362010-09-18 22:35:02 +0000138 self._shutdown = False
139 self._shutdown_lock = threading.Lock()
Gregory P. Smitha3d91b42017-06-21 23:41:13 -0700140 self._thread_name_prefix = (thread_name_prefix or
141 ("ThreadPoolExecutor-%d" % self._counter()))
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100142 self._initializer = initializer
143 self._initargs = initargs
Brian Quinlan81c4d362010-09-18 22:35:02 +0000144
Serhiy Storchaka42a139e2019-04-01 09:16:35 +0300145 def submit(*args, **kwargs):
146 if len(args) >= 2:
147 self, fn, *args = args
148 elif not args:
149 raise TypeError("descriptor 'submit' of 'ThreadPoolExecutor' object "
150 "needs an argument")
151 elif 'fn' in kwargs:
152 fn = kwargs.pop('fn')
153 self, *args = args
154 import warnings
155 warnings.warn("Passing 'fn' as keyword argument is deprecated",
156 DeprecationWarning, stacklevel=2)
157 else:
158 raise TypeError('submit expected at least 1 positional argument, '
159 'got %d' % (len(args)-1))
160
Brian Quinlan81c4d362010-09-18 22:35:02 +0000161 with self._shutdown_lock:
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100162 if self._broken:
163 raise BrokenThreadPool(self._broken)
164
Brian Quinlan81c4d362010-09-18 22:35:02 +0000165 if self._shutdown:
166 raise RuntimeError('cannot schedule new futures after shutdown')
Mark Nemecc4b695f2018-04-10 18:23:14 +0100167 if _shutdown:
Serhiy Storchaka34fd4c22018-11-05 16:20:25 +0200168 raise RuntimeError('cannot schedule new futures after '
Mark Nemecc4b695f2018-04-10 18:23:14 +0100169 'interpreter shutdown')
Brian Quinlan81c4d362010-09-18 22:35:02 +0000170
171 f = _base.Future()
172 w = _WorkItem(f, fn, args, kwargs)
173
174 self._work_queue.put(w)
175 self._adjust_thread_count()
176 return f
177 submit.__doc__ = _base.Executor.submit.__doc__
178
179 def _adjust_thread_count(self):
Antoine Pitrouc13d4542011-03-26 19:29:44 +0100180 # When the executor gets lost, the weakref callback will wake up
181 # the worker threads.
182 def weakref_cb(_, q=self._work_queue):
183 q.put(None)
Brian Quinlan81c4d362010-09-18 22:35:02 +0000184 # TODO(bquinlan): Should avoid creating new threads if there are more
185 # idle threads than items in the work queue.
Gregory P. Smith50abe872016-08-07 10:19:20 -0700186 num_threads = len(self._threads)
187 if num_threads < self._max_workers:
188 thread_name = '%s_%d' % (self._thread_name_prefix or self,
189 num_threads)
190 t = threading.Thread(name=thread_name, target=_worker,
Antoine Pitrouc13d4542011-03-26 19:29:44 +0100191 args=(weakref.ref(self, weakref_cb),
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100192 self._work_queue,
193 self._initializer,
194 self._initargs))
Brian Quinlan81c4d362010-09-18 22:35:02 +0000195 t.daemon = True
196 t.start()
197 self._threads.add(t)
Antoine Pitrouc13d4542011-03-26 19:29:44 +0100198 _threads_queues[t] = self._work_queue
Brian Quinlan81c4d362010-09-18 22:35:02 +0000199
Antoine Pitrou63ff4132017-11-04 11:05:49 +0100200 def _initializer_failed(self):
201 with self._shutdown_lock:
202 self._broken = ('A thread initializer failed, the thread pool '
203 'is not usable anymore')
204 # Drain work queue and mark pending futures failed
205 while True:
206 try:
207 work_item = self._work_queue.get_nowait()
208 except queue.Empty:
209 break
210 if work_item is not None:
211 work_item.future.set_exception(BrokenThreadPool(self._broken))
212
Brian Quinlan81c4d362010-09-18 22:35:02 +0000213 def shutdown(self, wait=True):
214 with self._shutdown_lock:
215 self._shutdown = True
Antoine Pitrouc13d4542011-03-26 19:29:44 +0100216 self._work_queue.put(None)
Brian Quinlan81c4d362010-09-18 22:35:02 +0000217 if wait:
218 for t in self._threads:
219 t.join()
220 shutdown.__doc__ = _base.Executor.shutdown.__doc__