blob: b004a6acfaeaf6208b24e29a5e8462374af7017a [file] [log] [blame]
Benjamin Petersone711caf2008-06-11 16:44:04 +00001#
2# Module implementing queues
3#
4# multiprocessing/queues.py
5#
R. David Murray3fc969a2010-12-14 01:38:16 +00006# Copyright (c) 2006-2008, R Oudkerk
Richard Oudkerk3e268aa2012-04-30 12:13:55 +01007# Licensed to PSF under a Contributor Agreement.
Benjamin Petersone711caf2008-06-11 16:44:04 +00008#
9
Jesse Noller14f3ae22009-03-31 03:37:07 +000010__all__ = ['Queue', 'SimpleQueue', 'JoinableQueue']
Benjamin Petersone711caf2008-06-11 16:44:04 +000011
12import sys
13import os
14import threading
15import collections
16import time
Benjamin Petersone711caf2008-06-11 16:44:04 +000017import weakref
Antoine Pitroudc19c242011-07-16 01:51:58 +020018import errno
Benjamin Petersone711caf2008-06-11 16:44:04 +000019
20from queue import Empty, Full
Richard Oudkerk84ed9a62013-08-14 15:35:41 +010021
Benjamin Petersone711caf2008-06-11 16:44:04 +000022import _multiprocessing
Richard Oudkerk84ed9a62013-08-14 15:35:41 +010023
24from . import connection
Richard Oudkerkb1694cf2013-10-16 16:41:56 +010025from . import context
Richard Oudkerk84ed9a62013-08-14 15:35:41 +010026
27from .util import debug, info, Finalize, register_after_fork, is_exiting
28from .reduction import ForkingPickler
Benjamin Petersone711caf2008-06-11 16:44:04 +000029
30#
31# Queue type using a pipe, buffer and thread
32#
33
34class Queue(object):
35
Richard Oudkerkb1694cf2013-10-16 16:41:56 +010036 def __init__(self, maxsize=0, *, ctx):
Benjamin Petersone711caf2008-06-11 16:44:04 +000037 if maxsize <= 0:
Berker Peksag7ecfc822015-04-08 17:56:30 +030038 # Can raise ImportError (see issues #3770 and #23400)
39 from .synchronize import SEM_VALUE_MAX as maxsize
Benjamin Petersone711caf2008-06-11 16:44:04 +000040 self._maxsize = maxsize
Richard Oudkerk84ed9a62013-08-14 15:35:41 +010041 self._reader, self._writer = connection.Pipe(duplex=False)
Richard Oudkerkb1694cf2013-10-16 16:41:56 +010042 self._rlock = ctx.Lock()
Benjamin Petersone711caf2008-06-11 16:44:04 +000043 self._opid = os.getpid()
44 if sys.platform == 'win32':
45 self._wlock = None
46 else:
Richard Oudkerkb1694cf2013-10-16 16:41:56 +010047 self._wlock = ctx.Lock()
48 self._sem = ctx.BoundedSemaphore(maxsize)
Antoine Pitroudc19c242011-07-16 01:51:58 +020049 # For use by concurrent.futures
50 self._ignore_epipe = False
Benjamin Petersone711caf2008-06-11 16:44:04 +000051
52 self._after_fork()
53
54 if sys.platform != 'win32':
55 register_after_fork(self, Queue._after_fork)
56
57 def __getstate__(self):
Richard Oudkerkb1694cf2013-10-16 16:41:56 +010058 context.assert_spawning(self)
Antoine Pitroufb960892011-07-20 02:01:39 +020059 return (self._ignore_epipe, self._maxsize, self._reader, self._writer,
Benjamin Petersone711caf2008-06-11 16:44:04 +000060 self._rlock, self._wlock, self._sem, self._opid)
61
62 def __setstate__(self, state):
Antoine Pitroufb960892011-07-20 02:01:39 +020063 (self._ignore_epipe, self._maxsize, self._reader, self._writer,
Benjamin Petersone711caf2008-06-11 16:44:04 +000064 self._rlock, self._wlock, self._sem, self._opid) = state
65 self._after_fork()
66
67 def _after_fork(self):
68 debug('Queue._after_fork()')
69 self._notempty = threading.Condition(threading.Lock())
70 self._buffer = collections.deque()
71 self._thread = None
72 self._jointhread = None
73 self._joincancelled = False
74 self._closed = False
75 self._close = None
Charles-François Natali84e43162013-03-25 18:20:40 +010076 self._send_bytes = self._writer.send_bytes
77 self._recv_bytes = self._reader.recv_bytes
Benjamin Petersone711caf2008-06-11 16:44:04 +000078 self._poll = self._reader.poll
79
80 def put(self, obj, block=True, timeout=None):
81 assert not self._closed
82 if not self._sem.acquire(block, timeout):
83 raise Full
84
Charles-François Natalia924fc72014-05-25 14:12:12 +010085 with self._notempty:
Benjamin Petersone711caf2008-06-11 16:44:04 +000086 if self._thread is None:
87 self._start_thread()
88 self._buffer.append(obj)
89 self._notempty.notify()
Benjamin Petersone711caf2008-06-11 16:44:04 +000090
91 def get(self, block=True, timeout=None):
92 if block and timeout is None:
Charles-François Natali84e43162013-03-25 18:20:40 +010093 with self._rlock:
94 res = self._recv_bytes()
95 self._sem.release()
Benjamin Petersone711caf2008-06-11 16:44:04 +000096 else:
97 if block:
98 deadline = time.time() + timeout
99 if not self._rlock.acquire(block, timeout):
100 raise Empty
101 try:
Antoine Pitroua3651132011-11-10 00:37:09 +0100102 if block:
103 timeout = deadline - time.time()
104 if timeout < 0 or not self._poll(timeout):
105 raise Empty
106 elif not self._poll():
Benjamin Petersone711caf2008-06-11 16:44:04 +0000107 raise Empty
Charles-François Natali84e43162013-03-25 18:20:40 +0100108 res = self._recv_bytes()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000109 self._sem.release()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000110 finally:
111 self._rlock.release()
Charles-François Natali84e43162013-03-25 18:20:40 +0100112 # unserialize the data after having released the lock
113 return ForkingPickler.loads(res)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000114
115 def qsize(self):
Benjamin Peterson87c8d872009-06-11 22:54:11 +0000116 # Raises NotImplementedError on Mac OSX because of broken sem_getvalue()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000117 return self._maxsize - self._sem._semlock._get_value()
118
119 def empty(self):
120 return not self._poll()
121
122 def full(self):
123 return self._sem._semlock._is_zero()
124
125 def get_nowait(self):
126 return self.get(False)
127
128 def put_nowait(self, obj):
129 return self.put(obj, False)
130
131 def close(self):
132 self._closed = True
133 self._reader.close()
134 if self._close:
135 self._close()
136
137 def join_thread(self):
138 debug('Queue.join_thread()')
139 assert self._closed
140 if self._jointhread:
141 self._jointhread()
142
143 def cancel_join_thread(self):
144 debug('Queue.cancel_join_thread()')
145 self._joincancelled = True
146 try:
147 self._jointhread.cancel()
148 except AttributeError:
149 pass
150
151 def _start_thread(self):
152 debug('Queue._start_thread()')
153
154 # Start thread which transfers data from buffer to pipe
155 self._buffer.clear()
156 self._thread = threading.Thread(
157 target=Queue._feed,
Charles-François Natali84e43162013-03-25 18:20:40 +0100158 args=(self._buffer, self._notempty, self._send_bytes,
Antoine Pitroudc19c242011-07-16 01:51:58 +0200159 self._wlock, self._writer.close, self._ignore_epipe),
Benjamin Petersone711caf2008-06-11 16:44:04 +0000160 name='QueueFeederThread'
161 )
Benjamin Peterson72753702008-08-18 18:09:21 +0000162 self._thread.daemon = True
Benjamin Petersone711caf2008-06-11 16:44:04 +0000163
164 debug('doing self._thread.start()')
165 self._thread.start()
166 debug('... done self._thread.start()')
167
168 # On process exit we will wait for data to be flushed to pipe.
169 #
170 # However, if this process created the queue then all
171 # processes which use the queue will be descendants of this
172 # process. Therefore waiting for the queue to be flushed
173 # is pointless once all the child processes have been joined.
174 created_by_this_process = (self._opid == os.getpid())
175 if not self._joincancelled and not created_by_this_process:
176 self._jointhread = Finalize(
177 self._thread, Queue._finalize_join,
178 [weakref.ref(self._thread)],
179 exitpriority=-5
180 )
181
182 # Send sentinel to the thread queue object when garbage collected
183 self._close = Finalize(
184 self, Queue._finalize_close,
185 [self._buffer, self._notempty],
186 exitpriority=10
187 )
188
189 @staticmethod
190 def _finalize_join(twr):
191 debug('joining queue thread')
192 thread = twr()
193 if thread is not None:
194 thread.join()
195 debug('... queue thread joined')
196 else:
197 debug('... queue thread already dead')
198
199 @staticmethod
200 def _finalize_close(buffer, notempty):
201 debug('telling queue thread to quit')
Charles-François Natalia924fc72014-05-25 14:12:12 +0100202 with notempty:
Benjamin Petersone711caf2008-06-11 16:44:04 +0000203 buffer.append(_sentinel)
204 notempty.notify()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000205
206 @staticmethod
Charles-François Natali84e43162013-03-25 18:20:40 +0100207 def _feed(buffer, notempty, send_bytes, writelock, close, ignore_epipe):
Benjamin Petersone711caf2008-06-11 16:44:04 +0000208 debug('starting thread to feed data to pipe')
Benjamin Petersone711caf2008-06-11 16:44:04 +0000209 nacquire = notempty.acquire
210 nrelease = notempty.release
211 nwait = notempty.wait
212 bpopleft = buffer.popleft
213 sentinel = _sentinel
214 if sys.platform != 'win32':
215 wacquire = writelock.acquire
216 wrelease = writelock.release
217 else:
218 wacquire = None
219
220 try:
221 while 1:
222 nacquire()
223 try:
224 if not buffer:
225 nwait()
226 finally:
227 nrelease()
228 try:
229 while 1:
230 obj = bpopleft()
231 if obj is sentinel:
232 debug('feeder thread got sentinel -- exiting')
233 close()
234 return
235
Charles-François Natali84e43162013-03-25 18:20:40 +0100236 # serialize the data before acquiring the lock
237 obj = ForkingPickler.dumps(obj)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000238 if wacquire is None:
Charles-François Natali84e43162013-03-25 18:20:40 +0100239 send_bytes(obj)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000240 else:
241 wacquire()
242 try:
Charles-François Natali84e43162013-03-25 18:20:40 +0100243 send_bytes(obj)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000244 finally:
245 wrelease()
246 except IndexError:
247 pass
248 except Exception as e:
Antoine Pitroudc19c242011-07-16 01:51:58 +0200249 if ignore_epipe and getattr(e, 'errno', 0) == errno.EPIPE:
250 return
Benjamin Petersone711caf2008-06-11 16:44:04 +0000251 # Since this runs in a daemon thread the resources it uses
252 # may be become unusable while the process is cleaning up.
253 # We ignore errors which happen after the process has
254 # started to cleanup.
255 try:
256 if is_exiting():
257 info('error in queue thread: %s', e)
258 else:
259 import traceback
260 traceback.print_exc()
261 except Exception:
262 pass
263
264_sentinel = object()
265
266#
267# A queue type which also supports join() and task_done() methods
268#
269# Note that if you do not call task_done() for each finished task then
270# eventually the counter's semaphore may overflow causing Bad Things
271# to happen.
272#
273
274class JoinableQueue(Queue):
275
Richard Oudkerkb1694cf2013-10-16 16:41:56 +0100276 def __init__(self, maxsize=0, *, ctx):
277 Queue.__init__(self, maxsize, ctx=ctx)
278 self._unfinished_tasks = ctx.Semaphore(0)
279 self._cond = ctx.Condition()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000280
281 def __getstate__(self):
282 return Queue.__getstate__(self) + (self._cond, self._unfinished_tasks)
283
284 def __setstate__(self, state):
285 Queue.__setstate__(self, state[:-2])
286 self._cond, self._unfinished_tasks = state[-2:]
287
Benjamin Peterson8719ad52009-09-11 22:24:02 +0000288 def put(self, obj, block=True, timeout=None):
289 assert not self._closed
290 if not self._sem.acquire(block, timeout):
291 raise Full
292
Charles-François Natalia924fc72014-05-25 14:12:12 +0100293 with self._notempty, self._cond:
Benjamin Peterson8719ad52009-09-11 22:24:02 +0000294 if self._thread is None:
295 self._start_thread()
296 self._buffer.append(obj)
297 self._unfinished_tasks.release()
298 self._notempty.notify()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000299
300 def task_done(self):
Charles-François Natalia924fc72014-05-25 14:12:12 +0100301 with self._cond:
Benjamin Petersone711caf2008-06-11 16:44:04 +0000302 if not self._unfinished_tasks.acquire(False):
303 raise ValueError('task_done() called too many times')
304 if self._unfinished_tasks._semlock._is_zero():
305 self._cond.notify_all()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000306
307 def join(self):
Charles-François Natalia924fc72014-05-25 14:12:12 +0100308 with self._cond:
Benjamin Petersone711caf2008-06-11 16:44:04 +0000309 if not self._unfinished_tasks._semlock._is_zero():
310 self._cond.wait()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000311
312#
313# Simplified Queue type -- really just a locked pipe
314#
315
316class SimpleQueue(object):
317
Richard Oudkerkb1694cf2013-10-16 16:41:56 +0100318 def __init__(self, *, ctx):
Richard Oudkerk84ed9a62013-08-14 15:35:41 +0100319 self._reader, self._writer = connection.Pipe(duplex=False)
Richard Oudkerkb1694cf2013-10-16 16:41:56 +0100320 self._rlock = ctx.Lock()
Antoine Pitroubdb1cf12012-03-05 19:28:37 +0100321 self._poll = self._reader.poll
Benjamin Petersone711caf2008-06-11 16:44:04 +0000322 if sys.platform == 'win32':
323 self._wlock = None
324 else:
Richard Oudkerkb1694cf2013-10-16 16:41:56 +0100325 self._wlock = ctx.Lock()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000326
327 def empty(self):
Antoine Pitroubdb1cf12012-03-05 19:28:37 +0100328 return not self._poll()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000329
330 def __getstate__(self):
Richard Oudkerkb1694cf2013-10-16 16:41:56 +0100331 context.assert_spawning(self)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000332 return (self._reader, self._writer, self._rlock, self._wlock)
333
334 def __setstate__(self, state):
335 (self._reader, self._writer, self._rlock, self._wlock) = state
Benjamin Petersone711caf2008-06-11 16:44:04 +0000336
Charles-François Natali84e43162013-03-25 18:20:40 +0100337 def get(self):
338 with self._rlock:
339 res = self._reader.recv_bytes()
340 # unserialize the data after having released the lock
341 return ForkingPickler.loads(res)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000342
Charles-François Natali84e43162013-03-25 18:20:40 +0100343 def put(self, obj):
344 # serialize the data before acquiring the lock
345 obj = ForkingPickler.dumps(obj)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000346 if self._wlock is None:
347 # writes to a message oriented win32 pipe are atomic
Charles-François Natali84e43162013-03-25 18:20:40 +0100348 self._writer.send_bytes(obj)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000349 else:
Charles-François Natali84e43162013-03-25 18:20:40 +0100350 with self._wlock:
351 self._writer.send_bytes(obj)