blob: 293ad7673c603c4191d47123403344369415d2e0 [file] [log] [blame]
Benjamin Petersone711caf2008-06-11 16:44:04 +00001#
2# Module implementing queues
3#
4# multiprocessing/queues.py
5#
R. David Murray3fc969a2010-12-14 01:38:16 +00006# Copyright (c) 2006-2008, R Oudkerk
Richard Oudkerk3e268aa2012-04-30 12:13:55 +01007# Licensed to PSF under a Contributor Agreement.
Benjamin Petersone711caf2008-06-11 16:44:04 +00008#
9
Jesse Noller14f3ae22009-03-31 03:37:07 +000010__all__ = ['Queue', 'SimpleQueue', 'JoinableQueue']
Benjamin Petersone711caf2008-06-11 16:44:04 +000011
12import sys
13import os
14import threading
15import collections
16import time
Benjamin Petersone711caf2008-06-11 16:44:04 +000017import weakref
Antoine Pitroudc19c242011-07-16 01:51:58 +020018import errno
Benjamin Petersone711caf2008-06-11 16:44:04 +000019
20from queue import Empty, Full
Richard Oudkerk84ed9a62013-08-14 15:35:41 +010021
Benjamin Petersone711caf2008-06-11 16:44:04 +000022import _multiprocessing
Richard Oudkerk84ed9a62013-08-14 15:35:41 +010023
24from . import connection
Richard Oudkerkb1694cf2013-10-16 16:41:56 +010025from . import context
Richard Oudkerk84ed9a62013-08-14 15:35:41 +010026
27from .util import debug, info, Finalize, register_after_fork, is_exiting
28from .reduction import ForkingPickler
Benjamin Petersone711caf2008-06-11 16:44:04 +000029
30#
31# Queue type using a pipe, buffer and thread
32#
33
34class Queue(object):
35
Richard Oudkerkb1694cf2013-10-16 16:41:56 +010036 def __init__(self, maxsize=0, *, ctx):
Benjamin Petersone711caf2008-06-11 16:44:04 +000037 if maxsize <= 0:
Berker Peksag7ecfc822015-04-08 17:56:30 +030038 # Can raise ImportError (see issues #3770 and #23400)
39 from .synchronize import SEM_VALUE_MAX as maxsize
Benjamin Petersone711caf2008-06-11 16:44:04 +000040 self._maxsize = maxsize
Richard Oudkerk84ed9a62013-08-14 15:35:41 +010041 self._reader, self._writer = connection.Pipe(duplex=False)
Richard Oudkerkb1694cf2013-10-16 16:41:56 +010042 self._rlock = ctx.Lock()
Benjamin Petersone711caf2008-06-11 16:44:04 +000043 self._opid = os.getpid()
44 if sys.platform == 'win32':
45 self._wlock = None
46 else:
Richard Oudkerkb1694cf2013-10-16 16:41:56 +010047 self._wlock = ctx.Lock()
48 self._sem = ctx.BoundedSemaphore(maxsize)
Antoine Pitroudc19c242011-07-16 01:51:58 +020049 # For use by concurrent.futures
50 self._ignore_epipe = False
Benjamin Petersone711caf2008-06-11 16:44:04 +000051
52 self._after_fork()
53
54 if sys.platform != 'win32':
55 register_after_fork(self, Queue._after_fork)
56
57 def __getstate__(self):
Richard Oudkerkb1694cf2013-10-16 16:41:56 +010058 context.assert_spawning(self)
Antoine Pitroufb960892011-07-20 02:01:39 +020059 return (self._ignore_epipe, self._maxsize, self._reader, self._writer,
Benjamin Petersone711caf2008-06-11 16:44:04 +000060 self._rlock, self._wlock, self._sem, self._opid)
61
62 def __setstate__(self, state):
Antoine Pitroufb960892011-07-20 02:01:39 +020063 (self._ignore_epipe, self._maxsize, self._reader, self._writer,
Benjamin Petersone711caf2008-06-11 16:44:04 +000064 self._rlock, self._wlock, self._sem, self._opid) = state
65 self._after_fork()
66
67 def _after_fork(self):
68 debug('Queue._after_fork()')
69 self._notempty = threading.Condition(threading.Lock())
70 self._buffer = collections.deque()
71 self._thread = None
72 self._jointhread = None
73 self._joincancelled = False
74 self._closed = False
75 self._close = None
Charles-François Natali84e43162013-03-25 18:20:40 +010076 self._send_bytes = self._writer.send_bytes
77 self._recv_bytes = self._reader.recv_bytes
Benjamin Petersone711caf2008-06-11 16:44:04 +000078 self._poll = self._reader.poll
79
80 def put(self, obj, block=True, timeout=None):
81 assert not self._closed
82 if not self._sem.acquire(block, timeout):
83 raise Full
84
85 self._notempty.acquire()
86 try:
87 if self._thread is None:
88 self._start_thread()
89 self._buffer.append(obj)
90 self._notempty.notify()
91 finally:
92 self._notempty.release()
93
94 def get(self, block=True, timeout=None):
95 if block and timeout is None:
Charles-François Natali84e43162013-03-25 18:20:40 +010096 with self._rlock:
97 res = self._recv_bytes()
98 self._sem.release()
Benjamin Petersone711caf2008-06-11 16:44:04 +000099 else:
100 if block:
101 deadline = time.time() + timeout
102 if not self._rlock.acquire(block, timeout):
103 raise Empty
104 try:
Antoine Pitroua3651132011-11-10 00:37:09 +0100105 if block:
106 timeout = deadline - time.time()
107 if timeout < 0 or not self._poll(timeout):
108 raise Empty
109 elif not self._poll():
Benjamin Petersone711caf2008-06-11 16:44:04 +0000110 raise Empty
Charles-François Natali84e43162013-03-25 18:20:40 +0100111 res = self._recv_bytes()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000112 self._sem.release()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000113 finally:
114 self._rlock.release()
Charles-François Natali84e43162013-03-25 18:20:40 +0100115 # unserialize the data after having released the lock
116 return ForkingPickler.loads(res)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000117
118 def qsize(self):
Benjamin Peterson87c8d872009-06-11 22:54:11 +0000119 # Raises NotImplementedError on Mac OSX because of broken sem_getvalue()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000120 return self._maxsize - self._sem._semlock._get_value()
121
122 def empty(self):
123 return not self._poll()
124
125 def full(self):
126 return self._sem._semlock._is_zero()
127
128 def get_nowait(self):
129 return self.get(False)
130
131 def put_nowait(self, obj):
132 return self.put(obj, False)
133
134 def close(self):
135 self._closed = True
Serhiy Storchaka7e7a3db2015-04-10 13:24:41 +0300136 try:
137 self._reader.close()
138 finally:
139 close = self._close
140 if close:
141 self._close = None
142 close()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000143
144 def join_thread(self):
145 debug('Queue.join_thread()')
146 assert self._closed
147 if self._jointhread:
148 self._jointhread()
149
150 def cancel_join_thread(self):
151 debug('Queue.cancel_join_thread()')
152 self._joincancelled = True
153 try:
154 self._jointhread.cancel()
155 except AttributeError:
156 pass
157
158 def _start_thread(self):
159 debug('Queue._start_thread()')
160
161 # Start thread which transfers data from buffer to pipe
162 self._buffer.clear()
163 self._thread = threading.Thread(
164 target=Queue._feed,
Charles-François Natali84e43162013-03-25 18:20:40 +0100165 args=(self._buffer, self._notempty, self._send_bytes,
Antoine Pitroudc19c242011-07-16 01:51:58 +0200166 self._wlock, self._writer.close, self._ignore_epipe),
Benjamin Petersone711caf2008-06-11 16:44:04 +0000167 name='QueueFeederThread'
168 )
Benjamin Peterson72753702008-08-18 18:09:21 +0000169 self._thread.daemon = True
Benjamin Petersone711caf2008-06-11 16:44:04 +0000170
171 debug('doing self._thread.start()')
172 self._thread.start()
173 debug('... done self._thread.start()')
174
175 # On process exit we will wait for data to be flushed to pipe.
176 #
177 # However, if this process created the queue then all
178 # processes which use the queue will be descendants of this
179 # process. Therefore waiting for the queue to be flushed
180 # is pointless once all the child processes have been joined.
181 created_by_this_process = (self._opid == os.getpid())
182 if not self._joincancelled and not created_by_this_process:
183 self._jointhread = Finalize(
184 self._thread, Queue._finalize_join,
185 [weakref.ref(self._thread)],
186 exitpriority=-5
187 )
188
189 # Send sentinel to the thread queue object when garbage collected
190 self._close = Finalize(
191 self, Queue._finalize_close,
192 [self._buffer, self._notempty],
193 exitpriority=10
194 )
195
196 @staticmethod
197 def _finalize_join(twr):
198 debug('joining queue thread')
199 thread = twr()
200 if thread is not None:
201 thread.join()
202 debug('... queue thread joined')
203 else:
204 debug('... queue thread already dead')
205
206 @staticmethod
207 def _finalize_close(buffer, notempty):
208 debug('telling queue thread to quit')
209 notempty.acquire()
210 try:
211 buffer.append(_sentinel)
212 notempty.notify()
213 finally:
214 notempty.release()
215
216 @staticmethod
Charles-François Natali84e43162013-03-25 18:20:40 +0100217 def _feed(buffer, notempty, send_bytes, writelock, close, ignore_epipe):
Benjamin Petersone711caf2008-06-11 16:44:04 +0000218 debug('starting thread to feed data to pipe')
Benjamin Petersone711caf2008-06-11 16:44:04 +0000219 nacquire = notempty.acquire
220 nrelease = notempty.release
221 nwait = notempty.wait
222 bpopleft = buffer.popleft
223 sentinel = _sentinel
224 if sys.platform != 'win32':
225 wacquire = writelock.acquire
226 wrelease = writelock.release
227 else:
228 wacquire = None
229
230 try:
231 while 1:
232 nacquire()
233 try:
234 if not buffer:
235 nwait()
236 finally:
237 nrelease()
238 try:
239 while 1:
240 obj = bpopleft()
241 if obj is sentinel:
242 debug('feeder thread got sentinel -- exiting')
243 close()
244 return
245
Charles-François Natali84e43162013-03-25 18:20:40 +0100246 # serialize the data before acquiring the lock
247 obj = ForkingPickler.dumps(obj)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000248 if wacquire is None:
Charles-François Natali84e43162013-03-25 18:20:40 +0100249 send_bytes(obj)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000250 else:
251 wacquire()
252 try:
Charles-François Natali84e43162013-03-25 18:20:40 +0100253 send_bytes(obj)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000254 finally:
255 wrelease()
256 except IndexError:
257 pass
258 except Exception as e:
Antoine Pitroudc19c242011-07-16 01:51:58 +0200259 if ignore_epipe and getattr(e, 'errno', 0) == errno.EPIPE:
260 return
Benjamin Petersone711caf2008-06-11 16:44:04 +0000261 # Since this runs in a daemon thread the resources it uses
262 # may be become unusable while the process is cleaning up.
263 # We ignore errors which happen after the process has
264 # started to cleanup.
265 try:
266 if is_exiting():
267 info('error in queue thread: %s', e)
268 else:
269 import traceback
270 traceback.print_exc()
271 except Exception:
272 pass
273
274_sentinel = object()
275
276#
277# A queue type which also supports join() and task_done() methods
278#
279# Note that if you do not call task_done() for each finished task then
280# eventually the counter's semaphore may overflow causing Bad Things
281# to happen.
282#
283
284class JoinableQueue(Queue):
285
Richard Oudkerkb1694cf2013-10-16 16:41:56 +0100286 def __init__(self, maxsize=0, *, ctx):
287 Queue.__init__(self, maxsize, ctx=ctx)
288 self._unfinished_tasks = ctx.Semaphore(0)
289 self._cond = ctx.Condition()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000290
291 def __getstate__(self):
292 return Queue.__getstate__(self) + (self._cond, self._unfinished_tasks)
293
294 def __setstate__(self, state):
295 Queue.__setstate__(self, state[:-2])
296 self._cond, self._unfinished_tasks = state[-2:]
297
Benjamin Peterson8719ad52009-09-11 22:24:02 +0000298 def put(self, obj, block=True, timeout=None):
299 assert not self._closed
300 if not self._sem.acquire(block, timeout):
301 raise Full
302
303 self._notempty.acquire()
304 self._cond.acquire()
305 try:
306 if self._thread is None:
307 self._start_thread()
308 self._buffer.append(obj)
309 self._unfinished_tasks.release()
310 self._notempty.notify()
311 finally:
312 self._cond.release()
313 self._notempty.release()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000314
315 def task_done(self):
316 self._cond.acquire()
317 try:
318 if not self._unfinished_tasks.acquire(False):
319 raise ValueError('task_done() called too many times')
320 if self._unfinished_tasks._semlock._is_zero():
321 self._cond.notify_all()
322 finally:
323 self._cond.release()
324
325 def join(self):
326 self._cond.acquire()
327 try:
328 if not self._unfinished_tasks._semlock._is_zero():
329 self._cond.wait()
330 finally:
331 self._cond.release()
332
333#
334# Simplified Queue type -- really just a locked pipe
335#
336
337class SimpleQueue(object):
338
Richard Oudkerkb1694cf2013-10-16 16:41:56 +0100339 def __init__(self, *, ctx):
Richard Oudkerk84ed9a62013-08-14 15:35:41 +0100340 self._reader, self._writer = connection.Pipe(duplex=False)
Richard Oudkerkb1694cf2013-10-16 16:41:56 +0100341 self._rlock = ctx.Lock()
Antoine Pitroubdb1cf12012-03-05 19:28:37 +0100342 self._poll = self._reader.poll
Benjamin Petersone711caf2008-06-11 16:44:04 +0000343 if sys.platform == 'win32':
344 self._wlock = None
345 else:
Richard Oudkerkb1694cf2013-10-16 16:41:56 +0100346 self._wlock = ctx.Lock()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000347
348 def empty(self):
Antoine Pitroubdb1cf12012-03-05 19:28:37 +0100349 return not self._poll()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000350
351 def __getstate__(self):
Richard Oudkerkb1694cf2013-10-16 16:41:56 +0100352 context.assert_spawning(self)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000353 return (self._reader, self._writer, self._rlock, self._wlock)
354
355 def __setstate__(self, state):
356 (self._reader, self._writer, self._rlock, self._wlock) = state
Benjamin Petersone711caf2008-06-11 16:44:04 +0000357
Charles-François Natali84e43162013-03-25 18:20:40 +0100358 def get(self):
359 with self._rlock:
360 res = self._reader.recv_bytes()
361 # unserialize the data after having released the lock
362 return ForkingPickler.loads(res)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000363
Charles-François Natali84e43162013-03-25 18:20:40 +0100364 def put(self, obj):
365 # serialize the data before acquiring the lock
366 obj = ForkingPickler.dumps(obj)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000367 if self._wlock is None:
368 # writes to a message oriented win32 pipe are atomic
Charles-François Natali84e43162013-03-25 18:20:40 +0100369 self._writer.send_bytes(obj)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000370 else:
Charles-François Natali84e43162013-03-25 18:20:40 +0100371 with self._wlock:
372 self._writer.send_bytes(obj)