blob: c07ad40cbcd913c0c11fc9b197fc025639a9d3c6 [file] [log] [blame]
Benjamin Petersone711caf2008-06-11 16:44:04 +00001#
2# Module implementing queues
3#
4# multiprocessing/queues.py
5#
R. David Murray3fc969a2010-12-14 01:38:16 +00006# Copyright (c) 2006-2008, R Oudkerk
Richard Oudkerk3e268aa2012-04-30 12:13:55 +01007# Licensed to PSF under a Contributor Agreement.
Benjamin Petersone711caf2008-06-11 16:44:04 +00008#
9
Jesse Noller14f3ae22009-03-31 03:37:07 +000010__all__ = ['Queue', 'SimpleQueue', 'JoinableQueue']
Benjamin Petersone711caf2008-06-11 16:44:04 +000011
12import sys
13import os
14import threading
15import collections
16import time
Benjamin Petersone711caf2008-06-11 16:44:04 +000017import weakref
Antoine Pitroudc19c242011-07-16 01:51:58 +020018import errno
Benjamin Petersone711caf2008-06-11 16:44:04 +000019
20from queue import Empty, Full
Richard Oudkerk84ed9a62013-08-14 15:35:41 +010021
Benjamin Petersone711caf2008-06-11 16:44:04 +000022import _multiprocessing
Richard Oudkerk84ed9a62013-08-14 15:35:41 +010023
24from . import connection
Richard Oudkerkb1694cf2013-10-16 16:41:56 +010025from . import context
Richard Oudkerk84ed9a62013-08-14 15:35:41 +010026
27from .util import debug, info, Finalize, register_after_fork, is_exiting
28from .reduction import ForkingPickler
Benjamin Petersone711caf2008-06-11 16:44:04 +000029
30#
31# Queue type using a pipe, buffer and thread
32#
33
34class Queue(object):
35
Richard Oudkerkb1694cf2013-10-16 16:41:56 +010036 def __init__(self, maxsize=0, *, ctx):
Benjamin Petersone711caf2008-06-11 16:44:04 +000037 if maxsize <= 0:
38 maxsize = _multiprocessing.SemLock.SEM_VALUE_MAX
39 self._maxsize = maxsize
Richard Oudkerk84ed9a62013-08-14 15:35:41 +010040 self._reader, self._writer = connection.Pipe(duplex=False)
Richard Oudkerkb1694cf2013-10-16 16:41:56 +010041 self._rlock = ctx.Lock()
Benjamin Petersone711caf2008-06-11 16:44:04 +000042 self._opid = os.getpid()
43 if sys.platform == 'win32':
44 self._wlock = None
45 else:
Richard Oudkerkb1694cf2013-10-16 16:41:56 +010046 self._wlock = ctx.Lock()
47 self._sem = ctx.BoundedSemaphore(maxsize)
Antoine Pitroudc19c242011-07-16 01:51:58 +020048 # For use by concurrent.futures
49 self._ignore_epipe = False
Benjamin Petersone711caf2008-06-11 16:44:04 +000050
51 self._after_fork()
52
53 if sys.platform != 'win32':
54 register_after_fork(self, Queue._after_fork)
55
56 def __getstate__(self):
Richard Oudkerkb1694cf2013-10-16 16:41:56 +010057 context.assert_spawning(self)
Antoine Pitroufb960892011-07-20 02:01:39 +020058 return (self._ignore_epipe, self._maxsize, self._reader, self._writer,
Benjamin Petersone711caf2008-06-11 16:44:04 +000059 self._rlock, self._wlock, self._sem, self._opid)
60
61 def __setstate__(self, state):
Antoine Pitroufb960892011-07-20 02:01:39 +020062 (self._ignore_epipe, self._maxsize, self._reader, self._writer,
Benjamin Petersone711caf2008-06-11 16:44:04 +000063 self._rlock, self._wlock, self._sem, self._opid) = state
64 self._after_fork()
65
66 def _after_fork(self):
67 debug('Queue._after_fork()')
68 self._notempty = threading.Condition(threading.Lock())
69 self._buffer = collections.deque()
70 self._thread = None
71 self._jointhread = None
72 self._joincancelled = False
73 self._closed = False
74 self._close = None
Charles-François Natali84e43162013-03-25 18:20:40 +010075 self._send_bytes = self._writer.send_bytes
76 self._recv_bytes = self._reader.recv_bytes
Benjamin Petersone711caf2008-06-11 16:44:04 +000077 self._poll = self._reader.poll
78
79 def put(self, obj, block=True, timeout=None):
80 assert not self._closed
81 if not self._sem.acquire(block, timeout):
82 raise Full
83
Charles-François Natalia924fc72014-05-25 14:12:12 +010084 with self._notempty:
Benjamin Petersone711caf2008-06-11 16:44:04 +000085 if self._thread is None:
86 self._start_thread()
87 self._buffer.append(obj)
88 self._notempty.notify()
Benjamin Petersone711caf2008-06-11 16:44:04 +000089
90 def get(self, block=True, timeout=None):
91 if block and timeout is None:
Charles-François Natali84e43162013-03-25 18:20:40 +010092 with self._rlock:
93 res = self._recv_bytes()
94 self._sem.release()
Benjamin Petersone711caf2008-06-11 16:44:04 +000095 else:
96 if block:
97 deadline = time.time() + timeout
98 if not self._rlock.acquire(block, timeout):
99 raise Empty
100 try:
Antoine Pitroua3651132011-11-10 00:37:09 +0100101 if block:
102 timeout = deadline - time.time()
103 if timeout < 0 or not self._poll(timeout):
104 raise Empty
105 elif not self._poll():
Benjamin Petersone711caf2008-06-11 16:44:04 +0000106 raise Empty
Charles-François Natali84e43162013-03-25 18:20:40 +0100107 res = self._recv_bytes()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000108 self._sem.release()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000109 finally:
110 self._rlock.release()
Charles-François Natali84e43162013-03-25 18:20:40 +0100111 # unserialize the data after having released the lock
112 return ForkingPickler.loads(res)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000113
114 def qsize(self):
Benjamin Peterson87c8d872009-06-11 22:54:11 +0000115 # Raises NotImplementedError on Mac OSX because of broken sem_getvalue()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000116 return self._maxsize - self._sem._semlock._get_value()
117
118 def empty(self):
119 return not self._poll()
120
121 def full(self):
122 return self._sem._semlock._is_zero()
123
124 def get_nowait(self):
125 return self.get(False)
126
127 def put_nowait(self, obj):
128 return self.put(obj, False)
129
130 def close(self):
131 self._closed = True
132 self._reader.close()
133 if self._close:
134 self._close()
135
136 def join_thread(self):
137 debug('Queue.join_thread()')
138 assert self._closed
139 if self._jointhread:
140 self._jointhread()
141
142 def cancel_join_thread(self):
143 debug('Queue.cancel_join_thread()')
144 self._joincancelled = True
145 try:
146 self._jointhread.cancel()
147 except AttributeError:
148 pass
149
150 def _start_thread(self):
151 debug('Queue._start_thread()')
152
153 # Start thread which transfers data from buffer to pipe
154 self._buffer.clear()
155 self._thread = threading.Thread(
156 target=Queue._feed,
Charles-François Natali84e43162013-03-25 18:20:40 +0100157 args=(self._buffer, self._notempty, self._send_bytes,
Antoine Pitroudc19c242011-07-16 01:51:58 +0200158 self._wlock, self._writer.close, self._ignore_epipe),
Benjamin Petersone711caf2008-06-11 16:44:04 +0000159 name='QueueFeederThread'
160 )
Benjamin Peterson72753702008-08-18 18:09:21 +0000161 self._thread.daemon = True
Benjamin Petersone711caf2008-06-11 16:44:04 +0000162
163 debug('doing self._thread.start()')
164 self._thread.start()
165 debug('... done self._thread.start()')
166
167 # On process exit we will wait for data to be flushed to pipe.
168 #
169 # However, if this process created the queue then all
170 # processes which use the queue will be descendants of this
171 # process. Therefore waiting for the queue to be flushed
172 # is pointless once all the child processes have been joined.
173 created_by_this_process = (self._opid == os.getpid())
174 if not self._joincancelled and not created_by_this_process:
175 self._jointhread = Finalize(
176 self._thread, Queue._finalize_join,
177 [weakref.ref(self._thread)],
178 exitpriority=-5
179 )
180
181 # Send sentinel to the thread queue object when garbage collected
182 self._close = Finalize(
183 self, Queue._finalize_close,
184 [self._buffer, self._notempty],
185 exitpriority=10
186 )
187
188 @staticmethod
189 def _finalize_join(twr):
190 debug('joining queue thread')
191 thread = twr()
192 if thread is not None:
193 thread.join()
194 debug('... queue thread joined')
195 else:
196 debug('... queue thread already dead')
197
198 @staticmethod
199 def _finalize_close(buffer, notempty):
200 debug('telling queue thread to quit')
Charles-François Natalia924fc72014-05-25 14:12:12 +0100201 with notempty:
Benjamin Petersone711caf2008-06-11 16:44:04 +0000202 buffer.append(_sentinel)
203 notempty.notify()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000204
205 @staticmethod
Charles-François Natali84e43162013-03-25 18:20:40 +0100206 def _feed(buffer, notempty, send_bytes, writelock, close, ignore_epipe):
Benjamin Petersone711caf2008-06-11 16:44:04 +0000207 debug('starting thread to feed data to pipe')
Benjamin Petersone711caf2008-06-11 16:44:04 +0000208 nacquire = notempty.acquire
209 nrelease = notempty.release
210 nwait = notempty.wait
211 bpopleft = buffer.popleft
212 sentinel = _sentinel
213 if sys.platform != 'win32':
214 wacquire = writelock.acquire
215 wrelease = writelock.release
216 else:
217 wacquire = None
218
219 try:
220 while 1:
221 nacquire()
222 try:
223 if not buffer:
224 nwait()
225 finally:
226 nrelease()
227 try:
228 while 1:
229 obj = bpopleft()
230 if obj is sentinel:
231 debug('feeder thread got sentinel -- exiting')
232 close()
233 return
234
Charles-François Natali84e43162013-03-25 18:20:40 +0100235 # serialize the data before acquiring the lock
236 obj = ForkingPickler.dumps(obj)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000237 if wacquire is None:
Charles-François Natali84e43162013-03-25 18:20:40 +0100238 send_bytes(obj)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000239 else:
240 wacquire()
241 try:
Charles-François Natali84e43162013-03-25 18:20:40 +0100242 send_bytes(obj)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000243 finally:
244 wrelease()
245 except IndexError:
246 pass
247 except Exception as e:
Antoine Pitroudc19c242011-07-16 01:51:58 +0200248 if ignore_epipe and getattr(e, 'errno', 0) == errno.EPIPE:
249 return
Benjamin Petersone711caf2008-06-11 16:44:04 +0000250 # Since this runs in a daemon thread the resources it uses
251 # may be become unusable while the process is cleaning up.
252 # We ignore errors which happen after the process has
253 # started to cleanup.
254 try:
255 if is_exiting():
256 info('error in queue thread: %s', e)
257 else:
258 import traceback
259 traceback.print_exc()
260 except Exception:
261 pass
262
263_sentinel = object()
264
265#
266# A queue type which also supports join() and task_done() methods
267#
268# Note that if you do not call task_done() for each finished task then
269# eventually the counter's semaphore may overflow causing Bad Things
270# to happen.
271#
272
273class JoinableQueue(Queue):
274
Richard Oudkerkb1694cf2013-10-16 16:41:56 +0100275 def __init__(self, maxsize=0, *, ctx):
276 Queue.__init__(self, maxsize, ctx=ctx)
277 self._unfinished_tasks = ctx.Semaphore(0)
278 self._cond = ctx.Condition()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000279
280 def __getstate__(self):
281 return Queue.__getstate__(self) + (self._cond, self._unfinished_tasks)
282
283 def __setstate__(self, state):
284 Queue.__setstate__(self, state[:-2])
285 self._cond, self._unfinished_tasks = state[-2:]
286
Benjamin Peterson8719ad52009-09-11 22:24:02 +0000287 def put(self, obj, block=True, timeout=None):
288 assert not self._closed
289 if not self._sem.acquire(block, timeout):
290 raise Full
291
Charles-François Natalia924fc72014-05-25 14:12:12 +0100292 with self._notempty, self._cond:
Benjamin Peterson8719ad52009-09-11 22:24:02 +0000293 if self._thread is None:
294 self._start_thread()
295 self._buffer.append(obj)
296 self._unfinished_tasks.release()
297 self._notempty.notify()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000298
299 def task_done(self):
Charles-François Natalia924fc72014-05-25 14:12:12 +0100300 with self._cond:
Benjamin Petersone711caf2008-06-11 16:44:04 +0000301 if not self._unfinished_tasks.acquire(False):
302 raise ValueError('task_done() called too many times')
303 if self._unfinished_tasks._semlock._is_zero():
304 self._cond.notify_all()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000305
306 def join(self):
Charles-François Natalia924fc72014-05-25 14:12:12 +0100307 with self._cond:
Benjamin Petersone711caf2008-06-11 16:44:04 +0000308 if not self._unfinished_tasks._semlock._is_zero():
309 self._cond.wait()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000310
311#
312# Simplified Queue type -- really just a locked pipe
313#
314
315class SimpleQueue(object):
316
Richard Oudkerkb1694cf2013-10-16 16:41:56 +0100317 def __init__(self, *, ctx):
Richard Oudkerk84ed9a62013-08-14 15:35:41 +0100318 self._reader, self._writer = connection.Pipe(duplex=False)
Richard Oudkerkb1694cf2013-10-16 16:41:56 +0100319 self._rlock = ctx.Lock()
Antoine Pitroubdb1cf12012-03-05 19:28:37 +0100320 self._poll = self._reader.poll
Benjamin Petersone711caf2008-06-11 16:44:04 +0000321 if sys.platform == 'win32':
322 self._wlock = None
323 else:
Richard Oudkerkb1694cf2013-10-16 16:41:56 +0100324 self._wlock = ctx.Lock()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000325
326 def empty(self):
Antoine Pitroubdb1cf12012-03-05 19:28:37 +0100327 return not self._poll()
Benjamin Petersone711caf2008-06-11 16:44:04 +0000328
329 def __getstate__(self):
Richard Oudkerkb1694cf2013-10-16 16:41:56 +0100330 context.assert_spawning(self)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000331 return (self._reader, self._writer, self._rlock, self._wlock)
332
333 def __setstate__(self, state):
334 (self._reader, self._writer, self._rlock, self._wlock) = state
Benjamin Petersone711caf2008-06-11 16:44:04 +0000335
Charles-François Natali84e43162013-03-25 18:20:40 +0100336 def get(self):
337 with self._rlock:
338 res = self._reader.recv_bytes()
339 # unserialize the data after having released the lock
340 return ForkingPickler.loads(res)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000341
Charles-François Natali84e43162013-03-25 18:20:40 +0100342 def put(self, obj):
343 # serialize the data before acquiring the lock
344 obj = ForkingPickler.dumps(obj)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000345 if self._wlock is None:
346 # writes to a message oriented win32 pipe are atomic
Charles-François Natali84e43162013-03-25 18:20:40 +0100347 self._writer.send_bytes(obj)
Benjamin Petersone711caf2008-06-11 16:44:04 +0000348 else:
Charles-François Natali84e43162013-03-25 18:20:40 +0100349 with self._wlock:
350 self._writer.send_bytes(obj)