| # |
| # Module which supports allocation of memory from an mmap |
| # |
| # multiprocessing/heap.py |
| # |
| # Copyright (c) 2006-2008, R Oudkerk |
| # Licensed to PSF under a Contributor Agreement. |
| # |
| |
| import bisect |
| from collections import defaultdict |
| import mmap |
| import os |
| import sys |
| import tempfile |
| import threading |
| |
| from .context import reduction, assert_spawning |
| from . import util |
| |
| __all__ = ['BufferWrapper'] |
| |
| # |
| # Inheritable class which wraps an mmap, and from which blocks can be allocated |
| # |
| |
| if sys.platform == 'win32': |
| |
| import _winapi |
| |
| class Arena(object): |
| """ |
| A shared memory area backed by anonymous memory (Windows). |
| """ |
| |
| _rand = tempfile._RandomNameSequence() |
| |
| def __init__(self, size): |
| self.size = size |
| for i in range(100): |
| name = 'pym-%d-%s' % (os.getpid(), next(self._rand)) |
| buf = mmap.mmap(-1, size, tagname=name) |
| if _winapi.GetLastError() == 0: |
| break |
| # We have reopened a preexisting mmap. |
| buf.close() |
| else: |
| raise FileExistsError('Cannot find name for new mmap') |
| self.name = name |
| self.buffer = buf |
| self._state = (self.size, self.name) |
| |
| def __getstate__(self): |
| assert_spawning(self) |
| return self._state |
| |
| def __setstate__(self, state): |
| self.size, self.name = self._state = state |
| # Reopen existing mmap |
| self.buffer = mmap.mmap(-1, self.size, tagname=self.name) |
| # XXX Temporarily preventing buildbot failures while determining |
| # XXX the correct long-term fix. See issue 23060 |
| #assert _winapi.GetLastError() == _winapi.ERROR_ALREADY_EXISTS |
| |
| else: |
| |
| class Arena(object): |
| """ |
| A shared memory area backed by a temporary file (POSIX). |
| """ |
| |
| if sys.platform == 'linux': |
| _dir_candidates = ['/dev/shm'] |
| else: |
| _dir_candidates = [] |
| |
| def __init__(self, size, fd=-1): |
| self.size = size |
| self.fd = fd |
| if fd == -1: |
| # Arena is created anew (if fd != -1, it means we're coming |
| # from rebuild_arena() below) |
| self.fd, name = tempfile.mkstemp( |
| prefix='pym-%d-'%os.getpid(), |
| dir=self._choose_dir(size)) |
| os.unlink(name) |
| util.Finalize(self, os.close, (self.fd,)) |
| os.ftruncate(self.fd, size) |
| self.buffer = mmap.mmap(self.fd, self.size) |
| |
| def _choose_dir(self, size): |
| # Choose a non-storage backed directory if possible, |
| # to improve performance |
| for d in self._dir_candidates: |
| st = os.statvfs(d) |
| if st.f_bavail * st.f_frsize >= size: # enough free space? |
| return d |
| return util.get_temp_dir() |
| |
| def reduce_arena(a): |
| if a.fd == -1: |
| raise ValueError('Arena is unpicklable because ' |
| 'forking was enabled when it was created') |
| return rebuild_arena, (a.size, reduction.DupFd(a.fd)) |
| |
| def rebuild_arena(size, dupfd): |
| return Arena(size, dupfd.detach()) |
| |
| reduction.register(Arena, reduce_arena) |
| |
| # |
| # Class allowing allocation of chunks of memory from arenas |
| # |
| |
| class Heap(object): |
| |
| # Minimum malloc() alignment |
| _alignment = 8 |
| |
| _DISCARD_FREE_SPACE_LARGER_THAN = 4 * 1024 ** 2 # 4 MB |
| _DOUBLE_ARENA_SIZE_UNTIL = 4 * 1024 ** 2 |
| |
| def __init__(self, size=mmap.PAGESIZE): |
| self._lastpid = os.getpid() |
| self._lock = threading.Lock() |
| # Current arena allocation size |
| self._size = size |
| # A sorted list of available block sizes in arenas |
| self._lengths = [] |
| |
| # Free block management: |
| # - map each block size to a list of `(Arena, start, stop)` blocks |
| self._len_to_seq = {} |
| # - map `(Arena, start)` tuple to the `(Arena, start, stop)` block |
| # starting at that offset |
| self._start_to_block = {} |
| # - map `(Arena, stop)` tuple to the `(Arena, start, stop)` block |
| # ending at that offset |
| self._stop_to_block = {} |
| |
| # Map arenas to their `(Arena, start, stop)` blocks in use |
| self._allocated_blocks = defaultdict(set) |
| self._arenas = [] |
| |
| # List of pending blocks to free - see comment in free() below |
| self._pending_free_blocks = [] |
| |
| # Statistics |
| self._n_mallocs = 0 |
| self._n_frees = 0 |
| |
| @staticmethod |
| def _roundup(n, alignment): |
| # alignment must be a power of 2 |
| mask = alignment - 1 |
| return (n + mask) & ~mask |
| |
| def _new_arena(self, size): |
| # Create a new arena with at least the given *size* |
| length = self._roundup(max(self._size, size), mmap.PAGESIZE) |
| # We carve larger and larger arenas, for efficiency, until we |
| # reach a large-ish size (roughly L3 cache-sized) |
| if self._size < self._DOUBLE_ARENA_SIZE_UNTIL: |
| self._size *= 2 |
| util.info('allocating a new mmap of length %d', length) |
| arena = Arena(length) |
| self._arenas.append(arena) |
| return (arena, 0, length) |
| |
| def _discard_arena(self, arena): |
| # Possibly delete the given (unused) arena |
| length = arena.size |
| # Reusing an existing arena is faster than creating a new one, so |
| # we only reclaim space if it's large enough. |
| if length < self._DISCARD_FREE_SPACE_LARGER_THAN: |
| return |
| blocks = self._allocated_blocks.pop(arena) |
| assert not blocks |
| del self._start_to_block[(arena, 0)] |
| del self._stop_to_block[(arena, length)] |
| self._arenas.remove(arena) |
| seq = self._len_to_seq[length] |
| seq.remove((arena, 0, length)) |
| if not seq: |
| del self._len_to_seq[length] |
| self._lengths.remove(length) |
| |
| def _malloc(self, size): |
| # returns a large enough block -- it might be much larger |
| i = bisect.bisect_left(self._lengths, size) |
| if i == len(self._lengths): |
| return self._new_arena(size) |
| else: |
| length = self._lengths[i] |
| seq = self._len_to_seq[length] |
| block = seq.pop() |
| if not seq: |
| del self._len_to_seq[length], self._lengths[i] |
| |
| (arena, start, stop) = block |
| del self._start_to_block[(arena, start)] |
| del self._stop_to_block[(arena, stop)] |
| return block |
| |
| def _add_free_block(self, block): |
| # make block available and try to merge with its neighbours in the arena |
| (arena, start, stop) = block |
| |
| try: |
| prev_block = self._stop_to_block[(arena, start)] |
| except KeyError: |
| pass |
| else: |
| start, _ = self._absorb(prev_block) |
| |
| try: |
| next_block = self._start_to_block[(arena, stop)] |
| except KeyError: |
| pass |
| else: |
| _, stop = self._absorb(next_block) |
| |
| block = (arena, start, stop) |
| length = stop - start |
| |
| try: |
| self._len_to_seq[length].append(block) |
| except KeyError: |
| self._len_to_seq[length] = [block] |
| bisect.insort(self._lengths, length) |
| |
| self._start_to_block[(arena, start)] = block |
| self._stop_to_block[(arena, stop)] = block |
| |
| def _absorb(self, block): |
| # deregister this block so it can be merged with a neighbour |
| (arena, start, stop) = block |
| del self._start_to_block[(arena, start)] |
| del self._stop_to_block[(arena, stop)] |
| |
| length = stop - start |
| seq = self._len_to_seq[length] |
| seq.remove(block) |
| if not seq: |
| del self._len_to_seq[length] |
| self._lengths.remove(length) |
| |
| return start, stop |
| |
| def _remove_allocated_block(self, block): |
| arena, start, stop = block |
| blocks = self._allocated_blocks[arena] |
| blocks.remove((start, stop)) |
| if not blocks: |
| # Arena is entirely free, discard it from this process |
| self._discard_arena(arena) |
| |
| def _free_pending_blocks(self): |
| # Free all the blocks in the pending list - called with the lock held. |
| while True: |
| try: |
| block = self._pending_free_blocks.pop() |
| except IndexError: |
| break |
| self._add_free_block(block) |
| self._remove_allocated_block(block) |
| |
| def free(self, block): |
| # free a block returned by malloc() |
| # Since free() can be called asynchronously by the GC, it could happen |
| # that it's called while self._lock is held: in that case, |
| # self._lock.acquire() would deadlock (issue #12352). To avoid that, a |
| # trylock is used instead, and if the lock can't be acquired |
| # immediately, the block is added to a list of blocks to be freed |
| # synchronously sometimes later from malloc() or free(), by calling |
| # _free_pending_blocks() (appending and retrieving from a list is not |
| # strictly thread-safe but under CPython it's atomic thanks to the GIL). |
| if os.getpid() != self._lastpid: |
| raise ValueError( |
| "My pid ({0:n}) is not last pid {1:n}".format( |
| os.getpid(),self._lastpid)) |
| if not self._lock.acquire(False): |
| # can't acquire the lock right now, add the block to the list of |
| # pending blocks to free |
| self._pending_free_blocks.append(block) |
| else: |
| # we hold the lock |
| try: |
| self._n_frees += 1 |
| self._free_pending_blocks() |
| self._add_free_block(block) |
| self._remove_allocated_block(block) |
| finally: |
| self._lock.release() |
| |
| def malloc(self, size): |
| # return a block of right size (possibly rounded up) |
| if size < 0: |
| raise ValueError("Size {0:n} out of range".format(size)) |
| if sys.maxsize <= size: |
| raise OverflowError("Size {0:n} too large".format(size)) |
| if os.getpid() != self._lastpid: |
| self.__init__() # reinitialize after fork |
| with self._lock: |
| self._n_mallocs += 1 |
| # allow pending blocks to be marked available |
| self._free_pending_blocks() |
| size = self._roundup(max(size, 1), self._alignment) |
| (arena, start, stop) = self._malloc(size) |
| real_stop = start + size |
| if real_stop < stop: |
| # if the returned block is larger than necessary, mark |
| # the remainder available |
| self._add_free_block((arena, real_stop, stop)) |
| self._allocated_blocks[arena].add((start, real_stop)) |
| return (arena, start, real_stop) |
| |
| # |
| # Class wrapping a block allocated out of a Heap -- can be inherited by child process |
| # |
| |
| class BufferWrapper(object): |
| |
| _heap = Heap() |
| |
| def __init__(self, size): |
| if size < 0: |
| raise ValueError("Size {0:n} out of range".format(size)) |
| if sys.maxsize <= size: |
| raise OverflowError("Size {0:n} too large".format(size)) |
| block = BufferWrapper._heap.malloc(size) |
| self._state = (block, size) |
| util.Finalize(self, BufferWrapper._heap.free, args=(block,)) |
| |
| def create_memoryview(self): |
| (arena, start, stop), size = self._state |
| return memoryview(arena.buffer)[start:start+size] |