|  | # | 
|  | # Module which supports allocation of memory from an mmap | 
|  | # | 
|  | # multiprocessing/heap.py | 
|  | # | 
|  | # Copyright (c) 2006-2008, R Oudkerk | 
|  | # Licensed to PSF under a Contributor Agreement. | 
|  | # | 
|  |  | 
|  | import bisect | 
|  | from collections import defaultdict | 
|  | import mmap | 
|  | import os | 
|  | import sys | 
|  | import tempfile | 
|  | import threading | 
|  |  | 
|  | from .context import reduction, assert_spawning | 
|  | from . import util | 
|  |  | 
|  | __all__ = ['BufferWrapper'] | 
|  |  | 
|  | # | 
|  | # Inheritable class which wraps an mmap, and from which blocks can be allocated | 
|  | # | 
|  |  | 
|  | if sys.platform == 'win32': | 
|  |  | 
|  | import _winapi | 
|  |  | 
|  | class Arena(object): | 
|  | """ | 
|  | A shared memory area backed by anonymous memory (Windows). | 
|  | """ | 
|  |  | 
|  | _rand = tempfile._RandomNameSequence() | 
|  |  | 
|  | def __init__(self, size): | 
|  | self.size = size | 
|  | for i in range(100): | 
|  | name = 'pym-%d-%s' % (os.getpid(), next(self._rand)) | 
|  | buf = mmap.mmap(-1, size, tagname=name) | 
|  | if _winapi.GetLastError() == 0: | 
|  | break | 
|  | # We have reopened a preexisting mmap. | 
|  | buf.close() | 
|  | else: | 
|  | raise FileExistsError('Cannot find name for new mmap') | 
|  | self.name = name | 
|  | self.buffer = buf | 
|  | self._state = (self.size, self.name) | 
|  |  | 
|  | def __getstate__(self): | 
|  | assert_spawning(self) | 
|  | return self._state | 
|  |  | 
|  | def __setstate__(self, state): | 
|  | self.size, self.name = self._state = state | 
|  | # Reopen existing mmap | 
|  | self.buffer = mmap.mmap(-1, self.size, tagname=self.name) | 
|  | # XXX Temporarily preventing buildbot failures while determining | 
|  | # XXX the correct long-term fix. See issue 23060 | 
|  | #assert _winapi.GetLastError() == _winapi.ERROR_ALREADY_EXISTS | 
|  |  | 
|  | else: | 
|  |  | 
|  | class Arena(object): | 
|  | """ | 
|  | A shared memory area backed by a temporary file (POSIX). | 
|  | """ | 
|  |  | 
|  | if sys.platform == 'linux': | 
|  | _dir_candidates = ['/dev/shm'] | 
|  | else: | 
|  | _dir_candidates = [] | 
|  |  | 
|  | def __init__(self, size, fd=-1): | 
|  | self.size = size | 
|  | self.fd = fd | 
|  | if fd == -1: | 
|  | # Arena is created anew (if fd != -1, it means we're coming | 
|  | # from rebuild_arena() below) | 
|  | self.fd, name = tempfile.mkstemp( | 
|  | prefix='pym-%d-'%os.getpid(), | 
|  | dir=self._choose_dir(size)) | 
|  | os.unlink(name) | 
|  | util.Finalize(self, os.close, (self.fd,)) | 
|  | os.ftruncate(self.fd, size) | 
|  | self.buffer = mmap.mmap(self.fd, self.size) | 
|  |  | 
|  | def _choose_dir(self, size): | 
|  | # Choose a non-storage backed directory if possible, | 
|  | # to improve performance | 
|  | for d in self._dir_candidates: | 
|  | st = os.statvfs(d) | 
|  | if st.f_bavail * st.f_frsize >= size:  # enough free space? | 
|  | return d | 
|  | return util.get_temp_dir() | 
|  |  | 
|  | def reduce_arena(a): | 
|  | if a.fd == -1: | 
|  | raise ValueError('Arena is unpicklable because ' | 
|  | 'forking was enabled when it was created') | 
|  | return rebuild_arena, (a.size, reduction.DupFd(a.fd)) | 
|  |  | 
|  | def rebuild_arena(size, dupfd): | 
|  | return Arena(size, dupfd.detach()) | 
|  |  | 
|  | reduction.register(Arena, reduce_arena) | 
|  |  | 
|  | # | 
|  | # Class allowing allocation of chunks of memory from arenas | 
|  | # | 
|  |  | 
|  | class Heap(object): | 
|  |  | 
|  | # Minimum malloc() alignment | 
|  | _alignment = 8 | 
|  |  | 
|  | _DISCARD_FREE_SPACE_LARGER_THAN = 4 * 1024 ** 2  # 4 MB | 
|  | _DOUBLE_ARENA_SIZE_UNTIL = 4 * 1024 ** 2 | 
|  |  | 
|  | def __init__(self, size=mmap.PAGESIZE): | 
|  | self._lastpid = os.getpid() | 
|  | self._lock = threading.Lock() | 
|  | # Current arena allocation size | 
|  | self._size = size | 
|  | # A sorted list of available block sizes in arenas | 
|  | self._lengths = [] | 
|  |  | 
|  | # Free block management: | 
|  | # - map each block size to a list of `(Arena, start, stop)` blocks | 
|  | self._len_to_seq = {} | 
|  | # - map `(Arena, start)` tuple to the `(Arena, start, stop)` block | 
|  | #   starting at that offset | 
|  | self._start_to_block = {} | 
|  | # - map `(Arena, stop)` tuple to the `(Arena, start, stop)` block | 
|  | #   ending at that offset | 
|  | self._stop_to_block = {} | 
|  |  | 
|  | # Map arenas to their `(Arena, start, stop)` blocks in use | 
|  | self._allocated_blocks = defaultdict(set) | 
|  | self._arenas = [] | 
|  |  | 
|  | # List of pending blocks to free - see comment in free() below | 
|  | self._pending_free_blocks = [] | 
|  |  | 
|  | # Statistics | 
|  | self._n_mallocs = 0 | 
|  | self._n_frees = 0 | 
|  |  | 
|  | @staticmethod | 
|  | def _roundup(n, alignment): | 
|  | # alignment must be a power of 2 | 
|  | mask = alignment - 1 | 
|  | return (n + mask) & ~mask | 
|  |  | 
|  | def _new_arena(self, size): | 
|  | # Create a new arena with at least the given *size* | 
|  | length = self._roundup(max(self._size, size), mmap.PAGESIZE) | 
|  | # We carve larger and larger arenas, for efficiency, until we | 
|  | # reach a large-ish size (roughly L3 cache-sized) | 
|  | if self._size < self._DOUBLE_ARENA_SIZE_UNTIL: | 
|  | self._size *= 2 | 
|  | util.info('allocating a new mmap of length %d', length) | 
|  | arena = Arena(length) | 
|  | self._arenas.append(arena) | 
|  | return (arena, 0, length) | 
|  |  | 
|  | def _discard_arena(self, arena): | 
|  | # Possibly delete the given (unused) arena | 
|  | length = arena.size | 
|  | # Reusing an existing arena is faster than creating a new one, so | 
|  | # we only reclaim space if it's large enough. | 
|  | if length < self._DISCARD_FREE_SPACE_LARGER_THAN: | 
|  | return | 
|  | blocks = self._allocated_blocks.pop(arena) | 
|  | assert not blocks | 
|  | del self._start_to_block[(arena, 0)] | 
|  | del self._stop_to_block[(arena, length)] | 
|  | self._arenas.remove(arena) | 
|  | seq = self._len_to_seq[length] | 
|  | seq.remove((arena, 0, length)) | 
|  | if not seq: | 
|  | del self._len_to_seq[length] | 
|  | self._lengths.remove(length) | 
|  |  | 
|  | def _malloc(self, size): | 
|  | # returns a large enough block -- it might be much larger | 
|  | i = bisect.bisect_left(self._lengths, size) | 
|  | if i == len(self._lengths): | 
|  | return self._new_arena(size) | 
|  | else: | 
|  | length = self._lengths[i] | 
|  | seq = self._len_to_seq[length] | 
|  | block = seq.pop() | 
|  | if not seq: | 
|  | del self._len_to_seq[length], self._lengths[i] | 
|  |  | 
|  | (arena, start, stop) = block | 
|  | del self._start_to_block[(arena, start)] | 
|  | del self._stop_to_block[(arena, stop)] | 
|  | return block | 
|  |  | 
|  | def _add_free_block(self, block): | 
|  | # make block available and try to merge with its neighbours in the arena | 
|  | (arena, start, stop) = block | 
|  |  | 
|  | try: | 
|  | prev_block = self._stop_to_block[(arena, start)] | 
|  | except KeyError: | 
|  | pass | 
|  | else: | 
|  | start, _ = self._absorb(prev_block) | 
|  |  | 
|  | try: | 
|  | next_block = self._start_to_block[(arena, stop)] | 
|  | except KeyError: | 
|  | pass | 
|  | else: | 
|  | _, stop = self._absorb(next_block) | 
|  |  | 
|  | block = (arena, start, stop) | 
|  | length = stop - start | 
|  |  | 
|  | try: | 
|  | self._len_to_seq[length].append(block) | 
|  | except KeyError: | 
|  | self._len_to_seq[length] = [block] | 
|  | bisect.insort(self._lengths, length) | 
|  |  | 
|  | self._start_to_block[(arena, start)] = block | 
|  | self._stop_to_block[(arena, stop)] = block | 
|  |  | 
|  | def _absorb(self, block): | 
|  | # deregister this block so it can be merged with a neighbour | 
|  | (arena, start, stop) = block | 
|  | del self._start_to_block[(arena, start)] | 
|  | del self._stop_to_block[(arena, stop)] | 
|  |  | 
|  | length = stop - start | 
|  | seq = self._len_to_seq[length] | 
|  | seq.remove(block) | 
|  | if not seq: | 
|  | del self._len_to_seq[length] | 
|  | self._lengths.remove(length) | 
|  |  | 
|  | return start, stop | 
|  |  | 
|  | def _remove_allocated_block(self, block): | 
|  | arena, start, stop = block | 
|  | blocks = self._allocated_blocks[arena] | 
|  | blocks.remove((start, stop)) | 
|  | if not blocks: | 
|  | # Arena is entirely free, discard it from this process | 
|  | self._discard_arena(arena) | 
|  |  | 
|  | def _free_pending_blocks(self): | 
|  | # Free all the blocks in the pending list - called with the lock held. | 
|  | while True: | 
|  | try: | 
|  | block = self._pending_free_blocks.pop() | 
|  | except IndexError: | 
|  | break | 
|  | self._add_free_block(block) | 
|  | self._remove_allocated_block(block) | 
|  |  | 
|  | def free(self, block): | 
|  | # free a block returned by malloc() | 
|  | # Since free() can be called asynchronously by the GC, it could happen | 
|  | # that it's called while self._lock is held: in that case, | 
|  | # self._lock.acquire() would deadlock (issue #12352). To avoid that, a | 
|  | # trylock is used instead, and if the lock can't be acquired | 
|  | # immediately, the block is added to a list of blocks to be freed | 
|  | # synchronously sometimes later from malloc() or free(), by calling | 
|  | # _free_pending_blocks() (appending and retrieving from a list is not | 
|  | # strictly thread-safe but under CPython it's atomic thanks to the GIL). | 
|  | if os.getpid() != self._lastpid: | 
|  | raise ValueError( | 
|  | "My pid ({0:n}) is not last pid {1:n}".format( | 
|  | os.getpid(),self._lastpid)) | 
|  | if not self._lock.acquire(False): | 
|  | # can't acquire the lock right now, add the block to the list of | 
|  | # pending blocks to free | 
|  | self._pending_free_blocks.append(block) | 
|  | else: | 
|  | # we hold the lock | 
|  | try: | 
|  | self._n_frees += 1 | 
|  | self._free_pending_blocks() | 
|  | self._add_free_block(block) | 
|  | self._remove_allocated_block(block) | 
|  | finally: | 
|  | self._lock.release() | 
|  |  | 
|  | def malloc(self, size): | 
|  | # return a block of right size (possibly rounded up) | 
|  | if size < 0: | 
|  | raise ValueError("Size {0:n} out of range".format(size)) | 
|  | if sys.maxsize <= size: | 
|  | raise OverflowError("Size {0:n} too large".format(size)) | 
|  | if os.getpid() != self._lastpid: | 
|  | self.__init__()                     # reinitialize after fork | 
|  | with self._lock: | 
|  | self._n_mallocs += 1 | 
|  | # allow pending blocks to be marked available | 
|  | self._free_pending_blocks() | 
|  | size = self._roundup(max(size, 1), self._alignment) | 
|  | (arena, start, stop) = self._malloc(size) | 
|  | real_stop = start + size | 
|  | if real_stop < stop: | 
|  | # if the returned block is larger than necessary, mark | 
|  | # the remainder available | 
|  | self._add_free_block((arena, real_stop, stop)) | 
|  | self._allocated_blocks[arena].add((start, real_stop)) | 
|  | return (arena, start, real_stop) | 
|  |  | 
|  | # | 
|  | # Class wrapping a block allocated out of a Heap -- can be inherited by child process | 
|  | # | 
|  |  | 
|  | class BufferWrapper(object): | 
|  |  | 
|  | _heap = Heap() | 
|  |  | 
|  | def __init__(self, size): | 
|  | if size < 0: | 
|  | raise ValueError("Size {0:n} out of range".format(size)) | 
|  | if sys.maxsize <= size: | 
|  | raise OverflowError("Size {0:n} too large".format(size)) | 
|  | block = BufferWrapper._heap.malloc(size) | 
|  | self._state = (block, size) | 
|  | util.Finalize(self, BufferWrapper._heap.free, args=(block,)) | 
|  |  | 
|  | def create_memoryview(self): | 
|  | (arena, start, stop), size = self._state | 
|  | return memoryview(arena.buffer)[start:start+size] |