Lib/multiprocessing/heap.py - platform/external/python/cpython3 - Git at Google

 #
 # Module which supports allocation of memory from an mmap
 #
 # multiprocessing/heap.py
 #
 # Copyright (c) 2006-2008, R Oudkerk
 # Licensed to PSF under a Contributor Agreement.
 #

 import bisect
 from collections import defaultdict
 import mmap
 import os
 import sys
 import tempfile
 import threading

 from .context import reduction, assert_spawning
 from . import util

 __all__ = ['BufferWrapper']

 #
 # Inheritable class which wraps an mmap, and from which blocks can be allocated
 #

 if sys.platform == 'win32':

     import _winapi

     class Arena(object):
         """
         A shared memory area backed by anonymous memory (Windows).
         """

         _rand = tempfile._RandomNameSequence()

         def __init__(self, size):
             self.size = size
             for i in range(100):
                 name = 'pym-%d-%s' % (os.getpid(), next(self._rand))
                 buf = mmap.mmap(-1, size, tagname=name)
                 if _winapi.GetLastError() == 0:
                     break
                 # We have reopened a preexisting mmap.
                 buf.close()
             else:
                 raise FileExistsError('Cannot find name for new mmap')
             self.name = name
             self.buffer = buf
             self._state = (self.size, self.name)

         def __getstate__(self):
             assert_spawning(self)
             return self._state

         def __setstate__(self, state):
             self.size, self.name = self._state = state
             # Reopen existing mmap
             self.buffer = mmap.mmap(-1, self.size, tagname=self.name)
             # XXX Temporarily preventing buildbot failures while determining
             # XXX the correct long-term fix. See issue 23060
             #assert _winapi.GetLastError() == _winapi.ERROR_ALREADY_EXISTS

 else:

     class Arena(object):
         """
         A shared memory area backed by a temporary file (POSIX).
         """

         if sys.platform == 'linux':
             _dir_candidates = ['/dev/shm']
         else:
             _dir_candidates = []

         def __init__(self, size, fd=-1):
             self.size = size
             self.fd = fd
             if fd == -1:
                 # Arena is created anew (if fd != -1, it means we're coming
                 # from rebuild_arena() below)
                 self.fd, name = tempfile.mkstemp(
                      prefix='pym-%d-'%os.getpid(),
                      dir=self._choose_dir(size))
                 os.unlink(name)
                 util.Finalize(self, os.close, (self.fd,))
                 os.ftruncate(self.fd, size)
             self.buffer = mmap.mmap(self.fd, self.size)

         def _choose_dir(self, size):
             # Choose a non-storage backed directory if possible,
             # to improve performance
             for d in self._dir_candidates:
                 st = os.statvfs(d)
                 if st.f_bavail * st.f_frsize >= size:  # enough free space?
                     return d
             return util.get_temp_dir()

     def reduce_arena(a):
         if a.fd == -1:
             raise ValueError('Arena is unpicklable because '
                              'forking was enabled when it was created')
         return rebuild_arena, (a.size, reduction.DupFd(a.fd))

     def rebuild_arena(size, dupfd):
         return Arena(size, dupfd.detach())

     reduction.register(Arena, reduce_arena)

 #
 # Class allowing allocation of chunks of memory from arenas
 #

 class Heap(object):

     # Minimum malloc() alignment
     _alignment = 8

     _DISCARD_FREE_SPACE_LARGER_THAN = 4 * 1024 ** 2  # 4 MB
     _DOUBLE_ARENA_SIZE_UNTIL = 4 * 1024 ** 2

     def __init__(self, size=mmap.PAGESIZE):
         self._lastpid = os.getpid()
         self._lock = threading.Lock()
         # Current arena allocation size
         self._size = size
         # A sorted list of available block sizes in arenas
         self._lengths = []

         # Free block management:
         # - map each block size to a list of `(Arena, start, stop)` blocks
         self._len_to_seq = {}
         # - map `(Arena, start)` tuple to the `(Arena, start, stop)` block
         #   starting at that offset
         self._start_to_block = {}
         # - map `(Arena, stop)` tuple to the `(Arena, start, stop)` block
         #   ending at that offset
         self._stop_to_block = {}

         # Map arenas to their `(Arena, start, stop)` blocks in use
         self._allocated_blocks = defaultdict(set)
         self._arenas = []

         # List of pending blocks to free - see comment in free() below
         self._pending_free_blocks = []

         # Statistics
         self._n_mallocs = 0
         self._n_frees = 0

     @staticmethod
     def _roundup(n, alignment):
         # alignment must be a power of 2
         mask = alignment - 1
         return (n + mask) & ~mask

     def _new_arena(self, size):
         # Create a new arena with at least the given *size*
         length = self._roundup(max(self._size, size), mmap.PAGESIZE)
         # We carve larger and larger arenas, for efficiency, until we
         # reach a large-ish size (roughly L3 cache-sized)
         if self._size < self._DOUBLE_ARENA_SIZE_UNTIL:
             self._size *= 2
         util.info('allocating a new mmap of length %d', length)
         arena = Arena(length)
         self._arenas.append(arena)
         return (arena, 0, length)

     def _discard_arena(self, arena):
         # Possibly delete the given (unused) arena
         length = arena.size
         # Reusing an existing arena is faster than creating a new one, so
         # we only reclaim space if it's large enough.
         if length < self._DISCARD_FREE_SPACE_LARGER_THAN:
             return
         blocks = self._allocated_blocks.pop(arena)
         assert not blocks
         del self._start_to_block[(arena, 0)]
         del self._stop_to_block[(arena, length)]
         self._arenas.remove(arena)
         seq = self._len_to_seq[length]
         seq.remove((arena, 0, length))
         if not seq:
             del self._len_to_seq[length]
             self._lengths.remove(length)

     def _malloc(self, size):
         # returns a large enough block -- it might be much larger
         i = bisect.bisect_left(self._lengths, size)
         if i == len(self._lengths):
             return self._new_arena(size)
         else:
             length = self._lengths[i]
             seq = self._len_to_seq[length]
             block = seq.pop()
             if not seq:
                 del self._len_to_seq[length], self._lengths[i]

         (arena, start, stop) = block
         del self._start_to_block[(arena, start)]
         del self._stop_to_block[(arena, stop)]
         return block

     def _add_free_block(self, block):
         # make block available and try to merge with its neighbours in the arena
         (arena, start, stop) = block

         try:
             prev_block = self._stop_to_block[(arena, start)]
         except KeyError:
             pass
         else:
             start, _ = self._absorb(prev_block)

         try:
             next_block = self._start_to_block[(arena, stop)]
         except KeyError:
             pass
         else:
             _, stop = self._absorb(next_block)

         block = (arena, start, stop)
         length = stop - start

         try:
             self._len_to_seq[length].append(block)
         except KeyError:
             self._len_to_seq[length] = [block]
             bisect.insort(self._lengths, length)

         self._start_to_block[(arena, start)] = block
         self._stop_to_block[(arena, stop)] = block

     def _absorb(self, block):
         # deregister this block so it can be merged with a neighbour
         (arena, start, stop) = block
         del self._start_to_block[(arena, start)]
         del self._stop_to_block[(arena, stop)]

         length = stop - start
         seq = self._len_to_seq[length]
         seq.remove(block)
         if not seq:
             del self._len_to_seq[length]
             self._lengths.remove(length)

         return start, stop

     def _remove_allocated_block(self, block):
         arena, start, stop = block
         blocks = self._allocated_blocks[arena]
         blocks.remove((start, stop))
         if not blocks:
             # Arena is entirely free, discard it from this process
             self._discard_arena(arena)

     def _free_pending_blocks(self):
         # Free all the blocks in the pending list - called with the lock held.
         while True:
             try:
                 block = self._pending_free_blocks.pop()
             except IndexError:
                 break
             self._add_free_block(block)
             self._remove_allocated_block(block)

     def free(self, block):
         # free a block returned by malloc()
         # Since free() can be called asynchronously by the GC, it could happen
         # that it's called while self._lock is held: in that case,
         # self._lock.acquire() would deadlock (issue #12352). To avoid that, a
         # trylock is used instead, and if the lock can't be acquired
         # immediately, the block is added to a list of blocks to be freed
         # synchronously sometimes later from malloc() or free(), by calling
         # _free_pending_blocks() (appending and retrieving from a list is not
         # strictly thread-safe but under CPython it's atomic thanks to the GIL).
         if os.getpid() != self._lastpid:
             raise ValueError(
                 "My pid ({0:n}) is not last pid {1:n}".format(
                     os.getpid(),self._lastpid))
         if not self._lock.acquire(False):
             # can't acquire the lock right now, add the block to the list of
             # pending blocks to free
             self._pending_free_blocks.append(block)
         else:
             # we hold the lock
             try:
                 self._n_frees += 1
                 self._free_pending_blocks()
                 self._add_free_block(block)
                 self._remove_allocated_block(block)
             finally:
                 self._lock.release()

     def malloc(self, size):
         # return a block of right size (possibly rounded up)
         if size < 0:
             raise ValueError("Size {0:n} out of range".format(size))
         if sys.maxsize <= size:
             raise OverflowError("Size {0:n} too large".format(size))
         if os.getpid() != self._lastpid:
             self.__init__()                     # reinitialize after fork
         with self._lock:
             self._n_mallocs += 1
             # allow pending blocks to be marked available
             self._free_pending_blocks()
             size = self._roundup(max(size, 1), self._alignment)
             (arena, start, stop) = self._malloc(size)
             real_stop = start + size
             if real_stop < stop:
                 # if the returned block is larger than necessary, mark
                 # the remainder available
                 self._add_free_block((arena, real_stop, stop))
             self._allocated_blocks[arena].add((start, real_stop))
             return (arena, start, real_stop)

 #
 # Class wrapping a block allocated out of a Heap -- can be inherited by child process
 #

 class BufferWrapper(object):

     _heap = Heap()

     def __init__(self, size):
         if size < 0:
             raise ValueError("Size {0:n} out of range".format(size))
         if sys.maxsize <= size:
             raise OverflowError("Size {0:n} too large".format(size))
         block = BufferWrapper._heap.malloc(size)
         self._state = (block, size)
         util.Finalize(self, BufferWrapper._heap.free, args=(block,))

     def create_memoryview(self):
         (arena, start, stop), size = self._state
         return memoryview(arena.buffer)[start:start+size]
	#
	# Module which supports allocation of memory from an mmap
	#
	# multiprocessing/heap.py
	#
	# Copyright (c) 2006-2008, R Oudkerk
	# Licensed to PSF under a Contributor Agreement.
	#

	import bisect
	from collections import defaultdict
	import mmap
	import os
	import sys
	import tempfile
	import threading

	from .context import reduction, assert_spawning
	from . import util

	__all__ = ['BufferWrapper']

	#
	# Inheritable class which wraps an mmap, and from which blocks can be allocated
	#

	if sys.platform == 'win32':

	import _winapi

	class Arena(object):
	"""
	A shared memory area backed by anonymous memory (Windows).
	"""

	_rand = tempfile._RandomNameSequence()

	def __init__(self, size):
	self.size = size
	for i in range(100):
	name = 'pym-%d-%s' % (os.getpid(), next(self._rand))
	buf = mmap.mmap(-1, size, tagname=name)
	if _winapi.GetLastError() == 0:
	break
	# We have reopened a preexisting mmap.
	buf.close()
	else:
	raise FileExistsError('Cannot find name for new mmap')
	self.name = name
	self.buffer = buf
	self._state = (self.size, self.name)

	def __getstate__(self):
	assert_spawning(self)
	return self._state

	def __setstate__(self, state):
	self.size, self.name = self._state = state
	# Reopen existing mmap
	self.buffer = mmap.mmap(-1, self.size, tagname=self.name)
	# XXX Temporarily preventing buildbot failures while determining
	# XXX the correct long-term fix. See issue 23060
	#assert _winapi.GetLastError() == _winapi.ERROR_ALREADY_EXISTS

	else:

	class Arena(object):
	"""
	A shared memory area backed by a temporary file (POSIX).
	"""

	if sys.platform == 'linux':
	_dir_candidates = ['/dev/shm']
	else:
	_dir_candidates = []

	def __init__(self, size, fd=-1):
	self.size = size
	self.fd = fd
	if fd == -1:
	# Arena is created anew (if fd != -1, it means we're coming
	# from rebuild_arena() below)
	self.fd, name = tempfile.mkstemp(
	prefix='pym-%d-'%os.getpid(),
	dir=self._choose_dir(size))
	os.unlink(name)
	util.Finalize(self, os.close, (self.fd,))
	os.ftruncate(self.fd, size)
	self.buffer = mmap.mmap(self.fd, self.size)

	def _choose_dir(self, size):
	# Choose a non-storage backed directory if possible,
	# to improve performance
	for d in self._dir_candidates:
	st = os.statvfs(d)
	if st.f_bavail * st.f_frsize >= size: # enough free space?
	return d
	return util.get_temp_dir()

	def reduce_arena(a):
	if a.fd == -1:
	raise ValueError('Arena is unpicklable because '
	'forking was enabled when it was created')
	return rebuild_arena, (a.size, reduction.DupFd(a.fd))

	def rebuild_arena(size, dupfd):
	return Arena(size, dupfd.detach())

	reduction.register(Arena, reduce_arena)

	#
	# Class allowing allocation of chunks of memory from arenas
	#

	class Heap(object):

	# Minimum malloc() alignment
	_alignment = 8

	_DISCARD_FREE_SPACE_LARGER_THAN = 4 * 1024 ** 2 # 4 MB
	_DOUBLE_ARENA_SIZE_UNTIL = 4 * 1024 ** 2

	def __init__(self, size=mmap.PAGESIZE):
	self._lastpid = os.getpid()
	self._lock = threading.Lock()
	# Current arena allocation size
	self._size = size
	# A sorted list of available block sizes in arenas
	self._lengths = []

	# Free block management:
	# - map each block size to a list of `(Arena, start, stop)` blocks
	self._len_to_seq = {}
	# - map `(Arena, start)` tuple to the `(Arena, start, stop)` block
	# starting at that offset
	self._start_to_block = {}
	# - map `(Arena, stop)` tuple to the `(Arena, start, stop)` block
	# ending at that offset
	self._stop_to_block = {}

	# Map arenas to their `(Arena, start, stop)` blocks in use
	self._allocated_blocks = defaultdict(set)
	self._arenas = []

	# List of pending blocks to free - see comment in free() below
	self._pending_free_blocks = []

	# Statistics
	self._n_mallocs = 0
	self._n_frees = 0

	@staticmethod
	def _roundup(n, alignment):
	# alignment must be a power of 2
	mask = alignment - 1
	return (n + mask) & ~mask

	def _new_arena(self, size):
	# Create a new arena with at least the given size
	length = self._roundup(max(self._size, size), mmap.PAGESIZE)
	# We carve larger and larger arenas, for efficiency, until we
	# reach a large-ish size (roughly L3 cache-sized)
	if self._size < self._DOUBLE_ARENA_SIZE_UNTIL:
	self._size *= 2
	util.info('allocating a new mmap of length %d', length)
	arena = Arena(length)
	self._arenas.append(arena)
	return (arena, 0, length)

	def _discard_arena(self, arena):
	# Possibly delete the given (unused) arena
	length = arena.size
	# Reusing an existing arena is faster than creating a new one, so
	# we only reclaim space if it's large enough.
	if length < self._DISCARD_FREE_SPACE_LARGER_THAN:
	return
	blocks = self._allocated_blocks.pop(arena)
	assert not blocks
	del self._start_to_block[(arena, 0)]
	del self._stop_to_block[(arena, length)]
	self._arenas.remove(arena)
	seq = self._len_to_seq[length]
	seq.remove((arena, 0, length))
	if not seq:
	del self._len_to_seq[length]
	self._lengths.remove(length)

	def _malloc(self, size):
	# returns a large enough block -- it might be much larger
	i = bisect.bisect_left(self._lengths, size)
	if i == len(self._lengths):
	return self._new_arena(size)
	else:
	length = self._lengths[i]
	seq = self._len_to_seq[length]
	block = seq.pop()
	if not seq:
	del self._len_to_seq[length], self._lengths[i]

	(arena, start, stop) = block
	del self._start_to_block[(arena, start)]
	del self._stop_to_block[(arena, stop)]
	return block

	def _add_free_block(self, block):
	# make block available and try to merge with its neighbours in the arena
	(arena, start, stop) = block

	try:
	prev_block = self._stop_to_block[(arena, start)]
	except KeyError:
	pass
	else:
	start, _ = self._absorb(prev_block)

	try:
	next_block = self._start_to_block[(arena, stop)]
	except KeyError:
	pass
	else:
	_, stop = self._absorb(next_block)

	block = (arena, start, stop)
	length = stop - start

	try:
	self._len_to_seq[length].append(block)
	except KeyError:
	self._len_to_seq[length] = [block]
	bisect.insort(self._lengths, length)

	self._start_to_block[(arena, start)] = block
	self._stop_to_block[(arena, stop)] = block

	def _absorb(self, block):
	# deregister this block so it can be merged with a neighbour
	(arena, start, stop) = block
	del self._start_to_block[(arena, start)]
	del self._stop_to_block[(arena, stop)]

	length = stop - start
	seq = self._len_to_seq[length]
	seq.remove(block)
	if not seq:
	del self._len_to_seq[length]
	self._lengths.remove(length)

	return start, stop

	def _remove_allocated_block(self, block):
	arena, start, stop = block
	blocks = self._allocated_blocks[arena]
	blocks.remove((start, stop))
	if not blocks:
	# Arena is entirely free, discard it from this process
	self._discard_arena(arena)

	def _free_pending_blocks(self):
	# Free all the blocks in the pending list - called with the lock held.
	while True:
	try:
	block = self._pending_free_blocks.pop()
	except IndexError:
	break
	self._add_free_block(block)
	self._remove_allocated_block(block)

	def free(self, block):
	# free a block returned by malloc()
	# Since free() can be called asynchronously by the GC, it could happen
	# that it's called while self._lock is held: in that case,
	# self._lock.acquire() would deadlock (issue #12352). To avoid that, a
	# trylock is used instead, and if the lock can't be acquired
	# immediately, the block is added to a list of blocks to be freed
	# synchronously sometimes later from malloc() or free(), by calling
	# _free_pending_blocks() (appending and retrieving from a list is not
	# strictly thread-safe but under CPython it's atomic thanks to the GIL).
	if os.getpid() != self._lastpid:
	raise ValueError(
	"My pid ({0:n}) is not last pid {1:n}".format(
	os.getpid(),self._lastpid))
	if not self._lock.acquire(False):
	# can't acquire the lock right now, add the block to the list of
	# pending blocks to free
	self._pending_free_blocks.append(block)
	else:
	# we hold the lock
	try:
	self._n_frees += 1
	self._free_pending_blocks()
	self._add_free_block(block)
	self._remove_allocated_block(block)
	finally:
	self._lock.release()

	def malloc(self, size):
	# return a block of right size (possibly rounded up)
	if size < 0:
	raise ValueError("Size {0:n} out of range".format(size))
	if sys.maxsize <= size:
	raise OverflowError("Size {0:n} too large".format(size))
	if os.getpid() != self._lastpid:
	self.__init__() # reinitialize after fork
	with self._lock:
	self._n_mallocs += 1
	# allow pending blocks to be marked available
	self._free_pending_blocks()
	size = self._roundup(max(size, 1), self._alignment)
	(arena, start, stop) = self._malloc(size)
	real_stop = start + size
	if real_stop < stop:
	# if the returned block is larger than necessary, mark
	# the remainder available
	self._add_free_block((arena, real_stop, stop))
	self._allocated_blocks[arena].add((start, real_stop))
	return (arena, start, real_stop)

	#
	# Class wrapping a block allocated out of a Heap -- can be inherited by child process
	#

	class BufferWrapper(object):

	_heap = Heap()

	def __init__(self, size):
	if size < 0:
	raise ValueError("Size {0:n} out of range".format(size))
	if sys.maxsize <= size:
	raise OverflowError("Size {0:n} too large".format(size))
	block = BufferWrapper._heap.malloc(size)
	self._state = (block, size)
	util.Finalize(self, BufferWrapper._heap.free, args=(block,))

	def create_memoryview(self):
	(arena, start, stop), size = self._state
	return memoryview(arena.buffer)[start:start+size]