123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337 |
- #
- # Module which supports allocation of memory from an mmap
- #
- # multiprocessing/heap.py
- #
- # Copyright (c) 2006-2008, R Oudkerk
- # Licensed to PSF under a Contributor Agreement.
- #
- import bisect
- from collections import defaultdict
- import mmap
- import os
- import sys
- import tempfile
- import threading
- from .context import reduction, assert_spawning
- from . import util
- __all__ = ['BufferWrapper']
- #
- # Inheritable class which wraps an mmap, and from which blocks can be allocated
- #
- if sys.platform == 'win32':
- import _winapi
- class Arena(object):
- """
- A shared memory area backed by anonymous memory (Windows).
- """
- _rand = tempfile._RandomNameSequence()
- def __init__(self, size):
- self.size = size
- for i in range(100):
- name = 'pym-%d-%s' % (os.getpid(), next(self._rand))
- buf = mmap.mmap(-1, size, tagname=name)
- if _winapi.GetLastError() == 0:
- break
- # We have reopened a preexisting mmap.
- buf.close()
- else:
- raise FileExistsError('Cannot find name for new mmap')
- self.name = name
- self.buffer = buf
- self._state = (self.size, self.name)
- def __getstate__(self):
- assert_spawning(self)
- return self._state
- def __setstate__(self, state):
- self.size, self.name = self._state = state
- # Reopen existing mmap
- self.buffer = mmap.mmap(-1, self.size, tagname=self.name)
- # XXX Temporarily preventing buildbot failures while determining
- # XXX the correct long-term fix. See issue 23060
- #assert _winapi.GetLastError() == _winapi.ERROR_ALREADY_EXISTS
- else:
- class Arena(object):
- """
- A shared memory area backed by a temporary file (POSIX).
- """
- if sys.platform == 'linux':
- _dir_candidates = ['/dev/shm']
- else:
- _dir_candidates = []
- def __init__(self, size, fd=-1):
- self.size = size
- self.fd = fd
- if fd == -1:
- # Arena is created anew (if fd != -1, it means we're coming
- # from rebuild_arena() below)
- self.fd, name = tempfile.mkstemp(
- prefix='pym-%d-'%os.getpid(),
- dir=self._choose_dir(size))
- os.unlink(name)
- util.Finalize(self, os.close, (self.fd,))
- os.ftruncate(self.fd, size)
- self.buffer = mmap.mmap(self.fd, self.size)
- def _choose_dir(self, size):
- # Choose a non-storage backed directory if possible,
- # to improve performance
- for d in self._dir_candidates:
- st = os.statvfs(d)
- if st.f_bavail * st.f_frsize >= size: # enough free space?
- return d
- return util.get_temp_dir()
- def reduce_arena(a):
- if a.fd == -1:
- raise ValueError('Arena is unpicklable because '
- 'forking was enabled when it was created')
- return rebuild_arena, (a.size, reduction.DupFd(a.fd))
- def rebuild_arena(size, dupfd):
- return Arena(size, dupfd.detach())
- reduction.register(Arena, reduce_arena)
- #
- # Class allowing allocation of chunks of memory from arenas
- #
- class Heap(object):
- # Minimum malloc() alignment
- _alignment = 8
- _DISCARD_FREE_SPACE_LARGER_THAN = 4 * 1024 ** 2 # 4 MB
- _DOUBLE_ARENA_SIZE_UNTIL = 4 * 1024 ** 2
- def __init__(self, size=mmap.PAGESIZE):
- self._lastpid = os.getpid()
- self._lock = threading.Lock()
- # Current arena allocation size
- self._size = size
- # A sorted list of available block sizes in arenas
- self._lengths = []
- # Free block management:
- # - map each block size to a list of `(Arena, start, stop)` blocks
- self._len_to_seq = {}
- # - map `(Arena, start)` tuple to the `(Arena, start, stop)` block
- # starting at that offset
- self._start_to_block = {}
- # - map `(Arena, stop)` tuple to the `(Arena, start, stop)` block
- # ending at that offset
- self._stop_to_block = {}
- # Map arenas to their `(Arena, start, stop)` blocks in use
- self._allocated_blocks = defaultdict(set)
- self._arenas = []
- # List of pending blocks to free - see comment in free() below
- self._pending_free_blocks = []
- # Statistics
- self._n_mallocs = 0
- self._n_frees = 0
- @staticmethod
- def _roundup(n, alignment):
- # alignment must be a power of 2
- mask = alignment - 1
- return (n + mask) & ~mask
- def _new_arena(self, size):
- # Create a new arena with at least the given *size*
- length = self._roundup(max(self._size, size), mmap.PAGESIZE)
- # We carve larger and larger arenas, for efficiency, until we
- # reach a large-ish size (roughly L3 cache-sized)
- if self._size < self._DOUBLE_ARENA_SIZE_UNTIL:
- self._size *= 2
- util.info('allocating a new mmap of length %d', length)
- arena = Arena(length)
- self._arenas.append(arena)
- return (arena, 0, length)
- def _discard_arena(self, arena):
- # Possibly delete the given (unused) arena
- length = arena.size
- # Reusing an existing arena is faster than creating a new one, so
- # we only reclaim space if it's large enough.
- if length < self._DISCARD_FREE_SPACE_LARGER_THAN:
- return
- blocks = self._allocated_blocks.pop(arena)
- assert not blocks
- del self._start_to_block[(arena, 0)]
- del self._stop_to_block[(arena, length)]
- self._arenas.remove(arena)
- seq = self._len_to_seq[length]
- seq.remove((arena, 0, length))
- if not seq:
- del self._len_to_seq[length]
- self._lengths.remove(length)
- def _malloc(self, size):
- # returns a large enough block -- it might be much larger
- i = bisect.bisect_left(self._lengths, size)
- if i == len(self._lengths):
- return self._new_arena(size)
- else:
- length = self._lengths[i]
- seq = self._len_to_seq[length]
- block = seq.pop()
- if not seq:
- del self._len_to_seq[length], self._lengths[i]
- (arena, start, stop) = block
- del self._start_to_block[(arena, start)]
- del self._stop_to_block[(arena, stop)]
- return block
- def _add_free_block(self, block):
- # make block available and try to merge with its neighbours in the arena
- (arena, start, stop) = block
- try:
- prev_block = self._stop_to_block[(arena, start)]
- except KeyError:
- pass
- else:
- start, _ = self._absorb(prev_block)
- try:
- next_block = self._start_to_block[(arena, stop)]
- except KeyError:
- pass
- else:
- _, stop = self._absorb(next_block)
- block = (arena, start, stop)
- length = stop - start
- try:
- self._len_to_seq[length].append(block)
- except KeyError:
- self._len_to_seq[length] = [block]
- bisect.insort(self._lengths, length)
- self._start_to_block[(arena, start)] = block
- self._stop_to_block[(arena, stop)] = block
- def _absorb(self, block):
- # deregister this block so it can be merged with a neighbour
- (arena, start, stop) = block
- del self._start_to_block[(arena, start)]
- del self._stop_to_block[(arena, stop)]
- length = stop - start
- seq = self._len_to_seq[length]
- seq.remove(block)
- if not seq:
- del self._len_to_seq[length]
- self._lengths.remove(length)
- return start, stop
- def _remove_allocated_block(self, block):
- arena, start, stop = block
- blocks = self._allocated_blocks[arena]
- blocks.remove((start, stop))
- if not blocks:
- # Arena is entirely free, discard it from this process
- self._discard_arena(arena)
- def _free_pending_blocks(self):
- # Free all the blocks in the pending list - called with the lock held.
- while True:
- try:
- block = self._pending_free_blocks.pop()
- except IndexError:
- break
- self._add_free_block(block)
- self._remove_allocated_block(block)
- def free(self, block):
- # free a block returned by malloc()
- # Since free() can be called asynchronously by the GC, it could happen
- # that it's called while self._lock is held: in that case,
- # self._lock.acquire() would deadlock (issue #12352). To avoid that, a
- # trylock is used instead, and if the lock can't be acquired
- # immediately, the block is added to a list of blocks to be freed
- # synchronously sometimes later from malloc() or free(), by calling
- # _free_pending_blocks() (appending and retrieving from a list is not
- # strictly thread-safe but under CPython it's atomic thanks to the GIL).
- if os.getpid() != self._lastpid:
- raise ValueError(
- "My pid ({0:n}) is not last pid {1:n}".format(
- os.getpid(),self._lastpid))
- if not self._lock.acquire(False):
- # can't acquire the lock right now, add the block to the list of
- # pending blocks to free
- self._pending_free_blocks.append(block)
- else:
- # we hold the lock
- try:
- self._n_frees += 1
- self._free_pending_blocks()
- self._add_free_block(block)
- self._remove_allocated_block(block)
- finally:
- self._lock.release()
- def malloc(self, size):
- # return a block of right size (possibly rounded up)
- if size < 0:
- raise ValueError("Size {0:n} out of range".format(size))
- if sys.maxsize <= size:
- raise OverflowError("Size {0:n} too large".format(size))
- if os.getpid() != self._lastpid:
- self.__init__() # reinitialize after fork
- with self._lock:
- self._n_mallocs += 1
- # allow pending blocks to be marked available
- self._free_pending_blocks()
- size = self._roundup(max(size, 1), self._alignment)
- (arena, start, stop) = self._malloc(size)
- real_stop = start + size
- if real_stop < stop:
- # if the returned block is larger than necessary, mark
- # the remainder available
- self._add_free_block((arena, real_stop, stop))
- self._allocated_blocks[arena].add((start, real_stop))
- return (arena, start, real_stop)
- #
- # Class wrapping a block allocated out of a Heap -- can be inherited by child process
- #
- class BufferWrapper(object):
- _heap = Heap()
- def __init__(self, size):
- if size < 0:
- raise ValueError("Size {0:n} out of range".format(size))
- if sys.maxsize <= size:
- raise OverflowError("Size {0:n} too large".format(size))
- block = BufferWrapper._heap.malloc(size)
- self._state = (block, size)
- util.Finalize(self, BufferWrapper._heap.free, args=(block,))
- def create_memoryview(self):
- (arena, start, stop), size = self._state
- return memoryview(arena.buffer)[start:start+size]
|