mirror of
				https://github.com/python/cpython.git
				synced 2025-10-25 02:43:41 +00:00 
			
		
		
		
	 e4679cd644
			
		
	
	
		e4679cd644
		
			
		
	
	
	
	
		
			
			Large shared arrays allocated using multiprocessing would remain allocated until the process ends.
		
			
				
	
	
		
			337 lines
		
	
	
	
		
			11 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			337 lines
		
	
	
	
		
			11 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| #
 | |
| # Module which supports allocation of memory from an mmap
 | |
| #
 | |
| # multiprocessing/heap.py
 | |
| #
 | |
| # Copyright (c) 2006-2008, R Oudkerk
 | |
| # Licensed to PSF under a Contributor Agreement.
 | |
| #
 | |
| 
 | |
| import bisect
 | |
| from collections import defaultdict
 | |
| import mmap
 | |
| import os
 | |
| import sys
 | |
| import tempfile
 | |
| import threading
 | |
| 
 | |
| from .context import reduction, assert_spawning
 | |
| from . import util
 | |
| 
 | |
| __all__ = ['BufferWrapper']
 | |
| 
 | |
| #
 | |
| # Inheritable class which wraps an mmap, and from which blocks can be allocated
 | |
| #
 | |
| 
 | |
| if sys.platform == 'win32':
 | |
| 
 | |
|     import _winapi
 | |
| 
 | |
|     class Arena(object):
 | |
|         """
 | |
|         A shared memory area backed by anonymous memory (Windows).
 | |
|         """
 | |
| 
 | |
|         _rand = tempfile._RandomNameSequence()
 | |
| 
 | |
|         def __init__(self, size):
 | |
|             self.size = size
 | |
|             for i in range(100):
 | |
|                 name = 'pym-%d-%s' % (os.getpid(), next(self._rand))
 | |
|                 buf = mmap.mmap(-1, size, tagname=name)
 | |
|                 if _winapi.GetLastError() == 0:
 | |
|                     break
 | |
|                 # We have reopened a preexisting mmap.
 | |
|                 buf.close()
 | |
|             else:
 | |
|                 raise FileExistsError('Cannot find name for new mmap')
 | |
|             self.name = name
 | |
|             self.buffer = buf
 | |
|             self._state = (self.size, self.name)
 | |
| 
 | |
|         def __getstate__(self):
 | |
|             assert_spawning(self)
 | |
|             return self._state
 | |
| 
 | |
|         def __setstate__(self, state):
 | |
|             self.size, self.name = self._state = state
 | |
|             # Reopen existing mmap
 | |
|             self.buffer = mmap.mmap(-1, self.size, tagname=self.name)
 | |
|             # XXX Temporarily preventing buildbot failures while determining
 | |
|             # XXX the correct long-term fix. See issue 23060
 | |
|             #assert _winapi.GetLastError() == _winapi.ERROR_ALREADY_EXISTS
 | |
| 
 | |
| else:
 | |
| 
 | |
|     class Arena(object):
 | |
|         """
 | |
|         A shared memory area backed by a temporary file (POSIX).
 | |
|         """
 | |
| 
 | |
|         if sys.platform == 'linux':
 | |
|             _dir_candidates = ['/dev/shm']
 | |
|         else:
 | |
|             _dir_candidates = []
 | |
| 
 | |
|         def __init__(self, size, fd=-1):
 | |
|             self.size = size
 | |
|             self.fd = fd
 | |
|             if fd == -1:
 | |
|                 # Arena is created anew (if fd != -1, it means we're coming
 | |
|                 # from rebuild_arena() below)
 | |
|                 self.fd, name = tempfile.mkstemp(
 | |
|                      prefix='pym-%d-'%os.getpid(),
 | |
|                      dir=self._choose_dir(size))
 | |
|                 os.unlink(name)
 | |
|                 util.Finalize(self, os.close, (self.fd,))
 | |
|                 os.ftruncate(self.fd, size)
 | |
|             self.buffer = mmap.mmap(self.fd, self.size)
 | |
| 
 | |
|         def _choose_dir(self, size):
 | |
|             # Choose a non-storage backed directory if possible,
 | |
|             # to improve performance
 | |
|             for d in self._dir_candidates:
 | |
|                 st = os.statvfs(d)
 | |
|                 if st.f_bavail * st.f_frsize >= size:  # enough free space?
 | |
|                     return d
 | |
|             return util.get_temp_dir()
 | |
| 
 | |
|     def reduce_arena(a):
 | |
|         if a.fd == -1:
 | |
|             raise ValueError('Arena is unpicklable because '
 | |
|                              'forking was enabled when it was created')
 | |
|         return rebuild_arena, (a.size, reduction.DupFd(a.fd))
 | |
| 
 | |
|     def rebuild_arena(size, dupfd):
 | |
|         return Arena(size, dupfd.detach())
 | |
| 
 | |
|     reduction.register(Arena, reduce_arena)
 | |
| 
 | |
| #
 | |
| # Class allowing allocation of chunks of memory from arenas
 | |
| #
 | |
| 
 | |
| class Heap(object):
 | |
| 
 | |
|     # Minimum malloc() alignment
 | |
|     _alignment = 8
 | |
| 
 | |
|     _DISCARD_FREE_SPACE_LARGER_THAN = 4 * 1024 ** 2  # 4 MB
 | |
|     _DOUBLE_ARENA_SIZE_UNTIL = 4 * 1024 ** 2
 | |
| 
 | |
|     def __init__(self, size=mmap.PAGESIZE):
 | |
|         self._lastpid = os.getpid()
 | |
|         self._lock = threading.Lock()
 | |
|         # Current arena allocation size
 | |
|         self._size = size
 | |
|         # A sorted list of available block sizes in arenas
 | |
|         self._lengths = []
 | |
| 
 | |
|         # Free block management:
 | |
|         # - map each block size to a list of `(Arena, start, stop)` blocks
 | |
|         self._len_to_seq = {}
 | |
|         # - map `(Arena, start)` tuple to the `(Arena, start, stop)` block
 | |
|         #   starting at that offset
 | |
|         self._start_to_block = {}
 | |
|         # - map `(Arena, stop)` tuple to the `(Arena, start, stop)` block
 | |
|         #   ending at that offset
 | |
|         self._stop_to_block = {}
 | |
| 
 | |
|         # Map arenas to their `(Arena, start, stop)` blocks in use
 | |
|         self._allocated_blocks = defaultdict(set)
 | |
|         self._arenas = []
 | |
| 
 | |
|         # List of pending blocks to free - see comment in free() below
 | |
|         self._pending_free_blocks = []
 | |
| 
 | |
|         # Statistics
 | |
|         self._n_mallocs = 0
 | |
|         self._n_frees = 0
 | |
| 
 | |
|     @staticmethod
 | |
|     def _roundup(n, alignment):
 | |
|         # alignment must be a power of 2
 | |
|         mask = alignment - 1
 | |
|         return (n + mask) & ~mask
 | |
| 
 | |
|     def _new_arena(self, size):
 | |
|         # Create a new arena with at least the given *size*
 | |
|         length = self._roundup(max(self._size, size), mmap.PAGESIZE)
 | |
|         # We carve larger and larger arenas, for efficiency, until we
 | |
|         # reach a large-ish size (roughly L3 cache-sized)
 | |
|         if self._size < self._DOUBLE_ARENA_SIZE_UNTIL:
 | |
|             self._size *= 2
 | |
|         util.info('allocating a new mmap of length %d', length)
 | |
|         arena = Arena(length)
 | |
|         self._arenas.append(arena)
 | |
|         return (arena, 0, length)
 | |
| 
 | |
|     def _discard_arena(self, arena):
 | |
|         # Possibly delete the given (unused) arena
 | |
|         length = arena.size
 | |
|         # Reusing an existing arena is faster than creating a new one, so
 | |
|         # we only reclaim space if it's large enough.
 | |
|         if length < self._DISCARD_FREE_SPACE_LARGER_THAN:
 | |
|             return
 | |
|         blocks = self._allocated_blocks.pop(arena)
 | |
|         assert not blocks
 | |
|         del self._start_to_block[(arena, 0)]
 | |
|         del self._stop_to_block[(arena, length)]
 | |
|         self._arenas.remove(arena)
 | |
|         seq = self._len_to_seq[length]
 | |
|         seq.remove((arena, 0, length))
 | |
|         if not seq:
 | |
|             del self._len_to_seq[length]
 | |
|             self._lengths.remove(length)
 | |
| 
 | |
|     def _malloc(self, size):
 | |
|         # returns a large enough block -- it might be much larger
 | |
|         i = bisect.bisect_left(self._lengths, size)
 | |
|         if i == len(self._lengths):
 | |
|             return self._new_arena(size)
 | |
|         else:
 | |
|             length = self._lengths[i]
 | |
|             seq = self._len_to_seq[length]
 | |
|             block = seq.pop()
 | |
|             if not seq:
 | |
|                 del self._len_to_seq[length], self._lengths[i]
 | |
| 
 | |
|         (arena, start, stop) = block
 | |
|         del self._start_to_block[(arena, start)]
 | |
|         del self._stop_to_block[(arena, stop)]
 | |
|         return block
 | |
| 
 | |
|     def _add_free_block(self, block):
 | |
|         # make block available and try to merge with its neighbours in the arena
 | |
|         (arena, start, stop) = block
 | |
| 
 | |
|         try:
 | |
|             prev_block = self._stop_to_block[(arena, start)]
 | |
|         except KeyError:
 | |
|             pass
 | |
|         else:
 | |
|             start, _ = self._absorb(prev_block)
 | |
| 
 | |
|         try:
 | |
|             next_block = self._start_to_block[(arena, stop)]
 | |
|         except KeyError:
 | |
|             pass
 | |
|         else:
 | |
|             _, stop = self._absorb(next_block)
 | |
| 
 | |
|         block = (arena, start, stop)
 | |
|         length = stop - start
 | |
| 
 | |
|         try:
 | |
|             self._len_to_seq[length].append(block)
 | |
|         except KeyError:
 | |
|             self._len_to_seq[length] = [block]
 | |
|             bisect.insort(self._lengths, length)
 | |
| 
 | |
|         self._start_to_block[(arena, start)] = block
 | |
|         self._stop_to_block[(arena, stop)] = block
 | |
| 
 | |
|     def _absorb(self, block):
 | |
|         # deregister this block so it can be merged with a neighbour
 | |
|         (arena, start, stop) = block
 | |
|         del self._start_to_block[(arena, start)]
 | |
|         del self._stop_to_block[(arena, stop)]
 | |
| 
 | |
|         length = stop - start
 | |
|         seq = self._len_to_seq[length]
 | |
|         seq.remove(block)
 | |
|         if not seq:
 | |
|             del self._len_to_seq[length]
 | |
|             self._lengths.remove(length)
 | |
| 
 | |
|         return start, stop
 | |
| 
 | |
|     def _remove_allocated_block(self, block):
 | |
|         arena, start, stop = block
 | |
|         blocks = self._allocated_blocks[arena]
 | |
|         blocks.remove((start, stop))
 | |
|         if not blocks:
 | |
|             # Arena is entirely free, discard it from this process
 | |
|             self._discard_arena(arena)
 | |
| 
 | |
|     def _free_pending_blocks(self):
 | |
|         # Free all the blocks in the pending list - called with the lock held.
 | |
|         while True:
 | |
|             try:
 | |
|                 block = self._pending_free_blocks.pop()
 | |
|             except IndexError:
 | |
|                 break
 | |
|             self._add_free_block(block)
 | |
|             self._remove_allocated_block(block)
 | |
| 
 | |
|     def free(self, block):
 | |
|         # free a block returned by malloc()
 | |
|         # Since free() can be called asynchronously by the GC, it could happen
 | |
|         # that it's called while self._lock is held: in that case,
 | |
|         # self._lock.acquire() would deadlock (issue #12352). To avoid that, a
 | |
|         # trylock is used instead, and if the lock can't be acquired
 | |
|         # immediately, the block is added to a list of blocks to be freed
 | |
|         # synchronously sometimes later from malloc() or free(), by calling
 | |
|         # _free_pending_blocks() (appending and retrieving from a list is not
 | |
|         # strictly thread-safe but under CPython it's atomic thanks to the GIL).
 | |
|         if os.getpid() != self._lastpid:
 | |
|             raise ValueError(
 | |
|                 "My pid ({0:n}) is not last pid {1:n}".format(
 | |
|                     os.getpid(),self._lastpid))
 | |
|         if not self._lock.acquire(False):
 | |
|             # can't acquire the lock right now, add the block to the list of
 | |
|             # pending blocks to free
 | |
|             self._pending_free_blocks.append(block)
 | |
|         else:
 | |
|             # we hold the lock
 | |
|             try:
 | |
|                 self._n_frees += 1
 | |
|                 self._free_pending_blocks()
 | |
|                 self._add_free_block(block)
 | |
|                 self._remove_allocated_block(block)
 | |
|             finally:
 | |
|                 self._lock.release()
 | |
| 
 | |
|     def malloc(self, size):
 | |
|         # return a block of right size (possibly rounded up)
 | |
|         if size < 0:
 | |
|             raise ValueError("Size {0:n} out of range".format(size))
 | |
|         if sys.maxsize <= size:
 | |
|             raise OverflowError("Size {0:n} too large".format(size))
 | |
|         if os.getpid() != self._lastpid:
 | |
|             self.__init__()                     # reinitialize after fork
 | |
|         with self._lock:
 | |
|             self._n_mallocs += 1
 | |
|             # allow pending blocks to be marked available
 | |
|             self._free_pending_blocks()
 | |
|             size = self._roundup(max(size, 1), self._alignment)
 | |
|             (arena, start, stop) = self._malloc(size)
 | |
|             real_stop = start + size
 | |
|             if real_stop < stop:
 | |
|                 # if the returned block is larger than necessary, mark
 | |
|                 # the remainder available
 | |
|                 self._add_free_block((arena, real_stop, stop))
 | |
|             self._allocated_blocks[arena].add((start, real_stop))
 | |
|             return (arena, start, real_stop)
 | |
| 
 | |
| #
 | |
| # Class wrapping a block allocated out of a Heap -- can be inherited by child process
 | |
| #
 | |
| 
 | |
| class BufferWrapper(object):
 | |
| 
 | |
|     _heap = Heap()
 | |
| 
 | |
|     def __init__(self, size):
 | |
|         if size < 0:
 | |
|             raise ValueError("Size {0:n} out of range".format(size))
 | |
|         if sys.maxsize <= size:
 | |
|             raise OverflowError("Size {0:n} too large".format(size))
 | |
|         block = BufferWrapper._heap.malloc(size)
 | |
|         self._state = (block, size)
 | |
|         util.Finalize(self, BufferWrapper._heap.free, args=(block,))
 | |
| 
 | |
|     def create_memoryview(self):
 | |
|         (arena, start, stop), size = self._state
 | |
|         return memoryview(arena.buffer)[start:start+size]
 |