mirror of
				https://github.com/python/cpython.git
				synced 2025-10-31 13:41:24 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			343 lines
		
	
	
	
		
			13 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			343 lines
		
	
	
	
		
			13 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| import os
 | |
| import tempfile
 | |
| 
 | |
| from . import abc as resources_abc
 | |
| from contextlib import contextmanager, suppress
 | |
| from importlib import import_module
 | |
| from importlib.abc import ResourceLoader
 | |
| from io import BytesIO, TextIOWrapper
 | |
| from pathlib import Path
 | |
| from types import ModuleType
 | |
| from typing import Iterable, Iterator, Optional, Set, Union   # noqa: F401
 | |
| from typing import cast
 | |
| from typing.io import BinaryIO, TextIO
 | |
| from zipimport import ZipImportError
 | |
| 
 | |
| 
 | |
| __all__ = [
 | |
|     'Package',
 | |
|     'Resource',
 | |
|     'contents',
 | |
|     'is_resource',
 | |
|     'open_binary',
 | |
|     'open_text',
 | |
|     'path',
 | |
|     'read_binary',
 | |
|     'read_text',
 | |
|     ]
 | |
| 
 | |
| 
 | |
| Package = Union[str, ModuleType]
 | |
| Resource = Union[str, os.PathLike]
 | |
| 
 | |
| 
 | |
| def _get_package(package) -> ModuleType:
 | |
|     """Take a package name or module object and return the module.
 | |
| 
 | |
|     If a name, the module is imported.  If the passed or imported module
 | |
|     object is not a package, raise an exception.
 | |
|     """
 | |
|     if hasattr(package, '__spec__'):
 | |
|         if package.__spec__.submodule_search_locations is None:
 | |
|             raise TypeError('{!r} is not a package'.format(
 | |
|                 package.__spec__.name))
 | |
|         else:
 | |
|             return package
 | |
|     else:
 | |
|         module = import_module(package)
 | |
|         if module.__spec__.submodule_search_locations is None:
 | |
|             raise TypeError('{!r} is not a package'.format(package))
 | |
|         else:
 | |
|             return module
 | |
| 
 | |
| 
 | |
| def _normalize_path(path) -> str:
 | |
|     """Normalize a path by ensuring it is a string.
 | |
| 
 | |
|     If the resulting string contains path separators, an exception is raised.
 | |
|     """
 | |
|     parent, file_name = os.path.split(path)
 | |
|     if parent:
 | |
|         raise ValueError('{!r} must be only a file name'.format(path))
 | |
|     else:
 | |
|         return file_name
 | |
| 
 | |
| 
 | |
| def _get_resource_reader(
 | |
|         package: ModuleType) -> Optional[resources_abc.ResourceReader]:
 | |
|     # Return the package's loader if it's a ResourceReader.  We can't use
 | |
|     # a issubclass() check here because apparently abc.'s __subclasscheck__()
 | |
|     # hook wants to create a weak reference to the object, but
 | |
|     # zipimport.zipimporter does not support weak references, resulting in a
 | |
|     # TypeError.  That seems terrible.
 | |
|     spec = package.__spec__
 | |
|     if hasattr(spec.loader, 'get_resource_reader'):
 | |
|         return cast(resources_abc.ResourceReader,
 | |
|                     spec.loader.get_resource_reader(spec.name))
 | |
|     return None
 | |
| 
 | |
| 
 | |
| def _check_location(package):
 | |
|     if package.__spec__.origin is None or not package.__spec__.has_location:
 | |
|         raise FileNotFoundError(f'Package has no location {package!r}')
 | |
| 
 | |
| 
 | |
| def open_binary(package: Package, resource: Resource) -> BinaryIO:
 | |
|     """Return a file-like object opened for binary reading of the resource."""
 | |
|     resource = _normalize_path(resource)
 | |
|     package = _get_package(package)
 | |
|     reader = _get_resource_reader(package)
 | |
|     if reader is not None:
 | |
|         return reader.open_resource(resource)
 | |
|     _check_location(package)
 | |
|     absolute_package_path = os.path.abspath(package.__spec__.origin)
 | |
|     package_path = os.path.dirname(absolute_package_path)
 | |
|     full_path = os.path.join(package_path, resource)
 | |
|     try:
 | |
|         return open(full_path, mode='rb')
 | |
|     except OSError:
 | |
|         # Just assume the loader is a resource loader; all the relevant
 | |
|         # importlib.machinery loaders are and an AttributeError for
 | |
|         # get_data() will make it clear what is needed from the loader.
 | |
|         loader = cast(ResourceLoader, package.__spec__.loader)
 | |
|         data = None
 | |
|         if hasattr(package.__spec__.loader, 'get_data'):
 | |
|             with suppress(OSError):
 | |
|                 data = loader.get_data(full_path)
 | |
|         if data is None:
 | |
|             package_name = package.__spec__.name
 | |
|             message = '{!r} resource not found in {!r}'.format(
 | |
|                 resource, package_name)
 | |
|             raise FileNotFoundError(message)
 | |
|         else:
 | |
|             return BytesIO(data)
 | |
| 
 | |
| 
 | |
| def open_text(package: Package,
 | |
|               resource: Resource,
 | |
|               encoding: str = 'utf-8',
 | |
|               errors: str = 'strict') -> TextIO:
 | |
|     """Return a file-like object opened for text reading of the resource."""
 | |
|     resource = _normalize_path(resource)
 | |
|     package = _get_package(package)
 | |
|     reader = _get_resource_reader(package)
 | |
|     if reader is not None:
 | |
|         return TextIOWrapper(reader.open_resource(resource), encoding, errors)
 | |
|     _check_location(package)
 | |
|     absolute_package_path = os.path.abspath(package.__spec__.origin)
 | |
|     package_path = os.path.dirname(absolute_package_path)
 | |
|     full_path = os.path.join(package_path, resource)
 | |
|     try:
 | |
|         return open(full_path, mode='r', encoding=encoding, errors=errors)
 | |
|     except OSError:
 | |
|         # Just assume the loader is a resource loader; all the relevant
 | |
|         # importlib.machinery loaders are and an AttributeError for
 | |
|         # get_data() will make it clear what is needed from the loader.
 | |
|         loader = cast(ResourceLoader, package.__spec__.loader)
 | |
|         data = None
 | |
|         if hasattr(package.__spec__.loader, 'get_data'):
 | |
|             with suppress(OSError):
 | |
|                 data = loader.get_data(full_path)
 | |
|         if data is None:
 | |
|             package_name = package.__spec__.name
 | |
|             message = '{!r} resource not found in {!r}'.format(
 | |
|                 resource, package_name)
 | |
|             raise FileNotFoundError(message)
 | |
|         else:
 | |
|             return TextIOWrapper(BytesIO(data), encoding, errors)
 | |
| 
 | |
| 
 | |
| def read_binary(package: Package, resource: Resource) -> bytes:
 | |
|     """Return the binary contents of the resource."""
 | |
|     resource = _normalize_path(resource)
 | |
|     package = _get_package(package)
 | |
|     with open_binary(package, resource) as fp:
 | |
|         return fp.read()
 | |
| 
 | |
| 
 | |
| def read_text(package: Package,
 | |
|               resource: Resource,
 | |
|               encoding: str = 'utf-8',
 | |
|               errors: str = 'strict') -> str:
 | |
|     """Return the decoded string of the resource.
 | |
| 
 | |
|     The decoding-related arguments have the same semantics as those of
 | |
|     bytes.decode().
 | |
|     """
 | |
|     resource = _normalize_path(resource)
 | |
|     package = _get_package(package)
 | |
|     with open_text(package, resource, encoding, errors) as fp:
 | |
|         return fp.read()
 | |
| 
 | |
| 
 | |
| @contextmanager
 | |
| def path(package: Package, resource: Resource) -> Iterator[Path]:
 | |
|     """A context manager providing a file path object to the resource.
 | |
| 
 | |
|     If the resource does not already exist on its own on the file system,
 | |
|     a temporary file will be created. If the file was created, the file
 | |
|     will be deleted upon exiting the context manager (no exception is
 | |
|     raised if the file was deleted prior to the context manager
 | |
|     exiting).
 | |
|     """
 | |
|     resource = _normalize_path(resource)
 | |
|     package = _get_package(package)
 | |
|     reader = _get_resource_reader(package)
 | |
|     if reader is not None:
 | |
|         try:
 | |
|             yield Path(reader.resource_path(resource))
 | |
|             return
 | |
|         except FileNotFoundError:
 | |
|             pass
 | |
|     else:
 | |
|         _check_location(package)
 | |
|     # Fall-through for both the lack of resource_path() *and* if
 | |
|     # resource_path() raises FileNotFoundError.
 | |
|     package_directory = Path(package.__spec__.origin).parent
 | |
|     file_path = package_directory / resource
 | |
|     if file_path.exists():
 | |
|         yield file_path
 | |
|     else:
 | |
|         with open_binary(package, resource) as fp:
 | |
|             data = fp.read()
 | |
|         # Not using tempfile.NamedTemporaryFile as it leads to deeper 'try'
 | |
|         # blocks due to the need to close the temporary file to work on
 | |
|         # Windows properly.
 | |
|         fd, raw_path = tempfile.mkstemp()
 | |
|         try:
 | |
|             os.write(fd, data)
 | |
|             os.close(fd)
 | |
|             yield Path(raw_path)
 | |
|         finally:
 | |
|             try:
 | |
|                 os.remove(raw_path)
 | |
|             except FileNotFoundError:
 | |
|                 pass
 | |
| 
 | |
| 
 | |
| def is_resource(package: Package, name: str) -> bool:
 | |
|     """True if 'name' is a resource inside 'package'.
 | |
| 
 | |
|     Directories are *not* resources.
 | |
|     """
 | |
|     package = _get_package(package)
 | |
|     _normalize_path(name)
 | |
|     reader = _get_resource_reader(package)
 | |
|     if reader is not None:
 | |
|         return reader.is_resource(name)
 | |
|     try:
 | |
|         package_contents = set(contents(package))
 | |
|     except (NotADirectoryError, FileNotFoundError):
 | |
|         return False
 | |
|     if name not in package_contents:
 | |
|         return False
 | |
|     # Just because the given file_name lives as an entry in the package's
 | |
|     # contents doesn't necessarily mean it's a resource.  Directories are not
 | |
|     # resources, so let's try to find out if it's a directory or not.
 | |
|     path = Path(package.__spec__.origin).parent / name
 | |
|     return path.is_file()
 | |
| 
 | |
| 
 | |
| def contents(package: Package) -> Iterable[str]:
 | |
|     """Return an iterable of entries in 'package'.
 | |
| 
 | |
|     Note that not all entries are resources.  Specifically, directories are
 | |
|     not considered resources.  Use `is_resource()` on each entry returned here
 | |
|     to check if it is a resource or not.
 | |
|     """
 | |
|     package = _get_package(package)
 | |
|     reader = _get_resource_reader(package)
 | |
|     if reader is not None:
 | |
|         return reader.contents()
 | |
|     # Is the package a namespace package?  By definition, namespace packages
 | |
|     # cannot have resources.  We could use _check_location() and catch the
 | |
|     # exception, but that's extra work, so just inline the check.
 | |
|     elif package.__spec__.origin is None or not package.__spec__.has_location:
 | |
|         return ()
 | |
|     else:
 | |
|         package_directory = Path(package.__spec__.origin).parent
 | |
|         return os.listdir(package_directory)
 | |
| 
 | |
| 
 | |
| # Private implementation of ResourceReader and get_resource_reader() called
 | |
| # from zipimport.c.  Don't use these directly!  We're implementing these in
 | |
| # Python because 1) it's easier, 2) zipimport may get rewritten in Python
 | |
| # itself at some point, so doing this all in C would difficult and a waste of
 | |
| # effort.
 | |
| 
 | |
| class _ZipImportResourceReader(resources_abc.ResourceReader):
 | |
|     """Private class used to support ZipImport.get_resource_reader().
 | |
| 
 | |
|     This class is allowed to reference all the innards and private parts of
 | |
|     the zipimporter.
 | |
|     """
 | |
| 
 | |
|     def __init__(self, zipimporter, fullname):
 | |
|         self.zipimporter = zipimporter
 | |
|         self.fullname = fullname
 | |
| 
 | |
|     def open_resource(self, resource):
 | |
|         fullname_as_path = self.fullname.replace('.', '/')
 | |
|         path = f'{fullname_as_path}/{resource}'
 | |
|         try:
 | |
|             return BytesIO(self.zipimporter.get_data(path))
 | |
|         except OSError:
 | |
|             raise FileNotFoundError(path)
 | |
| 
 | |
|     def resource_path(self, resource):
 | |
|         # All resources are in the zip file, so there is no path to the file.
 | |
|         # Raising FileNotFoundError tells the higher level API to extract the
 | |
|         # binary data and create a temporary file.
 | |
|         raise FileNotFoundError
 | |
| 
 | |
|     def is_resource(self, name):
 | |
|         # Maybe we could do better, but if we can get the data, it's a
 | |
|         # resource.  Otherwise it isn't.
 | |
|         fullname_as_path = self.fullname.replace('.', '/')
 | |
|         path = f'{fullname_as_path}/{name}'
 | |
|         try:
 | |
|             self.zipimporter.get_data(path)
 | |
|         except OSError:
 | |
|             return False
 | |
|         return True
 | |
| 
 | |
|     def contents(self):
 | |
|         # This is a bit convoluted, because fullname will be a module path,
 | |
|         # but _files is a list of file names relative to the top of the
 | |
|         # archive's namespace.  We want to compare file paths to find all the
 | |
|         # names of things inside the module represented by fullname.  So we
 | |
|         # turn the module path of fullname into a file path relative to the
 | |
|         # top of the archive, and then we iterate through _files looking for
 | |
|         # names inside that "directory".
 | |
|         fullname_path = Path(self.zipimporter.get_filename(self.fullname))
 | |
|         relative_path = fullname_path.relative_to(self.zipimporter.archive)
 | |
|         # Don't forget that fullname names a package, so its path will include
 | |
|         # __init__.py, which we want to ignore.
 | |
|         assert relative_path.name == '__init__.py'
 | |
|         package_path = relative_path.parent
 | |
|         subdirs_seen = set()
 | |
|         for filename in self.zipimporter._files:
 | |
|             try:
 | |
|                 relative = Path(filename).relative_to(package_path)
 | |
|             except ValueError:
 | |
|                 continue
 | |
|             # If the path of the file (which is relative to the top of the zip
 | |
|             # namespace), relative to the package given when the resource
 | |
|             # reader was created, has a parent, then it's a name in a
 | |
|             # subdirectory and thus we skip it.
 | |
|             parent_name = relative.parent.name
 | |
|             if len(parent_name) == 0:
 | |
|                 yield relative.name
 | |
|             elif parent_name not in subdirs_seen:
 | |
|                 subdirs_seen.add(parent_name)
 | |
|                 yield parent_name
 | |
| 
 | |
| 
 | |
| # Called from zipimport.c
 | |
| def _zipimport_get_resource_reader(zipimporter, fullname):
 | |
|     try:
 | |
|         if not zipimporter.is_package(fullname):
 | |
|             return None
 | |
|     except ZipImportError:
 | |
|         return None
 | |
|     return _ZipImportResourceReader(zipimporter, fullname)
 | 
