mirror of
				https://github.com/python/cpython.git
				synced 2025-11-04 11:49:12 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			332 lines
		
	
	
	
		
			13 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			332 lines
		
	
	
	
		
			13 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
import os
 | 
						|
import tempfile
 | 
						|
 | 
						|
from . import abc as resources_abc
 | 
						|
from builtins import open as builtins_open
 | 
						|
from contextlib import contextmanager, suppress
 | 
						|
from importlib import import_module
 | 
						|
from importlib.abc import ResourceLoader
 | 
						|
from io import BytesIO, TextIOWrapper
 | 
						|
from pathlib import Path
 | 
						|
from types import ModuleType
 | 
						|
from typing import Iterator, Optional, Set, Union   # noqa: F401
 | 
						|
from typing import cast
 | 
						|
from typing.io import BinaryIO, TextIO
 | 
						|
from zipimport import ZipImportError
 | 
						|
 | 
						|
 | 
						|
Package = Union[str, ModuleType]
 | 
						|
Resource = Union[str, os.PathLike]
 | 
						|
 | 
						|
 | 
						|
def _get_package(package) -> ModuleType:
 | 
						|
    """Take a package name or module object and return the module.
 | 
						|
 | 
						|
    If a name, the module is imported.  If the passed or imported module
 | 
						|
    object is not a package, raise an exception.
 | 
						|
    """
 | 
						|
    if hasattr(package, '__spec__'):
 | 
						|
        if package.__spec__.submodule_search_locations is None:
 | 
						|
            raise TypeError('{!r} is not a package'.format(
 | 
						|
                package.__spec__.name))
 | 
						|
        else:
 | 
						|
            return package
 | 
						|
    else:
 | 
						|
        module = import_module(package)
 | 
						|
        if module.__spec__.submodule_search_locations is None:
 | 
						|
            raise TypeError('{!r} is not a package'.format(package))
 | 
						|
        else:
 | 
						|
            return module
 | 
						|
 | 
						|
 | 
						|
def _normalize_path(path) -> str:
 | 
						|
    """Normalize a path by ensuring it is a string.
 | 
						|
 | 
						|
    If the resulting string contains path separators, an exception is raised.
 | 
						|
    """
 | 
						|
    str_path = str(path)
 | 
						|
    parent, file_name = os.path.split(str_path)
 | 
						|
    if parent:
 | 
						|
        raise ValueError('{!r} must be only a file name'.format(path))
 | 
						|
    else:
 | 
						|
        return file_name
 | 
						|
 | 
						|
 | 
						|
def _get_resource_reader(
 | 
						|
        package: ModuleType) -> Optional[resources_abc.ResourceReader]:
 | 
						|
    # Return the package's loader if it's a ResourceReader.  We can't use
 | 
						|
    # a issubclass() check here because apparently abc.'s __subclasscheck__()
 | 
						|
    # hook wants to create a weak reference to the object, but
 | 
						|
    # zipimport.zipimporter does not support weak references, resulting in a
 | 
						|
    # TypeError.  That seems terrible.
 | 
						|
    spec = package.__spec__
 | 
						|
    if hasattr(spec.loader, 'get_resource_reader'):
 | 
						|
        return cast(resources_abc.ResourceReader,
 | 
						|
                    spec.loader.get_resource_reader(spec.name))
 | 
						|
    return None
 | 
						|
 | 
						|
 | 
						|
def _check_location(package):
 | 
						|
    if package.__spec__.origin is None or not package.__spec__.has_location:
 | 
						|
        raise FileNotFoundError(f'Package has no location {package!r}')
 | 
						|
 | 
						|
 | 
						|
def open_binary(package: Package, resource: Resource) -> BinaryIO:
 | 
						|
    """Return a file-like object opened for binary reading of the resource."""
 | 
						|
    resource = _normalize_path(resource)
 | 
						|
    package = _get_package(package)
 | 
						|
    reader = _get_resource_reader(package)
 | 
						|
    if reader is not None:
 | 
						|
        return reader.open_resource(resource)
 | 
						|
    _check_location(package)
 | 
						|
    absolute_package_path = os.path.abspath(package.__spec__.origin)
 | 
						|
    package_path = os.path.dirname(absolute_package_path)
 | 
						|
    full_path = os.path.join(package_path, resource)
 | 
						|
    try:
 | 
						|
        return builtins_open(full_path, mode='rb')
 | 
						|
    except OSError:
 | 
						|
        # Just assume the loader is a resource loader; all the relevant
 | 
						|
        # importlib.machinery loaders are and an AttributeError for
 | 
						|
        # get_data() will make it clear what is needed from the loader.
 | 
						|
        loader = cast(ResourceLoader, package.__spec__.loader)
 | 
						|
        data = None
 | 
						|
        if hasattr(package.__spec__.loader, 'get_data'):
 | 
						|
            with suppress(OSError):
 | 
						|
                data = loader.get_data(full_path)
 | 
						|
        if data is None:
 | 
						|
            package_name = package.__spec__.name
 | 
						|
            message = '{!r} resource not found in {!r}'.format(
 | 
						|
                resource, package_name)
 | 
						|
            raise FileNotFoundError(message)
 | 
						|
        else:
 | 
						|
            return BytesIO(data)
 | 
						|
 | 
						|
 | 
						|
def open_text(package: Package,
 | 
						|
              resource: Resource,
 | 
						|
              encoding: str = 'utf-8',
 | 
						|
              errors: str = 'strict') -> TextIO:
 | 
						|
    """Return a file-like object opened for text reading of the resource."""
 | 
						|
    resource = _normalize_path(resource)
 | 
						|
    package = _get_package(package)
 | 
						|
    reader = _get_resource_reader(package)
 | 
						|
    if reader is not None:
 | 
						|
        return TextIOWrapper(reader.open_resource(resource), encoding, errors)
 | 
						|
    _check_location(package)
 | 
						|
    absolute_package_path = os.path.abspath(package.__spec__.origin)
 | 
						|
    package_path = os.path.dirname(absolute_package_path)
 | 
						|
    full_path = os.path.join(package_path, resource)
 | 
						|
    try:
 | 
						|
        return builtins_open(
 | 
						|
            full_path, mode='r', encoding=encoding, errors=errors)
 | 
						|
    except OSError:
 | 
						|
        # Just assume the loader is a resource loader; all the relevant
 | 
						|
        # importlib.machinery loaders are and an AttributeError for
 | 
						|
        # get_data() will make it clear what is needed from the loader.
 | 
						|
        loader = cast(ResourceLoader, package.__spec__.loader)
 | 
						|
        data = None
 | 
						|
        if hasattr(package.__spec__.loader, 'get_data'):
 | 
						|
            with suppress(OSError):
 | 
						|
                data = loader.get_data(full_path)
 | 
						|
        if data is None:
 | 
						|
            package_name = package.__spec__.name
 | 
						|
            message = '{!r} resource not found in {!r}'.format(
 | 
						|
                resource, package_name)
 | 
						|
            raise FileNotFoundError(message)
 | 
						|
        else:
 | 
						|
            return TextIOWrapper(BytesIO(data), encoding, errors)
 | 
						|
 | 
						|
 | 
						|
def read_binary(package: Package, resource: Resource) -> bytes:
 | 
						|
    """Return the binary contents of the resource."""
 | 
						|
    resource = _normalize_path(resource)
 | 
						|
    package = _get_package(package)
 | 
						|
    with open_binary(package, resource) as fp:
 | 
						|
        return fp.read()
 | 
						|
 | 
						|
 | 
						|
def read_text(package: Package,
 | 
						|
              resource: Resource,
 | 
						|
              encoding: str = 'utf-8',
 | 
						|
              errors: str = 'strict') -> str:
 | 
						|
    """Return the decoded string of the resource.
 | 
						|
 | 
						|
    The decoding-related arguments have the same semantics as those of
 | 
						|
    bytes.decode().
 | 
						|
    """
 | 
						|
    resource = _normalize_path(resource)
 | 
						|
    package = _get_package(package)
 | 
						|
    with open_text(package, resource, encoding, errors) as fp:
 | 
						|
        return fp.read()
 | 
						|
 | 
						|
 | 
						|
@contextmanager
 | 
						|
def path(package: Package, resource: Resource) -> Iterator[Path]:
 | 
						|
    """A context manager providing a file path object to the resource.
 | 
						|
 | 
						|
    If the resource does not already exist on its own on the file system,
 | 
						|
    a temporary file will be created. If the file was created, the file
 | 
						|
    will be deleted upon exiting the context manager (no exception is
 | 
						|
    raised if the file was deleted prior to the context manager
 | 
						|
    exiting).
 | 
						|
    """
 | 
						|
    resource = _normalize_path(resource)
 | 
						|
    package = _get_package(package)
 | 
						|
    reader = _get_resource_reader(package)
 | 
						|
    if reader is not None:
 | 
						|
        try:
 | 
						|
            yield Path(reader.resource_path(resource))
 | 
						|
            return
 | 
						|
        except FileNotFoundError:
 | 
						|
            pass
 | 
						|
    else:
 | 
						|
        _check_location(package)
 | 
						|
    # Fall-through for both the lack of resource_path() *and* if
 | 
						|
    # resource_path() raises FileNotFoundError.
 | 
						|
    package_directory = Path(package.__spec__.origin).parent
 | 
						|
    file_path = package_directory / resource
 | 
						|
    if file_path.exists():
 | 
						|
        yield file_path
 | 
						|
    else:
 | 
						|
        with open_binary(package, resource) as fp:
 | 
						|
            data = fp.read()
 | 
						|
        # Not using tempfile.NamedTemporaryFile as it leads to deeper 'try'
 | 
						|
        # blocks due to the need to close the temporary file to work on
 | 
						|
        # Windows properly.
 | 
						|
        fd, raw_path = tempfile.mkstemp()
 | 
						|
        try:
 | 
						|
            os.write(fd, data)
 | 
						|
            os.close(fd)
 | 
						|
            yield Path(raw_path)
 | 
						|
        finally:
 | 
						|
            try:
 | 
						|
                os.remove(raw_path)
 | 
						|
            except FileNotFoundError:
 | 
						|
                pass
 | 
						|
 | 
						|
 | 
						|
def is_resource(package: Package, name: str) -> bool:
 | 
						|
    """True if 'name' is a resource inside 'package'.
 | 
						|
 | 
						|
    Directories are *not* resources.
 | 
						|
    """
 | 
						|
    package = _get_package(package)
 | 
						|
    _normalize_path(name)
 | 
						|
    reader = _get_resource_reader(package)
 | 
						|
    if reader is not None:
 | 
						|
        return reader.is_resource(name)
 | 
						|
    try:
 | 
						|
        package_contents = set(contents(package))
 | 
						|
    except (NotADirectoryError, FileNotFoundError):
 | 
						|
        return False
 | 
						|
    if name not in package_contents:
 | 
						|
        return False
 | 
						|
    # Just because the given file_name lives as an entry in the package's
 | 
						|
    # contents doesn't necessarily mean it's a resource.  Directories are not
 | 
						|
    # resources, so let's try to find out if it's a directory or not.
 | 
						|
    path = Path(package.__spec__.origin).parent / name
 | 
						|
    return path.is_file()
 | 
						|
 | 
						|
 | 
						|
def contents(package: Package) -> Iterator[str]:
 | 
						|
    """Return the list of entries in 'package'.
 | 
						|
 | 
						|
    Note that not all entries are resources.  Specifically, directories are
 | 
						|
    not considered resources.  Use `is_resource()` on each entry returned here
 | 
						|
    to check if it is a resource or not.
 | 
						|
    """
 | 
						|
    package = _get_package(package)
 | 
						|
    reader = _get_resource_reader(package)
 | 
						|
    if reader is not None:
 | 
						|
        yield from reader.contents()
 | 
						|
        return
 | 
						|
    # Is the package a namespace package?  By definition, namespace packages
 | 
						|
    # cannot have resources.  We could use _check_location() and catch the
 | 
						|
    # exception, but that's extra work, so just inline the check.
 | 
						|
    if package.__spec__.origin is None or not package.__spec__.has_location:
 | 
						|
        return []
 | 
						|
    package_directory = Path(package.__spec__.origin).parent
 | 
						|
    yield from os.listdir(str(package_directory))
 | 
						|
 | 
						|
 | 
						|
# Private implementation of ResourceReader and get_resource_reader() for
 | 
						|
# zipimport.  Don't use these directly!  We're implementing these in Python
 | 
						|
# because 1) it's easier, 2) zipimport will likely get rewritten in Python
 | 
						|
# itself at some point, so doing this all in C would just be a waste of
 | 
						|
# effort.
 | 
						|
 | 
						|
class _ZipImportResourceReader(resources_abc.ResourceReader):
 | 
						|
    """Private class used to support ZipImport.get_resource_reader().
 | 
						|
 | 
						|
    This class is allowed to reference all the innards and private parts of
 | 
						|
    the zipimporter.
 | 
						|
    """
 | 
						|
 | 
						|
    def __init__(self, zipimporter, fullname):
 | 
						|
        self.zipimporter = zipimporter
 | 
						|
        self.fullname = fullname
 | 
						|
 | 
						|
    def open_resource(self, resource):
 | 
						|
        fullname_as_path = self.fullname.replace('.', '/')
 | 
						|
        path = f'{fullname_as_path}/{resource}'
 | 
						|
        try:
 | 
						|
            return BytesIO(self.zipimporter.get_data(path))
 | 
						|
        except OSError:
 | 
						|
            raise FileNotFoundError(path)
 | 
						|
 | 
						|
    def resource_path(self, resource):
 | 
						|
        # All resources are in the zip file, so there is no path to the file.
 | 
						|
        # Raising FileNotFoundError tells the higher level API to extract the
 | 
						|
        # binary data and create a temporary file.
 | 
						|
        raise FileNotFoundError
 | 
						|
 | 
						|
    def is_resource(self, name):
 | 
						|
        # Maybe we could do better, but if we can get the data, it's a
 | 
						|
        # resource.  Otherwise it isn't.
 | 
						|
        fullname_as_path = self.fullname.replace('.', '/')
 | 
						|
        path = f'{fullname_as_path}/{name}'
 | 
						|
        try:
 | 
						|
            self.zipimporter.get_data(path)
 | 
						|
        except OSError:
 | 
						|
            return False
 | 
						|
        return True
 | 
						|
 | 
						|
    def contents(self):
 | 
						|
        # This is a bit convoluted, because fullname will be a module path,
 | 
						|
        # but _files is a list of file names relative to the top of the
 | 
						|
        # archive's namespace.  We want to compare file paths to find all the
 | 
						|
        # names of things inside the module represented by fullname.  So we
 | 
						|
        # turn the module path of fullname into a file path relative to the
 | 
						|
        # top of the archive, and then we iterate through _files looking for
 | 
						|
        # names inside that "directory".
 | 
						|
        fullname_path = Path(self.zipimporter.get_filename(self.fullname))
 | 
						|
        relative_path = fullname_path.relative_to(self.zipimporter.archive)
 | 
						|
        # Don't forget that fullname names a package, so its path will include
 | 
						|
        # __init__.py, which we want to ignore.
 | 
						|
        assert relative_path.name == '__init__.py'
 | 
						|
        package_path = relative_path.parent
 | 
						|
        subdirs_seen = set()
 | 
						|
        for filename in self.zipimporter._files:
 | 
						|
            try:
 | 
						|
                relative = Path(filename).relative_to(package_path)
 | 
						|
            except ValueError:
 | 
						|
                continue
 | 
						|
            # If the path of the file (which is relative to the top of the zip
 | 
						|
            # namespace), relative to the package given when the resource
 | 
						|
            # reader was created, has a parent, then it's a name in a
 | 
						|
            # subdirectory and thus we skip it.
 | 
						|
            parent_name = relative.parent.name
 | 
						|
            if len(parent_name) == 0:
 | 
						|
                yield relative.name
 | 
						|
            elif parent_name not in subdirs_seen:
 | 
						|
                subdirs_seen.add(parent_name)
 | 
						|
                yield parent_name
 | 
						|
 | 
						|
 | 
						|
def _zipimport_get_resource_reader(zipimporter, fullname):
 | 
						|
    try:
 | 
						|
        if not zipimporter.is_package(fullname):
 | 
						|
            return None
 | 
						|
    except ZipImportError:
 | 
						|
        return None
 | 
						|
    return _ZipImportResourceReader(zipimporter, fullname)
 |