| """Utility functions to expand configuration directives or special values |
| (such glob patterns). |
| |
| We can split the process of interpreting configuration files into 2 steps: |
| |
| 1. The parsing the file contents from strings to value objects |
| that can be understand by Python (for example a string with a comma |
| separated list of keywords into an actual Python list of strings). |
| |
| 2. The expansion (or post-processing) of these values according to the |
| semantics ``setuptools`` assign to them (for example a configuration field |
| with the ``file:`` directive should be expanded from a list of file paths to |
| a single string with the contents of those files concatenated) |
| |
| This module focus on the second step, and therefore allow sharing the expansion |
| functions among several configuration file formats. |
| |
| **PRIVATE MODULE**: API reserved for setuptools internal usage only. |
| """ |
| import ast |
| import importlib |
| import io |
| import os |
| import sys |
| import warnings |
| from glob import iglob |
| from configparser import ConfigParser |
| from importlib.machinery import ModuleSpec |
| from itertools import chain |
| from typing import ( |
| TYPE_CHECKING, |
| Callable, |
| Dict, |
| Iterable, |
| Iterator, |
| List, |
| Mapping, |
| Optional, |
| Tuple, |
| TypeVar, |
| Union, |
| cast |
| ) |
| from types import ModuleType |
| |
| from distutils.errors import DistutilsOptionError |
| |
| if TYPE_CHECKING: |
| from setuptools.dist import Distribution # noqa |
| from setuptools.discovery import ConfigDiscovery # noqa |
| from distutils.dist import DistributionMetadata # noqa |
| |
| chain_iter = chain.from_iterable |
| _Path = Union[str, os.PathLike] |
| _K = TypeVar("_K") |
| _V = TypeVar("_V", covariant=True) |
| |
| |
| class StaticModule: |
| """Proxy to a module object that avoids executing arbitrary code.""" |
| |
| def __init__(self, name: str, spec: ModuleSpec): |
| with open(spec.origin) as strm: # type: ignore |
| src = strm.read() |
| module = ast.parse(src) |
| vars(self).update(locals()) |
| del self.self |
| |
| def _find_assignments(self) -> Iterator[Tuple[ast.AST, ast.AST]]: |
| for statement in self.module.body: |
| if isinstance(statement, ast.Assign): |
| yield from ((target, statement.value) for target in statement.targets) |
| elif isinstance(statement, ast.AnnAssign) and statement.value: |
| yield (statement.target, statement.value) |
| |
| def __getattr__(self, attr): |
| """Attempt to load an attribute "statically", via :func:`ast.literal_eval`.""" |
| try: |
| return next( |
| ast.literal_eval(value) |
| for target, value in self._find_assignments() |
| if isinstance(target, ast.Name) and target.id == attr |
| ) |
| except Exception as e: |
| raise AttributeError(f"{self.name} has no attribute {attr}") from e |
| |
| |
| def glob_relative( |
| patterns: Iterable[str], root_dir: Optional[_Path] = None |
| ) -> List[str]: |
| """Expand the list of glob patterns, but preserving relative paths. |
| |
| :param list[str] patterns: List of glob patterns |
| :param str root_dir: Path to which globs should be relative |
| (current directory by default) |
| :rtype: list |
| """ |
| glob_characters = {'*', '?', '[', ']', '{', '}'} |
| expanded_values = [] |
| root_dir = root_dir or os.getcwd() |
| for value in patterns: |
| |
| # Has globby characters? |
| if any(char in value for char in glob_characters): |
| # then expand the glob pattern while keeping paths *relative*: |
| glob_path = os.path.abspath(os.path.join(root_dir, value)) |
| expanded_values.extend(sorted( |
| os.path.relpath(path, root_dir).replace(os.sep, "/") |
| for path in iglob(glob_path, recursive=True))) |
| |
| else: |
| # take the value as-is |
| path = os.path.relpath(value, root_dir).replace(os.sep, "/") |
| expanded_values.append(path) |
| |
| return expanded_values |
| |
| |
| def read_files(filepaths: Union[str, bytes, Iterable[_Path]], root_dir=None) -> str: |
| """Return the content of the files concatenated using ``\n`` as str |
| |
| This function is sandboxed and won't reach anything outside ``root_dir`` |
| |
| (By default ``root_dir`` is the current directory). |
| """ |
| from setuptools.extern.more_itertools import always_iterable |
| |
| root_dir = os.path.abspath(root_dir or os.getcwd()) |
| _filepaths = (os.path.join(root_dir, path) for path in always_iterable(filepaths)) |
| return '\n'.join( |
| _read_file(path) |
| for path in _filter_existing_files(_filepaths) |
| if _assert_local(path, root_dir) |
| ) |
| |
| |
| def _filter_existing_files(filepaths: Iterable[_Path]) -> Iterator[_Path]: |
| for path in filepaths: |
| if os.path.isfile(path): |
| yield path |
| else: |
| warnings.warn(f"File {path!r} cannot be found") |
| |
| |
| def _read_file(filepath: Union[bytes, _Path]) -> str: |
| with io.open(filepath, encoding='utf-8') as f: |
| return f.read() |
| |
| |
| def _assert_local(filepath: _Path, root_dir: str): |
| if not os.path.abspath(filepath).startswith(root_dir): |
| msg = f"Cannot access {filepath!r} (or anything outside {root_dir!r})" |
| raise DistutilsOptionError(msg) |
| |
| return True |
| |
| |
| def read_attr( |
| attr_desc: str, |
| package_dir: Optional[Mapping[str, str]] = None, |
| root_dir: Optional[_Path] = None |
| ): |
| """Reads the value of an attribute from a module. |
| |
| This function will try to read the attributed statically first |
| (via :func:`ast.literal_eval`), and only evaluate the module if it fails. |
| |
| Examples: |
| read_attr("package.attr") |
| read_attr("package.module.attr") |
| |
| :param str attr_desc: Dot-separated string describing how to reach the |
| attribute (see examples above) |
| :param dict[str, str] package_dir: Mapping of package names to their |
| location in disk (represented by paths relative to ``root_dir``). |
| :param str root_dir: Path to directory containing all the packages in |
| ``package_dir`` (current directory by default). |
| :rtype: str |
| """ |
| root_dir = root_dir or os.getcwd() |
| attrs_path = attr_desc.strip().split('.') |
| attr_name = attrs_path.pop() |
| module_name = '.'.join(attrs_path) |
| module_name = module_name or '__init__' |
| _parent_path, path, module_name = _find_module(module_name, package_dir, root_dir) |
| spec = _find_spec(module_name, path) |
| |
| try: |
| return getattr(StaticModule(module_name, spec), attr_name) |
| except Exception: |
| # fallback to evaluate module |
| module = _load_spec(spec, module_name) |
| return getattr(module, attr_name) |
| |
| |
| def _find_spec(module_name: str, module_path: Optional[_Path]) -> ModuleSpec: |
| spec = importlib.util.spec_from_file_location(module_name, module_path) |
| spec = spec or importlib.util.find_spec(module_name) |
| |
| if spec is None: |
| raise ModuleNotFoundError(module_name) |
| |
| return spec |
| |
| |
| def _load_spec(spec: ModuleSpec, module_name: str) -> ModuleType: |
| name = getattr(spec, "__name__", module_name) |
| if name in sys.modules: |
| return sys.modules[name] |
| module = importlib.util.module_from_spec(spec) |
| sys.modules[name] = module # cache (it also ensures `==` works on loaded items) |
| spec.loader.exec_module(module) # type: ignore |
| return module |
| |
| |
| def _find_module( |
| module_name: str, package_dir: Optional[Mapping[str, str]], root_dir: _Path |
| ) -> Tuple[_Path, Optional[str], str]: |
| """Given a module (that could normally be imported by ``module_name`` |
| after the build is complete), find the path to the parent directory where |
| it is contained and the canonical name that could be used to import it |
| considering the ``package_dir`` in the build configuration and ``root_dir`` |
| """ |
| parent_path = root_dir |
| module_parts = module_name.split('.') |
| if package_dir: |
| if module_parts[0] in package_dir: |
| # A custom path was specified for the module we want to import |
| custom_path = package_dir[module_parts[0]] |
| parts = custom_path.rsplit('/', 1) |
| if len(parts) > 1: |
| parent_path = os.path.join(root_dir, parts[0]) |
| parent_module = parts[1] |
| else: |
| parent_module = custom_path |
| module_name = ".".join([parent_module, *module_parts[1:]]) |
| elif '' in package_dir: |
| # A custom parent directory was specified for all root modules |
| parent_path = os.path.join(root_dir, package_dir['']) |
| |
| path_start = os.path.join(parent_path, *module_name.split(".")) |
| candidates = chain( |
| (f"{path_start}.py", os.path.join(path_start, "__init__.py")), |
| iglob(f"{path_start}.*") |
| ) |
| module_path = next((x for x in candidates if os.path.isfile(x)), None) |
| return parent_path, module_path, module_name |
| |
| |
| def resolve_class( |
| qualified_class_name: str, |
| package_dir: Optional[Mapping[str, str]] = None, |
| root_dir: Optional[_Path] = None |
| ) -> Callable: |
| """Given a qualified class name, return the associated class object""" |
| root_dir = root_dir or os.getcwd() |
| idx = qualified_class_name.rfind('.') |
| class_name = qualified_class_name[idx + 1 :] |
| pkg_name = qualified_class_name[:idx] |
| |
| _parent_path, path, module_name = _find_module(pkg_name, package_dir, root_dir) |
| module = _load_spec(_find_spec(module_name, path), module_name) |
| return getattr(module, class_name) |
| |
| |
| def cmdclass( |
| values: Dict[str, str], |
| package_dir: Optional[Mapping[str, str]] = None, |
| root_dir: Optional[_Path] = None |
| ) -> Dict[str, Callable]: |
| """Given a dictionary mapping command names to strings for qualified class |
| names, apply :func:`resolve_class` to the dict values. |
| """ |
| return {k: resolve_class(v, package_dir, root_dir) for k, v in values.items()} |
| |
| |
| def find_packages( |
| *, |
| namespaces=True, |
| fill_package_dir: Optional[Dict[str, str]] = None, |
| root_dir: Optional[_Path] = None, |
| **kwargs |
| ) -> List[str]: |
| """Works similarly to :func:`setuptools.find_packages`, but with all |
| arguments given as keyword arguments. Moreover, ``where`` can be given |
| as a list (the results will be simply concatenated). |
| |
| When the additional keyword argument ``namespaces`` is ``True``, it will |
| behave like :func:`setuptools.find_namespace_packages`` (i.e. include |
| implicit namespaces as per :pep:`420`). |
| |
| The ``where`` argument will be considered relative to ``root_dir`` (or the current |
| working directory when ``root_dir`` is not given). |
| |
| If the ``fill_package_dir`` argument is passed, this function will consider it as a |
| similar data structure to the ``package_dir`` configuration parameter add fill-in |
| any missing package location. |
| |
| :rtype: list |
| """ |
| from setuptools.discovery import construct_package_dir |
| from setuptools.extern.more_itertools import unique_everseen, always_iterable |
| |
| if namespaces: |
| from setuptools.discovery import PEP420PackageFinder as PackageFinder |
| else: |
| from setuptools.discovery import PackageFinder # type: ignore |
| |
| root_dir = root_dir or os.curdir |
| where = kwargs.pop('where', ['.']) |
| packages: List[str] = [] |
| fill_package_dir = {} if fill_package_dir is None else fill_package_dir |
| search = list(unique_everseen(always_iterable(where))) |
| |
| if len(search) == 1 and all(not _same_path(search[0], x) for x in (".", root_dir)): |
| fill_package_dir.setdefault("", search[0]) |
| |
| for path in search: |
| package_path = _nest_path(root_dir, path) |
| pkgs = PackageFinder.find(package_path, **kwargs) |
| packages.extend(pkgs) |
| if pkgs and not ( |
| fill_package_dir.get("") == path |
| or os.path.samefile(package_path, root_dir) |
| ): |
| fill_package_dir.update(construct_package_dir(pkgs, path)) |
| |
| return packages |
| |
| |
| def _same_path(p1: _Path, p2: _Path) -> bool: |
| """Differs from os.path.samefile because it does not require paths to exist. |
| Purely string based (no comparison between i-nodes). |
| >>> _same_path("a/b", "./a/b") |
| True |
| >>> _same_path("a/b", "a/./b") |
| True |
| >>> _same_path("a/b", "././a/b") |
| True |
| >>> _same_path("a/b", "./a/b/c/..") |
| True |
| >>> _same_path("a/b", "../a/b/c") |
| False |
| >>> _same_path("a", "a/b") |
| False |
| """ |
| return os.path.normpath(p1) == os.path.normpath(p2) |
| |
| |
| def _nest_path(parent: _Path, path: _Path) -> str: |
| path = parent if path in {".", ""} else os.path.join(parent, path) |
| return os.path.normpath(path) |
| |
| |
| def version(value: Union[Callable, Iterable[Union[str, int]], str]) -> str: |
| """When getting the version directly from an attribute, |
| it should be normalised to string. |
| """ |
| if callable(value): |
| value = value() |
| |
| value = cast(Iterable[Union[str, int]], value) |
| |
| if not isinstance(value, str): |
| if hasattr(value, '__iter__'): |
| value = '.'.join(map(str, value)) |
| else: |
| value = '%s' % value |
| |
| return value |
| |
| |
| def canonic_package_data(package_data: dict) -> dict: |
| if "*" in package_data: |
| package_data[""] = package_data.pop("*") |
| return package_data |
| |
| |
| def canonic_data_files( |
| data_files: Union[list, dict], root_dir: Optional[_Path] = None |
| ) -> List[Tuple[str, List[str]]]: |
| """For compatibility with ``setup.py``, ``data_files`` should be a list |
| of pairs instead of a dict. |
| |
| This function also expands glob patterns. |
| """ |
| if isinstance(data_files, list): |
| return data_files |
| |
| return [ |
| (dest, glob_relative(patterns, root_dir)) |
| for dest, patterns in data_files.items() |
| ] |
| |
| |
| def entry_points(text: str, text_source="entry-points") -> Dict[str, dict]: |
| """Given the contents of entry-points file, |
| process it into a 2-level dictionary (``dict[str, dict[str, str]]``). |
| The first level keys are entry-point groups, the second level keys are |
| entry-point names, and the second level values are references to objects |
| (that correspond to the entry-point value). |
| """ |
| parser = ConfigParser(default_section=None, delimiters=("=",)) # type: ignore |
| parser.optionxform = str # case sensitive |
| parser.read_string(text, text_source) |
| groups = {k: dict(v.items()) for k, v in parser.items()} |
| groups.pop(parser.default_section, None) |
| return groups |
| |
| |
| class EnsurePackagesDiscovered: |
| """Some expand functions require all the packages to already be discovered before |
| they run, e.g. :func:`read_attr`, :func:`resolve_class`, :func:`cmdclass`. |
| |
| Therefore in some cases we will need to run autodiscovery during the evaluation of |
| the configuration. However, it is better to postpone calling package discovery as |
| much as possible, because some parameters can influence it (e.g. ``package_dir``), |
| and those might not have been processed yet. |
| """ |
| |
| def __init__(self, distribution: "Distribution"): |
| self._dist = distribution |
| self._called = False |
| |
| def __call__(self): |
| """Trigger the automatic package discovery, if it is still necessary.""" |
| if not self._called: |
| self._called = True |
| self._dist.set_defaults(name=False) # Skip name, we can still be parsing |
| |
| def __enter__(self): |
| return self |
| |
| def __exit__(self, _exc_type, _exc_value, _traceback): |
| if self._called: |
| self._dist.set_defaults.analyse_name() # Now we can set a default name |
| |
| def _get_package_dir(self) -> Mapping[str, str]: |
| self() |
| pkg_dir = self._dist.package_dir |
| return {} if pkg_dir is None else pkg_dir |
| |
| @property |
| def package_dir(self) -> Mapping[str, str]: |
| """Proxy to ``package_dir`` that may trigger auto-discovery when used.""" |
| return LazyMappingProxy(self._get_package_dir) |
| |
| |
| class LazyMappingProxy(Mapping[_K, _V]): |
| """Mapping proxy that delays resolving the target object, until really needed. |
| |
| >>> def obtain_mapping(): |
| ... print("Running expensive function!") |
| ... return {"key": "value", "other key": "other value"} |
| >>> mapping = LazyMappingProxy(obtain_mapping) |
| >>> mapping["key"] |
| Running expensive function! |
| 'value' |
| >>> mapping["other key"] |
| 'other value' |
| """ |
| |
| def __init__(self, obtain_mapping_value: Callable[[], Mapping[_K, _V]]): |
| self._obtain = obtain_mapping_value |
| self._value: Optional[Mapping[_K, _V]] = None |
| |
| def _target(self) -> Mapping[_K, _V]: |
| if self._value is None: |
| self._value = self._obtain() |
| return self._value |
| |
| def __getitem__(self, key: _K) -> _V: |
| return self._target()[key] |
| |
| def __len__(self) -> int: |
| return len(self._target()) |
| |
| def __iter__(self) -> Iterator[_K]: |
| return iter(self._target()) |