Source code for dwas._steps.steps

# Those are protocols...
# pylint: disable=unused-argument

from __future__ import annotations

from pathlib import Path  # noqa: TC003  required for Sphinx
from typing import TYPE_CHECKING, Any, Callable, Protocol, runtime_checkable

if TYPE_CHECKING:
    import os
    import subprocess

    from .._config import Config
    from .handlers import StepHandler



[docs]
@runtime_checkable
class Step(Protocol):
    """
    Holds the information about a :term:`step` in the pipeline.

    A :term:`step` is essentially a function that can be called and that has a
    :python:`__name__` attribute.

    .. todo:: Add a link to a high level tutorial like getting started

    Steps can then be parametrized by the help of :py:func:`dwas.parametrize`,
    and registered using :py:func:`register_step`. at which point they are
    usable  by dwas.

    :Examples:

        A step can either be a simple function:

        .. code-block::

            @step()
            def my_step(step: StepRunner) -> None:
                step.run(["echo", "hello!"])

        Or a class:

        .. code-block::

            # NOTE: you don't need to explicitely inherit from `Step`
            class MyStep:
                def __call__(self, step: StepRunner) -> None:
                    step.run(["echo", "hello!"])

            register_step(MyStep(), name="my_step")

    .. note::

        Use whichever method you prefer. Both are supported. Classes tend to be
        easier for reusability, but functions work well if you just use them
        in your project.

        We will strive to provide both types in examples.
    """

    # XXX: pylint will complain about the *args/**kwargs with 'arguments-differ'
    #      However, this is the canonical way mypy does for callback protocols
    #      that can accept any kind of parameters.
    #      To avoid the issue, you can also not inherit from 'Step', all the
    #      type checking should still work.
    #
    #      See https://github.com/python/mypy/issues/5876.
    #

[docs]
    def __call__(self, *args: Any, **kwargs: Any) -> None:
        """
        The method to run when the :term:`step` is invoked.

        :Parameters:

            It can take any amount of parameters, that can be passed by keyword, so
            positional only arguments are not supported.

            Parameters will then be passed using parametrization, with a few specific
            parameters being reserved by the system. Namely:

            - ``step``, which is used to pass the :py:class:`StepRunner`.
            - ``user_args``, which is used to pass arguments that the user would
              have passed on the cli. This can be useful, to allow users to
              interact with some cli tool your step might be calling.

            For passing other arguments, see :py:func:`dwas.parametrize` and
            :py:func:`dwas.set_defaults`.
        """  # noqa: D401





[docs]
@runtime_checkable
class StepWithSetup(Step, Protocol):
    """
    Defines a :term:`step` that needs some setup that can be cached.

    In addition to having a :py:attr:`~Step.__call__` method, a :py:class:`Step`, can
    implement a :py:func:`~StepWithSetup.setup` function, that gets called
    before the method.

    This can be useful to separate the actual running of the step, from the
    necessary preparations.

    .. warning::

        the :py:attr:`setup` is meant to contain work that does not necessarily
        needs to happen at every run of your step, and can be cached in between.

    .. tip::

        When running ``dwas`` repeatedly, you can pass a ``--no-setup`` flag to
        avoid running those steps again and thus speedup your run.

        .. todo:: Link to a document that gives tips on how to run dwas effectively

    :Examples:

        A setup method can be added on a step declaration:

        .. note:: A more complete pytest example is provided as :py:func:`dwas.predefined.pytest`.

        .. tab:: Using functions

            .. code-block::

                @step()
                def pytest(step: StepRunner) -> None:
                    step.run(["pytest"])

                def install_dependencies(step: StepRunner) -> None:
                    step.install("pytest")

                pytest.setup = install_dependencies

        .. tab:: Using a class

            .. code-block::

                class Pytest:
                    def setup(self, step: StepRunner) -> None:
                        step.install("pytest")

                    def __call__(self, step: StepRunner) -> None:
                        step.run(["pytest"])

                register_step(Pytest(), name="pytest")

        .. tip::

                This is what :py:func:`register_managed_step` does to install your
                python dependencies.
    """

    setup: Callable[..., None]
    """
    The setup method that will be invoked before running the step.

    This step should run work that is necessary for the test to be able to run
    but that does not require running every time, as it can be skipped when
    running dwas with `--no-setup`.

    :Parameters:

        Parameters are passed to this function the same way they are passed to
        :py:func:`~Step.__call__`
    """




[docs]
@runtime_checkable
class StepWithDependentSetup(Step, Protocol):
    """
    Defines a :term:`step` that will act in the context of its dependent steps.

    In addition to having a :py:func:`~Step.__call__` method, a
    :py:class:`Step` can act in the context of a dependent step, before this
    one runs.

    This allows another step to, for example, install the project it just built
    into another virtual environment.

    .. note:: This method is called *after* :py:func:`~StepWithSetup.setup`

    .. warning::

        This method is *always* called when running, and cannot be skipped like
        :py:func:`~StepWithSetup.setup` by passing ``--no-setup``.

    :Examples:

        You might want to have a step that builds a wheel of your current
        package and run your tests against it. This could be done like:

        .. note::

            A more complete packaging example is provided as
            :py:func:`dwas.predefined.package`

        .. tab:: Using functions

            .. code-block::

                @managed_step(dependencies=["build"])
                def package(step: StepRunner) -> None:
                    step.run([step.python, "-m", "build", f"--outdir={step.cache_path}"])

                def install(self, original_step: StepRunner, current_step: StepRunner) -> None:
                    wheels = list(original_step.cache_path.glob("*.whl"))
                    # Assuming this is a universal wheel
                    assert len(wheels) == 1

                    current_step.install(str(wheels[0]))

                package.setup_dependent = install

                # This can now be used as a dependency
                @step(requires=["package"])
                def my_step(step: StepRunner) -> None:
                    step.run(["myproject", "--help"])

        .. tab:: Using a class

            .. code-block::

                class Package:
                    def __call__(step: StepRunner) -> None:
                        step.run([step.python, "-m", "build", f"--outdir={step.cache_path}"])

                    def setup_dependent(
                        self,
                        original_step: StepRunner,
                        current_step: StepRunner,
                    ) -> None:
                        wheels = list(original_step.cache_path.glob("*.whl"))
                        # Assuming this is a universal wheel
                        assert len(wheels) == 1

                        current_step.install(str(wheels[0]))

                register_managed_step(Package(), name="package", dependencies=["build"])

                # This can now be used as a dependency
                @step(requires=["package"])
                def my_step(step: StepRunner) -> None:
                    step.run(["myproject", "--help"])
    """


[docs]
    def setup_dependent(
        self,
        original_step: StepRunner,
        current_step: StepRunner,
    ) -> None:
        """
        Run some logic into a dependent step.

        :param original_step: The original step handler that was used
            when the step defining this method was called.
        :param current_step: The current step handler, that contains the
            context of the step that is going to be executed.
        """





[docs]
@runtime_checkable
class StepWithArtifacts(Step, Protocol):
    """
    Defines a :term:`step` creating artifacts that can be consumed by dependent steps.

    Sometimes, you want to share artifacts between jobs. For example, you might
    have some ``pytest`` runs that generate coverage reports, and then you
    want to aggregate them together.

    This allows a programmatic interface between steps to access artifacts.
    See :py:func:`StepRunner.get_artifacts` for how to retrieve those artifacts
    from another step.

    :Examples:

        If you wanted to have multiple pytest steps, and one that aggregates
        the coverage, you could do:

        .. tip::

            This is what the provided :py:func:`dwas.predefined.pytest` step
            does.

        .. tab:: Using functions

            .. code-block::

                @step()
                @parametrize(python=["3.9", "3.10"])
                def pytest(step: StepRunner) -> None:
                    step.run(
                        ["pytest"],
                        env={
                            "COVERAGE_FILE": str(
                                step.cache_path.joinpath(step.python, "coverage")
                            ),
                        },
                    )

                def gather_artifacts(step: "StepRunner") -> Dict[str, List[Any]]:
                    return step.cache_path.joinpath(step.python, "coverage")

                pytest.gather_artifacts = gather_artifacts

        .. tab:: Using classes

            .. code-block::

                class Pytest:
                    def _get_coverage_file(self, step: StepRunner) -> str:
                        return str(step.cache_path / "reports" / "coverage")

                    def gather_artifacts(self, step: StepRunner) -> Dict[str, List[Any]]:
                        return {"coverage_files": [self._get_coverage_file(step)]}

                    def __call__(self, step: StepRunner) -> None:
                        step.run(
                            ["pytest", *args],
                            env={"COVERAGE_FILE": self._get_coverage_file(step)},
                        )

                register_step(parametrize("python", ["3.9", "3.10"])(Pytest()))

        And you could then combine and display the coverage like:

        .. code-block::

            @managed_step(dependencies=["coverage"], requires=["pytest"])
            def coverage(self, step: StepRunner) -> None:
                env = {"COVERAGE_FILE": str(step.cache_path / "coverage")}

                coverage_files = step.get_artifacts("coverage_files")
                if not coverage_files:
                    raise Exception("No coverage files provided. Can't proceed")

                step.run(["coverage", "combine", "--keep", *coverage_files], env=env)
                step.run(["coverage", "html"], env=env)

        .. tip:: The :py:func:`dwas.predefined.coverage` step does roughly this.
    """


[docs]
    def gather_artifacts(self, step: StepRunner) -> dict[str, list[Any]]:
        """
        Gather all artifacts exposed by this step.

        :param step: The step handler that was used when running the
            step.
        :return: A dictionary of artifact key to a list of arbitrary
            data. This **must** return a list, as they are merged with
            other steps' artifacts into a single list per artifact key.
        """





[docs]
@runtime_checkable
class StepWithCleanup(Step, Protocol):
    """
    Defines a :term:`step` that needs to do custom cleanup.

    Sometimes, a step might write outside of the dwas-managed cache, in which
    case it might be desirable for it to be able to clean that directory.

    This allows a step to hook on the ``dwas --clean`` invocation to cleanup
    such files.

    :Examples:

        If you wanted to generated documentation, and wanted to have it easily
        accessible, you could do:

        .. tip::

            This is a simplified example of what
            :py:func:`dwas.predefined.sphinx` does

        .. tab:: using functions

            .. code-block::

                @managed_step(dependencies=["sphinx"], output="./build/docs")
                def sphinx(step: StepRunner, output: str) -> None:
                    step.run(["sphinx-build", "-b=html", "docs/", output])

                def clean(output: str) -> None:
                    with suppress(FileNotFoundError):
                        shutil.rmtree(output)

                sphinx.clean = clean

        .. tab:: using classes

            .. code-block::

                class Sphinx(Step):
                    def __init__(self) -> None:
                        self.__name__ = "sphinx"

                    def __call__(self, step: StepRunner, output: str) -> None:
                        step.run(["sphinx-build", "-b=html", "docs/", output])

                    def clean(output: str) -> None:
                        with suppress(FileNotFoundError):
                            shutil.rmtree(output)
    """

    clean: Callable[..., None]




[docs]
class StepRunner:
    """
    Defines the runner for a :term:`step`, and provides utilities for the step to run.

    This is passed as an argument to every step that executes as ``step``.

    It provides various utilities to allow the step to run in an isolated,
    standardized environment.
    """

    def __init__(self, handler: StepHandler) -> None:
        self._handler = handler

    @property
    def name(self) -> str:
        """
        The name of the current step.
        """
        return self._handler.name

    @property
    def python(self) -> str:
        """
        The name of the current python interpreter.

        .. note:: This is not the absolute path to it, just its name.
        """
        return self._handler.python

    @property
    def config(self) -> Config:
        """
        The global configuration for the current run.

        At this point, you should not be modifying it. However, you can
        use it to act differently on what you are doing. For example,
        you might want to use the :py:attr:`Config.verbosity` to
        configure the output of some commands you run.
        """
        return self._handler.config

    @property
    def cache_path(self) -> Path:
        """
        The path to the cache for the current step.

        This can be used to store temporary files or any other
        artifacts.

        This will be cleaned up and emptied before the step runs.
        """
        name = self.name
        # Those chars regularly cause trouble with unescaped glob patterns and
        # such. As such, replace them with "-", hoping this does not cause
        # collisions
        for char in ["/", ":", "*", "[", "]"]:
            name = name.replace(char, "-")

        return self.config.cache_path / "cache" / name


[docs]
    def get_artifacts(self, key: str) -> list[Any]:
        """
        Get the artifacts exported by previous steps for the given key.

        See :py:func:`StepWithArtifacts.gather_artifacts` for how to expose
        artifacts from a step.

        .. note::

            This only returns artifacts exported by the direct dependencies of
            the current step, and does not go recursively. Unless this depends
            on a step group, in which case it returns the artifacts of all
            dependencies in the group.

        :param key: The name of the key for which to get the artifacts
        :return: A list of artifacts, one per step providing artifacts for the
                 given key.
        """
        return self._handler.get_artifacts(key)



[docs]
    def install(
        self,
        *packages: str,
        sync: bool = False,
        no_deps: bool = False,
        force_reinstall: bool = False,
    ) -> None:
        """
        Install the provided packages in the current environment.

        This is a wrapper around the canonical way of installing packages in
        the provided environment (e.g. `pip`), so that users don't need to
        handle the details when changing the type of virtual environment (e.g.
        if you wanted to move to conda.).

        :Examples:

        Here's a few ways of installing packages depending on what you want.

        .. code-block::

            ##
            # Without syncing files
            ##

            # Install a single package
            step.install(["mypy"])

            # Install dependencies from a requirements.txt file
            step.install(["--requirements=requirements.txt"])

            # Install only the package's dependencies but not the package
            step.install(["--requirements=pyproject.toml"])

            # Install the current package (See dwas.predefined.Package for a better way)
            step.install(["."])

            # Install a dependency group
            step.install(["--group=dev"])

            ##
            # Syncing files from a lockfile
            ##

            # Install only the package's dependencies but not the package
            step.install([], sync=True)

            # Install a group of the package
            step.install(["--only-group=dev"], sync=True)

            # Install the dependencies and a group
            step.install(["--group=dev"])

        :param packages: which packages to install
        :param sync: Use `uv sync` instead of `pip install` to install the
                     dependencies. This ensures is resolves dependencies
                     according to the lock file, and not installing the latest
                     versions. Note that semantics change a bit, so it is not
                     fully interchangeable with `sync=False`.
        :param no_deps: ignore the package's dependencies when installing
        :param force_reinstall: force the re-installation of the package and its
                                dependencies even if already installed
        :raise KeyboardInterrupt: If the user has tried aborting the program and
                                  is waiting for it to finish.
        """
        return self._handler.install(
            *packages,
            sync=sync,
            no_deps=no_deps,
            force_reinstall=force_reinstall,
        )



[docs]
    def run(
        self,
        command: list[str],
        *,
        cwd: str | bytes | os.PathLike[str] | os.PathLike[bytes] | None = None,
        env: dict[str, str] | None = None,
        external_command: bool = False,
        silent_on_success: bool = False,
    ) -> subprocess.CompletedProcess[None]:
        """
        Run the provided command in the current environment.

        This method makes it's best to ensure the process' environment is
        as isolated as possible. It should be used whenever possible, instead
        of calling :py:mod:`subprocess` directly.

        It will enforce that the first argument of the command is part of the
        python virtual environment that is specially created for the current
        step (in the case when there is isolation).

        It will also ensure that the environment in which it is run is clean,
        and will only get environment entries from :py:attr:`Config.environ`.
        To add more values, use `env`.

        :param command: The command to run, as a list of arguments.
        :param cwd: The working directory in which to run the command.
        :param env: Additional environment variables to pass to the process.
                    Those will be merged on top of the :py:attr:`Config.environ`
                    values and can override them, but not remove them.
        :param external_command: Set to true if you want to run a command that
                                 lives outside the current virtual environment.
                                 Otherwise, this will fail the command.
        :param silent_on_success: Whether to silence the command's output if it
                                  succeeds, or show it every time.
        :return: a :py:class:`subprocess.CompletedProcess` with `stderr` and
                 `stdout` set to ``None``.
        :raise KeyboardInterrupt: If the user has tried aborting the program and
                                  is waiting for it to finish.
        """
        return self._handler.run(
            command,
            cwd=cwd,
            env=env,
            external_command=external_command,
            silent_on_success=silent_on_success,
        )



[docs]
    def set_env(self, variable: str, value: str) -> None:
        """
        Set a specific environment variable for this runner.

        This can be useful for example to set environment variables
        inside another step when setting up a dependent.

        :param variable: The name of the environment variable to set.
        :param value: The value to set the variable to.
        """
        self._handler.set_env(variable, value)