Source code for passengersim.experiments

"""Run structured sets of PassengerSim simulations as experiments.

Supports defining parameter changes and scenario comparisons, running
individual simulations sequentially or in parallel across multiple
processes, and collecting results into a unified output.
"""

from __future__ import annotations

import concurrent.futures
import pathlib
import warnings
from collections.abc import Callable
from typing import TYPE_CHECKING, Literal

from pydantic import ValidationError
from rich.console import Group
from rich.live import Live
from rich.panel import Panel
from rich.progress import (
    BarColumn,
    MofNCompleteColumn,
    Progress,
    TextColumn,
    TimeRemainingColumn,
)

from passengersim import __version__ as _passengersim_version
from passengersim import contrast
from passengersim.callbacks import CallbackMixin
from passengersim.core import __version__ as _passengersim_core_version

from . import MultiSimulation, Simulation
from ._types import PathLike
from .config import Config
from .driver import check_summarizer, get_default_summarizer
from .mp_executor import JobExecutor
from .summaries import GenericSimulationTables, SimulationTables

if TYPE_CHECKING:
    from passengersim.contrast import Contrast

    UseExistingT = Literal[True, False, "ignore", "raise"]



[docs]
class OverwriteExperimentWarning(UserWarning):
    """An experiment is being overwritten with another of the same name."""




[docs]
class Experiment:

[docs]
    def __init__(
        self,
        title: str | None,
        tag: str | None = None,
        multiprocess: bool = True,
        *,
        external: GenericSimulationTables | PathLike | None = None,
    ):
        """
        Parameters
        ----------
        title : str
            A short human-friendly title for the experiment.  This title is used in
            generating an HTML report of the experiment results.  If not provided,
            the tag is used as the title in reporting.
        tag : str, optional
            A short machine-friendly tag for the experiment. Ideally this tag will not have
            spaces or other special character other than underscores. This tag is used as a key
            in the results dictionary returned by `Experiments.run()`, and it is used in
            generating filenames for the experiment outputs.  If not provided, the name of
            the decorated function is used as the tag.
        multiprocess : bool, default True
            If True, run the simulation for this experiment in multi-process mode.  If False,
            run the simulation for this experiment in single-process mode.  Note that
            multi-process mode is not compatible with all environments, and may cause issues
            in interactive environments such as Jupyter notebooks.  In those cases, set this to
            False to run in single-process mode.
        external : GenericSimulationTables or path-like, optional
            If provided, this should be an existing SimulationTables result or a path to an
            existing output file containing the results for this experiment.  If this is
            provided, the experiment will skip running the simulation and instead load the
            results from the given file.  This is useful for cases where the simulation has
            already been run and the results are saved, but you want to include those results
            in a report with other experiments, without re-running the simulation.  If given
            a path but the given file does not exist or cannot be loaded, an error will
            be raised.
        """
        self.title = title
        self.tag = tag
        self.multi = multiprocess
        self.external = external
        self.func = None
        if isinstance(self.external, SimulationTables):
            self.cached = self.external
            self.external = None
        else:
            self.cached = None


    def __call__(self, func: Callable[[Config], Config] | Config):
        if self.func is None:
            # decorate a function that takes a config and returns a modified config
            self.func = func
            if self.tag is None:
                self.tag = func.__name__
            if self.title == "__DEFERRED_INIT__":
                self.title = self.tag
            return self
        else:
            # if the function is already decorated, call it with the base config,
            # while making a deep copy to avoid modifying the original
            if isinstance(func, Config) or type(func).__name__ == "Config":
                return self.func(func.model_copy(deep=True))
            else:
                raise TypeError("Experiment already decorated, expected base_config as input")




[docs]
class Experiments(CallbackMixin):
    _report_filename = None

    def __init__(
        self,
        config: Config,
        output_dir: pathlib.Path | None | Literal[False] = None,
        *,
        pickle: bool | str = False,
        html: bool | str = "passengersim_output",
        hide_from_git: bool = True,
    ):
        self.experiments: list[Experiment] = []
        self.base_config = config
        self.output_dir = output_dir
        if isinstance(self.output_dir, str):
            self.output_dir = pathlib.Path(output_dir)
        self.extra_reporting = None
        if self.output_dir and hide_from_git:
            if not self.output_dir.exists():
                self.output_dir.mkdir(parents=True)
            if not self.output_dir.joinpath(".gitignore").exists():
                self.output_dir.joinpath(".gitignore").write_text("**\n")
        # ensure the base config has pickle output
        if pickle and self.base_config.outputs.pickle is None:
            if pickle is True:
                pickle = "passengersim_output"
            self.base_config.outputs.pickle = pathlib.Path(pickle)
        # ensure the base config has html output
        if html and self.base_config.outputs.html.filename is None:
            if html is True:
                html = "passengersim_output"
            self.base_config.outputs.html.filename = pathlib.Path(html)

        self._sims = None
        # sims are only retained if requested

    @property
    def sims(self):
        if self._sims is None:
            raise ValueError("sims not available; set retain_sims=True in run() to retain them")
        return self._sims

    def _rename_file(self, tag: str, filename: pathlib.Path):
        if not isinstance(filename, str | pathlib.Path):
            return filename
        if self.output_dir is None:
            return pathlib.Path(tag) / filename
        elif not self.output_dir:
            return None
        else:
            return pathlib.Path(self.output_dir) / tag / pathlib.Path(filename).name


[docs]
    def existing(self, external: GenericSimulationTables | PathLike | None = None) -> Experiment:
        """Create an experiment that uses existing results, rather than running a simulation.

        Parameters
        ----------
        external : GenericSimulationTables or path-like, optional
            If provided, this should be an existing SimulationTables result or a path to an
            existing output file containing the results for this experiment.  If this is
            provided, the experiment will skip running the simulation and instead load the
            results from the given file.  This is useful for cases where the simulation has
            already been run and the results are saved, but you want to include those results
            in a report with other experiments, without re-running the simulation.  If given
            a path but the given file does not exist or cannot be loaded, an error will
            be raised.

        Returns
        -------
        Experiment
            An experiment that will use the given existing results when run, rather than running
            a simulation.
        """
        return self(external=external)


    def __call__(
        self,
        title: str | Callable[[Config], Config] = "__DEFERRED_INIT__",
        tag: str | None = None,
        multiprocess: bool = True,
        *,
        external: GenericSimulationTables | PathLike | None = None,
    ) -> Experiment:
        if title == "__DEFERRED_INIT__":
            e = Experiment(title, tag, multiprocess, external=external)
        elif not isinstance(title, str):
            # called as a decorator, so the first argument is the function
            e = Experiment(None, tag, multiprocess, external=external)(title)
        else:
            e = Experiment(title, tag, multiprocess, external=external)
        # check if this is a duplicate of an existing experiment
        # if so, overwrite the existing experiment and warn the user
        for i in range(len(self.experiments)):
            if e.tag == self.experiments[i].tag:
                warnings.warn(
                    f"Overwriting existing experiment tag: {e.tag}", stacklevel=2, category=OverwriteExperimentWarning
                )
                self.experiments[i] = e
                return e
        # otherwise add the new experiment
        self.experiments.append(e)
        return e

    @staticmethod
    def _check_loaded_summary(
        summary: GenericSimulationTables,
        config: Config,
        tag: str,
        check_versions: bool = True,
        check_content: bool = True,
        source_file: str | None = None,
    ) -> tuple[str, GenericSimulationTables | None]:
        """
        Check if the loaded summary matches the config and PassengerSim versions.

        Parameters
        ----------
        summary : GenericSimulationTables
        config : Config
        tag : str
        check_versions : bool, optional
            If True, check the PassengerSim versions in the loaded summary.
        check_content : bool, optional
            If True, check the content of the loaded summary.

        Returns
        -------
        str
            A message about the loaded summary
        GenericSimulationTables
            The loaded summary if it matches the config, otherwise None
        """
        if source_file is None:
            try:
                source_file = summary.metadata("store.filename")
            except (KeyError, Exception):
                pass
        if source_file is None:
            source_file = config.outputs.pickle
        if source_file is None:
            source_file = config.outputs.disk
        msg = ""
        try:
            check = config.find_differences(summary.config)
        except ValidationError as e:
            check = e
        try:
            versions = summary.metadata("version")
        except KeyError:
            msg = f"Loaded {tag} from {source_file}, but the PassengerSim version is unknown"
            return msg, None

        public_version = versions.get("passengersim", None)
        core_version = versions.get("passengersim_core", None)

        if check_versions and public_version is None:
            msg = f"Loaded {tag} from {source_file}, but the PassengerSim version is unknown"
            return msg, None

        if check_versions and public_version != _passengersim_version:
            msg = (
                f"Loaded {tag} from {source_file}, "
                f"but the PassengerSim version has changed: "
                f"running {_passengersim_version}, found {public_version}"
            )
            return msg, None

        if check_versions and core_version is None:
            msg = f"Loaded {tag} from {source_file}, but the PassengerSim.Core version is unknown"
            return msg, None

        if check_versions and core_version != _passengersim_core_version:
            msg = (
                f"Loaded {tag} from {source_file}, "
                f"but the PassengerSim.Core version has changed: "
                f"running {_passengersim_core_version}, found {core_version}"
            )
            return msg, None

        if isinstance(check, ValidationError):
            msg = f"Loaded {tag} from {source_file}, but the config is invalid:\n{str(check)[:4000]}"
            return msg, None

        if check_content and check:
            msg = f"Loaded {tag} from {source_file}, but the config has changed:\n{str(check)[:4000]}"
            return msg, None

        if check:
            msg = f"Loaded {tag} from {source_file}, although the config has changed:\n{str(check)[:4000]}"
        else:
            msg = f"Loaded {tag} from {source_file}"

        return msg, summary

    def _write_report_after_run(self, write_report, results: Contrast):
        if isinstance(write_report, PathLike):
            write_report = pathlib.Path(write_report)
        else:
            write_report = pathlib.Path("experiments-summary.html")
        # if output directory is set, write the report there,
        # unless the path is absolute (then write it to the given path)
        if self.output_dir and not write_report.is_absolute():
            write_report = self.output_dir / write_report
        self._report_filename = results.write_report(
            write_report, base_config=self.base_config, extra=self.extra_reporting
        )

    def _run_experiments_in_sequence(
        self,
        use_existing: UseExistingT | dict[str, UseExistingT] = True,
        *,
        tag: str | None = None,
        check_versions: bool = True,
        check_content: bool = True,
        single_process: bool = False,
        retain_sims: bool = False,
        write_report: PathLike | bool | None = True,
        cache_results: bool = True,
    ):
        """
        Run the experiments in sequence.

        Parameters
        ----------
        use_existing : Literal[True, False, "ignore", "raise"] or dict
            This can either be a single value for all experiments, or a dictionary
            mapping tags to values.  For each value, the behavior is as follows:
            If True, load from existing output pickle files if they exist,
            otherwise run the simulation for each experiment.  If False, always
            run the simulation for each experiment. If "ignore", load results
            from output pickle or pxsim files if they exist, otherwise skip each
            experiment.  If "raise", raise an error if the output pickle or pxsim
            files do not exist for any experiment.
        tag : str, optional
            If provided, only run the experiment with the given tag.
        check_versions : bool, default True
            If True, check the PassengerSim versions in the loaded summary (if
            any), and re-run the simulation if they do not match the current
            environment. If False, do not check the PassengerSim versions.
        check_content : bool, default True
            If True, check the content of the loaded summary (if any), and
            re-run the simulation if the config has changed. If False, do not
            check the content of the loaded summary.
        single_process : bool, default False
            If True, force all the simulations to run in single process mode. If
            False, run allow each experiment's simulation to run multi-process,
            unless that individual experiment is set to run in single process mode.
        retain_sims : bool, default False
            If True, retain the simulation objects in the `sims` attribute after
            running each simulation. This is primarily useful for debugging.
        write_report : path-like or bool, default True
            If provided, write a report of the experiments to the given file.
            This will be relative to the output directory if that is set, and the
            filename given here is a relative path. If True, the report filename
            will be "experiments-summary.html". If False, do not write a report.
        cache_results : bool, default True
            If True, cache the results of each experiment in the `cached` attribute
            of the corresponding Experiment object.  This allows the results to be
            reused in future runs of the experiments, without needing to reload from
            disk.

        Returns
        -------
        contrast.Contrast or SimulationTables
        """

        results = contrast.Contrast()

        if retain_sims:
            self._sims = {}

        # validate that all experiments have unique tags
        tags = set()
        for e in self.experiments:
            if e.tag is None:
                if e.title is None:
                    raise ValueError("Experiment missing tag and title")
                raise ValueError("Experiment missing tag: " + e.title)
            if e.tag in tags:
                raise ValueError("Duplicate experiment tag: " + e.tag)
            tags.add(e.tag)

        if isinstance(tag, str):
            selected_experiments = [e for e in self.experiments if e.tag == tag]
            if not selected_experiments:
                raise ValueError(f"No experiment found with tag {tag}")
        elif tag is None:
            selected_experiments = self.experiments
        else:
            raise TypeError("tag must be a string or None")

        rich_progress = Progress(
            TextColumn("[progress.description]{task.description}"),
            BarColumn(),
            MofNCompleteColumn(),
            TimeRemainingColumn(),
            auto_refresh=False,
            transient=True,
        )
        top_progress = Progress(
            MofNCompleteColumn(),
            TextColumn("[progress.description]{task.description}"),
            auto_refresh=False,
            transient=True,
        )
        live_display = Live(
            Panel(
                Group(
                    top_progress,
                    rich_progress,
                ),
                title="Experiments",
                border_style="blue",
                expand=True,
            ),
            refresh_per_second=4,
            transient=True,
        )

        default_use_existing = True
        if not isinstance(use_existing, dict):
            default_use_existing = use_existing
            use_existing = {}

        with live_display:
            top_task = top_progress.add_task("[blue]Experiments", total=len(selected_experiments))

            for e in selected_experiments:
                top_progress.update(top_task, advance=1, description=f"[bold blue]{e.tag}", refresh=True)

                if e.cached:
                    # If a cached SimulationTables result is available, use it and skip the simulation.
                    # No checks are performed on the cached result, so it is the user's responsibility to
                    # ensure that the cached result is valid and matches the current config and PassengerSim
                    # versions, if applicable.
                    summary = e.cached
                    live_display.console.print(f"Using cached results for experiment {e.tag}")
                    results[e.tag] = summary
                    continue
                elif e.external:
                    # If an external file is provided, load it and skip the simulation.
                    # This is done without regard for the use_existing parameter, and
                    # the absence of the external file is always an error.
                    if isinstance(e.external, GenericSimulationTables):
                        summary = e.external
                    else:
                        summary = get_default_summarizer().from_file(e.external)
                    live_display.console.print(f"Loaded experiment {e.tag} from {e.external}")
                    results[e.tag] = summary
                    continue

                # Create the modified config for this experiment
                config = e.func(self.base_config.model_copy(deep=True))
                config.outputs.html.title = e.title or e.tag

                # Update the paths for the output files
                if config.outputs.html.filename:
                    config.outputs.html.filename = self._rename_file(e.tag, config.outputs.html.filename)
                if config.outputs.pickle:
                    config.outputs.pickle = self._rename_file(e.tag, config.outputs.pickle)
                if config.outputs.excel:
                    config.outputs.excel = self._rename_file(e.tag, config.outputs.excel)

                summary = None

                e_use_existing = use_existing.get(e.tag, default_use_existing)
                if e_use_existing:
                    try:
                        # Check if the output pickle files are defined and already exist
                        if config.outputs.pickle:
                            summary = get_default_summarizer().from_pickle(config.outputs.pickle)
                        else:
                            raise FileNotFoundError("No output pickle file specified")
                    except FileNotFoundError:
                        # At this point either the output pickle file is not defined
                        # (triggering the explicit FileNotFoundError) or does not exist,
                        # which raises the FileNotFoundError organically.  Either way,
                        # we also want to check if the pxsim-format disk file exists.

                        try:
                            second_file = config.outputs._get_disk_filename()
                            if second_file:
                                summary = get_default_summarizer().from_file(second_file)
                            else:
                                raise FileNotFoundError("No output disk file specified")
                        except FileNotFoundError as second_error:
                            if e_use_existing == "raise":
                                # Neither the output pickle file nor the pxsim-format disk file
                                # exist, so we need to raise an error.
                                raise second_error
                            elif e_use_existing == "ignore":
                                # Neither the output pickle file nor the pxsim-format disk file
                                # exist, but we have been instructed to ignore this.  The
                                # matching simulation will not be run, and will not be included
                                # in the results.
                                continue

                    if summary is not None:
                        # If we reach this point, we have successfully loaded the
                        # output from a pickle or pxsim file. But before we celebrate,
                        # we need to make sure the run we loaded matches the config
                        # we would otherwise run, and the versions of PassengerSim
                        # match between the run and the current environment.
                        msg, summary = self._check_loaded_summary(
                            summary,
                            config,
                            e.tag,
                            check_versions=check_versions,
                            check_content=check_content,
                        )
                        live_display.console.print(msg)
                        if summary is None:
                            if e_use_existing == "raise":
                                raise ValueError("existing result does not match requested experiment")
                            elif e_use_existing == "ignore":
                                continue

                if summary is None:
                    # If we reach this point, we need to run the simulation

                    # Initialize the simulation
                    if e.multi and not single_process:
                        sim = MultiSimulation(config)
                        if retain_sims:
                            self._sims[e.tag] = sim
                        self.apply_callback_functions(sim)
                        summary = sim.run(rich_progress=rich_progress)
                        del sim
                    else:
                        sim = Simulation(config)
                        if retain_sims:
                            self._sims[e.tag] = sim
                        self.apply_callback_functions(sim)
                        summary = sim.run(rich_progress=rich_progress)
                        del sim

                results[e.tag] = summary
                if cache_results:
                    e.cached = summary

            top_progress.update(
                top_task,
                description="[bold blue]Finished Experiments",
                refresh=True,
                visible=False,
            )

        if write_report:
            self._write_report_after_run(write_report, results)

        if tag is not None and len(selected_experiments) == 1:
            return results[selected_experiments[0].tag]
        return results

    def _run_together(
        self,
        use_existing: UseExistingT | dict[str, UseExistingT] = True,
        *,
        tag: str | None = None,
        check_versions: bool = True,
        check_content: bool = True,
        retain_sims: bool = False,
        write_report: PathLike | bool | None = True,
        cache_results: bool = True,
        summarizer: type | None = None,
    ):
        """
        Run the experiments.

        Parameters
        ----------
        use_existing : Literal[True, False, "ignore", "raise"] or dict
            This can either be a single value for all experiments, or a dictionary
            mapping tags to values.  For each value, the behavior is as follows:
            If True, load from existing output pickle files if they exist,
            otherwise run the simulation for each experiment.  If False, always
            run the simulation for each experiment. If "ignore", load results
            from output pickle or pxsim files if they exist, otherwise skip each
            experiment.  If "raise", raise an error if the output pickle or pxsim
            files do not exist for any experiment.
        tag : str, optional
            If provided, only run the experiment with the given tag.
        check_versions : bool, default True
            If True, check the PassengerSim versions in the loaded summary (if
            any), and re-run the simulation if they do not match the current
            environment. If False, do not check the PassengerSim versions.
        check_content : bool, default True
            If True, check the content of the loaded summary (if any), and
            re-run the simulation if the config has changed. If False, do not
            check the content of the loaded summary.
        single_process : bool, default False
            If True, force all the simulations to run in single process mode. If
            False, run allow each experiment's simulation to run multi-process,
            unless that individual experiment is set to run in single process mode.
        retain_sims : bool, default False
            If True, retain the simulation objects in the `sims` attribute after
            running each simulation. This is primarily useful for debugging.
        write_report : path-like or bool, default True
            If provided, write a report of the experiments to the given file.
            This will be relative to the output directory if that is set, and the
            filename given here is a relative path. If True, the report filename
            will be "experiments-summary.html". If False, do not write a report.
        cache_results : bool, default True
            If True, cache the results of each experiment in the `cached` attribute
            of the corresponding Experiment object.  This allows the results to be
            reused in future runs of the experiments, without needing to reload from
            disk.

        Returns
        -------
        contrast.Contrast or SimulationTables
        """
        jobber = JobExecutor().start()
        results = contrast.Contrast()
        pending_results: dict[str, concurrent.futures.Future] = {}

        summarizer = check_summarizer(summarizer)

        if retain_sims:
            self._sims = {}

        # validate that all experiments have unique tags
        tags = set()
        for e in self.experiments:
            if e.tag is None:
                if e.title is None:
                    raise ValueError("Experiment missing tag and title")
                raise ValueError("Experiment missing tag: " + e.title)
            if e.tag in tags:
                raise ValueError("Duplicate experiment tag: " + e.tag)
            tags.add(e.tag)

        if isinstance(tag, str):
            selected_experiments = [e for e in self.experiments if e.tag == tag]
            if not selected_experiments:
                raise ValueError(f"No experiment found with tag {tag}")
        elif tag is None:
            selected_experiments = self.experiments
        else:
            raise TypeError("tag must be a string or None")

        default_use_existing = True
        if not isinstance(use_existing, dict):
            default_use_existing = use_existing
            use_existing = {}

        for e in selected_experiments:
            if e.cached:
                # If a cached SimulationTables result is available, use it and skip the simulation.
                # No checks are performed on the cached result, so it is the user's responsibility to
                # ensure that the cached result is valid and matches the current config and PassengerSim
                # versions, if applicable.
                summary = e.cached
                jobber.rich_progress.console.print(f"Using cached results for experiment {e.tag}")
                results[e.tag] = summary
                continue
            elif e.external:
                # If an external file is provided, load it and skip the simulation.
                # This is done without regard for the use_existing parameter, and
                # the absence of the external file is always an error.
                if isinstance(e.external, GenericSimulationTables):
                    summary = e.external
                else:
                    summary = get_default_summarizer().from_file(e.external)
                jobber.rich_progress.console.print(f"Loaded experiment {e.tag} from {e.external}")
                results[e.tag] = summary
                continue

            # Create the modified config for this experiment
            config = e.func(self.base_config.model_copy(deep=True))
            # Revalidate the config now, which will ensure that all the changes that occur during validation
            # are captured. For example, the Experiment function might change a carrier to assign a standard
            # Frat5 curve, but that still needs to be loaded.
            config = config.model_validate(config)
            # make the config's title consistent with the experiment title or tag
            config.outputs.html.title = e.title or e.tag

            # Update the paths for the output files
            if not self.output_dir:
                config.outputs.base_dir = pathlib.Path(e.tag)
            else:
                config.outputs.base_dir = pathlib.Path(self.output_dir) / e.tag
            config.outputs.filename_stem = e.tag

            # TODO: FIND ALL THESE AND CHANGE TO config._resolve
            # if config.outputs.html.filename:
            #     config.outputs.html.filename = self._rename_file(e.tag, config.outputs.html.filename)
            # if config.outputs.pickle:
            #     config.outputs.pickle = self._rename_file(e.tag, config.outputs.pickle)
            # if config.outputs.excel:
            #     config.outputs.excel = self._rename_file(e.tag, config.outputs.excel)

            summary = None

            e_use_existing = use_existing.get(e.tag, default_use_existing)
            if e_use_existing:
                # At this point either the output pickle file is not defined
                # (triggering the explicit FileNotFoundError) or does not exist,
                # which raises the FileNotFoundError organically.  Either way,
                # we also want to check if the pxsim-format disk file exists.

                try:
                    disk_file = config.outputs.get_output_filename("disk", make_dirs=False)
                    if disk_file:
                        summary = get_default_summarizer().from_file(disk_file)
                    else:
                        raise FileNotFoundError("No output disk file specified")
                except FileNotFoundError as second_error:
                    if e_use_existing == "raise":
                        # Neither the output pickle file nor the pxsim-format disk file
                        # exist, so we need to raise an error.
                        raise second_error
                    elif e_use_existing == "ignore":
                        # The output pxsim-format disk file does not exist, but we have
                        # been instructed to ignore this.  The matching simulation will
                        # not be run, and will not be included in the results.
                        continue

                if summary is not None:
                    # If we reach this point, we have successfully loaded the
                    # output from a .pxsim file on disk. But before we celebrate,
                    # we need to make sure the run we loaded matches the config
                    # we would otherwise run, and the versions of PassengerSim
                    # match between the run and the current environment.
                    msg, summary = self._check_loaded_summary(
                        summary,
                        config,
                        e.tag,
                        check_versions=check_versions,
                        check_content=check_content,
                    )
                    jobber.rich_progress.console.print(msg)
                    if summary is None:
                        if e_use_existing == "raise":
                            raise ValueError("existing result does not match requested experiment")
                        elif e_use_existing == "ignore":
                            continue

            if summary is None:
                # If we reach this point, we need to run the simulation
                sim = MultiSimulation(config)
                if retain_sims:
                    self._sims[e.tag] = sim
                self.apply_callback_functions(sim)
                summary = sim._run_asynchronously(summarizer=summarizer, jobber=jobber, run_id=e.tag)
                del sim

            pending_results[e.tag] = summary
            results[e.tag] = summary
            if cache_results:
                e.cached = summary

        # convert cached results, which might be Futures, into finalized results
        results = contrast.Contrast(
            {k: (v.result() if isinstance(v, concurrent.futures.Future) else v) for k, v in results.items()}
        )

        # await results
        for k, v in pending_results.items():
            if isinstance(v, concurrent.futures.Future):
                results[k] = v.result()
            else:
                results[k] = v

        if write_report:
            self._write_report_after_run(write_report, results)

        if tag is not None and len(selected_experiments) == 1:
            return results[selected_experiments[0].tag]
        return results


[docs]
    def run(
        self,
        use_existing: UseExistingT | dict[str, UseExistingT] = True,
        *,
        tag: str | None = None,
        check_versions: bool = True,
        check_content: bool = True,
        single_process: bool = False,
        retain_sims: bool = False,
        write_report: PathLike | bool | None = True,
        cache_results: bool = True,
    ):
        """
        Run the experiments.

        Parameters
        ----------
        use_existing : Literal[True, False, "ignore", "raise"] or dict
            This can either be a single value for all experiments, or a dictionary
            mapping tags to values.  For each value, the behavior is as follows:
            If True, load from existing output pickle files if they exist,
            otherwise run the simulation for each experiment.  If False, always
            run the simulation for each experiment. If "ignore", load results
            from output pickle or pxsim files if they exist, otherwise skip each
            experiment.  If "raise", raise an error if the output pickle or pxsim
            files do not exist for any experiment.
        tag : str, optional
            If provided, only run the experiment with the given tag.
        check_versions : bool, default True
            If True, check the PassengerSim versions in the loaded summary (if
            any), and re-run the simulation if they do not match the current
            environment. If False, do not check the PassengerSim versions.
        check_content : bool, default True
            If True, check the content of the loaded summary (if any), and
            re-run the simulation if the config has changed. If False, do not
            check the content of the loaded summary.
        single_process : bool, default False
            If True, force all the simulations to run in single process mode. If
            False, run allow each experiment's simulation to run multi-process,
            unless that individual experiment is set to run in single process mode.
        retain_sims : bool, default False
            If True, retain the simulation objects in the `sims` attribute after
            running each simulation. This is primarily useful for debugging.
        write_report : path-like or bool, default True
            If provided, write a report of the experiments to the given file.
            This will be relative to the output directory if that is set, and the
            filename given here is a relative path. If True, the report filename
            will be "experiments-summary.html". If False, do not write a report.
        cache_results : bool, default True
            If True, cache the results of each experiment in the `cached` attribute
            of the corresponding Experiment object.  This allows the results to be
            reused in future runs of the experiments, without needing to reload from
            disk.

        Returns
        -------
        contrast.Contrast or SimulationTables
        """
        if single_process:
            return self._run_experiments_in_sequence(
                use_existing=use_existing,
                tag=tag,
                check_versions=check_versions,
                check_content=check_content,
                single_process=single_process,
                retain_sims=retain_sims,
                write_report=write_report,
                cache_results=cache_results,
            )
        else:
            return self._run_together(
                use_existing=use_existing,
                tag=tag,
                check_versions=check_versions,
                check_content=check_content,
                retain_sims=retain_sims,
                write_report=write_report,
                cache_results=cache_results,
            )


    @property
    def report_filename(self) -> pathlib.Path:
        """Filename of the written report.

        Unless disabled, a report is written to a file after running the experiments.
        The report filename is stored here for reference.

        Raises
        ------
        ValueError
            If no report has been written.
        """
        if self._report_filename is None:
            raise ValueError("no report has been written")
        return self._report_filename


[docs]
    def validate(self):
        """Validate the experiments.

        This checks that all the experiments can be initialized with the base config,
        and that there are no duplicate tags.  This does not check that the modified
        configs are valid, since some modifications might be mutually incompatible
        but still be useful for comparison.
        """
        tags = set()
        for e in self.experiments:
            if e.tag is None:
                if e.title is None:
                    raise ValueError("Experiment missing tag and title")
                raise ValueError("Experiment missing tag: " + e.title)
            if e.tag in tags:
                raise ValueError("Duplicate experiment tag: " + e.tag)
            tags.add(e.tag)
            try:
                config = e.func(self.base_config.model_copy(deep=True))
                config = config.model_validate(config)
            except Exception as ex:
                raise ValueError(f"Experiment {e.tag} failed to validate") from ex