Source code for passengersim.summaries.generic

from __future__ import annotations

import glob
import inspect
import multiprocessing
import os
import pathlib
import platform
import time
import warnings
from collections.abc import Callable, Collection
from datetime import UTC, datetime
from functools import partialmethod
from typing import TYPE_CHECKING, Any, ClassVar, Literal, Self

import dill as pickle
import pandas as pd

from passengersim.callbacks import CallbackData
from passengersim.config import Config
from passengersim.utils.filenaming import (
    filename_with_timestamp,
    filenames_with_timestamp,
    make_parent_directory,
)
from passengersim.utils.kvstore import KVStore

if TYPE_CHECKING:
    from passengersim import Simulation
    from passengersim.database import Database



[docs]
class MissingDataError(KeyError):
    """Exception raised when data is missing from a summary table."""

    pass




[docs]
def initialize_metadata() -> dict[str, Any]:
    """Initialize metadata for the summary."""
    from passengersim_core import __version__ as core_version

    from passengersim import __version__ as version

    metadata = {}
    metadata["time.created"] = datetime.now(UTC).isoformat()
    metadata["machine.system"] = platform.system()
    metadata["machine.release"] = platform.release()
    metadata["machine.version"] = platform.version()
    metadata["machine.machine"] = platform.machine()
    metadata["machine.processor"] = platform.processor()
    metadata["machine.architecture"] = platform.architecture()
    metadata["machine.node"] = platform.node()
    metadata["machine.platform"] = platform.platform()
    metadata["machine.python_version"] = platform.python_version()
    metadata["machine.cpu_count"] = multiprocessing.cpu_count()
    metadata["version.passengersim"] = version
    metadata["version.passengersim_core"] = core_version
    return metadata




[docs]
class SimulationTableItem:
    def __init__(
        self,
        aggregation_func: Callable[[list[GenericSimulationTables]], pd.DataFrame | None],
        extraction_func: Callable[[Simulation], pd.DataFrame | None] = None,
        computed_fields: dict[str, Any] = None,
        doc: str | None = None,
    ):
        self._doc = doc
        self._aggregation_func = aggregation_func
        self._extraction_func = extraction_func
        self._computed_fields = computed_fields or {}

    def __set_name__(self, owner, name):
        self.name = name
        owner._std_agg[name] = self._aggregation_func
        owner._std_extract[name] = self._extraction_func
        setattr(owner, "_raw_" + name, property(self._get_raw))

    def __get__(self, instance, owner):
        if instance is None:
            return self
        try:
            # if we don't have the data we want but we have a file_store,
            # try to load it from there
            if self.name not in instance._data and instance._file_store is not None:
                try:
                    instance._data[self.name] = instance._file_store[self.name]
                except KeyError:
                    pass
            # now work with what we have
            df = instance._data[self.name]
            # make n_total_samples available for computed fields, if it is present in the instance
            # to use in, write `@n_total_samples` in the expression
            local_dict = {}
            n_total_samples = getattr(instance, "n_total_samples", None)
            if n_total_samples is not None:
                local_dict["n_total_samples"] = n_total_samples
            if isinstance(df, Exception):
                raise df
            if df is not None:
                engine = "python" if len(df) < 10000 else "numexpr"
                for field, func in self._computed_fields.items():
                    if field in df:
                        continue
                    try:
                        df[field] = df.eval(func, engine=engine, local_dict=local_dict)
                    except Exception as e:
                        warnings.warn(
                            f"Error computing {field} for {self.name}: {e}",
                            stacklevel=2,
                        )
            return df
        except KeyError:
            raise MissingDataError(self.name) from None

    def __set__(self, instance, value):
        if isinstance(value, pd.DataFrame):
            instance._data[self.name] = value
        else:
            raise TypeError(f"expected DataFrame, got {type(value)}")

    @property
    def __doc__(self):
        return self._doc

    def _get_raw(self, instance):
        df = instance._data.get(self.name, None)
        if df is not None:
            df = df.drop(columns=self._computed_fields.keys(), errors="ignore")
        return df




[docs]
class DatabaseTableItem:
    def __init__(
        self,
        query_func: Callable[[Database], pd.DataFrame],
        aggregation_func: Callable[[list[GenericSimulationTables]], pd.DataFrame | None],
        doc: str | None = None,
    ):
        self._doc = doc
        self._aggregation_func = aggregation_func
        self._query_func = query_func

    def __set_name__(self, owner, name):
        self.name = name
        owner._std_agg[name] = self._aggregation_func
        owner._std_query[name] = self._query_func
        setattr(owner, "_raw_" + name, property(self._get_raw))
        setattr(
            owner,
            "_requery_" + name,
            partialmethod(lambda instance, *arg, **kwarg: self._requery(instance, *arg, **kwarg)),
        )

    def __get__(self, instance, owner):
        if instance is None:
            return self
        if self.name not in instance._data:
            try:
                instance.run_queries(items=[self.name])
            except Exception as e:
                warnings.warn(f"Error querying {self.name}: {e}", stacklevel=2)
        try:
            df = instance._data[self.name]
            if isinstance(df, Exception):
                raise df
            return df
        except KeyError:
            raise MissingDataError(self.name) from None

    def __set__(self, instance, value):
        instance._data[self.name] = value

    @property
    def __doc__(self):
        return self._doc

    def _get_raw(self, instance: GenericSimulationTables):
        df = instance._data.get(self.name, None)
        return df

    def _requery(self, instance: GenericSimulationTables, cnx: Database = None, **kwargs):
        instance.run_queries(cnx=cnx, items=[self.name], **kwargs)
        return self._get_raw(instance)




[docs]
class GenericSimulationTables:
    __subclasses: ClassVar[set[type[GenericSimulationTables]]] = set()


[docs]
    @classmethod
    def subclasses(cls) -> list[type[GenericSimulationTables]]:
        """Return a list of all concrete subclasses.

        User defined subclasses (those not in the passengersim package)
        are at the front of the list, so they come first in MRO and
        thus can override native subclasses.
        """
        subs = []
        for sub in cls.__subclasses:
            if getattr(sub, "__final__", False):
                # do not include classes marked as final
                continue
            if sub.__module__.startswith("passengersim.summaries"):
                # these are native subclasses
                subs.append(sub)
            else:
                subs.insert(0, sub)
        subs.append(GenericSimulationTables)
        return subs


    def __init_subclass__(cls, **kwargs):
        """Capture a set of all concrete subclasses"""
        super().__init_subclass__(**kwargs)
        if inspect.isabstract(cls):
            return  # do not include intermediate abstract base classes
        cls.__subclasses.add(cls)

    def __init__(
        self,
        data: dict[str, pd.DataFrame] = None,
        *,
        config: Config | None = None,
        cnx: Database | None = None,
        sim: Simulation | None = None,
        n_total_samples: int = 0,
        items: Collection[str] = (),
        callback_data: CallbackData | None = None,
    ):
        self._file_store = None
        """File store for loading data when it is otherwise missing."""

        self._data = data or {}
        """Dataframes that summarize a Simulation run."""

        self.config = config
        """Configuration for the Simulation run."""

        self.cnx = cnx
        """Database connection for the Simulation run."""

        self.sim = sim
        """Simulation object for the Simulation run."""

        self.n_total_samples = n_total_samples
        """Total number of sample departures simulated to create these summaries.

        This excludes any burn samples.
        """

        self._items = items
        """Collection of items that should extracted to create this summary.

        If empty, all items will be extracted."""

        self.meta_summaries = []
        """Summaries that were aggregated to create this summary."""

        self._metadata = initialize_metadata()
        """Metadata for the summary."""

        self.callback_data = callback_data or CallbackData()
        """Data collected during callbacks."""

    __writable_attrs = {
        "_file_store",
        "_data",
        "config",
        "_config",
        "cnx",
        "sim",
        "n_total_samples",
        "meta_summaries",
        "_preserve_meta_summaries",
        "_preserve_config",
        "_items",
        "_metadata",
        "callback_data",
        "_callback_data",
    }

    def __setattr__(self, item, value):
        """Deny setting of attributes that are not in __writable_attrs."""
        if item in self.__writable_attrs:
            # writable attributes are handled normally
            super().__setattr__(item, value)
        else:
            raise AttributeError(f"Cannot set attribute {item!r}")

    _std_agg: dict[str, Callable[[list[GenericSimulationTables]], pd.DataFrame | None]] = {}
    _std_extract: dict[str, Callable[[Simulation], pd.DataFrame]] = {}
    _std_query: dict[str, Callable[..., pd.DataFrame]] = {}


[docs]
    @classmethod
    def extract(cls, sim: Simulation, items: Collection[str] = ()) -> Self:
        """Extract summary data from a Simulation."""
        eng = sim.eng
        num_samples = eng.num_trials_completed * (eng.num_samples - eng.burn_samples)
        if num_samples <= 0:
            raise ValueError(
                "insufficient number of samples outside burn period for reporting"
                f"\n- num_trials = {eng.num_trials}"
                f"\n- num_trials_completed = {eng.num_trials_completed}"
                f"\n- num_samples = {eng.num_samples}"
                f"\n- burn_samples = {eng.burn_samples}"
            )

        data = {}
        items = set(items) or cls._std_extract.keys()
        for name, func in cls._std_extract.items():
            if name in items:
                if func is not None:
                    try:
                        data[name] = func(sim)
                    except Exception as err:
                        # do not let an exception here take down the whole report
                        warnings.warn(f"Exception {type(err).__name__} in {name}: {err}", stacklevel=2)
        return cls(
            data,
            sim=sim,
            config=sim.config,
            cnx=sim.cnx,
            n_total_samples=num_samples,
            callback_data=sim.callback_data,
        )


    def _extract(self: Self, sim: Simulation) -> Self:
        """Extract summary data from a Simulation."""
        return self.__class__.extract(sim, self._items)


[docs]
    def run_queries(
        self,
        cnx: Database = None,
        items: Collection[str] | None = None,
        *,
        scenario: str = None,
        burn_samples: int | None = None,
    ) -> Self:
        """Query summary data from a Database.

        The requested items will be queried from the database and stored in this
        summary object.  If the item is not available, an exception will be raised.

        Parameters
        ----------
        cnx : Database, optional
            Database connection to use for querying.
        items : Collection[str], optional
            The items to query.  If None, or if only "*" is given, then all
            available items will be queried.
        scenario : str, optional
            The scenario to use for querying.
        burn_samples : int, optional
            The number of burn samples to use for querying. If explicitly `None`,
            the burn_samples value from the configuration will be used if available,
            otherwise the default value of 100 will be used.
        """
        if cnx is None:
            cnx = self.cnx
        if items is None or len(items) == 1 and "*" in items:
            items = self._std_query.keys()
        else:
            items = set(items)
        if burn_samples is None:
            if self.config is not None:
                burn_samples = self.config.simulation_controls.burn_samples
            elif self.sim is not None:
                burn_samples = self.sim.config.simulation_controls.burn_samples
        if burn_samples is None:
            burn_samples = 100
        for name, query in self._std_query.items():
            if name in items:
                if cnx is None:
                    warnings.warn(f"no database connection available for {name}", stacklevel=2)
                    self._data[name] = ValueError(f"no database connection available for {name}")
                else:
                    try:
                        self._data[name] = query(cnx, scenario=scenario, burn_samples=burn_samples)
                    except Exception as e:
                        warnings.warn(f"error in query for {name}: {e}", stacklevel=2)
                        self._data[name] = e
        return self



[docs]
    @classmethod
    def aggregate(cls, summaries: Collection[GenericSimulationTables]) -> Self:
        """Aggregate multiple summary tables."""
        if not summaries:
            warnings.warn("no summaries available", stacklevel=2)
            return cls({})

        result = cls({})
        for name, func in cls._std_agg.items():
            if func is not None:
                result._data[name] = func(summaries)
        result.meta_summaries = summaries
        result.n_total_samples = sum(s.n_total_samples for s in summaries)
        result.callback_data = sum(s.callback_data for s in summaries)
        return result


    def __getstate__(self):
        state = self.__dict__.copy()
        if "cnx" in state:
            del state["cnx"]
        if "sim" in state:
            del state["sim"]
        if "config" in state:
            if state.get("_preserve_config", False):
                state["_config_yaml"] = state["config"].to_yaml()
            del state["config"]
        if "meta_trials" in state and not state.get("_preserve_meta_trials", True):
            del state["meta_trials"]
        if "_preserve_meta_trials" in state:
            del state["_preserve_meta_trials"]
        if "_preserve_config" in state:
            del state["_preserve_config"]
        return state

    def __setstate__(self, state):
        if "_config_yaml" in state:
            content = state.pop("_config_yaml")
            try:
                state["config"] = Config.from_raw_yaml(content)
            except Exception:
                try:
                    if isinstance(content, bytes):
                        content_lines = content.decode("utf-8").split("\n")
                    else:
                        content_lines = content.split("\n")
                    for i, line in enumerate(content_lines):
                        print(f"{i + 1:>4} | {line}")
                except Exception:
                    pass
                raise
        self.__dict__.update(state)
        if "cnx" not in self.__dict__:
            self.cnx = None
        if "sim" not in self.__dict__:
            self.sim = None
        if "_config" not in self.__dict__:
            self._config = None
        if "n_total_samples" not in self.__dict__:
            self.n_total_samples = 0
        if "_metadata" not in self.__dict__:
            self._metadata = {}
        if "_callback_data" not in self.__dict__:
            self._callback_data = CallbackData()


[docs]
    def to_pickle(
        self,
        filename: str | pathlib.Path,
        add_timestamp_ext: bool = True,
        *,
        preserve_meta_summaries: bool = False,
        preserve_config: bool = True,
        make_dirs: Literal[True, False, "git"] = True,
    ) -> pathlib.Path:
        """Save to a pickle file.

        This method uses lz4 compression if the lz4.frame module is available.

        Parameters
        ----------
        filename : str or Path-like
            The filename to save the object to.  An extension map be added or
            modified, to optionally add a time stamp and/or compression flag.
        add_timestamp_ext : bool, default True
            Add a timestamp extension to the filename.
        preserve_meta_summaries : bool, default False
            Preserve the meta_summaries attribute in the saved object.
        preserve_config : bool, default False
            Preserve the config attribute in the saved object.  This includes
            the entire network, and can potentially be a lot of data.
        make_dirs : bool or "git", default True
            If True, create the parent directory for the pickle file if it does
            not already exist.  If the directory is created, it will be created
            with a `.gitignore` file to prevent accidental inclusion of pickled
            output in Git repositories, unless the value is "git", in which case
            no `.gitignore` file is created and the results will be eligible for
            inclusion in Git.

        Returns
        -------
        Path-like
            The resolved filename for the saved outputs.
        """
        if add_timestamp_ext:
            filename = filename_with_timestamp(filename, suffix=".pkl")
        else:
            filename = pathlib.Path(filename)
        if make_dirs:
            if not filename.parent.exists():
                filename.parent.mkdir(parents=True, exist_ok=True)
                if make_dirs != "git":
                    with open(filename.parent / ".gitignore", "w") as f:
                        f.write(".gitignore\n")  # ignore this file itself
                        f.write("*.pkl\n")  # ignore pickles
                        f.write("*.pkl.lz4\n")  # ignore compressed pickles

        try:
            import lz4.frame
        except ImportError:
            with open(filename, "wb") as f:
                self._preserve_meta_summaries = preserve_meta_summaries
                self._preserve_config = preserve_config
                pickle.dump(self, f)
                del self._preserve_meta_summaries
                del self._preserve_config
            return filename
        else:
            use_filename = filename.with_suffix(filename.suffix + ".lz4")
            with lz4.frame.open(use_filename, "wb") as f:
                self._preserve_meta_summaries = preserve_meta_summaries
                self._preserve_config = preserve_config
                pickle.dump(self, f)
                del self._preserve_meta_summaries
                del self._preserve_config
            return use_filename



[docs]
    @classmethod
    def from_pickle(cls, filename: str | pathlib.Path, read_latest: bool = True):
        """Load the object from a pickle file.

        Parameters
        ----------
        filename : str or Path-like
            The filename to load the object from.
        read_latest : bool, default True
            If True, read the latest file matching the pattern.
        """
        try:
            import lz4.frame
        except ImportError:
            pass
        else:
            # first try lz4 compressed files if available
            try:
                if read_latest:
                    filename_glob = pathlib.Path(filename).with_suffix(".*.pkl.lz4")
                    files = sorted(glob.glob(str(filename_glob)))
                    if not files:
                        if not os.path.exists(filename):
                            raise FileNotFoundError(filename)
                    else:
                        filename = files[-1]

                try:
                    with lz4.frame.open(filename, "rb") as f:
                        try:
                            result = pickle.load(f)
                        except Exception as e:
                            raise RuntimeError(f"Error loading {filename}: {e}") from e
                        # if result.__class__.__name__ != cls.__name__:
                        #     raise TypeError(f"Expected {cls}, got {type(result)}")
                        if hasattr(result, "_metadata"):
                            result._metadata["loaded.filename"] = filename
                            result._metadata["loaded.time"] = datetime.now(UTC).isoformat()
                        return result
                except RuntimeError as err:
                    if "LZ4F_decompress failed" in str(err):
                        # lz4 frame error, try uncompressed file
                        with open(filename, "rb") as f:
                            result = pickle.load(f)
                            # if result.__class__.__name__ != cls.__name__:
                            #     raise TypeError(f"Expected {cls}, got {type(result)}")
                            if hasattr(result, "_metadata"):
                                result._metadata["loaded.filename"] = filename
                                result._metadata["loaded.time"] = datetime.now(UTC).isoformat()
                            return result
                    raise
            except FileNotFoundError:
                pass

        if read_latest:
            filename_glob = pathlib.Path(filename).with_suffix(".*.pkl")
            files = sorted(glob.glob(str(filename_glob)))
            if not files:
                if not os.path.exists(filename):
                    raise FileNotFoundError(filename)
            else:
                filename = files[-1]

        with open(filename, "rb") as f:
            result = pickle.load(f)
            if result.__class__.__name__ != cls.__name__:
                raise TypeError(f"Expected {cls}, got {type(result)}")
            if hasattr(result, "_metadata"):
                result._metadata["loaded.filename"] = filename
                result._metadata["loaded.time"] = datetime.now(UTC).isoformat()
            return result



[docs]
    def to_file(
        self,
        filename: str | pathlib.Path,
        add_timestamp_ext: bool = True,
        *,
        preserve_config: bool = True,
        make_dirs: Literal[True, False, "git"] = True,
    ) -> pathlib.Path:
        """Write simulation tables to a file.

        Parameters
        ----------
        filename : Path-like
            The file to write.
        add_timestamp_ext : bool, default True
            Add a timestamp extension to the filename.
        preserve_config : bool, default True
            Preserve the config attribute in the saved object.  This includes
            the entire network, and can potentially be a lot of data.
        make_dirs : bool or "git", default True
            If True, create the parent directory for the file if it does
            not already exist.  If the directory is created, it will be created
            with a `.gitignore` file to prevent accidental inclusion of output
            in Git repositories, unless the value is "git", in which case
            no `.gitignore` file is created and the results will be eligible for
            inclusion in Git.

        Returns
        -------
        Path-like
            The resolved filename for the saved outputs.
        """
        if add_timestamp_ext:
            filename = filename_with_timestamp(filename, suffix=".pxsim")
        else:
            filename = pathlib.Path(filename)
        if make_dirs:
            git_ignores = ["*.pxsim", "*.pkl.lz4", "*.pkl"] if make_dirs != "git" else False
            make_parent_directory(filename, git_ignores)
        kvs = KVStore(filename)
        for k, v in self._data.items():
            if preserve_config and k.endswith("_defs"):
                # do not save *_defs tables, as they can be regenerated from the config
                continue
            if k.endswith("_") and not k.startswith("_"):
                # do not save data with names that end with "_" but do not begin with "_",
                # as these are cached joins that are not meant to be saved
                continue
            kvs[k] = v
        if preserve_config:
            kvs["_config_"] = self.config.model_dump(serialize_as_any=True)
        kvs["_metadata_"] = self._metadata
        kvs["_n_total_samples_"] = self.n_total_samples
        if self.callback_data:
            kvs["_callback_data_"] = self.callback_data
        kvs.close()
        return filename



[docs]
    @classmethod
    def from_file(cls, filename: str | pathlib.Path, read_latest: bool = True, lazy: bool = True):
        """Load the object from a file.

        Parameters
        ----------
        filename : str or Path-like
            The filename to load the object from.
        read_latest : bool, default True
            If True, read the latest file matching the pattern.
        lazy : bool, default True
            If True, load the data lazily (as needed).  Otherwise, load the data
            immediately.
        """

        # if the file is a *.pkl or *.pkl.lz4 file, read it with the from_pickle method instead
        if str(filename).endswith(".pkl") or str(filename).endswith(".pkl.lz4"):
            return cls.from_pickle(filename, read_latest=read_latest)

        if read_latest:
            filename_glob = pathlib.Path(filename).with_suffix(".*.pxsim")
            files = sorted(glob.glob(str(filename_glob)))
            if not files:
                if not os.path.exists(filename):
                    raise FileNotFoundError(filename)
            else:
                filename = files[-1]

        result = cls()
        result._file_store = KVStore(filename)
        result._metadata = result._file_store["_metadata_"]
        result.n_total_samples = result._file_store["_n_total_samples_"]
        result._metadata["store.filename"] = filename
        if not lazy:
            for k in result._file_store:
                if not (k.startswith("_") and k.endswith("_")):
                    result._data[k] = result._file_store[k]
                if k == "_callback_data_":
                    result._callback_data = result._file_store[k]
                if k == "_config_":
                    try:
                        temp = result._file_store["_config_"]
                    except KeyError:
                        pass
                    else:
                        if isinstance(temp, dict):
                            temp = Config.model_validate(temp)
                        result._config = temp
        return result



[docs]
    def file_info(self):
        """Return information about the file store."""
        from passengersim.utils.si import si_units

        if self._file_store is None:
            return "No file store"
        info = f"File store: {self.metadata('store.filename')}"
        info += f"\n  {'Data Element':30} Disk Usage"
        sizes = pd.Series(self._file_store.get_sizes()).sort_values(ascending=False)
        for k, v in sizes.items():
            info += f"\n* {k:30} {si_units(v, 'B')}"
        return info



[docs]
    def remove_data(self, keys: Collection[str] | str) -> Self:
        """Remove data from the summary tables.

        This can be used to reduce the size of the summary tables when saving
        to a file, or to remove sensitive data before sharing the summary tables.

        Parameters
        ----------
        keys : Collection[str] or str
            The key(s) of the data to remove.

        Returns
        -------
        Self
            The summary tables object, with the specified data removed.
        """
        if isinstance(keys, str):
            keys = [keys]
        for key in keys:
            if key in self._data:
                del self._data[key]
            if self._file_store is not None and key in self._file_store:
                del self._file_store[key]
        if self._file_store is not None:
            self._file_store.vacuum()
        return self



[docs]
    def to_xlsx(self, filename: str | pathlib.Path) -> None:
        """Write simulation tables to excel.

        Parameters
        ----------
        filename : Path-like
            The excel file to write.
        """
        if isinstance(filename, str):
            filename = pathlib.Path(filename)
        filename.parent.mkdir(exist_ok=True, parents=True)
        with pd.ExcelWriter(filename) as writer:
            for k, v in self._data.items():
                if isinstance(v, pd.DataFrame):
                    v.to_excel(writer, sheet_name=k)



[docs]
    def to_html(
        self,
        filename: str | pathlib.Path,
        *,
        cfg: Config | None = None,
        make_dirs: bool = True,
        extra: tuple = (),
        add_timestamp: bool = True,
    ) -> pathlib.Path:
        """Write simulation tables report summary to html.

        Parameters
        ----------
        filename : Path-like, optional
            The html file to write.
        cfg : Config, optional
            The configuration to use for the report.  If None, the configuration
            from the simulation object will be used.
        make_dirs : bool, default True
            If True, create any necessary directories.
        extra : tuple, optional
            Additional data to include in the report.  Each item in the tuple should
            either a section or subsection title, or a tuple of (title, func), or
            just a function.  If a function is provided, it should take the summary
            as its only argument and return a figure (altair.Chart or xmle.Elem) or
            table (pandas.DataFrame).  The function will be called with the summary
            as its only argument. To use a function that requires other arguments,
            use `functools.partial` provide the other arguments.
        add_timestamp : bool, default True
            If True, append a timestamp to the filename.  This ensures that each
            report is unique and does not overwrite previous reports.  If False,
            the filename will be used as-is. Set this to False if you want to
            overwrite previous reports with the same filename, or if you are
            already setting the timestamp yourself.

        Returns
        -------
        Path-like
            The resolved filename for the saved outputs.
        """
        from passengersim.reporting.html import to_html

        return to_html(self, filename, cfg=cfg, make_dirs=make_dirs, extra=extra, add_timestamp=add_timestamp)



[docs]
    def save(
        self,
        filename: str | pathlib.Path,
        *,
        timestamp: float | time.struct_time | datetime | None = None,
        make_dirs: Literal[True, False, "git"] = True,
        cfg: Config | None = None,
        extra_html: tuple = (),
    ) -> dict[str, pathlib.Path]:
        """Save the object to a set of files.

        This method will write both an HTML report on this simulation tables
        object and a ".pxsim" file allowing the content to be restored.

        Parameters
        ----------
        filename : Path-like
            The file stem to use for writing files.
        timestamp : float or time.struct_time or datetime, optional
            The timestamp to use for the filenames.  If not provided, the current
            time will be used.
        make_dirs : bool or "git", default True
            If True, create the parent directory for the files if it does not
            already exist.  If the directory is created, it will be created with
            a `.gitignore` file to prevent accidental inclusion of output in Git
            repositories, unless the value is "git", in which case no `.gitignore`
            file is created and the results will be eligible for inclusion in Git.
        cfg : Config, optional
            The configuration to use for the HTML report.  If None, the configuration
            from the simulation object will be used if available.
        extra_html : tuple, optional
            Additional data to include in the HTML report. This argument is passed
            to `to_html`, see that function for more details.

        Returns
        -------
        dict
            A dictionary of filenames written, including the timestamp added.
        """
        if make_dirs:
            make_parent_directory(
                filename,
                git_ignore_things=False if make_dirs == "git" else ["*.pxsim", "*.html"],
            )
        filename = pathlib.Path(filename)
        filenames = filenames_with_timestamp(filename, timestamp=timestamp, suffix=[".pxsim", ".html"])
        self.to_html(filenames[".html"], cfg=cfg, make_dirs=False, extra=extra_html)
        self.to_file(filenames[".pxsim"], make_dirs=False, add_timestamp_ext=False)
        return filenames



[docs]
    def metadata(self, key: str = ""):
        """Return a metadata value."""
        if key in self._metadata:
            return self._metadata[key]
        if "." in key:
            # dotted keys are always exact matches
            raise KeyError(key)
        if key == "":
            return self._metadata.copy()
        matches = {}
        for k in self._metadata:
            subkeys = k.split(".")
            subkey = subkeys[0]
            others = ".".join(subkeys[1:])
            if subkey == key:
                matches[others] = self._metadata[k]
        if not matches:
            raise KeyError(key)
        return matches


    @property
    def config(self):
        if self._config is None and self._file_store is not None:
            try:
                temp = self._file_store["_config_"]
            except KeyError:
                pass
            else:
                if isinstance(temp, dict):
                    temp = Config.model_validate(temp)
                self._config = temp
        return self._config

    @config.setter
    def config(self, value):
        self._config = value

    @config.deleter
    def config(self):
        self._config = None

    @property
    def callback_data(self):
        if not self._callback_data and self._file_store is not None:
            try:
                self._callback_data = self._file_store["_callback_data_"]
            except KeyError:
                pass
        return self._callback_data

    @callback_data.setter
    def callback_data(self, value):
        self._callback_data = value

    @callback_data.deleter
    def callback_data(self):
        self._callback_data = CallbackData()