Source code for amici.petab.petab_importer

"""PEtab v2 handling.

Functionality for importing and simulating
`PEtab v2 <https://petab.readthedocs.io/en/latest/v2/documentation_data_format.html#>`__
problems.

The relevant classes are:

* :class:`PetabImporter`: Import a PEtab problem as an AMICI model.
* :class:`PetabSimulator`: Simulate PEtab problems with AMICI.
* :class:`ExperimentManager`: Create :class:`amici.ExpData` objects for PEtab
  experiments.

See :doc:`/examples/example_petab/petab_v2` for example usage.
"""

from __future__ import annotations

import copy
import logging
import numbers
from collections import Counter
from collections.abc import Sequence
from pathlib import Path
from pprint import pprint
from typing import TYPE_CHECKING, Any

import numpy as np
import pandas as pd
import sympy as sp
from petab import v1 as v1
from petab import v2 as v2
from petab.v2 import ExperimentPeriod, Observable
from petab.v2.converters import ExperimentsToSbmlConverter
from petab.v2.models import MODEL_TYPE_PYSB, MODEL_TYPE_SBML

import amici

from .. import MeasurementChannel, SensitivityOrder, get_model_dir
from ..de_model import DEModel
from ..import_utils import amici_time_symbol
from ..logging import get_logger
from .sbml_import import _add_global_parameter
from .simulations import EDATAS, LLH, RDATAS, RES, S2LLH, SLLH, SRES

if TYPE_CHECKING:
    import pysb

    import amici.de_model_components

__all__ = [
    "PetabImporter",
    "ExperimentManager",
    "PetabSimulator",
    "rdatas_to_measurement_df",
    "rdatas_to_simulation_df",
    "flatten_timepoint_specific_output_overrides",
    "unflatten_simulation_df",
    "has_timepoint_specific_overrides",
    "EDATAS",
    "RDATAS",
    "LLH",
    "SLLH",
    "S2LLH",
    "RES",
    "SRES",
]
logger = get_logger(__name__, log_level=logging.INFO)


#: Default experiment ID to be used for measurements without an experiment ID.
_DEFAULT_EXPERIMENT_ID = "__default__"

#: PEtab measurement table columns to consider for detecting timepoint-specific
#:  parameter overrides
_POSSIBLE_GROUPVARS_FLATTENED_PROBLEM = [
    v2.C.MODEL_ID,
    v2.C.EXPERIMENT_ID,
    v2.C.OBSERVABLE_ID,
    v2.C.OBSERVABLE_PARAMETERS,
    v2.C.NOISE_PARAMETERS,
]

# TODO: how to handle SBML vs PySB, jax vs sundials?
#  -> separate importers or subclasses?
# TODO: How to handle multi-model-problems?



[docs]
class PetabImporter:
    """
    Importer for PEtab2 problems.

    This class is used to create an AMICI model from a PEtab problem.

    The underlying SBML or PySB model will be modified to encode the
    experiments defined in the PEtab problem as events or initial conditions.

    Be careful when using the imported model for anything other than the
    PEtab-encoded experiments.

    All PEtab experiments will be encoded in the model, independent of
    whether they have measurements. This is to make it easier to simulate
    the respective experiments with the resulting AMICI model.
    This may make the resulting model more bloated. If this is not desired,
    the problem should be simplified before import.

    :param petab_problem:
        The PEtab problem to import. The problem must not be changed after
        construction of the importer.
    """

    # TODO remove: extra debug output
    _debug = False


[docs]
    def __init__(
        self,
        petab_problem: v2.Problem | v1.Problem,
        *,
        compile_: bool = None,
        validate: bool = True,
        module_name: str = None,
        # TODO: model_id for selecting the model in multi-model problems
        # model_id: str = None,
        outdir: str | Path = None,
        jax: bool = False,
        output_parameter_defaults: dict[str, float] | None = None,
        verbose: int | bool = logging.INFO,
        non_estimated_parameters_as_constants: bool = True,
    ):
        """
        Create a new PetabImporter instance.

        :param petab_problem: The PEtab problem to import.
        :param compile_: Whether to compile the model extension after import.
        :param validate: Whether to validate the PEtab problem before import.
        :param module_name: The name of model module to generate.
        :param outdir:
            The output directory where the model files are written to.
        :param jax: Whether to generate a JAX model instead of a
            SUNDIALS model. Currently, only ``False`` is supported.
        :param output_parameter_defaults:
            Optional default parameter values for output parameters introduced
            in the PEtab observables table, in particular for placeholder
            parameters. A dictionary mapping parameter IDs to default values.
        :param verbose:
            The verbosity level. If ``True``, set to ``logging.INFO``.
            If ``False``, set to ``logging.WARNING``. Otherwise, use the given
            logging level.
        :param non_estimated_parameters_as_constants:
            Whether parameters marked as non-estimated in PEtab should be
            considered constant in AMICI. Setting this to ``True`` will reduce
            model size and simulation times. If sensitivities with respect to
            those parameters are required, this should be set to ``False``.
        """
        self.petab_problem: v2.Problem = self._upgrade_or_copy_if_needed(
            petab_problem
        )
        self._verbose = (
            logging.INFO
            if verbose is True
            else logging.WARNING
            if verbose is False
            else verbose
        )
        self._output_parameter_defaults = output_parameter_defaults

        if len(self.petab_problem.models) > 1:
            raise NotImplementedError(
                "PEtab v2 importer currently only supports single-model "
                "problems."
            )

        if self.petab_problem.model.type_id not in (
            MODEL_TYPE_SBML,
            MODEL_TYPE_PYSB,
        ):
            raise NotImplementedError(
                "PEtab v2 importer currently only supports SBML and PySB "
                f"models. Got {self.petab_problem.model.type_id!r}."
            )
        if jax:
            raise NotImplementedError(
                "PEtab v2 importer currently does not support JAX. "
            )

        if self._debug:
            print("PetabImpoter.__init__: petab_problem:")
            pprint(self.petab_problem.model_dump())
            if self.petab_problem.model.type_id == MODEL_TYPE_SBML:
                print(self.petab_problem.model.to_antimony())
            elif self.petab_problem.model.type_id == MODEL_TYPE_PYSB:
                print(self.petab_problem.model.to_str())

        self._compile = not jax if compile_ is None else compile_
        self._sym_model: DEModel | None = None
        self._model_id = self.petab_problem.model.model_id
        self._module_name = module_name or (
            f"{self.petab_problem.id}_{self.model_id}"
            if self.petab_problem.id
            else self.model_id
        )
        if self._module_name is None:
            raise ValueError(
                "No `module_name` was provided and no model ID "
                "was specified in the PEtab problem."
            )

        self._outdir: Path | None = (
            None if outdir is None else Path(outdir).absolute()
        )
        self._jax = jax
        self._non_estimated_parameters_as_constants: bool = (
            non_estimated_parameters_as_constants
        )

        if validate:
            logger.info("Validating PEtab problem ...")
            validation_result = petab_problem.validate()
            if validation_result:
                validation_result.log()

            if validation_result.has_errors():
                raise ValueError(
                    "PEtab problem is not valid, see log messages for details."
                )

        # ensure each measurement has an experimentId to simplify processing
        _set_default_experiment(self.petab_problem)

        if self.petab_problem.model.type_id == MODEL_TYPE_SBML:
            self._preprocess_sbml()
        elif self.petab_problem.model.type_id == MODEL_TYPE_PYSB:
            self._preprocess_pysb()
        else:
            raise AssertionError()


    def _preprocess_sbml(self):
        """Pre-process the SBML-based PEtab problem to make it
        amici-compatible."""
        from petab.v2.models.sbml_model import SbmlModel

        if not isinstance(self.petab_problem.model, SbmlModel):
            raise ValueError("The PEtab problem must contain an SBML model.")

        # Convert petab experiments to events, because so far,
        #  AMICI only supports preequilibration/presimulation/simulation, but
        #  no arbitrary list of periods.
        exp_event_conv = ExperimentsToSbmlConverter(self.petab_problem)
        # This will always create a copy of the problem.
        self.petab_problem = exp_event_conv.convert()
        for experiment in self.petab_problem.experiments:
            if len(experiment.periods) > 2:
                # This should never happen due to the conversion above
                raise NotImplementedError(
                    "AMICI currently does not support more than two periods."
                )

        if self._debug:
            print("PetabImpoter._preprocess_sbml: petab_problem:")
            pprint(self.petab_problem.model_dump())
            print(self.petab_problem.model.to_antimony())

    def _preprocess_pysb(self):
        """Pre-process the PySB-based PEtab problem to make it
        amici-compatible."""
        import pysb
        from petab.v2.models.pysb_model import PySBModel

        if not isinstance(self.petab_problem.model, PySBModel):
            raise ValueError("The PEtab problem must contain a PySB model.")

        _add_observation_model_pysb(self.petab_problem, self._jax)
        # TODO: clarify in PEtab whether its allowed to set initial amounts
        #  for a species without a pysb.Initial.
        #  Currently, we fail in that case.
        #  If so add a test case for changing the initial amount for a species
        #  without a pysb.Initial
        #  fixed_parameters = _add_initialization_variables(pysb_model,
        #                                                 petab_problem)

        pysb.bng.generate_equations(self.petab_problem.model.model)

        # Convert PEtab v2 experiments/conditions to events
        converter = ExperimentsToPySBConverter(self.petab_problem)
        self.petab_problem, self._events = converter.convert()

    def _upgrade_or_copy_if_needed(
        self, problem: v1.Problem | v2.Problem
    ) -> v2.Problem:
        """Upgrade the problem to petab v2 if necessary.
        Otherwise, create a deep copy of the problem."""
        if isinstance(problem, v2.Problem):
            return copy.deepcopy(problem)

        raise NotImplementedError(
            "'petab_problem' must be a `petab.v2.Problem`. "
            "`petab.v1.Problem` is not directly supported, but "
            "file-based PEtab v1 problems can be upgraded via "
            "`petab.v2.Problem.from_yaml(petab_v1_yaml_file)`."
        )

    @property
    def model_id(self) -> str:
        """The model ID."""
        if self._model_id is None:
            self._model_id = self.petab_problem.model.model_id

        return self._model_id

    @property
    def outdir(self) -> Path:
        """The output directory where the model files are written to."""
        if self._outdir is None:
            self._outdir = get_model_dir(self._module_name, jax=self._jax)
        return self._outdir

    def _do_import_sbml(self):
        """Import the model.

        Generate the symbolic model according to the given PEtab problem and
        generate the corresponding Python module.

        1. Encode all PEtab experiments as events and initial assignments
           in the SBML model.
           This leaves only (maybe) a pre-equilibration and a single
           simulation period.
        2. Add the observable parameters to the SBML model.
        """
        logger.info(f"Importing model {self.model_id!r}...")

        if not self.petab_problem.observables:
            raise NotImplementedError(
                "PEtab import without observables table "
                "is currently not supported."
            )

        logger.info(
            f"Module name is '{self._module_name}'.\n"
            f"Writing model code to '{self.outdir}'."
        )

        observation_model = self._get_observation_model()

        logger.info(f"#Observables: {len(observation_model)}")
        logger.debug(f"Observables: {observation_model}")

        self._workaround_observable_parameters_sbml(
            output_parameter_defaults=self._output_parameter_defaults,
        )

        # All indicator variables, i.e., all remaining targets after
        #  experiments-to-event in the PEtab problem must be converted
        #  to fixed parameters
        fixed_parameters = {
            change.target_id
            for experiment in self.petab_problem.experiments
            for period in experiment.periods
            for condition_id in period.condition_ids
            for change in self.petab_problem[condition_id].changes
        }

        from amici.petab.sbml_import import show_model_info

        show_model_info(self.petab_problem.model.sbml_model)
        sbml_importer = amici.SbmlImporter(
            self.petab_problem.model.sbml_model,
        )

        self._check_placeholders()

        fixed_parameters |= _get_fixed_parameters_sbml(
            petab_problem=self.petab_problem,
            non_estimated_parameters_as_constants=self._non_estimated_parameters_as_constants,
        )

        fixed_parameters = list(sorted(fixed_parameters))
        logger.info(f"Number of fixed parameters: {len(fixed_parameters)}")
        logger.debug(f"Fixed parameters are {fixed_parameters}")

        # Create Python module from SBML model
        if self._jax:
            sbml_importer.sbml2jax(
                model_name=self._module_name,
                output_dir=self.outdir,
                observation_model=observation_model,
                verbose=self._verbose,
                # **kwargs,
            )
            return sbml_importer
        else:
            # TODO:
            allow_reinit_fixpar_initcond = True
            sbml_importer.sbml2amici(
                model_name=self._module_name,
                output_dir=self.outdir,
                observation_model=observation_model,
                constant_parameters=fixed_parameters,
                allow_reinit_fixpar_initcond=allow_reinit_fixpar_initcond,
                verbose=self._verbose,
                compile=self._compile,
                # FIXME: simplification takes ages for Smith_BMCSystBiol2013
                #  due to nested piecewises / Heavisides?!
                simplify=None,
                # **kwargs,
            )
        # TODO check_model(amici_model=model, petab_problem=petab_problem)

        return sbml_importer

    def _do_import_pysb(
        self,
    ):
        """Import the PySB model.

        Generate the symbolic model according to the given PEtab problem and
        generate the corresponding Python module.
        """
        logger.info(f"Importing PySB model {self.model_id!r}...")

        if not self.petab_problem.observables:
            raise NotImplementedError(
                "PEtab import without observables table "
                "is currently not supported."
            )

        logger.info(
            f"Module name is '{self._module_name}'.\n"
            f"Writing model code to '{self.outdir}'."
        )

        observation_model = self._get_observation_model()

        logger.info(f"#Observables: {len(observation_model)}")
        logger.debug(f"Observables: {observation_model}")

        pysb_model = self.petab_problem.model.model

        # All indicator variables, i.e., all remaining targets after
        #  experiments-to-event in the PEtab problem must be converted
        #  to fixed parameters
        fixed_parameters = {
            change.target_id
            for experiment in self.petab_problem.experiments
            for period in experiment.periods
            for condition_id in period.condition_ids
            for change in self.petab_problem[condition_id].changes
        }
        # TODO: handle self._non_estimated_parameters_as_constants

        self._check_placeholders()
        fixed_parameters = list(sorted(fixed_parameters))

        logger.info(f"Number of fixed parameters: {len(fixed_parameters)}")
        logger.debug(f"Fixed parameters are {fixed_parameters}")

        from amici.pysb_import import pysb2amici, pysb2jax

        # Create Python module from PySB model
        if self._jax:
            pysb2jax(
                model=pysb_model,
                model_name=self._module_name,
                output_dir=self.outdir,
                observation_model=observation_model,
                verbose=self._verbose,
                pysb_model_has_obs_and_noise=True,
                # TODO: events
                # **kwargs,
            )
            return
        else:
            pysb2amici(
                model=pysb_model,
                model_name=self._module_name,
                output_dir=self.outdir,
                verbose=True,
                constant_parameters=fixed_parameters,
                observation_model=observation_model,
                pysb_model_has_obs_and_noise=True,
                compile=self._compile,
                _events=self._events,
                # **kwargs,
            )

        if self._compile:
            # check that the model extension was compiled successfully
            _ = self.import_module()
            # model = model_module.getModel()
            # TODO check_model(amici_model=model, petab_problem=petab_problem)

        return

    def _check_placeholders(self):
        # check for time-point-specific placeholders
        #  for now, we only support:
        #  * observable placeholders that are replaced by the same expression
        #    for all measurements for a given experiment
        #  * noise placeholders that are replaced by the same expression
        #    for all measurements for a given experiment
        #  * noise placeholders if there is only a single placeholder which
        #    is replaced by literals for all measurements for a given
        #    experiment
        for experiment in self.petab_problem.experiments:
            measurements = self.petab_problem.get_measurements_for_experiment(
                experiment
            )
            observable_overrides = {}
            noise_overrides = {}
            for measurement in measurements:
                observable_overrides.setdefault(
                    measurement.observable_id, set()
                ).add(tuple(measurement.observable_parameters))
                noise_overrides.setdefault(
                    measurement.observable_id, set()
                ).add(tuple(measurement.noise_parameters))

            for observable_id, overrides in observable_overrides.items():
                if len(overrides) > 1:
                    raise NotImplementedError(
                        f"Observable {observable_id} has multiple "
                        "timepoint-specific mappings for observable "
                        "parameters. "
                        "This is not supported by AMICI."
                    )
            for observable_id, overrides in noise_overrides.items():
                if len(overrides) > 1:
                    if len(next(iter(overrides))) == 1 and all(
                        isinstance(p[0], numbers.Number) for p in overrides
                    ):
                        continue

                    raise NotImplementedError(
                        f"Observable {observable_id} has multiple "
                        "timepoint-specific mappings for noise parameters. "
                        "This is not supported by AMICI."
                    )
                if len(overrides) == 1 and next(iter(overrides)) == ():
                    # this is a single literal, which is fine
                    continue
            if self._debug:
                print(experiment.id)
                print(observable_overrides)
                print(noise_overrides)

    def _workaround_observable_parameters_sbml(
        self, output_parameter_defaults: dict[str, float] = None
    ) -> None:
        """
        Add any output parameters that are introduced via PEtab to the model.

        This can be placeholder parameters or any other parameters that are
        introduced in observableFormula or noiseFormula in the observable
        table, or in observableParameters or noiseParameters in the measurement
        table.
        """
        problem = self.petab_problem
        output_parameters = problem.get_output_parameters()

        logger.debug(
            "Adding output parameters to model: "
            f"{list(sorted(output_parameters))}"
        )
        output_parameter_defaults = output_parameter_defaults or {}
        if extra_pars := (
            set(output_parameter_defaults) - set(output_parameters)
        ):
            raise ValueError(
                "Default output parameter values were given for "
                f"{extra_pars}, but they those are not output parameters."
            )

        for par in sorted(output_parameters):
            _add_global_parameter(
                sbml_model=problem.model.sbml_model,
                parameter_id=par,
                value=output_parameter_defaults.get(par, 0.0),
            )

    def _get_observation_model(
        self,
    ) -> list[MeasurementChannel]:
        """Get the observation model from the PEtab problem."""
        return [
            MeasurementChannel(
                id_=observable.id,
                name=observable.name or observable.id,
                formula=observable.formula,
                noise_distribution=observable.noise_distribution,
                sigma=observable.noise_formula,
            )
            for observable in self.petab_problem.observables or []
        ]


[docs]
    def import_module(self, force_import: bool = False) -> amici.ModelModule:
        """Import the generated model module.

        :param force_import:
            Whether to force re-import even if the model module already exists.
        :return: The imported model module.
        """
        if not self.outdir.is_dir() or force_import:
            if self.petab_problem.model.type_id == MODEL_TYPE_SBML:
                self._do_import_sbml()
            else:
                self._do_import_pysb()

        return amici.import_model_module(
            self._module_name,
            self.outdir,
        )



[docs]
    def create_model(self) -> amici.Model:
        """Create a :class:`amici.Model` instance from the imported model."""
        return self.import_module().get_model()



[docs]
    def create_simulator(self, force_import: bool = False) -> PetabSimulator:
        """
        Create a PEtab simulator for the imported model.

        :param force_import:
            Whether to force re-import even if the model module already exists.
        :return: The created PEtab simulator.
        """
        model = self.import_module(force_import=force_import).get_model()
        em = ExperimentManager(model=model, petab_problem=self.petab_problem)
        return PetabSimulator(em=em)





[docs]
class ExperimentManager:
    # TODO: support for pscale?
    """
    Handles the creation of :class:`ExpData` objects for a given model and
    PEtab problem.

    The assumption is that we have a set of :class:`amici.ExpData` objects,
    one for each PEtab experiment.
    Those are updated based on a set of global parameters (PEtab
    problem parameters, as opposed to model parameters for a single experiment
    period).
    """

    # TODO debug, remove
    _debug = False


[docs]
    def __init__(
        self,
        model: amici.Model,
        petab_problem: v2.Problem,
    ):
        """
        Initialize the `ExperimentManager`.

        :param model: The AMICI model to use.
        :param petab_problem: The PEtab problem to use.
            This is expected to be the output of
            :class:`petab.v2.ExperimentsToSbmlConverter` or an equivalent problem.
            This object must not be modified after the creation of this
            :class:`ExperimentManager` instance.
        """
        self._model: amici.Model = model
        self._petab_problem: v2.Problem = petab_problem
        self._state_ids: tuple[str, ...] = tuple(self._model.get_state_ids())
        self._parameter_ids: tuple[str, ...] = tuple(
            self._model.get_parameter_ids()
        )
        self._fixed_parameter_ids: tuple[str, ...] = tuple(
            self._model.get_fixed_parameter_ids()
        )
        # maps parameter IDs to parameter indices in the model
        self._pid_to_idx: dict[str, int] = {
            id_: i for i, id_ in enumerate(self._parameter_ids)
        }
        self._fixed_pid_to_idx: dict[str, int] = {
            id_: i for i, id_ in enumerate(self._fixed_parameter_ids)
        }
        # maps PEtab observable IDs to petab Observable instances
        self._petab_id_to_obs: dict[str, v2.Observable] = {
            obs.id: obs for obs in self._petab_problem.observables
        }

        # create a new model instance from the model module from which
        #  we can get the default parameters
        model0 = model.module.get_model()
        self._original_p = np.array(model0.get_parameters())
        self._original_k = np.array(model0.get_fixed_parameters())



[docs]
    def create_edatas(self) -> list[amici.ExpData]:
        """Create ExpData objects for all experiments."""
        return [
            self.create_edata(experiment)
            for experiment in self._petab_problem.experiments
        ]



[docs]
    def create_edata(
        self,
        experiment: v2.core.Experiment | str | None,
        problem_parameters: dict[str, float] | None = None,
    ) -> amici.ExpData:
        """Create an ExpData object for a single experiment.

        Sets timepoints, measurements, initial conditions, ... based on the
        given experiment and the nominal parameters of the PEtab problem.

        :param experiment:
            The experiment or experiment ID to create the `ExpData` for.
        :param problem_parameters:
            Optional dictionary of problem parameters to apply to the
            `ExpData`. If `None`, the nominal parameters of the PEtab problem
            are used.
        :return:
            The created `ExpData` object for the given experiment.
        """
        if isinstance(experiment, str):
            experiment = self._petab_problem[experiment]

        if len(experiment.periods) > 2:
            raise AssertionError(
                f"Expected <= 2 periods, got {len(experiment.periods)} "
                f"for experiment {experiment.id}."
            )

        edata = amici.ExpData(self._model)
        edata.id = experiment.id

        self._set_constants(edata, experiment)
        self._set_timepoints_and_measurements(edata, experiment)

        if self._debug:
            logger.debug(
                f"Created ExpData id={edata.id}, "
                f"k_preeq={edata.fixed_parameters_pre_equilibration}, "
                f"k={edata.fixed_parameters}"
            )

        if problem_parameters is None:
            problem_parameters = self._petab_problem.get_x_nominal_dict()
        self.apply_parameters(edata, problem_parameters=problem_parameters)

        return edata


    def _set_constants(
        self, edata: amici.ExpData, experiment: v2.core.Experiment
    ) -> None:
        """
        Set constant parameters for the given experiment.

        :param edata:
            The ExpData instance to set the constants for.
        :param experiment:
            The PEtab experiment to set the constants for.
        """
        # After converting experiments to events, all remaining
        # condition parameters are constants.
        if not experiment.periods:
            # No periods, no changes to apply.
            # Use the original fixed parameters that are encoded in the model.
            return

        def get_k(period: ExperimentPeriod):
            """Get the fixed parameters for the period."""
            changes = self._petab_problem.get_changes_for_period(period)
            fixed_pars_vals = self._original_k.copy()
            for change in changes:
                pid = self._fixed_pid_to_idx[change.target_id]
                # those are only indicator variables that are always number
                #  literals
                fixed_pars_vals[pid] = change.target_value
            return fixed_pars_vals

        if experiment.sorted_periods[0].time == -np.inf:
            # pre-equilibration period
            edata.fixed_parameters_pre_equilibration = get_k(
                experiment.sorted_periods[0]
            )
            # In PEtab, pre-equilibration always starts at t=0, since SBML
            # does not support specifying a different start time (yet).
            edata.t_start_preeq = 0

        if len(experiment.periods) >= int(1 + experiment.has_preequilibration):
            # simulation period
            main_period = experiment.sorted_periods[
                int(experiment.has_preequilibration)
            ]
            edata.fixed_parameters = get_k(main_period)
            edata.t_start = main_period.time

    def _set_timepoints_and_measurements(
        self, edata: amici.ExpData, experiment: v2.core.Experiment
    ) -> None:
        """
        Set timepoints and measurements for the given experiment.

        :param edata:
            The `ExpData` instance to update.
        :param experiment:
            The PEtab experiment to set the timepoints and measurements for.
        """
        # Get the required time points: this is the superset of timepoints
        #  of the measurements of all observables, including the different
        #  replicates
        measurements = self._petab_problem.get_measurements_for_experiment(
            experiment
        )
        t_counters = {o.id: Counter() for o in self._petab_problem.observables}
        unique_t = set()
        for m in measurements:
            t_counters[m.observable_id].update([m.time])
            unique_t.add(m.time)

        max_counter = Counter()
        for t in unique_t:
            for counter in t_counters.values():
                max_counter[t] = max(max_counter[t], counter[t])

        timepoints_w_reps = sorted(max_counter.elements())

        edata.set_timepoints(timepoints_w_reps)

        # measurements and sigmas
        y, sigma_y = self._get_measurements_and_sigmas(
            measurements=measurements,
            timepoints_w_reps=timepoints_w_reps,
            observable_ids=self._model.get_observable_ids(),
        )
        edata.set_observed_data(y.flatten())
        edata.set_observed_data_std_dev(sigma_y.flatten())

    def _get_measurements_and_sigmas(
        self,
        measurements: list[v2.Measurement],
        timepoints_w_reps: Sequence[numbers.Number],
        observable_ids: Sequence[str],
    ) -> tuple[np.ndarray, np.ndarray]:
        """
        Get measurements and sigmas

        Generate arrays with measured values and sigmas in AMICI format from a
        list of PEtab measurements.

        :param measurements:
            Subset of PEtab measurement table for one experiment
        :param timepoints_w_reps:
            Timepoints for which there exist measurements, including
            replicates.
        :param observable_ids:
            List of observable IDs for mapping IDs to indices.
        :return:
            arrays for measurement and sigmas
        """
        # prepare measurement matrix
        y = np.full(
            shape=(len(timepoints_w_reps), len(observable_ids)),
            fill_value=np.nan,
        )
        # prepare sigma matrix
        sigma_y = y.copy()

        time_to_meas = {}
        for m in measurements:
            time_to_meas.setdefault(m.time, []).append(m)

        for time in sorted(time_to_meas):
            # subselect for time
            time_ix_0 = timepoints_w_reps.index(time)

            # remember used time indices for each observable
            time_ix_for_obs_ix = {}

            # iterate over measurements
            for m in time_to_meas[time]:
                # extract observable index
                observable_ix = observable_ids.index(m.observable_id)

                # update time index for observable
                if observable_ix in time_ix_for_obs_ix:
                    time_ix_for_obs_ix[observable_ix] += 1
                else:
                    time_ix_for_obs_ix[observable_ix] = time_ix_0

                # fill observable and possibly noise parameter
                y[time_ix_for_obs_ix[observable_ix], observable_ix] = (
                    m.measurement
                )
                if (
                    len(m.noise_parameters) == 1
                    and m.noise_parameters[0].is_Number
                ):
                    sigma_y[
                        time_ix_for_obs_ix[observable_ix], observable_ix
                    ] = float(m.noise_parameters[0])
        return y, sigma_y


[docs]
    def apply_parameters(
        self, edata: amici.ExpData, problem_parameters: dict[str, float]
    ) -> None:
        """Apply problem parameters.

        Update the parameter-dependent values of the given `ExpData` instance
        according to the provided problem parameters (i.e., values of the
        parameters in the PEtab parameter table).

        This assumes that:

        * the `ExpData` instance was created by :meth:`create_edata`,
        * no other changes except for calls to :meth:`apply_parameters`
          were made,
        * and the PEtab problem was not modified since the creation of this
          :class:`ExperimentManager` instance.

        :param edata: The :class:`ExpData` instance to be updated.
            In case of errors, the state of `edata` is undefined.
        :param problem_parameters: Problem parameters to be applied.
        """
        # TODO: support ndarray in addition to dict?

        # check parameter IDs
        if set(problem_parameters) != set(self._petab_problem.x_ids):
            missing = set(self._petab_problem.x_ids) - set(problem_parameters)
            extra = set(problem_parameters) - set(self._petab_problem.x_ids)
            msg_parts = []
            if missing:
                # TODO: support a subset of parameters?
                #  if so, update only those parameters and leave the rest as is
                #  or use nominal values for missing ones?
                msg_parts.append(f"missing parameters: {missing}")
            if extra:
                msg_parts.append(f"unknown parameters: {extra}")
            raise ValueError(
                "Provided problem parameters do not match "
                "PEtab problem parameters: " + "; ".join(msg_parts)
            )

        # get the original parameter values
        #  (model parameters set during model creation)
        par_vals = np.array(self._original_p)
        pid_to_idx = self._pid_to_idx
        experiment_id = edata.id
        experiment = self._petab_problem[experiment_id]

        # plist -- estimated parameters + those mapped via placeholders
        # TODO sufficient to set them during creation of edata
        #   or allow dynamic fixing of parameters?
        plist = []
        placeholder_mappings = self._get_placeholder_mapping(experiment)
        estimated_par_ids = self._petab_problem.x_free_ids
        for model_par_idx, model_par_id in enumerate(
            self._model.get_parameter_ids()
        ):
            if model_par_id in estimated_par_ids or (
                (maps_to := placeholder_mappings.get(model_par_id)) is not None
                and maps_to in estimated_par_ids
            ):
                plist.append(model_par_idx)
        edata.plist = plist

        # Update fixed parameters in case they are affected by problem
        #  parameters (i.e., parameter table parameters)
        fixed_par_vals = np.asarray(edata.fixed_parameters)
        for p_id, p_val in problem_parameters.items():
            if (p_idx := self._fixed_pid_to_idx.get(p_id)) is not None:
                fixed_par_vals[p_idx] = p_val
        edata.fixed_parameters = fixed_par_vals

        if edata.fixed_parameters_pre_equilibration:
            fixed_par_vals = np.array(edata.fixed_parameters_pre_equilibration)
            for p_id, p_val in problem_parameters.items():
                if (p_idx := self._fixed_pid_to_idx.get(p_id)) is not None:
                    fixed_par_vals[p_idx] = p_val
            edata.fixed_parameters_pre_equilibration = fixed_par_vals

        # Apply problem parameter values to identical model parameters.
        #  Any other parameter mapping, except for output parameter
        #  placeholders, is handled by events.
        for k, v in problem_parameters.items():
            if (idx := pid_to_idx.get(k)) is not None:
                par_vals[idx] = v

        # Handle measurement-specific mappings to placeholders
        measurements = self._petab_problem.get_measurements_for_experiment(
            experiment
        )

        def apply_override(placeholder: str, override: sp.Basic):
            """Apply a single placeholder override."""
            if (idx := pid_to_idx.get(placeholder)) is not None:
                if override.is_Number:
                    par_vals[idx] = float(override)
                elif override.is_Symbol:
                    par_vals[idx] = problem_parameters[str(override)]
                else:
                    raise AssertionError(
                        f"Unexpected override type: {override} for {placeholder} in experiment {experiment_id}"
                    )
            else:
                raise NotImplementedError(
                    f"Cannot handle override `{placeholder}' => '{override}'"
                )

        # tracks encountered placeholders and their overrides
        # (across all observables -- placeholders IDs are globally unique)
        #  and check that all periods use the same overrides
        #  (except for numeric sigmas)
        # TODO: this can be simplified. we only need to process overrides
        #  that are parameters. the rest was handled during create_edata
        overrides = {}
        for m in measurements:
            obs = self._petab_id_to_obs[m.observable_id]
            if obs.observable_placeholders:
                for placeholder, override in zip(
                    obs.observable_placeholders,
                    m.observable_parameters,
                    strict=True,
                ):
                    placeholder = str(placeholder)
                    if (
                        prev_override := overrides.get(placeholder)
                    ) is not None and prev_override != override:
                        raise NotImplementedError(
                            "Timepoint-specific observable placeholder "
                            "overrides are not supported"
                        )
                    apply_override(placeholder, override)
            if obs.noise_placeholders:
                for placeholder, override in zip(
                    obs.noise_placeholders, m.noise_parameters, strict=True
                ):
                    placeholder = str(placeholder)
                    if (
                        prev_override := overrides.get(placeholder)
                    ) is not None and prev_override != override:
                        # TODO: this might have been handled
                        #  via .sigmay if numeric
                        raise NotImplementedError(
                            "Timepoint-specific observable placeholder "
                            "overrides are not supported"
                        )
                    apply_override(placeholder, override)

        # TODO: set all unused placeholders to NaN to make it easier to spot problems?
        edata.parameters = par_vals

        if self._debug:
            logger.debug("ExperimentManager.apply_parameters:")
            logger.debug(
                f"Parameters: "
                f"{dict(zip(self._parameter_ids, map(float, par_vals)))}"
            )


    @property
    def petab_problem(self) -> v2.Problem:
        """The PEtab problem used by this ExperimentManager.

        This must not be modified.
        """
        return self._petab_problem

    @property
    def model(self) -> amici.Model:
        """The AMICI model used by this ExperimentManager."""
        return self._model

    def _get_placeholder_mapping(
        self, experiment: v2.Experiment
    ) -> dict[str, str]:
        """Get the mapping from model parameter IDs (= PEtab placeholder ID)
        to problem parameter IDs for placeholders in the given experiment.

        Because AMICI does not support timepoint-specific overrides,
        this mapping is unique.

        :param experiment: The experiment to get the mapping for.
        :return: The mapping from model parameter IDs to problem parameter IDs.
        """
        mapping = {}
        for measurement in self._petab_problem.get_measurements_for_experiment(
            experiment
        ):
            observable = self._petab_problem[measurement.observable_id]
            for placeholder, override in zip(
                observable.observable_placeholders,
                measurement.observable_parameters,
                strict=True,
            ):
                # we don't care about numeric overrides here
                if isinstance(override, sp.Symbol):
                    mapping[str(placeholder)] = str(override)

            for placeholder, override in zip(
                observable.noise_placeholders,
                measurement.noise_parameters,
                strict=True,
            ):
                # we don't care about numeric overrides here
                if isinstance(override, sp.Symbol):
                    mapping[str(placeholder)] = str(override)
        return mapping




[docs]
class PetabSimulator:
    """
    Simulator for PEtab2 problems.

    This class is used to simulate all experiments of a given PEtab problem
    using a given AMICI model and solver, and to aggregate the results.
    """


[docs]
    def __init__(
        self,
        em: ExperimentManager,
        solver: amici.Solver | None = None,
        num_threads: int = 1,
        # TODO: allow selecting specific experiments?
        # TODO: store_edatas: bool
    ):
        """
        Initialize the simulator.

        :param em:
            The :class:`ExperimentManager` to generate the :class:`amici.ExpData`
            objects.
        :param solver: The AMICI solver to use for the simulations.
            If not provided, a new solver with default settings will be used.
        :param num_threads:
            The number of threads to use for parallel simulation of experiments.
            Only relevant if multiple experiments are present in the PEtab problem,
            and if AMICI was compiled with OpenMP support.
        """
        self._petab_problem: v2.Problem = em.petab_problem
        self._model = em.model
        self._solver = (
            solver if solver is not None else self._model.create_solver()
        )
        self._exp_man: ExperimentManager = em
        self.num_threads = num_threads


    @property
    def model(self) -> amici.Model:
        """The AMICI model used by this simulator."""
        return self._model

    @property
    def solver(self) -> amici.Solver:
        """The AMICI solver used by this simulator."""
        return self._solver

    @property
    def exp_man(self) -> ExperimentManager:
        """The ExperimentManager used by this simulator."""
        return self._exp_man


[docs]
    def simulate(
        self, problem_parameters: dict[str, float] = None
    ) -> dict[str, Any]:
        # TODO params: dict|np.ndarray|None?
        """Simulate all experiments of the given PEtab problem.

        :return:
            Dictionary of

            * the summed cost function value (``LLH``),
            * list of :class:`amici.amici.ReturnData` (``RDATAS``)
              for each experiment,
            * list of :class:`amici.amici.ExpData` (``EDATAS``)
              for each experiment

           Note that the returned :class:`amici.amici.ExpData` instances
           may be changed by subsequent calls to this function.
           Create a copy if needed.
        """
        if problem_parameters is None:
            # use default parameters, i.e., nominal values for all parameters
            # TODO: Nominal parameters, or previously used parameters?
            problem_parameters = {}

        # use nominal values for all unspecified parameters
        problem_parameters_default = self._petab_problem.get_x_nominal_dict()
        problem_parameters = problem_parameters_default | problem_parameters

        # TODO cache edatas
        edatas = self._exp_man.create_edatas()

        for edata in edatas:
            self._exp_man.apply_parameters(
                edata=edata, problem_parameters=problem_parameters
            )

        rdatas = amici.run_simulations(
            self._model, self._solver, edatas, num_threads=self.num_threads
        )

        return {
            EDATAS: edatas,
            RDATAS: rdatas,
            LLH: sum(rdata.llh for rdata in rdatas),
            SLLH: self._aggregate_sllh(rdatas),
            S2LLH: self._aggregate_s2llh(rdatas, use_fim=True),
            RES: np.hstack([rdata.res for rdata in rdatas]),
            # TODO: implement residual sensitivity aggregation
            SRES: None,
        }


    def _aggregate_sllh(
        self, rdatas: Sequence[amici.ReturnDataView]
    ) -> dict[str, float] | None:
        """Aggregate the sensitivities of the log-likelihoods.

        :param rdatas:
            The ReturnData objects to aggregate the sensitivities from.
        :return:
            The aggregated sensitivities (parameter ID -> sensitivity value).
        """
        if self._solver.get_sensitivity_order() < SensitivityOrder.first:
            return None

        sllh_total: dict[str, float] = {}

        # Check for issues in all condition simulation results.
        for rdata in rdatas:
            # Condition failed during simulation.
            if rdata.status != amici.AMICI_SUCCESS:
                return None
            # Condition simulation result does not provide SLLH.
            if rdata.sllh is None:
                raise ValueError(
                    f"The sensitivities of the likelihood for experiment "
                    f"{rdata.id} were not computed."
                )

        parameter_ids = self._model.get_parameter_ids()

        # still needs parameter mapping for placeholders
        for rdata in rdatas:
            experiment = self._petab_problem[rdata.id]
            placeholder_mappings = self._exp_man._get_placeholder_mapping(
                experiment
            )
            for model_par_idx, sllh in zip(
                rdata.plist, rdata.sllh, strict=True
            ):
                model_par_id = problem_par_id = parameter_ids[model_par_idx]
                if maps_to := placeholder_mappings.get(model_par_id):
                    problem_par_id = maps_to

                sllh_total[problem_par_id] = (
                    sllh_total.get(problem_par_id, 0.0) + sllh
                )
        return sllh_total

    def _aggregate_s2llh(
        self,
        rdatas: Sequence[amici.ReturnDataView],
        use_fim: bool = True,
    ) -> np.ndarray | None:
        """Aggregate the Hessians from individual experiments.

        Compute the total second-order sensitivities of the log-likelihoods
        w.r.t. estimated PEtab problem parameters.

        :param rdatas:
            The ReturnData objects to aggregate the sensitivities from.
        :param use_fim:
            Whether to use the Fisher Information Matrix (FIM) to compute
            the 2nd order sensitivities. Only ``True`` is currently supported.
        :return:
            The aggregated 2nd order sensitivities as a 2D numpy array
            in the order of the estimated PEtab problem parameters
            (``Problem.x_free_ids``),
            or `None` if sensitivities were not computed.
        """
        # TODO: add tests
        if self._solver.get_sensitivity_order() < SensitivityOrder.first:
            return None

        if not use_fim:
            raise NotImplementedError(
                "Computation of 2nd order sensitivities without FIM is not "
                "implemented yet."
            )

        # Check for issues in all condition simulation results.
        for rdata in rdatas:
            # Condition failed during simulation.
            if rdata.status != amici.AMICI_SUCCESS:
                return None
            # Condition simulation result does not provide FIM.
            if rdata.FIM is None:
                raise ValueError(
                    f"The FIM was not computed for experiment {rdata.id!r}."
                )

        # Model parameter index to problem parameter index map for estimated
        #  parameters except placeholders.
        #  This is the same for all experiments.
        global_ix_map: dict[int, int] = {
            model_ix: self._petab_problem.x_free_ids.index(model_pid)
            for model_ix, model_pid in enumerate(
                self._model.get_parameter_ids()
            )
            if model_pid in self._petab_problem.x_free_ids
        }
        s2llh_total = np.zeros(
            shape=(
                self._petab_problem.n_estimated,
                self._petab_problem.n_estimated,
            ),
            dtype=float,
        )

        for rdata in rdatas:
            ix_map = global_ix_map.copy()
            # still needs experiment-specific parameter mapping for
            # placeholders
            experiment = self._petab_problem[rdata.id]
            placeholder_mappings = self._exp_man._get_placeholder_mapping(
                experiment
            )
            for model_pid, problem_pid in placeholder_mappings.items():
                try:
                    ix_map[self.model.get_parameter_ids().index(model_pid)] = (
                        self._petab_problem.x_free_ids.index(problem_pid)
                    )
                except ValueError:
                    # mapped-to parameter is not estimated
                    pass

            # translate model parameter index to plist index
            ix_map: dict[int, int] = {
                tuple(rdata.plist).index(model_par_ix): problem_par_ix
                for model_par_ix, problem_par_ix in ix_map.items()
            }
            if use_fim:
                model_s2llh = rdata.FIM
            else:
                raise NotImplementedError()

            model_par_slice = np.fromiter(ix_map.keys(), dtype=int)
            problem_par_slice = np.fromiter(ix_map.values(), dtype=int)

            # handle possible non-unique indices in problem_par_slice
            # (i.e. multiple model parameters mapping to the same problem
            # parameter)
            problem_par_slice_unique, unique_index = np.unique(
                problem_par_slice, return_index=True
            )
            # handle unique mappings
            s2llh_total[
                np.ix_(problem_par_slice_unique, problem_par_slice_unique)
            ] += model_s2llh[
                np.ix_(
                    model_par_slice[unique_index],
                    model_par_slice[unique_index],
                )
            ]
            # handle non-unique mappings if any
            if problem_par_slice_unique.size < problem_par_slice.size:
                # index in the mapping arrays of non-unique entries
                non_unique_indices = [
                    idx
                    for idx in range(len(problem_par_slice))
                    if idx not in unique_index
                ]
                for idx in non_unique_indices:
                    s2llh_total[
                        problem_par_slice[idx], problem_par_slice_unique
                    ] += model_s2llh[
                        model_par_slice[idx], model_par_slice[unique_index]
                    ]
                    s2llh_total[
                        problem_par_slice_unique, problem_par_slice[idx]
                    ] += model_s2llh[
                        model_par_slice[unique_index], model_par_slice[idx]
                    ]
                    for jdx in non_unique_indices:
                        s2llh_total[
                            problem_par_slice[idx], problem_par_slice[jdx]
                        ] += model_s2llh[
                            model_par_slice[idx], model_par_slice[jdx]
                        ]

        return s2llh_total



def _set_default_experiment(
    problem: v2.Problem, id_: str = _DEFAULT_EXPERIMENT_ID
) -> None:
    """Replace any empty experiment ID in the measurement table by
    a new dummy experiment with ID ``id_``.

    :param problem: The PEtab problem. This will be modified in place.
    """
    if not any(m.experiment_id is None for m in problem.measurements):
        return

    # create dummy experiment
    problem += v2.core.Experiment(
        id=id_,
    )

    for m in problem.measurements:
        if m.experiment_id is None:
            m.experiment_id = id_



[docs]
def rdatas_to_measurement_df(
    rdatas: Sequence[amici.ReturnData],
    model: amici.AmiciModel,
    petab_problem: v2.Problem,
) -> pd.DataFrame:
    """
    Create a measurement dataframe in the PEtab format from the passed
    ``rdatas`` and own information.

    :param rdatas:
        A sequence of :class:`amici.ReturnData`.
    :param model:
        AMICI model used to generate ``rdatas``.
    :param petab_problem:
        The PEtab problem used to generate ``rdatas``.
    :return:
        A dataframe built from simulation results in `rdatas` in the format
        of the PEtab measurement table.
    """

    measurement_df = petab_problem.measurement_df
    observable_ids = model.get_observable_ids()
    rows = []
    # iterate over conditions
    for rdata in rdatas:
        experiment_id = rdata.id

        # current simulation matrix
        y = rdata.y
        # time array used in rdata
        t = list(rdata.ts)

        # extract rows for condition
        cur_measurement_df = measurement_df[
            measurement_df[v2.C.EXPERIMENT_ID] == experiment_id
        ]

        # iterate over entries for the given condition
        # note: this way we only generate a dataframe entry for every
        # row that existed in the original dataframe. if we want to
        # e.g. have also timepoints non-existent in the original file,
        # we need to instead iterate over the rdata['y'] entries
        for _, row in cur_measurement_df.iterrows():
            # copy row
            row_sim = copy.deepcopy(row)

            # extract simulated measurement value
            timepoint_idx = t.index(row[v2.C.TIME])
            observable_idx = observable_ids.index(row[v2.C.OBSERVABLE_ID])
            measurement_sim = y[timepoint_idx, observable_idx]

            # change measurement entry
            row_sim[v2.C.MEASUREMENT] = measurement_sim

            rows.append(row_sim)

    return pd.DataFrame(rows)




[docs]
def rdatas_to_simulation_df(
    rdatas: Sequence[amici.ReturnData],
    model: amici.AmiciModel,
    petab_problem: v2.Problem,
) -> pd.DataFrame:
    """
    Create a simulation dataframe in the PEtab format from the passed
    ``rdatas`` and own information.

    :param rdatas:
        A sequence of :class:`amici.ReturnData`.
    :param model:
        AMICI model used to generate ``rdatas``.
    :param petab_problem:
        The PEtab problem used to generate ``rdatas``.
    :return:
        A dataframe built from simulation results in `rdatas` in the format
        of the PEtab simulation table.
    """
    measurement_df = rdatas_to_measurement_df(rdatas, model, petab_problem)

    simulation_df = measurement_df.rename(
        columns={v2.C.MEASUREMENT: v2.C.SIMULATION}
    )

    # revert setting default experiment Id
    simulation_df.loc[
        simulation_df[v2.C.EXPERIMENT_ID] == _DEFAULT_EXPERIMENT_ID,
        v2.C.EXPERIMENT_ID,
    ] = np.nan

    return simulation_df




[docs]
def has_timepoint_specific_overrides(
    petab_problem: v2.Problem,
    ignore_scalar_numeric_noise_parameters: bool = False,
    ignore_scalar_numeric_observable_parameters: bool = False,
) -> bool:
    """Check if the measurements have timepoint-specific observable or
    noise parameter overrides.

    :param petab_problem:
        PEtab problem to check.
    :param ignore_scalar_numeric_noise_parameters:
        ignore scalar numeric assignments to noiseParameter placeholders
    :param ignore_scalar_numeric_observable_parameters:
        ignore scalar numeric assignments to observableParameter
        placeholders
    :return: `True` if the problem has timepoint-specific overrides, `False`
        otherwise.
    """
    if not petab_problem.measurements:
        return False

    from petab.v1.core import get_notnull_columns
    from petab.v1.lint import is_scalar_float

    measurement_df = petab_problem.measurement_df

    # mask numeric values
    for col, allow_scalar_numeric in [
        (
            v2.C.OBSERVABLE_PARAMETERS,
            ignore_scalar_numeric_observable_parameters,
        ),
        (v2.C.NOISE_PARAMETERS, ignore_scalar_numeric_noise_parameters),
    ]:
        if col not in measurement_df:
            continue

        measurement_df[col] = measurement_df[col].apply(str)

        if allow_scalar_numeric:
            measurement_df.loc[
                measurement_df[col].apply(is_scalar_float), col
            ] = ""

    grouping_cols = get_notnull_columns(
        measurement_df,
        _POSSIBLE_GROUPVARS_FLATTENED_PROBLEM,
    )
    grouped_df = measurement_df.groupby(grouping_cols, dropna=False)

    grouping_cols = get_notnull_columns(
        measurement_df,
        [
            v2.C.MODEL_ID,
            v2.C.OBSERVABLE_ID,
            v2.C.EXPERIMENT_ID,
        ],
    )
    grouped_df2 = measurement_df.groupby(grouping_cols)

    # data frame has timepoint specific overrides if grouping by noise
    # parameters and observable parameters in addition to observable and
    # experiment id yields more groups
    return len(grouped_df) != len(grouped_df2)



def _get_flattened_id_mappings(
    petab_problem: v2.Problem,
) -> dict[str, str]:
    """Get mapping from flattened to unflattened observable IDs.

    :param petab_problem:
        The unflattened PEtab problem.
    :returns:
        A mapping from flattened ID to original observable ID.
    """
    from petab.v1.core import (
        get_notnull_columns,
        get_observable_replacement_id,
    )

    groupvars = get_notnull_columns(
        petab_problem.measurement_df, _POSSIBLE_GROUPVARS_FLATTENED_PROBLEM
    )
    mappings: dict[str, str] = {}

    old_observable_ids = {obs.id for obs in petab_problem.observables}
    for groupvar, _ in petab_problem.measurement_df.groupby(
        groupvars, dropna=False
    ):
        observable_id = groupvar[groupvars.index(v2.C.OBSERVABLE_ID)]
        observable_replacement_id = get_observable_replacement_id(
            groupvars, groupvar
        )

        logger.debug(f"Creating synthetic observable {observable_id}")
        if (
            observable_id != observable_replacement_id
            and observable_replacement_id in old_observable_ids
        ):
            raise RuntimeError(
                "could not create synthetic observables "
                f"since {observable_replacement_id} was "
                "already present in observable table"
            )

        mappings[observable_replacement_id] = observable_id

    return mappings



[docs]
def flatten_timepoint_specific_output_overrides(
    petab_problem: v2.Problem,
) -> None:
    """Flatten timepoint-specific output parameter overrides.

    If the PEtab problem definition has timepoint-specific
    `observableParameters` or `noiseParameters` for the same observable,
    replace those by replicating the respective observable.

    This is a helper function for some tools which may not support such
    timepoint-specific mappings. The observable table and measurement table
    are modified in place.

    :param petab_problem:
        PEtab problem to work on. Modified in place.
    """
    from petab.v1.core import (
        get_notnull_columns,
        get_observable_replacement_id,
    )

    # Update observables
    def create_new_observable(old_id, new_id) -> Observable:
        if old_id not in petab_problem.observable_df.index:
            raise ValueError(
                f"Observable {old_id} not found in observable table."
            )

        # copy original observable and update ID
        observable: Observable = copy.deepcopy(petab_problem[old_id])
        observable.id = new_id

        # update placeholders
        old_obs_placeholders = observable.observable_placeholders
        old_noise_placeholders = observable.noise_placeholders
        suffix = new_id.removeprefix(old_id)
        observable.observable_placeholders = [
            f"{sym.name}{suffix}" for sym in observable.observable_placeholders
        ]
        observable.noise_placeholders = [
            f"{sym.name}{suffix}" for sym in observable.noise_placeholders
        ]

        # placeholders in formulas
        subs = dict(
            zip(
                old_obs_placeholders,
                observable.observable_placeholders,
                strict=True,
            )
        )
        observable.formula = observable.formula.subs(subs)
        subs |= dict(
            zip(
                old_noise_placeholders,
                observable.noise_placeholders,
                strict=True,
            )
        )
        observable.noise_formula = observable.noise_formula.subs(subs)

        return observable

    mappings = _get_flattened_id_mappings(petab_problem)

    petab_problem.observable_tables = [
        v2.ObservableTable(
            [
                create_new_observable(old_id, new_id)
                for new_id, old_id in mappings.items()
            ]
        )
    ]

    # Update measurements
    groupvars = get_notnull_columns(
        petab_problem.measurement_df, _POSSIBLE_GROUPVARS_FLATTENED_PROBLEM
    )
    for measurement_table in petab_problem.measurement_tables:
        for measurement in measurement_table.measurements:
            # TODO: inefficient, but ok for a start
            group_vals = (
                v2.MeasurementTable([measurement])
                .to_df()
                .iloc[0][groupvars]
                .tolist()
            )
            new_obs_id = get_observable_replacement_id(groupvars, group_vals)
            measurement.observable_id = new_obs_id




[docs]
def unflatten_simulation_df(
    simulation_df: pd.DataFrame,
    petab_problem: v2.Problem,
) -> pd.DataFrame:
    """Unflatten simulations from a flattened PEtab problem.

    A flattened PEtab problem is the output of applying
    :func:`flatten_timepoint_specific_output_overrides` to a PEtab problem.

    :param simulation_df:
        The simulation dataframe. A dataframe in the same format as a PEtab
        measurements table, but with the ``measurement`` column switched
        with a ``simulation`` column.
    :param petab_problem:
        The unflattened PEtab problem.
    :returns:
        The simulation dataframe for the unflattened PEtab problem.
    """
    mappings = _get_flattened_id_mappings(petab_problem)
    original_observable_ids = simulation_df[v2.C.OBSERVABLE_ID].replace(
        mappings
    )
    unflattened_simulation_df = simulation_df.assign(
        **{
            v2.C.OBSERVABLE_ID: original_observable_ids,
        }
    )
    return unflattened_simulation_df



def _get_fixed_parameters_sbml(
    petab_problem: v2.Problem,
    non_estimated_parameters_as_constants=True,
) -> set[str]:
    """
    Determine, set and return fixed model parameters.

    :param petab_problem:
        The PEtab problem instance

    :param non_estimated_parameters_as_constants:
        Whether parameters marked as non-estimated in PEtab should be
        considered constant in AMICI. Setting this to ``True`` will reduce
        model size and simulation times. If sensitivities with respect to those
        parameters are required, this should be set to ``False``.

    :return:
        List of IDs of (AMICI) parameters that are not estimated.
    """
    if not petab_problem.model.type_id == MODEL_TYPE_SBML:
        raise ValueError("Not an SBML model.")

    if not non_estimated_parameters_as_constants:
        raise NotImplementedError(
            "Only non_estimated_parameters_as_constants=True is supported."
        )

    # For amici constants we select everything
    # 1) that is a parameter in AMICI
    # and
    # 2) that is not flagged as estimated in PEtab
    # and
    # 3) for which there is no condition, where this parameter occurs as a
    #    targetId where the targetValue expression contains any estimated
    #    parameters
    #    TODO: if we assume that condition table changes have been converted to
    #     events, we can skip this check. indicator variables are always
    #     literal numbers. right?

    sbml_model = petab_problem.model.sbml_model

    # What will be implemented as a parameter in the amici model?
    amici_parameters = {
        p.getId()
        for p in sbml_model.getListOfParameters()
        if p.getConstant() is True
        # TODO: IAs with literals can be ignored
        # TODO(performance): collect IAs once
        and sbml_model.getInitialAssignmentBySymbol(p.getId()) is None
    }

    estimated_parameters = set(petab_problem.x_free_ids)

    return amici_parameters - estimated_parameters


def _add_observation_model_pysb(petab_problem: v2.Problem, jax: bool = False):
    """Extend PySB model by observation model as defined in the PEtab
    observables table"""
    import pysb

    pysb_model: pysb.Model = petab_problem.model.model

    # add any required output parameters
    local_syms = {
        sp.Symbol(sp.Symbol.__str__(comp), real=True): comp
        for comp in pysb_model.components
        if isinstance(comp, sp.Symbol)
    }

    def process_formula(sym: sp.Basic):
        changed_formula = False
        sym = sym.subs(local_syms)
        for s in sym.free_symbols:
            if not isinstance(s, pysb.Component):
                if not isinstance(s, sp.Symbol):
                    raise AssertionError(
                        f"Unexpected symbol type in observable formula: {s}, "
                        f"{type(s)}"
                    )
                name = str(s)
                p = pysb.Parameter(name, 1.0, _export=False)
                pysb_model.add_component(p)

                # placeholders for multiple observables are mapped to the
                # same symbol, so only add to local_syms when necessary
                if name not in local_syms:
                    local_syms[sp.Symbol(name, real=True)] = p

                # replace placeholder with parameter
                if jax and name != str(s):
                    changed_formula = True
                    sym = sym.subs(s, local_syms[name])
        return sym, changed_formula

    for observable in petab_problem.observables:
        sym, changed_formula = process_formula(observable.formula)
        observable.formula = sym
        sym, changed_formula = process_formula(observable.noise_formula)
        observable.noise_formula = sym

    # add observables and sigmas to pysb model
    for observable in petab_problem.observables:
        # obs_symbol = sp.sympify(observable_formula, locals=local_syms)
        if observable.id in pysb_model.expressions.keys():
            obs_expr = pysb_model.expressions[observable.id]
        else:
            obs_expr = pysb.Expression(
                observable.id, observable.formula, _export=False
            )
            pysb_model.add_component(obs_expr)
        local_syms[sp.Symbol(observable.id, real=True)] = obs_expr

        sigma_id = f"{observable.id}_sigma"
        sigma_expr = pysb.Expression(
            sigma_id, observable.noise_formula.subs(local_syms), _export=False
        )
        observable.noise_formula = sp.Symbol(sigma_id, real=True)
        pysb_model.add_component(sigma_expr)
        local_syms[sp.Symbol(sigma_id, real=True)] = sigma_expr


class ExperimentsToPySBConverter:
    """
    Convert PEtab experiments to amici events and PySB initials.

    See :meth:`convert` for details.
    """

    #: ID of the parameter that indicates whether the model is in
    #  the pre-equilibration phase (1) or not (0).
    PREEQ_INDICATOR = "_petab_preequilibration_indicator"

    #: The condition ID of the condition that sets the
    #: pre-equilibration indicator to 1.
    CONDITION_ID_PREEQ_ON = "_petab_preequilibration_on"

    #: The condition ID of the condition that sets the
    #: pre-equilibration indicator to 0.
    CONDITION_ID_PREEQ_OFF = "_petab_preequilibration_off"

    def __init__(self, petab_problem: v2.Problem):
        """Initialize the converter.

        :param petab_problem:
            The PEtab problem to convert.
            This will not be modified by this class.
        """
        from petab.v2.models.pysb_model import PySBModel

        if len(petab_problem.models) > 1:
            #  https://github.com/PEtab-dev/libpetab-python/issues/392
            raise NotImplementedError(
                "Only single-model PEtab problems are supported."
            )
        if not isinstance(petab_problem.model, PySBModel):
            raise ValueError("Only SBML models are supported.")
        model = petab_problem.model.model
        compartment_ids = {c.name for c in model.compartments}
        if compartment_ids and any(
            change.target_id in compartment_ids
            for cond in petab_problem.conditions
            for change in cond.changes
        ):
            # BNG evaluates compartment sizes during network generation.
            #  Changing those values later on will lead to incorrect results.
            raise NotImplementedError(
                "Changes to compartment sizes are not supported for PySB "
                "models."
            )

        # For the moment, we only support changes that are time-constant
        #  expressions, i.e., that only contain numbers or pysb.Parameters.
        # Furthermore, we only support changing species and pysb.Expressions,
        #  but not pysb.Parameter. (Expressions can be easily changed, but
        #  we can't easily convert a Parameter to an Expression, because we
        #  can't remove components from a PySB model. This either
        #  requires deeper integration with `pysb2amici`, or we need to
        #  recreate the PySB model.)
        parameter_ids = set(petab_problem.x_ids) | {
            p.name for p in model.parameters
        }

        for cond in petab_problem.conditions:
            for change in cond.changes:
                if (
                    set(map(str, change.target_value.free_symbols))
                    - parameter_ids
                ):
                    # TODO: we can't just change Parameter to Expression in
                    #  this case.
                    #  Expressions are evaluated continuously during the
                    #  simulation. i.e., to only set the initial value, we need
                    #  to replace all dynamic constructs by their initials.
                    # TODO: we may have to convert some parameters and
                    #  expressions to state variables,
                    #  otherwise we can't use them as event targets.
                    #  This will require deeper integration of PEtab and PySB
                    #  import
                    raise NotImplementedError(
                        "Currently, only time-constant targetValue expressions"
                        f" are supported. Got {str(change.target_value)!r} "
                        f"for target {change.target_id!r}."
                    )
                if change.target_id in parameter_ids:
                    raise NotImplementedError(
                        "Currently, PySB parameters are not supported as "
                        "targets of condition table changes. Replace "
                        f"parameter {change.target_id!r} by a pysb.Expression."
                    )
        #: The PEtab problem to convert. Not modified by this class.
        self._petab_problem = petab_problem
        self._events: list[amici.de_model_components.Event] = []
        self._new_problem: v2.Problem | None = None

    @staticmethod
    def _get_experiment_indicator_condition_id(experiment_id: str) -> str:
        """Get the condition ID for the experiment indicator parameter."""
        return f"_petab_experiment_condition_{experiment_id}"

    def convert(
        self,
    ) -> tuple[v2.Problem, list[amici.de_model_components.Event]]:
        """Convert PEtab experiments to amici events and pysb initials.

        Generate events, add Initials, or convert Parameters to Expressions
        that implement the changes encoded in the PEtab v2
        experiment / condition table.
        This adds indicator variables to the PEtab problem and removes all
        condition changes that are implemented as events.

        :returns:
            A PEtab problem with only indicator parameters left in the
            condition table a maximum of two periods per experiment
            (pre-equilibration and main simulation), and a list of events
            to be passed to `pysb2amici`.
        """
        self._new_problem = copy.deepcopy(self._petab_problem)
        self._events: list[amici.de_model_components.Event] = []

        self._add_preequilibration_indicator()

        for experiment in self._new_problem.experiments:
            self._convert_experiment(experiment)

        self._add_indicators_to_conditions()

        validation_results = self._new_problem.validate()
        validation_results.log()

        return self._new_problem, self._events

    def _convert_experiment(self, experiment: v2.Experiment) -> None:
        """
        Convert a single experiment to SBML events or initial assignments.
        """
        import pysb

        model: pysb.Model = self._new_problem.model.model
        experiment.sort_periods()
        has_preequilibration = experiment.has_preequilibration
        # mapping table mappings
        self.map_petab_to_pysb = {
            mapping.petab_id: mapping.model_id
            for mapping in self._petab_problem.mappings
            if mapping.petab_id is not None and mapping.model_id is not None
        }
        self.map_pysb_to_petab = {
            mapping.model_id: mapping.petab_id
            for mapping in self._petab_problem.mappings
            if mapping.petab_id is not None and mapping.model_id is not None
        }

        # add experiment indicator
        exp_ind_id = self.get_experiment_indicator(experiment.id)
        if exp_ind_id in map(str, model.components):
            raise ValueError(
                f"The model has entity with ID `{exp_ind_id}`. "
                "IDs starting with `petab_` are reserved for "
                f"{self.__class__.__name__} and should not be used in the "
                "model."
            )
        self._add_parameter(exp_ind_id, 0)
        kept_periods: list[ExperimentPeriod] = []
        # Collect values for initial assignments for the different experiments.
        #  All expressions must be combined into a single initial assignment
        #  per target.
        # target_id -> [(experiment_indicator, target_value), ...]
        period0_assignments: dict[str, list[tuple[str, sp.Basic]]] = {}

        for i_period, period in enumerate(experiment.sorted_periods):
            if period.is_preequilibration:
                # pre-equilibration cannot be encoded as event,
                #  so we need to keep this period in the Problem.
                kept_periods.append(period)
            elif i_period == int(has_preequilibration):
                # we always keep the first non-pre-equilibration period
                #  to set the indicator parameters
                kept_periods.append(period)
            elif not period.condition_ids:
                # no condition, no changes, no need for an event,
                #  no need to keep the period unless it's the pre-equilibration
                #  or the only non-equilibration period (handled above)
                continue

            # Encode the period changes as events
            #  that trigger at the start of the period or,
            #  for the first period, as pysb.Initials.
            #  pysb.Initials are required for the first period,
            #  because other initial assignments may depend on
            #  the changed values.
            if i_period == 0:
                exp_ind_id = self.get_experiment_indicator(experiment.id)
                for change in self._new_problem.get_changes_for_period(period):
                    period0_assignments.setdefault(
                        change.target_id, []
                    ).append((exp_ind_id, change.target_value))
            else:
                self._create_period_start_event(
                    experiment=experiment,
                    i_period=i_period,
                    period=period,
                )

        # Create initials for the first period
        if period0_assignments:
            free_symbols_in_assignments = set()
            for target_id, changes in period0_assignments.items():
                # The initial value might only be changed for a subset of
                #  experiments. We need to keep the original initial value
                #  for all other experiments.
                target_entity = None
                try:
                    target_entity = next(
                        c
                        for c in model.components
                        if c.name
                        == self.map_petab_to_pysb.get(target_id, target_id)
                    )
                    if isinstance(target_entity, pysb.Parameter):
                        default = target_entity.value
                    elif isinstance(target_entity, pysb.Expression):
                        default = target_entity.expr
                    else:
                        raise AssertionError(target_id)
                except StopIteration:
                    # species pattern?
                    for initial in model.initials:
                        if str(initial.pattern) == self.map_petab_to_pysb.get(
                            target_id, target_id
                        ):
                            default = initial.value
                            break
                    else:
                        raise AssertionError(target_id)

                # Only create the initial assignment if there is
                #  actually something to change.
                if expr_cond_pairs := [
                    (target_value, sp.Symbol(exp_ind) > 0.5)
                    for exp_ind, target_value in changes
                    if target_value != default
                ]:
                    # Unlike events, we can't have different initial
                    #  assignments for different experiments, so we need to
                    #  combine all changes into a single piecewise
                    #  expression.
                    expr = sp.Piecewise(
                        *expr_cond_pairs,
                        (default, True),
                    )

                    # Update the target expression
                    if target_entity is not None and isinstance(
                        target_entity, pysb.Expression
                    ):
                        target_entity.value = expr
                    else:
                        # if the target is not an expression, it must be an
                        #  initial. the rest is excluded in __init__
                        # TODO (performance): It might be more efficient
                        #  to handle this as multi-model problem.
                        #  Individual models might result in smaller networks
                        #  than the superset model required here.
                        for initial in model.initials:
                            if str(
                                initial.pattern
                            ) == self.map_petab_to_pysb.get(
                                target_id, target_id
                            ):
                                # Initial.value needs to be parameter or
                                # expression, we can't use piecewise directly
                                expr_expr = pysb.Expression(
                                    f"_petab_initial_{target_id}",
                                    expr,
                                    _export=False,
                                )
                                model.add_component(expr_expr)
                                initial.value = expr_expr
                                break
                        else:
                            raise AssertionError(target_id, target_entity)
                    free_symbols_in_assignments |= expr.free_symbols

            # the target value may depend on parameters that are only
            #  introduced in the PEtab parameter table - those need
            #  to be added to the model
            for sym in free_symbols_in_assignments:
                if model.parameters.get(sym.name) is None:
                    self._add_parameter(sym.name, 0)

        if len(kept_periods) > 2:
            raise AssertionError("Expected at most two periods to be kept.")

        # add conditions that set the indicator parameters
        for period in kept_periods:
            period.condition_ids = [
                self._get_experiment_indicator_condition_id(experiment.id),
                self.CONDITION_ID_PREEQ_ON
                if period.is_preequilibration
                else self.CONDITION_ID_PREEQ_OFF,
            ]

        experiment.periods = kept_periods

    def _create_period_start_event(
        self,
        experiment: v2.Experiment,
        i_period: int,
        period: ExperimentPeriod,
    ):
        """Create an event that triggers at the start of a period."""
        exp_ind_id = self.get_experiment_indicator(experiment.id)
        exp_ind_sym = sp.Symbol(exp_ind_id)
        preeq_ind_sym = sp.Symbol(self.PREEQ_INDICATOR)

        # Create trigger expressions
        # Since handling of == and !=, and distinguishing < and <=
        # (and > and >=), is a bit tricky in terms of root-finding,
        # we use these slightly more convoluted expressions.
        # (assuming that the indicator parameters are {0, 1})
        if period.is_preequilibration:
            root_fun = sp.Min(exp_ind_sym - 0.5, preeq_ind_sym - 0.5)
        else:
            root_fun = sp.Min(
                exp_ind_sym - 0.5,
                0.5 - preeq_ind_sym,
                amici_time_symbol - period.time,
            )

        event_id = f"_petab_event_{experiment.id}_{i_period}"
        assignments: dict[sp.Symbol, sp.Expr] = {}
        model = self._new_problem.model.model
        for change in self._new_problem.get_changes_for_period(period):
            if change.target_id in model.parameters:
                assignments[sp.Symbol(change.target_id)] = change.target_value
                # add any missing parameters
                for sym in change.target_value.free_symbols:
                    if sym.name not in model.parameters:
                        self._add_parameter(sym.name, 0)
            else:
                raise AssertionError(change)

        event = amici.de_model_components.Event(
            identifier=sp.Symbol(event_id),
            name=event_id,
            value=root_fun,
            assignments=assignments,
            initial_value=False,
            use_values_from_trigger_time=False,
        )

        self._events.append(event)

    def _add_parameter(self, par_id: str, value: float) -> None:
        """Add a parameter to the PySB model."""
        import pysb

        p = pysb.Parameter(par_id, value, _export=False)
        self._new_problem.model.model.add_component(p)

    def _add_preequilibration_indicator(
        self,
    ) -> None:
        """Add an indicator parameter for the pre-equilibration to the SBML
        model."""
        par_id = self.PREEQ_INDICATOR
        if par_id in map(str, self._new_problem.model.model.components):
            raise ValueError(
                f"Entity with ID {par_id} already exists in the model."
            )

        # add the pre-steady-state indicator parameter
        self._add_parameter(par_id, 0.0)

    @staticmethod
    def get_experiment_indicator(experiment_id: str) -> str:
        """The ID of the experiment indicator parameter.

        The experiment indicator parameter is used to identify the
        experiment in the SBML model. It is a parameter that is set
        to 1 for the current experiment and 0 for all other
        experiments. The parameter is used in the event trigger
        to determine whether the event should be triggered.

        :param experiment_id: The ID of the experiment for which to create
            the experiment indicator parameter ID.
        """
        return f"_petab_experiment_indicator_{experiment_id}"

    def _add_indicators_to_conditions(self) -> None:
        """After converting the experiments to events, add the indicator
        parameters for the pre-equilibration period and for the different
        experiments to the remaining conditions.
        Then remove all other conditions."""
        from petab.v2 import Change, Condition, ConditionTable

        problem = self._new_problem

        # create conditions for indicator parameters
        problem += Condition(
            id=self.CONDITION_ID_PREEQ_ON,
            changes=[Change(target_id=self.PREEQ_INDICATOR, target_value=1)],
        )

        problem += Condition(
            id=self.CONDITION_ID_PREEQ_OFF,
            changes=[Change(target_id=self.PREEQ_INDICATOR, target_value=0)],
        )

        # add conditions for the experiment indicators
        for experiment in problem.experiments:
            cond_id = self._get_experiment_indicator_condition_id(
                experiment.id
            )
            changes = [
                Change(
                    target_id=self.get_experiment_indicator(experiment.id),
                    target_value=1,
                )
            ]
            problem += Condition(
                id=cond_id,
                changes=changes,
            )

        #  All changes have been encoded in event assignments and can be
        #  removed. Only keep the conditions setting our indicators.
        problem.condition_tables = [
            ConditionTable(
                [
                    condition
                    for condition in problem.conditions
                    if condition.id.startswith("_petab")
                ]
            )
        ]