Source code for amici.importers.petab._petab_importer

"""PEtab v2 import."""

from __future__ import annotations

import copy
import logging
import numbers
from collections.abc import Sequence
from pathlib import Path
from pprint import pprint
from typing import TYPE_CHECKING

import numpy as np
import pandas as pd
import sympy as sp
from petab import v1 as v1
from petab import v2 as v2
from petab.v2 import ExperimentPeriod, Observable
from petab.v2.converters import ExperimentsToSbmlConverter
from petab.v2.models import MODEL_TYPE_PYSB, MODEL_TYPE_SBML

import amici
from amici import get_model_dir
from amici._symbolic import DEModel, Event
from amici.importers.utils import MeasurementChannel, amici_time_symbol
from amici.logging import get_logger

from .v1._sbml_import import _add_global_parameter

if TYPE_CHECKING:
    import pysb

__all__ = [
    "PetabImporter",
    "rdatas_to_measurement_df",
    "rdatas_to_simulation_df",
    "flatten_timepoint_specific_output_overrides",
    "unflatten_simulation_df",
    "has_timepoint_specific_overrides",
]
logger = get_logger(__name__, log_level=logging.INFO)


#: Default experiment ID to be used for measurements without an experiment ID.
_DEFAULT_EXPERIMENT_ID = "__default__"

#: PEtab measurement table columns to consider for detecting timepoint-specific
#:  parameter overrides
_POSSIBLE_GROUPVARS_FLATTENED_PROBLEM = [
    v2.C.MODEL_ID,
    v2.C.EXPERIMENT_ID,
    v2.C.OBSERVABLE_ID,
    v2.C.OBSERVABLE_PARAMETERS,
    v2.C.NOISE_PARAMETERS,
]

# TODO: how to handle SBML vs PySB, jax vs sundials?
#  -> separate importers or subclasses?
# TODO: How to handle multi-model-problems?



[docs]
class PetabImporter:
    """
    Importer for PEtab2 problems.

    This class is used to create an AMICI model from a PEtab problem.

    The underlying SBML or PySB model will be modified to encode the
    experiments defined in the PEtab problem as events or initial conditions.

    Be careful when using the imported model for anything other than the
    PEtab-encoded experiments.

    All PEtab experiments will be encoded in the model, independent of
    whether they have measurements. This is to make it easier to simulate
    the respective experiments with the resulting AMICI model.
    This may make the resulting model more bloated. If this is not desired,
    the problem should be simplified before import.

    :param petab_problem:
        The PEtab problem to import. The problem must not be changed after
        construction of the importer.
    """

    # TODO remove: extra debug output
    _debug = False


[docs]
    def __init__(
        self,
        petab_problem: v2.Problem | v1.Problem,
        *,
        compile_: bool = None,
        validate: bool = True,
        module_name: str = None,
        # TODO: model_id for selecting the model in multi-model problems
        # model_id: str = None,
        output_dir: str | Path = None,
        jax: bool = False,
        output_parameter_defaults: dict[str, float] | None = None,
        verbose: int | bool = logging.INFO,
        non_estimated_parameters_as_constants: bool = True,
    ):
        """
        Create a new PetabImporter instance.

        :param petab_problem: The PEtab problem to import.
        :param compile_: Whether to compile the model extension after import.
        :param validate: Whether to validate the PEtab problem before import.
        :param module_name: The name of model module to generate.
        :param output_dir:
            The output directory where the model files are written to.
        :param jax: Whether to generate a JAX model instead of a
            SUNDIALS model. Currently, only ``False`` is supported.
        :param output_parameter_defaults:
            Optional default parameter values for output parameters introduced
            in the PEtab observables table, in particular for placeholder
            parameters. A dictionary mapping parameter IDs to default values.
        :param verbose:
            The verbosity level. If ``True``, set to ``logging.INFO``.
            If ``False``, set to ``logging.WARNING``. Otherwise, use the given
            logging level.
        :param non_estimated_parameters_as_constants:
            Whether parameters marked as non-estimated in PEtab should be
            considered constant in AMICI. Setting this to ``True`` will reduce
            model size and simulation times. If sensitivities with respect to
            those parameters are required, this should be set to ``False``.
        """
        self.petab_problem: v2.Problem = self._upgrade_or_copy_if_needed(
            petab_problem
        )
        self._verbose = (
            logging.INFO
            if verbose is True
            else logging.WARNING
            if verbose is False
            else verbose
        )
        self._output_parameter_defaults = output_parameter_defaults

        if len(self.petab_problem.models) > 1:
            raise NotImplementedError(
                "PEtab v2 importer currently only supports single-model "
                "problems."
            )

        if self.petab_problem.model.type_id not in (
            MODEL_TYPE_SBML,
            MODEL_TYPE_PYSB,
        ):
            raise NotImplementedError(
                "PEtab v2 importer currently only supports SBML and PySB "
                f"models. Got {self.petab_problem.model.type_id!r}."
            )

        if self._debug:
            print("PetabImpoter.__init__: petab_problem:")
            pprint(self.petab_problem.model_dump())
            if self.petab_problem.model.type_id == MODEL_TYPE_SBML:
                print(self.petab_problem.model.to_antimony())
            elif self.petab_problem.model.type_id == MODEL_TYPE_PYSB:
                print(self.petab_problem.model.to_str())

        self._compile = not jax if compile_ is None else compile_
        self._sym_model: DEModel | None = None
        self._model_id = self.petab_problem.model.model_id
        self._module_name = module_name or (
            f"{self.petab_problem.id}_{self.model_id}"
            if self.petab_problem.id
            else self.model_id
        )
        if self._module_name is None:
            raise ValueError(
                "No `module_name` was provided and no model ID "
                "was specified in the PEtab problem."
            )

        self._output_dir: Path | None = (
            None if output_dir is None else Path(output_dir).absolute()
        )
        self._jax = jax
        self._non_estimated_parameters_as_constants: bool = (
            non_estimated_parameters_as_constants
        )

        if validate:
            logger.info("Validating PEtab problem ...")
            validation_result = petab_problem.validate()
            if validation_result:
                validation_result.log()

            if validation_result.has_errors():
                raise ValueError(
                    "PEtab problem is not valid, see log messages for details."
                )

        # ensure each measurement has an experimentId to simplify processing
        _set_default_experiment(self.petab_problem)

        if self.petab_problem.model.type_id == MODEL_TYPE_SBML:
            self._preprocess_sbml()
        elif self.petab_problem.model.type_id == MODEL_TYPE_PYSB:
            self._preprocess_pysb()
        else:
            raise AssertionError()


    def _preprocess_sbml(self):
        """Pre-process the SBML-based PEtab problem to make it
        amici-compatible."""
        from petab.v2.models.sbml_model import SbmlModel

        if not isinstance(self.petab_problem.model, SbmlModel):
            raise ValueError("The PEtab problem must contain an SBML model.")

        # Convert petab experiments to events, because so far,
        #  AMICI only supports preequilibration/presimulation/simulation, but
        #  no arbitrary list of periods.
        exp_event_conv = ExperimentsToSbmlConverter(self.petab_problem)
        # This will always create a copy of the problem.
        self.petab_problem = exp_event_conv.convert()
        for experiment in self.petab_problem.experiments:
            if len(experiment.periods) > 2:
                # This should never happen due to the conversion above
                raise NotImplementedError(
                    "AMICI currently does not support more than two periods."
                )

        if self._debug:
            print("PetabImpoter._preprocess_sbml: petab_problem:")
            pprint(self.petab_problem.model_dump())
            print(self.petab_problem.model.to_antimony())

    def _preprocess_pysb(self):
        """Pre-process the PySB-based PEtab problem to make it
        amici-compatible."""
        import pysb
        from petab.v2.models.pysb_model import PySBModel

        if not isinstance(self.petab_problem.model, PySBModel):
            raise ValueError("The PEtab problem must contain a PySB model.")

        _add_observation_model_pysb(self.petab_problem, self._jax)
        # TODO: clarify in PEtab whether its allowed to set initial amounts
        #  for a species without a pysb.Initial.
        #  Currently, we fail in that case.
        #  If so add a test case for changing the initial amount for a species
        #  without a pysb.Initial
        #  fixed_parameters = _add_initialization_variables(pysb_model,
        #                                                 petab_problem)

        pysb.bng.generate_equations(self.petab_problem.model.model)

        # Convert PEtab v2 experiments/conditions to events
        converter = ExperimentsToPySBConverter(self.petab_problem)
        self.petab_problem, self._events = converter.convert()

    def _upgrade_or_copy_if_needed(
        self, problem: v1.Problem | v2.Problem
    ) -> v2.Problem:
        """Upgrade the problem to petab v2 if necessary.
        Otherwise, create a deep copy of the problem."""
        if isinstance(problem, v2.Problem):
            return copy.deepcopy(problem)

        raise NotImplementedError(
            "'petab_problem' must be a `petab.v2.Problem`. "
            "`petab.v1.Problem` is not directly supported, but "
            "file-based PEtab v1 problems can be upgraded via "
            "`petab.v2.Problem.from_yaml(petab_v1_yaml_file)`."
        )

    @property
    def model_id(self) -> str:
        """The model ID."""
        if self._model_id is None:
            self._model_id = self.petab_problem.model.model_id

        return self._model_id

    @property
    def output_dir(self) -> Path:
        """The output directory where the model files are written to."""
        if self._output_dir is None:
            self._output_dir = get_model_dir(self._module_name, jax=self._jax)
        return self._output_dir

    def _do_import_sbml(self):
        """Import the model.

        Generate the symbolic model according to the given PEtab problem and
        generate the corresponding Python module.

        1. Encode all PEtab experiments as events and initial assignments
           in the SBML model.
           This leaves only (maybe) a pre-equilibration and a single
           simulation period.
        2. Add the observable parameters to the SBML model.
        """
        logger.info(f"Importing model {self.model_id!r}...")

        if not self.petab_problem.observables:
            raise NotImplementedError(
                "PEtab import without observables table "
                "is currently not supported."
            )

        logger.info(
            f"Module name is '{self._module_name}'.\n"
            f"Writing model code to '{self.output_dir}'."
        )

        observation_model = self._get_observation_model()

        logger.info(f"#Observables: {len(observation_model)}")
        logger.debug(f"Observables: {observation_model}")

        self._workaround_observable_parameters_sbml(
            output_parameter_defaults=self._output_parameter_defaults,
        )

        # All indicator variables, i.e., all remaining targets after
        #  experiments-to-event in the PEtab problem must be converted
        #  to fixed parameters
        fixed_parameters = {
            change.target_id
            for experiment in self.petab_problem.experiments
            for period in experiment.periods
            for condition_id in period.condition_ids
            for change in self.petab_problem[condition_id].changes
        }

        from .v1._sbml_import import show_model_info

        show_model_info(self.petab_problem.model.sbml_model)
        sbml_importer = amici.SbmlImporter(
            self.petab_problem.model.sbml_model, jax=self._jax
        )

        self._check_placeholders()

        fixed_parameters |= _get_fixed_parameters_sbml(
            petab_problem=self.petab_problem,
            non_estimated_parameters_as_constants=self._non_estimated_parameters_as_constants,
        )

        fixed_parameters = list(sorted(fixed_parameters))
        logger.info(f"Number of fixed parameters: {len(fixed_parameters)}")
        logger.debug(f"Fixed parameters are {fixed_parameters}")

        # Create Python module from SBML model
        if self._jax:
            sbml_importer.sbml2jax(
                model_name=self._module_name,
                output_dir=self.output_dir,
                observation_model=observation_model,
                fixed_parameters=fixed_parameters,
                verbose=self._verbose,
                # **kwargs,
            )
            return sbml_importer
        else:
            # TODO:
            allow_reinit_fixpar_initcond = True
            sbml_importer.sbml2amici(
                model_name=self._module_name,
                output_dir=self.output_dir,
                observation_model=observation_model,
                fixed_parameters=fixed_parameters,
                allow_reinit_fixpar_initcond=allow_reinit_fixpar_initcond,
                verbose=self._verbose,
                compile=self._compile,
                # FIXME: simplification takes ages for Smith_BMCSystBiol2013
                #  due to nested piecewises / Heavisides?!
                simplify=None,
                # **kwargs,
            )
        # TODO check_model(amici_model=model, petab_problem=petab_problem)

        return sbml_importer

    def _do_import_pysb(
        self,
    ):
        """Import the PySB model.

        Generate the symbolic model according to the given PEtab problem and
        generate the corresponding Python module.
        """
        logger.info(f"Importing PySB model {self.model_id!r}...")

        if not self.petab_problem.observables:
            raise NotImplementedError(
                "PEtab import without observables table "
                "is currently not supported."
            )

        logger.info(
            f"Module name is '{self._module_name}'.\n"
            f"Writing model code to '{self.output_dir}'."
        )

        observation_model = self._get_observation_model()

        logger.info(f"#Observables: {len(observation_model)}")
        logger.debug(f"Observables: {observation_model}")

        pysb_model = self.petab_problem.model.model

        # All indicator variables, i.e., all remaining targets after
        #  experiments-to-event in the PEtab problem must be converted
        #  to fixed parameters
        fixed_parameters = {
            change.target_id
            for experiment in self.petab_problem.experiments
            for period in experiment.periods
            for condition_id in period.condition_ids
            for change in self.petab_problem[condition_id].changes
        }
        # TODO: handle self._non_estimated_parameters_as_constants

        self._check_placeholders()
        fixed_parameters = list(sorted(fixed_parameters))

        logger.info(f"Number of fixed parameters: {len(fixed_parameters)}")
        logger.debug(f"Fixed parameters are {fixed_parameters}")

        from amici.importers.pysb import pysb2amici, pysb2jax

        # Create Python module from PySB model
        if self._jax:
            pysb2jax(
                model=pysb_model,
                model_name=self._module_name,
                output_dir=self.output_dir,
                observation_model=observation_model,
                verbose=self._verbose,
                pysb_model_has_obs_and_noise=True,
                # TODO: events
                # **kwargs,
            )
            return
        else:
            pysb2amici(
                model=pysb_model,
                model_name=self._module_name,
                output_dir=self.output_dir,
                verbose=True,
                fixed_parameters=fixed_parameters,
                observation_model=observation_model,
                pysb_model_has_obs_and_noise=True,
                compile=self._compile,
                _events=self._events,
                # **kwargs,
            )

        if self._compile:
            # check that the model extension was compiled successfully
            _ = self.import_module()
            # model = model_module.getModel()
            # TODO check_model(amici_model=model, petab_problem=petab_problem)

        return

    def _check_placeholders(self):
        # check for time-point-specific placeholders
        #  for now, we only support:
        #  * observable placeholders that are replaced by the same expression
        #    for all measurements for a given experiment
        #  * noise placeholders that are replaced by the same expression
        #    for all measurements for a given experiment
        #  * noise placeholders if there is only a single placeholder which
        #    is replaced by literals for all measurements for a given
        #    experiment
        for experiment in self.petab_problem.experiments:
            measurements = self.petab_problem.get_measurements_for_experiment(
                experiment
            )
            observable_overrides = {}
            noise_overrides = {}
            for measurement in measurements:
                observable_overrides.setdefault(
                    measurement.observable_id, set()
                ).add(tuple(measurement.observable_parameters))
                noise_overrides.setdefault(
                    measurement.observable_id, set()
                ).add(tuple(measurement.noise_parameters))

            for observable_id, overrides in observable_overrides.items():
                if len(overrides) > 1:
                    raise NotImplementedError(
                        f"Observable {observable_id} has multiple "
                        "timepoint-specific mappings for observable "
                        "parameters. "
                        "This is not supported by AMICI."
                    )
            for observable_id, overrides in noise_overrides.items():
                if len(overrides) > 1:
                    if len(next(iter(overrides))) == 1 and all(
                        isinstance(p[0], numbers.Number) for p in overrides
                    ):
                        continue

                    raise NotImplementedError(
                        f"Observable {observable_id} has multiple "
                        "timepoint-specific mappings for noise parameters. "
                        "This is not supported by AMICI."
                    )
                if len(overrides) == 1 and next(iter(overrides)) == ():
                    # this is a single literal, which is fine
                    continue
            if self._debug:
                print(experiment.id)
                print(observable_overrides)
                print(noise_overrides)

    def _workaround_observable_parameters_sbml(
        self, output_parameter_defaults: dict[str, float] = None
    ) -> None:
        """
        Add any output parameters that are introduced via PEtab to the model.

        This can be placeholder parameters or any other parameters that are
        introduced in observableFormula or noiseFormula in the observable
        table, or in observableParameters or noiseParameters in the measurement
        table.
        """
        problem = self.petab_problem
        output_parameters = problem.get_output_parameters()

        logger.debug(
            "Adding output parameters to model: "
            f"{list(sorted(output_parameters))}"
        )
        output_parameter_defaults = output_parameter_defaults or {}
        if extra_pars := (
            set(output_parameter_defaults) - set(output_parameters)
        ):
            raise ValueError(
                "Default output parameter values were given for "
                f"{extra_pars}, but they those are not output parameters."
            )

        for par in sorted(output_parameters):
            _add_global_parameter(
                sbml_model=problem.model.sbml_model,
                parameter_id=par,
                value=output_parameter_defaults.get(par, 0.0),
            )

    def _get_observation_model(
        self,
    ) -> list[MeasurementChannel]:
        """Get the observation model from the PEtab problem."""
        return [
            MeasurementChannel(
                id_=observable.id,
                name=observable.name or observable.id,
                formula=observable.formula,
                noise_distribution=observable.noise_distribution,
                sigma=observable.noise_formula,
            )
            for observable in self.petab_problem.observables or []
        ]


[docs]
    def import_module(self, force_import: bool = False) -> amici.ModelModule:
        """Import the generated model module.

        :param force_import:
            Whether to force re-import even if the model module already exists.
        :return: The imported model module.
        """
        if not self.output_dir.is_dir() or force_import:
            if self.petab_problem.model.type_id == MODEL_TYPE_SBML:
                self._do_import_sbml()
            else:
                self._do_import_pysb()

        if self._jax:
            return amici.import_model_module(
                Path(self.output_dir).stem, Path(self.output_dir).parent
            )

        return amici.import_model_module(
            self._module_name,
            self.output_dir,
        )



[docs]
    def create_model(self) -> amici.sim.sundials.Model:
        """
        Create a :class:`amici.sim.sundials.Model` instance from the imported
        model.
        """
        return self.import_module().get_model()



[docs]
    def create_simulator(
        self, force_import: bool = False
    ) -> amici.sim.sundials.petab.PetabSimulator | amici.sim.jax.JAXProblem:
        """
        Create a PEtab simulator for the imported model.

        :param force_import:
            Whether to force re-import even if the model module already exists.
        :return: The created PEtab simulator.
        """
        from amici.sim.sundials.petab import ExperimentManager, PetabSimulator

        if self._jax:
            model_module = self.import_module(force_import=force_import)
            model = model_module.Model()

            from amici.sim.jax.petab import JAXProblem

            return JAXProblem(model, self.petab_problem)

        model = self.import_module(force_import=force_import).get_model()
        em = ExperimentManager(model=model, petab_problem=self.petab_problem)
        return PetabSimulator(em=em)




def _set_default_experiment(
    problem: v2.Problem, id_: str = _DEFAULT_EXPERIMENT_ID
) -> None:
    """Replace any empty experiment ID in the measurement table by
    a new dummy experiment with ID ``id_``.

    :param problem: The PEtab problem. This will be modified in place.
    """
    if not any(m.experiment_id is None for m in problem.measurements):
        return

    # create dummy experiment
    problem += v2.core.Experiment(
        id=id_,
    )

    for m in problem.measurements:
        if m.experiment_id is None:
            m.experiment_id = id_



[docs]
def rdatas_to_measurement_df(
    rdatas: Sequence[amici.sim.sundials.ReturnData],
    model: amici.sim.sundials.AmiciModel,
    petab_problem: v2.Problem,
) -> pd.DataFrame:
    """
    Create a measurement dataframe in the PEtab format from the passed
    ``rdatas`` and own information.

    :param rdatas:
        A sequence of :class:`amici.sim.sundials.ReturnData`.
    :param model:
        AMICI model used to generate ``rdatas``.
    :param petab_problem:
        The PEtab problem used to generate ``rdatas``.
    :return:
        A dataframe built from simulation results in `rdatas` in the format
        of the PEtab measurement table.
    """

    measurement_df = petab_problem.measurement_df
    observable_ids = model.get_observable_ids()
    rows = []
    # iterate over conditions
    for rdata in rdatas:
        experiment_id = rdata.id

        # current simulation matrix
        y = rdata.y
        # time array used in rdata
        t = list(rdata.ts)

        # extract rows for condition
        cur_measurement_df = measurement_df[
            measurement_df[v2.C.EXPERIMENT_ID] == experiment_id
        ]

        # iterate over entries for the given condition
        # note: this way we only generate a dataframe entry for every
        # row that existed in the original dataframe. if we want to
        # e.g. have also timepoints non-existent in the original file,
        # we need to instead iterate over the rdata['y'] entries
        for _, row in cur_measurement_df.iterrows():
            # copy row
            row_sim = copy.deepcopy(row)

            # extract simulated measurement value
            timepoint_idx = t.index(row[v2.C.TIME])
            observable_idx = observable_ids.index(row[v2.C.OBSERVABLE_ID])
            measurement_sim = y[timepoint_idx, observable_idx]

            # change measurement entry
            row_sim[v2.C.MEASUREMENT] = measurement_sim

            rows.append(row_sim)

    return pd.DataFrame(rows)




[docs]
def rdatas_to_simulation_df(
    rdatas: Sequence[amici.sim.sundials.ReturnData],
    model: amici.sim.sundials.AmiciModel,
    petab_problem: v2.Problem,
) -> pd.DataFrame:
    """
    Create a simulation dataframe in the PEtab format from the passed
    ``rdatas`` and own information.

    :param rdatas:
        A sequence of :class:`amici.sim.sundials.ReturnData`.
    :param model:
        AMICI model used to generate ``rdatas``.
    :param petab_problem:
        The PEtab problem used to generate ``rdatas``.
    :return:
        A dataframe built from simulation results in `rdatas` in the format
        of the PEtab simulation table.
    """
    measurement_df = rdatas_to_measurement_df(rdatas, model, petab_problem)

    simulation_df = measurement_df.rename(
        columns={v2.C.MEASUREMENT: v2.C.SIMULATION}
    )

    # revert setting default experiment Id
    simulation_df.loc[
        simulation_df[v2.C.EXPERIMENT_ID] == _DEFAULT_EXPERIMENT_ID,
        v2.C.EXPERIMENT_ID,
    ] = np.nan

    return simulation_df




[docs]
def has_timepoint_specific_overrides(
    petab_problem: v2.Problem,
    ignore_scalar_numeric_noise_parameters: bool = False,
    ignore_scalar_numeric_observable_parameters: bool = False,
) -> bool:
    """Check if the measurements have timepoint-specific observable or
    noise parameter overrides.

    :param petab_problem:
        PEtab problem to check.
    :param ignore_scalar_numeric_noise_parameters:
        ignore scalar numeric assignments to noiseParameter placeholders
    :param ignore_scalar_numeric_observable_parameters:
        ignore scalar numeric assignments to observableParameter
        placeholders
    :return: `True` if the problem has timepoint-specific overrides, `False`
        otherwise.
    """
    if not petab_problem.measurements:
        return False

    from petab.v1.core import get_notnull_columns
    from petab.v1.lint import is_scalar_float

    measurement_df = petab_problem.measurement_df

    # mask numeric values
    for col, allow_scalar_numeric in [
        (
            v2.C.OBSERVABLE_PARAMETERS,
            ignore_scalar_numeric_observable_parameters,
        ),
        (v2.C.NOISE_PARAMETERS, ignore_scalar_numeric_noise_parameters),
    ]:
        if col not in measurement_df:
            continue

        measurement_df[col] = measurement_df[col].apply(str)

        if allow_scalar_numeric:
            measurement_df.loc[
                measurement_df[col].apply(is_scalar_float), col
            ] = ""

    grouping_cols = get_notnull_columns(
        measurement_df,
        _POSSIBLE_GROUPVARS_FLATTENED_PROBLEM,
    )
    grouped_df = measurement_df.groupby(grouping_cols, dropna=False)

    grouping_cols = get_notnull_columns(
        measurement_df,
        [
            v2.C.MODEL_ID,
            v2.C.OBSERVABLE_ID,
            v2.C.EXPERIMENT_ID,
        ],
    )
    grouped_df2 = measurement_df.groupby(grouping_cols)

    # data frame has timepoint specific overrides if grouping by noise
    # parameters and observable parameters in addition to observable and
    # experiment id yields more groups
    return len(grouped_df) != len(grouped_df2)



def _get_flattened_id_mappings(
    petab_problem: v2.Problem,
) -> dict[str, str]:
    """Get mapping from flattened to unflattened observable IDs.

    :param petab_problem:
        The unflattened PEtab problem.
    :returns:
        A mapping from flattened ID to original observable ID.
    """
    from petab.v1.core import (
        get_notnull_columns,
        get_observable_replacement_id,
    )

    groupvars = get_notnull_columns(
        petab_problem.measurement_df, _POSSIBLE_GROUPVARS_FLATTENED_PROBLEM
    )
    mappings: dict[str, str] = {}

    old_observable_ids = {obs.id for obs in petab_problem.observables}
    for groupvar, _ in petab_problem.measurement_df.groupby(
        groupvars, dropna=False
    ):
        observable_id = groupvar[groupvars.index(v2.C.OBSERVABLE_ID)]
        observable_replacement_id = get_observable_replacement_id(
            groupvars, groupvar
        )

        logger.debug(f"Creating synthetic observable {observable_id}")
        if (
            observable_id != observable_replacement_id
            and observable_replacement_id in old_observable_ids
        ):
            raise RuntimeError(
                "could not create synthetic observables "
                f"since {observable_replacement_id} was "
                "already present in observable table"
            )

        mappings[observable_replacement_id] = observable_id

    return mappings



[docs]
def flatten_timepoint_specific_output_overrides(
    petab_problem: v2.Problem,
) -> None:
    """Flatten timepoint-specific output parameter overrides.

    If the PEtab problem definition has timepoint-specific
    `observableParameters` or `noiseParameters` for the same observable,
    replace those by replicating the respective observable.

    This is a helper function for some tools which may not support such
    timepoint-specific mappings. The observable table and measurement table
    are modified in place.

    :param petab_problem:
        PEtab problem to work on. Modified in place.
    """
    from petab.v1.core import (
        get_notnull_columns,
        get_observable_replacement_id,
    )

    # Update observables
    def create_new_observable(old_id, new_id) -> Observable:
        if old_id not in petab_problem.observable_df.index:
            raise ValueError(
                f"Observable {old_id} not found in observable table."
            )

        # copy original observable and update ID
        observable: Observable = copy.deepcopy(petab_problem[old_id])
        observable.id = new_id

        # update placeholders
        old_obs_placeholders = observable.observable_placeholders
        old_noise_placeholders = observable.noise_placeholders
        suffix = new_id.removeprefix(old_id)
        observable.observable_placeholders = [
            f"{sym.name}{suffix}" for sym in observable.observable_placeholders
        ]
        observable.noise_placeholders = [
            f"{sym.name}{suffix}" for sym in observable.noise_placeholders
        ]

        # placeholders in formulas
        subs = dict(
            zip(
                old_obs_placeholders,
                observable.observable_placeholders,
                strict=True,
            )
        )
        observable.formula = observable.formula.subs(subs)
        subs |= dict(
            zip(
                old_noise_placeholders,
                observable.noise_placeholders,
                strict=True,
            )
        )
        observable.noise_formula = observable.noise_formula.subs(subs)

        return observable

    mappings = _get_flattened_id_mappings(petab_problem)

    petab_problem.observable_tables = [
        v2.ObservableTable(
            [
                create_new_observable(old_id, new_id)
                for new_id, old_id in mappings.items()
            ]
        )
    ]

    # Update measurements
    groupvars = get_notnull_columns(
        petab_problem.measurement_df, _POSSIBLE_GROUPVARS_FLATTENED_PROBLEM
    )
    for measurement_table in petab_problem.measurement_tables:
        for measurement in measurement_table.measurements:
            # TODO: inefficient, but ok for a start
            group_vals = (
                v2.MeasurementTable([measurement])
                .to_df()
                .iloc[0][groupvars]
                .tolist()
            )
            new_obs_id = get_observable_replacement_id(groupvars, group_vals)
            measurement.observable_id = new_obs_id




[docs]
def unflatten_simulation_df(
    simulation_df: pd.DataFrame,
    petab_problem: v2.Problem,
) -> pd.DataFrame:
    """Unflatten simulations from a flattened PEtab problem.

    A flattened PEtab problem is the output of applying
    :func:`flatten_timepoint_specific_output_overrides` to a PEtab problem.

    :param simulation_df:
        The simulation dataframe. A dataframe in the same format as a PEtab
        measurements table, but with the ``measurement`` column switched
        with a ``simulation`` column.
    :param petab_problem:
        The unflattened PEtab problem.
    :returns:
        The simulation dataframe for the unflattened PEtab problem.
    """
    mappings = _get_flattened_id_mappings(petab_problem)
    original_observable_ids = simulation_df[v2.C.OBSERVABLE_ID].replace(
        mappings
    )
    unflattened_simulation_df = simulation_df.assign(
        **{
            v2.C.OBSERVABLE_ID: original_observable_ids,
        }
    )
    return unflattened_simulation_df



def _get_fixed_parameters_sbml(
    petab_problem: v2.Problem,
    non_estimated_parameters_as_constants=True,
) -> set[str]:
    """
    Determine, set and return fixed model parameters.

    :param petab_problem:
        The PEtab problem instance

    :param non_estimated_parameters_as_constants:
        Whether parameters marked as non-estimated in PEtab should be
        considered constant in AMICI. Setting this to ``True`` will reduce
        model size and simulation times. If sensitivities with respect to those
        parameters are required, this should be set to ``False``.

    :return:
        List of IDs of (AMICI) parameters that are not estimated.
    """
    if not petab_problem.model.type_id == MODEL_TYPE_SBML:
        raise ValueError("Not an SBML model.")

    if not non_estimated_parameters_as_constants:
        raise NotImplementedError(
            "Only non_estimated_parameters_as_constants=True is supported."
        )

    # For amici constants we select everything
    # 1) that is a parameter in AMICI
    # and
    # 2) that is not flagged as estimated in PEtab
    # and
    # 3) for which there is no condition, where this parameter occurs as a
    #    targetId where the targetValue expression contains any estimated
    #    parameters
    #    TODO: if we assume that condition table changes have been converted to
    #     events, we can skip this check. indicator variables are always
    #     literal numbers. right?

    sbml_model = petab_problem.model.sbml_model

    # What will be implemented as a parameter in the amici model?
    amici_parameters = {
        p.getId()
        for p in sbml_model.getListOfParameters()
        if p.getConstant() is True
        # TODO: IAs with literals can be ignored
        # TODO(performance): collect IAs once
        and sbml_model.getInitialAssignmentBySymbol(p.getId()) is None
    }

    estimated_parameters = set(petab_problem.x_free_ids)

    return amici_parameters - estimated_parameters


def _add_observation_model_pysb(petab_problem: v2.Problem, jax: bool = False):
    """Extend PySB model by observation model as defined in the PEtab
    observables table"""
    import pysb

    pysb_model: pysb.Model = petab_problem.model.model

    # add any required output parameters
    local_syms = {
        sp.Symbol(sp.Symbol.__str__(comp), real=True): comp
        for comp in pysb_model.components
        if isinstance(comp, sp.Symbol)
    }

    def process_formula(sym: sp.Basic):
        changed_formula = False
        sym = sym.subs(local_syms)
        for s in sym.free_symbols:
            if not isinstance(s, pysb.Component):
                if not isinstance(s, sp.Symbol):
                    raise AssertionError(
                        f"Unexpected symbol type in observable formula: {s}, "
                        f"{type(s)}"
                    )
                name = str(s)
                p = pysb.Parameter(name, 1.0, _export=False)
                pysb_model.add_component(p)

                # placeholders for multiple observables are mapped to the
                # same symbol, so only add to local_syms when necessary
                if name not in local_syms:
                    local_syms[sp.Symbol(name, real=True)] = p

                # replace placeholder with parameter
                if jax and name != str(s):
                    changed_formula = True
                    sym = sym.subs(s, local_syms[name])
        return sym, changed_formula

    for observable in petab_problem.observables:
        sym, changed_formula = process_formula(observable.formula)
        observable.formula = sym
        sym, changed_formula = process_formula(observable.noise_formula)
        observable.noise_formula = sym

    # add observables and sigmas to pysb model
    for observable in petab_problem.observables:
        # obs_symbol = sp.sympify(observable_formula, locals=local_syms)
        if observable.id in pysb_model.expressions.keys():
            obs_expr = pysb_model.expressions[observable.id]
        else:
            obs_expr = pysb.Expression(
                observable.id, observable.formula, _export=False
            )
            pysb_model.add_component(obs_expr)
        local_syms[sp.Symbol(observable.id, real=True)] = obs_expr

        sigma_id = f"{observable.id}_sigma"
        sigma_expr = pysb.Expression(
            sigma_id, observable.noise_formula.subs(local_syms), _export=False
        )
        observable.noise_formula = sp.Symbol(sigma_id, real=True)
        pysb_model.add_component(sigma_expr)
        local_syms[sp.Symbol(sigma_id, real=True)] = sigma_expr


class ExperimentsToPySBConverter:
    """
    Convert PEtab experiments to amici events and PySB initials.

    See :meth:`convert` for details.
    """

    #: ID of the parameter that indicates whether the model is in
    #  the pre-equilibration phase (1) or not (0).
    PREEQ_INDICATOR = "_petab_preequilibration_indicator"

    #: The condition ID of the condition that sets the
    #: pre-equilibration indicator to 1.
    CONDITION_ID_PREEQ_ON = "_petab_preequilibration_on"

    #: The condition ID of the condition that sets the
    #: pre-equilibration indicator to 0.
    CONDITION_ID_PREEQ_OFF = "_petab_preequilibration_off"

    def __init__(self, petab_problem: v2.Problem):
        """Initialize the converter.

        :param petab_problem:
            The PEtab problem to convert.
            This will not be modified by this class.
        """
        from petab.v2.models.pysb_model import PySBModel

        if len(petab_problem.models) > 1:
            #  https://github.com/PEtab-dev/libpetab-python/issues/392
            raise NotImplementedError(
                "Only single-model PEtab problems are supported."
            )
        if not isinstance(petab_problem.model, PySBModel):
            raise ValueError("Only SBML models are supported.")
        model = petab_problem.model.model
        compartment_ids = {c.name for c in model.compartments}
        if compartment_ids and any(
            change.target_id in compartment_ids
            for cond in petab_problem.conditions
            for change in cond.changes
        ):
            # BNG evaluates compartment sizes during network generation.
            #  Changing those values later on will lead to incorrect results.
            raise NotImplementedError(
                "Changes to compartment sizes are not supported for PySB "
                "models."
            )

        # For the moment, we only support changes that are time-constant
        #  expressions, i.e., that only contain numbers or pysb.Parameters.
        # Furthermore, we only support changing species and pysb.Expressions,
        #  but not pysb.Parameter. (Expressions can be easily changed, but
        #  we can't easily convert a Parameter to an Expression, because we
        #  can't remove components from a PySB model. This either
        #  requires deeper integration with `pysb2amici`, or we need to
        #  recreate the PySB model.)
        parameter_ids = set(petab_problem.x_ids) | {
            p.name for p in model.parameters
        }

        for cond in petab_problem.conditions:
            for change in cond.changes:
                if (
                    set(map(str, change.target_value.free_symbols))
                    - parameter_ids
                ):
                    # TODO: we can't just change Parameter to Expression in
                    #  this case.
                    #  Expressions are evaluated continuously during the
                    #  simulation. i.e., to only set the initial value, we need
                    #  to replace all dynamic constructs by their initials.
                    # TODO: we may have to convert some parameters and
                    #  expressions to state variables,
                    #  otherwise we can't use them as event targets.
                    #  This will require deeper integration of PEtab and PySB
                    #  import
                    raise NotImplementedError(
                        "Currently, only time-constant targetValue expressions"
                        f" are supported. Got {str(change.target_value)!r} "
                        f"for target {change.target_id!r}."
                    )
                if change.target_id in parameter_ids:
                    raise NotImplementedError(
                        "Currently, PySB parameters are not supported as "
                        "targets of condition table changes. Replace "
                        f"parameter {change.target_id!r} by a pysb.Expression."
                    )
        #: The PEtab problem to convert. Not modified by this class.
        self._petab_problem = petab_problem
        self._events: list[Event] = []
        self._new_problem: v2.Problem | None = None

    @staticmethod
    def _get_experiment_indicator_condition_id(experiment_id: str) -> str:
        """Get the condition ID for the experiment indicator parameter."""
        return f"_petab_experiment_condition_{experiment_id}"

    def convert(
        self,
    ) -> tuple[v2.Problem, list[Event]]:
        """Convert PEtab experiments to amici events and pysb initials.

        Generate events, add Initials, or convert Parameters to Expressions
        that implement the changes encoded in the PEtab v2
        experiment / condition table.
        This adds indicator variables to the PEtab problem and removes all
        condition changes that are implemented as events.

        :returns:
            A PEtab problem with only indicator parameters left in the
            condition table a maximum of two periods per experiment
            (pre-equilibration and main simulation), and a list of events
            to be passed to `pysb2amici`.
        """
        self._new_problem = copy.deepcopy(self._petab_problem)
        self._events: list[Event] = []

        self._add_preequilibration_indicator()

        for experiment in self._new_problem.experiments:
            self._convert_experiment(experiment)

        self._add_indicators_to_conditions()

        validation_results = self._new_problem.validate()
        validation_results.log()

        return self._new_problem, self._events

    def _convert_experiment(self, experiment: v2.Experiment) -> None:
        """
        Convert a single experiment to SBML events or initial assignments.
        """
        import pysb

        model: pysb.Model = self._new_problem.model.model
        experiment.sort_periods()
        has_preequilibration = experiment.has_preequilibration
        # mapping table mappings
        self.map_petab_to_pysb = {
            mapping.petab_id: mapping.model_id
            for mapping in self._petab_problem.mappings
            if mapping.petab_id is not None and mapping.model_id is not None
        }
        self.map_pysb_to_petab = {
            mapping.model_id: mapping.petab_id
            for mapping in self._petab_problem.mappings
            if mapping.petab_id is not None and mapping.model_id is not None
        }

        # add experiment indicator
        exp_ind_id = self.get_experiment_indicator(experiment.id)
        if exp_ind_id in map(str, model.components):
            raise ValueError(
                f"The model has entity with ID `{exp_ind_id}`. "
                "IDs starting with `petab_` are reserved for "
                f"{self.__class__.__name__} and should not be used in the "
                "model."
            )
        self._add_parameter(exp_ind_id, 0)
        kept_periods: list[ExperimentPeriod] = []
        # Collect values for initial assignments for the different experiments.
        #  All expressions must be combined into a single initial assignment
        #  per target.
        # target_id -> [(experiment_indicator, target_value), ...]
        period0_assignments: dict[str, list[tuple[str, sp.Basic]]] = {}

        for i_period, period in enumerate(experiment.sorted_periods):
            if period.is_preequilibration:
                # pre-equilibration cannot be encoded as event,
                #  so we need to keep this period in the Problem.
                kept_periods.append(period)
            elif i_period == int(has_preequilibration):
                # we always keep the first non-pre-equilibration period
                #  to set the indicator parameters
                kept_periods.append(period)
            elif not period.condition_ids:
                # no condition, no changes, no need for an event,
                #  no need to keep the period unless it's the pre-equilibration
                #  or the only non-equilibration period (handled above)
                continue

            # Encode the period changes as events
            #  that trigger at the start of the period or,
            #  for the first period, as pysb.Initials.
            #  pysb.Initials are required for the first period,
            #  because other initial assignments may depend on
            #  the changed values.
            if i_period == 0:
                exp_ind_id = self.get_experiment_indicator(experiment.id)
                for change in self._new_problem.get_changes_for_period(period):
                    period0_assignments.setdefault(
                        change.target_id, []
                    ).append((exp_ind_id, change.target_value))
            else:
                self._create_period_start_event(
                    experiment=experiment,
                    i_period=i_period,
                    period=period,
                )

        # Create initials for the first period
        if period0_assignments:
            free_symbols_in_assignments = set()
            for target_id, changes in period0_assignments.items():
                # The initial value might only be changed for a subset of
                #  experiments. We need to keep the original initial value
                #  for all other experiments.
                target_entity = None
                try:
                    target_entity = next(
                        c
                        for c in model.components
                        if c.name
                        == self.map_petab_to_pysb.get(target_id, target_id)
                    )
                    if isinstance(target_entity, pysb.Parameter):
                        default = target_entity.value
                    elif isinstance(target_entity, pysb.Expression):
                        default = target_entity.expr
                    else:
                        raise AssertionError(target_id)
                except StopIteration:
                    # species pattern?
                    for initial in model.initials:
                        if str(initial.pattern) == self.map_petab_to_pysb.get(
                            target_id, target_id
                        ):
                            default = initial.value
                            break
                    else:
                        raise AssertionError(target_id)

                # Only create the initial assignment if there is
                #  actually something to change.
                if expr_cond_pairs := [
                    (target_value, sp.Symbol(exp_ind) > 0.5)
                    for exp_ind, target_value in changes
                    if target_value != default
                ]:
                    # Unlike events, we can't have different initial
                    #  assignments for different experiments, so we need to
                    #  combine all changes into a single piecewise
                    #  expression.
                    expr = sp.Piecewise(
                        *expr_cond_pairs,
                        (default, True),
                    )

                    # Update the target expression
                    if target_entity is not None and isinstance(
                        target_entity, pysb.Expression
                    ):
                        target_entity.value = expr
                    else:
                        # if the target is not an expression, it must be an
                        #  initial. the rest is excluded in __init__
                        # TODO (performance): It might be more efficient
                        #  to handle this as multi-model problem.
                        #  Individual models might result in smaller networks
                        #  than the superset model required here.
                        for initial in model.initials:
                            if str(
                                initial.pattern
                            ) == self.map_petab_to_pysb.get(
                                target_id, target_id
                            ):
                                # Initial.value needs to be parameter or
                                # expression, we can't use piecewise directly
                                expr_expr = pysb.Expression(
                                    f"_petab_initial_{target_id}",
                                    expr,
                                    _export=False,
                                )
                                model.add_component(expr_expr)
                                initial.value = expr_expr
                                break
                        else:
                            raise AssertionError(target_id, target_entity)
                    free_symbols_in_assignments |= expr.free_symbols

            # the target value may depend on parameters that are only
            #  introduced in the PEtab parameter table - those need
            #  to be added to the model
            for sym in free_symbols_in_assignments:
                if model.parameters.get(sym.name) is None:
                    self._add_parameter(sym.name, 0)

        if len(kept_periods) > 2:
            raise AssertionError("Expected at most two periods to be kept.")

        # add conditions that set the indicator parameters
        for period in kept_periods:
            period.condition_ids = [
                self._get_experiment_indicator_condition_id(experiment.id),
                self.CONDITION_ID_PREEQ_ON
                if period.is_preequilibration
                else self.CONDITION_ID_PREEQ_OFF,
            ]

        experiment.periods = kept_periods

    def _create_period_start_event(
        self,
        experiment: v2.Experiment,
        i_period: int,
        period: ExperimentPeriod,
    ):
        """Create an event that triggers at the start of a period."""
        exp_ind_id = self.get_experiment_indicator(experiment.id)
        exp_ind_sym = sp.Symbol(exp_ind_id)
        preeq_ind_sym = sp.Symbol(self.PREEQ_INDICATOR)

        # Create trigger expressions
        # Since handling of == and !=, and distinguishing < and <=
        # (and > and >=), is a bit tricky in terms of root-finding,
        # we use these slightly more convoluted expressions.
        # (assuming that the indicator parameters are {0, 1})
        if period.is_preequilibration:
            root_fun = sp.Min(exp_ind_sym - 0.5, preeq_ind_sym - 0.5)
        else:
            root_fun = sp.Min(
                exp_ind_sym - 0.5,
                0.5 - preeq_ind_sym,
                amici_time_symbol - period.time,
            )

        event_id = f"_petab_event_{experiment.id}_{i_period}"
        assignments: dict[sp.Symbol, sp.Expr] = {}
        model = self._new_problem.model.model
        for change in self._new_problem.get_changes_for_period(period):
            if change.target_id in model.parameters:
                assignments[sp.Symbol(change.target_id)] = change.target_value
                # add any missing parameters
                for sym in change.target_value.free_symbols:
                    if sym.name not in model.parameters:
                        self._add_parameter(sym.name, 0)
            else:
                raise AssertionError(change)

        event = Event(
            symbol=sp.Symbol(event_id),
            name=event_id,
            value=root_fun,
            assignments=assignments,
            initial_value=False,
            use_values_from_trigger_time=False,
        )

        self._events.append(event)

    def _add_parameter(self, par_id: str, value: float) -> None:
        """Add a parameter to the PySB model."""
        import pysb

        p = pysb.Parameter(par_id, value, _export=False)
        self._new_problem.model.model.add_component(p)

    def _add_preequilibration_indicator(
        self,
    ) -> None:
        """Add an indicator parameter for the pre-equilibration to the SBML
        model."""
        par_id = self.PREEQ_INDICATOR
        if par_id in map(str, self._new_problem.model.model.components):
            raise ValueError(
                f"Entity with ID {par_id} already exists in the model."
            )

        # add the pre-steady-state indicator parameter
        self._add_parameter(par_id, 0.0)

    @staticmethod
    def get_experiment_indicator(experiment_id: str) -> str:
        """The ID of the experiment indicator parameter.

        The experiment indicator parameter is used to identify the
        experiment in the SBML model. It is a parameter that is set
        to 1 for the current experiment and 0 for all other
        experiments. The parameter is used in the event trigger
        to determine whether the event should be triggered.

        :param experiment_id: The ID of the experiment for which to create
            the experiment indicator parameter ID.
        """
        return f"_petab_experiment_indicator_{experiment_id}"

    def _add_indicators_to_conditions(self) -> None:
        """After converting the experiments to events, add the indicator
        parameters for the pre-equilibration period and for the different
        experiments to the remaining conditions.
        Then remove all other conditions."""
        from petab.v2 import Change, Condition, ConditionTable

        problem = self._new_problem

        # create conditions for indicator parameters
        problem += Condition(
            id=self.CONDITION_ID_PREEQ_ON,
            changes=[Change(target_id=self.PREEQ_INDICATOR, target_value=1)],
        )

        problem += Condition(
            id=self.CONDITION_ID_PREEQ_OFF,
            changes=[Change(target_id=self.PREEQ_INDICATOR, target_value=0)],
        )

        # add conditions for the experiment indicators
        for experiment in problem.experiments:
            cond_id = self._get_experiment_indicator_condition_id(
                experiment.id
            )
            changes = [
                Change(
                    target_id=self.get_experiment_indicator(experiment.id),
                    target_value=1,
                )
            ]
            problem += Condition(
                id=cond_id,
                changes=changes,
            )

        #  All changes have been encoded in event assignments and can be
        #  removed. Only keep the conditions setting our indicators.
        problem.condition_tables = [
            ConditionTable(
                [
                    condition
                    for condition in problem.conditions
                    if condition.id.startswith("_petab")
                ]
            )
        ]