Source code for pybop.costs.base_cost

from typing import Optional, Union

import numpy as np
from SALib.analyze import sobol
from SALib.sample.sobol import sample

from pybop import BaseProblem
from pybop._utils import add_spaces
from pybop.parameters.parameter import Inputs, Parameters



[docs]
class BaseCost:
    """
    Base class for defining cost functions.

    Parameters
    ----------
    problem : object
        A problem instance containing the data and functions necessary for
        evaluating the cost function.
    target : array-like
        An array containing the target data to fit.
    n_outputs : int
        The number of outputs in the model.
    has_separable_problem : bool
        If True, the problem is separable from the cost function and will be
        evaluated in advance of the call to self.compute() (default: False).
    _de : float
        The gradient of the cost function to use if an error occurs during
        evaluation. Defaults to 1.0.
    minimising : bool, optional
        If False, tells the optimiser to switch the sign of the cost and gradient
        to maximise by default rather than minimise (default: True).
    """


[docs]
    class DeferredPrediction:
        """
        Class used to indicate a prediction has yet to be, but is expected during
        a cost call.
        """

        pass


    def __init__(self, problem: Optional[BaseProblem] = None):

[docs]
        self._parameters = Parameters()


[docs]
        self.problem = problem


[docs]
        self.verbose = False


[docs]
        self._has_separable_problem = False


[docs]
        self.y = None


[docs]
        self.dy = None


[docs]
        self._de = 1.0


[docs]
        self.minimising = True

        if isinstance(self.problem, BaseProblem):
            self._target = self.problem.target
            self._parameters.join(self.problem.parameters)
            self.n_outputs = self.problem.n_outputs
            self.signal = self.problem.signal
            self._has_separable_problem = True
            self.grad_fail = None
            self.set_fail_gradient()


[docs]
    def __call__(
        self,
        inputs: Union[Inputs, list, np.ndarray],
        calculate_grad: bool = False,
    ) -> Union[float, list, tuple[float, np.ndarray], list[tuple[float, np.ndarray]]]:
        """
        Compute cost and optional gradient for given input parameters.

        Parameters
        ----------
        inputs : Union[Inputs, list, np.ndarray]
            Input parameters for cost computation. Supports list-like evaluation of
            multiple input values, shaped [N,M] where N is the number of input positions
            to evaluate and M is the number of inputs for the underlying model (i.e. parameters).
        calculate_grad : bool, default=False
            If True, both the cost and gradient will be computed. Otherwise, only the
            cost is computed.

        Returns
        -------
        Union[float, list, tuple[float, np.ndarray], list[tuple[float, np.ndarray]]]
            - Single input, no gradient: float
            - Multiple inputs, no gradient: list[float]
            - Single input with gradient: tuple[float, np.ndarray]
            - Multiple inputs with gradient: list[tuple[float, np.ndarray]]
        """
        # Convert dict to list for sequential computations
        if isinstance(inputs, dict):
            inputs = list(inputs.values())
        inputs_list = np.atleast_2d(inputs)

        results = []
        for inputs in inputs_list:
            result = self.single_call(inputs, calculate_grad=calculate_grad)
            results.append(result)

        return results[0] if len(inputs_list) == 1 else results



[docs]
    def single_call(
        self,
        inputs: Union[Inputs, np.ndarray],
        calculate_grad: bool,
    ) -> Union[float, tuple[float, np.ndarray]]:
        """Evaluate the cost and (optionally) the gradient for a single set of inputs."""
        model_inputs = self.parameters.verify(inputs)
        self.parameters.update(values=list(model_inputs.values()))

        y = self.DeferredPrediction
        dy = self.DeferredPrediction if calculate_grad else None

        if self._has_separable_problem:
            if calculate_grad:
                y, dy = self.problem.evaluateS1(self.problem.parameters.as_dict())
                return self.compute(y, dy=dy)

            y = self.problem.evaluate(self.problem.parameters.as_dict())

        return self.compute(y, dy=dy)



[docs]
    def compute(self, y: dict, dy: Optional[np.ndarray]):
        """
        Compute the cost and, if dy is not None, its gradient with respect to the
        parameters.

        This method only computes the cost, without calling the `problem.evaluate()`.
        This method must be implemented by subclasses.

        Parameters
        ----------
        y : dict
            A dictionary of predictions with keys designating the signals for fitting.
        dy : np.ndarray, optional
            The corresponding gradient with respect to the parameters for each signal.

        Raises
        ------
        NotImplementedError
            If the method has not been implemented by the subclass.
        """
        raise NotImplementedError



[docs]
    def sensitivity_analysis(self, n_samples: int = 256):
        """
        Computes the parameter sensitivities on the cost function using
        SOBOL analyse from the SALib module [1].

        Parameters
        ----------
        n_samples : int, optional
            Number of samples for SOBOL sensitivity analysis,
            performs best as order of 2, i.e. 128, 256, etc.

        References
        ----------
        .. [1] Iwanaga, T., Usher, W., & Herman, J. (2022). Toward SALib 2.0:
               Advancing the accessibility and interpretability of global sensitivity
               analyses. Socio-Environmental Systems Modelling, 4, 18155. doi:10.18174/sesmo.18155

        Returns
        -------
        Sensitivities : dict
        """

        salib_dict = {
            "names": self.parameters.keys(),
            "bounds": self.parameters.get_bounds_for_plotly(),
            "num_vars": len(self.parameters.keys()),
        }

        param_values = sample(salib_dict, n_samples)
        return sobol.analyze(salib_dict, np.asarray(self.__call__(param_values)))



[docs]
    def set_fail_gradient(self, de: float = 1.0):
        """
        Set the fail gradient to a specified value.

        The fail gradient is used if an error occurs during the calculation
        of the gradient. This method allows updating the default gradient value.

        Parameters
        ----------
        de : float
            The new fail gradient value to be used.
        """
        if not isinstance(de, float):
            de = float(de)
        self._de = de
        self.grad_fail = self._de * np.ones(self.n_parameters)



[docs]
    def verify_prediction(self, y: dict):
        """
        Verify that the prediction matches the target data.

        Parameters
        ----------
        y : dict
            A dictionary of predictions with keys designating the signals for fitting.

        Returns
        -------
        bool
            True if the prediction matches the target data, otherwise False.
        """
        if any(
            len(y.get(key, [])) != len(self._target.get(key, [])) for key in self.signal
        ):
            return False

        return True



[docs]
    def join_parameters(self, parameters):
        """
        Setter for joining parameters. This method sets the fail gradient if the join adds parameters.
        """
        original_n_params = self.n_parameters
        self._parameters.join(parameters)
        if original_n_params != self.n_parameters:
            self.set_fail_gradient()



[docs]
    def stack_sensitivities(self, dy) -> np.ndarray:
        """
        Stack the sensitivities for each signal and parameter into a single array.

        Parameters
        ----------
        dict[str, dict[str, np.ndarray[np.float64]]]
            A dictionary of the sensitivities dy/dx(t) for each parameter x and signal y.

        Returns
        -------
        np.ndarray[np.float64]
            The combined sensitivities dy/dx(t) for each parameter and signal, with
            dimensions of (len(parameters), len(signal), len(domain_data)).
        """
        return np.stack(
            [
                np.row_stack([dy[key][signal] for signal in self.signal])
                for key in dy.keys()
            ],
            axis=0,
        )


    @property

[docs]
    def name(self):
        return add_spaces(type(self).__name__)


    @property

[docs]
    def n_parameters(self):
        return len(self._parameters)


    @property

[docs]
    def has_separable_problem(self):
        return self._has_separable_problem


    @property

[docs]
    def target(self):
        return self._target


    @property

[docs]
    def parameters(self):
        return self._parameters


    @parameters.setter
    def parameters(self, parameters):
        self._parameters = parameters

    @property

[docs]
    def pybamm_solution(self):
        return self.problem.pybamm_solution if self.problem is not None else None