pybop-team · NicolaCourtier · Dec 20, 2024 · Jun 14, 2024 · Jul 5, 2024 · Jul 5, 2024
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -2,6 +2,7 @@
 
 ## Features
 
+- [#362](https://github.com/pybop-team/PyBOP/issues/362) - Adds the `classify_using_Hessian` functionality to classify the optimised result.
 - [#571](https://github.com/pybop-team/PyBOP/pull/571) - Adds Multistart functionality to optimisers via initialisation arg `multistart`
 - [#582](https://github.com/pybop-team/PyBOP/pull/582) - Fixes `population_size` arg for Pints' based optimisers, reshapes `parameters.rvs` to be parameter instances.
 - [#570](https://github.com/pybop-team/PyBOP/pull/570) - Updates the contour and surface plots, adds mixed chain effective sample size computation, x0 to optim.log

diff --git a/pybop/_classification.py b/pybop/_classification.py
@@ -0,0 +1,117 @@
+import numpy as np
+
+
+def classify_using_Hessian(optim, x=None, epsilon=1e-2):
+    """
+    A simple check for parameter correlations based on numerical approximation
+    of the Hessian matrix at the optimal point using central finite differences.
+
+    Paramters
+    ---------
+    x : array-like, optional
+        The parameters values assumed to be the optimal point (default: optim.result.x).
+    epsilon : float, optional
+        A small positive value used to check proximity to the parameter bounds and as the
+        perturbation distance used in the finite difference calculations (default: 1e-2).
+    """
+
+    if x is None:
+        x = optim.result.x
+        final_cost = optim.result.final_cost
+    else:
+        final_cost = optim.cost(x)
+
+    n = len(x)
+    if n != 2:
+        raise ValueError(
+            "The function classify_using_Hessian currently only works"
+            " in the case of 2 parameters."
+        )
+
+    # Get a list of parameter names for use in the output message
+    names = list(optim.cost.parameters.keys())
+
+    # Evaluate the cost for a grid of surrounding points
+    dx = x * epsilon
+    costs = np.zeros((3, 3, 2))
+    for i in np.arange(0, 3):
+        for j in np.arange(0, 3):
+            if i == j == 1:
+                costs[1, 1, 0] = final_cost
+                costs[1, 1, 1] = final_cost
+            costs[i, j, 0] = optim.cost(x + np.multiply([i - 1, j - 1], dx))
+            costs[i, j, 1] = optim.cost(x + np.multiply([i - 1, j - 1], 2 * dx))
+
+    print(costs - final_cost)
+
+    # Classify the result
+    if (optim.minimising and np.any(costs < final_cost)) or (
+        not optim.minimising and np.any(costs > final_cost)
+    ):
+        message = "The optimiser has not converged to a stationary point."
+
+        # Check proximity to bounds
+        bounds = optim.cost.parameters.get_bounds()
+        if bounds is not None:
+            for i, value in enumerate(x):
+                x_range = bounds["upper"][i] - bounds["lower"][i]
+                if value > bounds["upper"][i] - epsilon * x_range:
+                    message += f" The result is near the upper bound of {names[i]}."
+
+                if value < bounds["lower"][i] + epsilon * x_range:
+                    message += f" The result is near the lower bound of {names[i]}."
+    else:
+        # Estimate the Hessian using second-order accurate central finite differences
+        # cfd_hessian = np.zeros((2, 2))
+        # cfd_hessian[0, 0] = costs[2,1,0] - 2 * costs[1,1,0] + costs[0,1,0]
+        # cfd_hessian[0, 1] = (costs[2,2,0] - costs[2,0,0] + costs[0,0,0] - costs[0,2,0]) / 4
+        # cfd_hessian[1, 0] = cfd_hessian[0, 1]
+        # cfd_hessian[1, 1] = costs[1,2,0] - 2 * costs[1,1,0] + costs[1,0,0]
+
+        # Estimate the Hessian using fourth-order accurate central finite differences
+        cfd_hessian = np.zeros((2, 2))
+        cfd_hessian[0, 0] = (
+            -costs[2, 1, 1]
+            + 16 * costs[2, 1, 0]
+            - 30 * costs[1, 1, 0]
+            + 16 * costs[0, 1, 0]
+            - costs[0, 1, 1]
+        ) / 12
+        cfd_hessian[0, 1] = (
+            -(costs[2, 2, 1] - costs[2, 0, 1] + costs[0, 0, 1] - costs[0, 2, 1])
+            + 16 * (costs[2, 2, 0] - costs[2, 0, 0] + costs[0, 0, 0] - costs[0, 2, 0])
+        ) / 48
+        cfd_hessian[1, 0] = cfd_hessian[0, 1]
+        cfd_hessian[1, 1] = (
+            -costs[1, 2, 1]
+            + 16 * costs[1, 2, 0]
+            - 30 * costs[1, 1, 0]
+            + 16 * costs[1, 0, 0]
+            - costs[1, 0, 1]
+        ) / 12
+
+        # Compute the eigenvalues, returned in ascending order
+        eigr = np.linalg.eigh(cfd_hessian)
+        eigenvalues = eigr.eigenvalues
+
+        # Classify the result
+        cost_tolerance = epsilon**2 * final_cost
+        if np.all(eigenvalues > cost_tolerance):
+            message = "The optimiser has located a minimum."
+        elif np.all(eigenvalues < -cost_tolerance):
+            message = "The optimiser has located a maximum."
+        elif np.all(np.abs(eigenvalues) > cost_tolerance):
+            message = "The optimiser has located a saddle point."
+        else:
+            # At least one eigenvalue is too small to classify with certainty
+            if np.all(np.abs(eigenvalues) < cost_tolerance):
+                message = "The cost is insensitive to these parameters."
+            elif np.allclose(eigr.eigenvectors[0], np.array([1, 0])):
+                message = f"The cost is insensitive to {names[0]}."
+            elif np.allclose(eigr.eigenvectors[0], np.array([0, 1])):
+                message = f"The cost is insensitive to {names[1]}."
+            else:
+                message = "There may be a correlation between these parameters."
+
+    print(message)
+    return message
diff --git a/tests/integration/test_classification.py b/tests/integration/test_classification.py
@@ -0,0 +1,198 @@
+import numpy as np
+import pytest
+from pybamm import Parameter
+
+import pybop
+from pybop._classification import classify_using_Hessian
+
+
+class TestClassification:
+    """
+    A class to test the classification of different optimisation results.
+    """
+
+    @pytest.fixture(
+        params=[
+            np.asarray([0.05, 0.05]),
+            np.asarray([0.1, 0.05]),
+            np.asarray([0.05, 0.01]),
+        ]
+    )
+    def parameters(self, request):
+        ground_truth = request.param
+        return pybop.Parameters(
+            pybop.Parameter(
+                "R0 [Ohm]",
+                prior=pybop.Gaussian(0.05, 0.01),
+                bounds=[0.02, 0.08],
+                true_value=ground_truth[0],
+            ),
+            pybop.Parameter(
+                "R1 [Ohm]",
+                prior=pybop.Gaussian(0.05, 0.01),
+                bounds=[0.02, 0.08],
+                true_value=ground_truth[1],
+            ),
+        )
+
+    @pytest.fixture
+    def parameter_set(self):
+        parameter_set = pybop.ParameterSet(
+            json_path="examples/parameters/initial_ecm_parameters.json"
+        )
+        parameter_set.import_parameters()
+        parameter_set.params.update({"C1 [F]": 1000})
+        return parameter_set
+
+    @pytest.fixture
+    def model(self, parameter_set, parameters):
+        parameter_set.params.update(parameters.as_dict(parameters.true_value()))
+        return pybop.empirical.Thevenin(parameter_set=parameter_set)
+
+    @pytest.fixture
+    def dataset(self, model):
+        experiment = pybop.Experiment(
+            [
+                (
+                    "Discharge at 0.5C for 2 minutes (4 seconds period)",
+                    "Charge at 0.5C for 2 minutes (4 seconds period)",
+                ),
+            ]
+        )
+        solution = model.predict(experiment=experiment)
+        return pybop.Dataset(
+            {
+                "Time [s]": solution["Time [s]"].data,
+                "Current function [A]": solution["Current [A]"].data,
+                "Voltage [V]": solution["Voltage [V]"].data,
+            }
+        )
+
+    @pytest.fixture
+    def problem(self, model, parameters, dataset):
+        return pybop.FittingProblem(model, parameters, dataset)
+
+    @pytest.mark.integration
+    def test_classify_using_Hessian(self, problem):
+        cost = pybop.RootMeanSquaredError(problem)
+        optim = pybop.XNES(cost=cost)
+
+        x = np.asarray(cost.parameters.true_value())
+        bounds = cost.parameters.get_bounds()
+        optim_x = np.clip(x, bounds["lower"], bounds["upper"])
+
+        if np.all(x == np.asarray([0.05, 0.05])):
+            message = classify_using_Hessian(optim, optim_x)
+            assert message == "The optimiser has located a minimum."
+        elif np.all(x == np.asarray([0.1, 0.05])):
+            message = classify_using_Hessian(optim, optim_x)
+            assert message == (
+                "The optimiser has not converged to a stationary point."
+                " The result is near the upper bound of R0 [Ohm]."
+            )
+        elif np.all(x == np.asarray([0.05, 0.01])):
+            message = classify_using_Hessian(optim, optim_x)
+            assert message == (
+                "The optimiser has not converged to a stationary point."
+                " The result is near the lower bound of R1 [Ohm]."
+            )
+        else:
+            raise Exception("Please add a check for these values.")
+
+        if np.all(x == np.asarray([0.05, 0.05])):
+            cost = pybop.GaussianLogLikelihoodKnownSigma(problem, sigma0=0.002)
+            optim = pybop.XNES(cost=cost)
+
+            message = classify_using_Hessian(optim, x)
+            assert message == "The optimiser has located a maximum."
+
+        # message = classify_using_Hessian(optim, x)
+        # assert message == "The optimiser has located a saddle point."
+
+    @pytest.mark.integration
+    def test_insensitive_classify_using_Hessian(self, parameter_set):
+        param_R0 = pybop.Parameter(
+            "R0 [Ohm]",
+            bounds=[0, 0.002],
+            true_value=0.001,
+        )
+        param_R0_mod = pybop.Parameter(
+            "R0 modification [Ohm]",
+            bounds=[-1e-4, 1e-4],
+            true_value=0,
+        )
+        param_R1_mod = pybop.Parameter(
+            "R1 modification [Ohm]",
+            bounds=[-1e-4, 1e-4],
+            true_value=0,
+        )
+        parameter_set.params.update(
+            {
+                "R0 modification [Ohm]": 0,
+                "R1 modification [Ohm]": 0,
+            },
+            check_already_exists=False,
+        )
+        R0, R1 = parameter_set["R0 [Ohm]"], parameter_set["R1 [Ohm]"]
+        parameter_set.params.update(
+            {
+                "R0 [Ohm]": R0 + Parameter("R0 modification [Ohm]"),
+                "R1 [Ohm]": R1 + Parameter("R1 modification [Ohm]"),
+            }
+        )
+        model = pybop.empirical.Thevenin(parameter_set=parameter_set)
+
+        experiment = pybop.Experiment(
+            ["Discharge at 0.5C for 2 minutes (4 seconds period)"]
+        )
+        solution = model.predict(experiment=experiment)
+        dataset = pybop.Dataset(
+            {
+                "Time [s]": solution["Time [s]"].data,
+                "Current function [A]": solution["Current [A]"].data,
+                "Voltage [V]": solution["Voltage [V]"].data,
+            }
+        )
+
+        for i, parameters in enumerate(
+            [
+                pybop.Parameters(param_R0_mod, param_R1_mod),
+                pybop.Parameters(param_R1_mod, param_R0),
+                pybop.Parameters(param_R0, param_R1_mod),
+            ]
+        ):
+            problem = pybop.FittingProblem(model, parameters, dataset)
+            cost = pybop.SumofPower(problem, p=3)
+            optim = pybop.XNES(cost=cost)
+
+            x = np.asarray(cost.parameters.true_value())
+            message = classify_using_Hessian(optim, x)
+
+            if i == 0:
+                assert message == "The cost is insensitive to these parameters."
+            elif i == 1 or i == 2:
+                assert message == "The cost is insensitive to R1 modification [Ohm]."
+
+        parameters = pybop.Parameters(param_R0, param_R0_mod)
+        problem = pybop.FittingProblem(model, parameters, dataset)
+        cost = pybop.SumofPower(problem, p=3)
+        optim = pybop.XNES(cost=cost)
+
+        x = np.asarray(cost.parameters.true_value())
+        message = classify_using_Hessian(optim, x)
+        assert message == "There may be a correlation between these parameters."
+
+    @pytest.mark.integration
+    def test_classify_using_Hessian_invalid(self, model, parameters, dataset):
+        parameters.remove("R0 [Ohm]")
+        problem = pybop.FittingProblem(model, parameters, dataset)
+        cost = pybop.SumSquaredError(problem)
+        optim = pybop.SNES(cost=cost)
+        optim.run()
+
+        with pytest.raises(
+            ValueError,
+            match="The function classify_using_Hessian currently only works"
+            " in the case of 2 parameters.",
+        ):
+            classify_using_Hessian(optim)