From eebae51767a907df77d38c9a4e9dc895bdc452b3 Mon Sep 17 00:00:00 2001 From: Brady Planden Date: Mon, 25 Nov 2024 17:51:08 +0000 Subject: [PATCH 1/7] feat: adds multi-dimensional learning rate gradient descent implementation --- examples/scripts/spm_descent.py | 11 +- pybop/__init__.py | 1 + pybop/optimisers/_gradient_descent.py | 132 +++++++++++++++++++++++ pybop/optimisers/base_pints_optimiser.py | 5 +- pybop/optimisers/pints_optimisers.py | 10 +- 5 files changed, 148 insertions(+), 11 deletions(-) create mode 100644 pybop/optimisers/_gradient_descent.py diff --git a/examples/scripts/spm_descent.py b/examples/scripts/spm_descent.py index 92332849f..41c47e876 100644 --- a/examples/scripts/spm_descent.py +++ b/examples/scripts/spm_descent.py @@ -12,11 +12,11 @@ parameters = pybop.Parameters( pybop.Parameter( "Negative electrode active material volume fraction", - prior=pybop.Gaussian(0.68, 0.05), + prior=pybop.Gaussian(0.6, 0.01), ), pybop.Parameter( "Positive electrode active material volume fraction", - prior=pybop.Gaussian(0.58, 0.05), + prior=pybop.Gaussian(0.6, 0.01), ), ) @@ -40,9 +40,9 @@ cost = pybop.RootMeanSquaredError(problem) optim = pybop.GradientDescent( cost, - sigma0=0.05, + sigma0=[0.6, 0.02], verbose=True, - max_iterations=125, + max_iterations=75, ) # Run optimisation @@ -58,4 +58,5 @@ pybop.plot.parameters(optim) # Plot the cost landscape with optimisation path -pybop.plot.surface(optim) +bounds = np.asarray([[0.5, 0.8], [0.4, 0.7]]) +pybop.plot.surface(optim, bounds=bounds) diff --git a/pybop/__init__.py b/pybop/__init__.py index 9eab3d5d6..c81b00893 100644 --- a/pybop/__init__.py +++ b/pybop/__init__.py @@ -123,6 +123,7 @@ from .optimisers._cuckoo import CuckooSearchImpl from .optimisers._adamw import AdamWImpl +from .optimisers._gradient_descent import GradientDescentImpl from .optimisers.base_optimiser import BaseOptimiser, OptimisationResult from .optimisers.base_pints_optimiser import BasePintsOptimiser from .optimisers.scipy_optimisers import ( diff --git a/pybop/optimisers/_gradient_descent.py b/pybop/optimisers/_gradient_descent.py new file mode 100644 index 000000000..35ad028d4 --- /dev/null +++ b/pybop/optimisers/_gradient_descent.py @@ -0,0 +1,132 @@ +import numpy as np +import pints + + +class GradientDescentImpl(pints.Optimiser): + """ + Gradient descent method with a fixed, per-dimension learning rate. + + Gradient descent updates the current position in the direction of the + steepest descent, as determined by the negative of the gradient of the + function. + + The update rule for each iteration is given by: + + x_{t+1} = x_t - \\eta * \nabla f(x_t) + + where: + - x_t are the current parameter values at iteration t, + - \nabla f(x_t) is the gradient of the function at x_t, + - \\eta is the learning rate, which controls the step size. + + Parameters + ---------- + x0 : array-like + Initial starting point for the optimisation. This should be a 1D array + representing the starting parameter values for the function being + optimised. + sigma0 : float or array-like, optional + Initial learning rate or rates for each dimension. If a scalar is + provided, the same learning rate is applied across all dimensions. + If an array is provided, each dimension will have its own learning + rate. Defaults to 0.02. + boundaries : pybop.Boundaries, optional + Boundaries for the parameters. This optimiser ignores boundaries and + operates as an unbounded method. Defaults to None. + + Attributes + ---------- + _x_best : array-like + The best parameter values (solution) found so far. + _f_best : float + The best function value (objective value) found so far. + _current : array-like + The current parameter values at the latest iteration. + _eta : array-like + The current learning rate(s). Can be a scalar or per-dimension array. + _running : bool + Indicates whether the optimisation process is running. + _ready_for_tell : bool + Indicates whether the optimiser is ready to receive feedback from + the objective function. + """ + + def __init__(self, x0, sigma0=0.02, boundaries=None): + super().__init__(x0, sigma0, boundaries) + + # Initialise state + self._x_best = self._current = self._x0 + self._f_best = np.inf + self._eta = np.asarray(sigma0, dtype=float) + + # State tracking + self._running = False + self._ready_for_tell = False + + def ask(self): + """Proposes the next point for evaluation.""" + self._ready_for_tell = True + self._running = True + return [self._current] + + def tell(self, reply): + """Updates optimiser with function evaluation results.""" + if not self._ready_for_tell: + raise RuntimeError("ask() must be called before tell().") + self._ready_for_tell = False + + fx, dfx = reply[0] + + # Update state + self._current_f, self._current_df = fx, dfx + self._current = self._current - self._eta * dfx + + # Track best solution + if fx < self._f_best: + self._f_best, self._x_best = fx, self._current + + def f_best(self): + """Returns the best objective value found.""" + return self._f_best + + def x_best(self): + """Returns the best solution found.""" + return self._x_best + + def learning_rate(self): + """Returns the learning rate(s).""" + return self._eta + + def set_learning_rate(self, eta): + """ + Sets the learning rate. Supports per-dimension rates. + + Parameters + ---------- + eta : float or array-like + New learning rate(s). + """ + eta = np.asarray(eta, dtype=float) + if np.any(eta <= 0): + raise ValueError("Learning rate(s) must be positive.") + self._eta = eta + + def needs_sensitivities(self): + """Indicates this optimiser requires gradient information.""" + return True + + def running(self): + """Returns whether the optimiser is running.""" + return self._running + + def name(self): + """Returns the name of the optimiser.""" + return "Gradient descent" + + def n_hyper_parameters(self): + """Returns the number of hyper-parameters (learning rate).""" + return self._eta.size if self._eta.ndim > 0 else 1 + + def set_hyper_parameters(self, x): + """Sets hyper-parameters (learning rate).""" + self.set_learning_rate(x) diff --git a/pybop/optimisers/base_pints_optimiser.py b/pybop/optimisers/base_pints_optimiser.py index f03fc7a19..982e19220 100644 --- a/pybop/optimisers/base_pints_optimiser.py +++ b/pybop/optimisers/base_pints_optimiser.py @@ -3,7 +3,6 @@ import numpy as np from pints import PSO as PintsPSO from pints import Adam as PintsAdam -from pints import GradientDescent as PintsGradientDescent from pints import NelderMead as PintsNelderMead from pints import Optimiser as PintsOptimiser from pints import ParallelEvaluator as PintsParallelEvaluator @@ -12,7 +11,7 @@ from pints import SequentialEvaluator as PintsSequentialEvaluator from pints import strfloat as PintsStrFloat -from pybop import BaseOptimiser, OptimisationResult +from pybop import BaseOptimiser, GradientDescentImpl, OptimisationResult class BasePintsOptimiser(BaseOptimiser): @@ -136,7 +135,7 @@ def _sanitise_inputs(self): # Convert bounds to PINTS boundaries if self.bounds is not None: - ignored_optimisers = (PintsGradientDescent, PintsAdam, PintsNelderMead) + ignored_optimisers = (GradientDescentImpl, PintsAdam, PintsNelderMead) if issubclass(self.optimiser, ignored_optimisers): print(f"NOTE: Boundaries ignored by {self.optimiser}") self.bounds = None diff --git a/pybop/optimisers/pints_optimisers.py b/pybop/optimisers/pints_optimisers.py index d4d89a6a4..ac19fab84 100644 --- a/pybop/optimisers/pints_optimisers.py +++ b/pybop/optimisers/pints_optimisers.py @@ -5,11 +5,15 @@ from pints import SNES as PintsSNES from pints import XNES as PintsXNES from pints import Adam as PintsAdam -from pints import GradientDescent as PintsGradientDescent from pints import IRPropMin as PintsIRPropMin from pints import NelderMead as PintsNelderMead -from pybop import AdamWImpl, BasePintsOptimiser, CuckooSearchImpl +from pybop import ( + AdamWImpl, + BasePintsOptimiser, + CuckooSearchImpl, + GradientDescentImpl, +) class GradientDescent(BasePintsOptimiser): @@ -69,7 +73,7 @@ def __init__( ): super().__init__( cost, - PintsGradientDescent, + GradientDescentImpl, max_iterations, min_iterations, max_unchanged_iterations, From e2086c759798e032ed8408e790c488b9e03a1ac0 Mon Sep 17 00:00:00 2001 From: Brady Planden Date: Mon, 25 Nov 2024 10:34:36 +0000 Subject: [PATCH 2/7] fix: update prior bounds for mcmc integration tests --- tests/integration/test_monte_carlo_thevenin.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/tests/integration/test_monte_carlo_thevenin.py b/tests/integration/test_monte_carlo_thevenin.py index a23df6094..a6c9738cf 100644 --- a/tests/integration/test_monte_carlo_thevenin.py +++ b/tests/integration/test_monte_carlo_thevenin.py @@ -58,12 +58,12 @@ def parameters(self): return pybop.Parameters( pybop.Parameter( "R0 [Ohm]", - prior=pybop.Uniform(1e-2, 8e-2), + prior=pybop.Uniform(1e-3, 9e-2), bounds=[1e-4, 1e-1], ), pybop.Parameter( "R1 [Ohm]", - prior=pybop.Uniform(1e-2, 8e-2), + prior=pybop.Uniform(1e-3, 9e-2), bounds=[1e-4, 1e-1], ), ) From abac1847e1b3781a85186e6f580b19704676fe05 Mon Sep 17 00:00:00 2001 From: Brady Planden Date: Tue, 26 Nov 2024 10:06:08 +0000 Subject: [PATCH 3/7] tests: adds coverage, refactors optimisation unit tests --- pybop/optimisers/_adamw.py | 2 +- pybop/optimisers/_cuckoo.py | 3 + tests/unit/test_optimisation.py | 164 +++++++++++++++++--------------- 3 files changed, 91 insertions(+), 78 deletions(-) diff --git a/pybop/optimisers/_adamw.py b/pybop/optimisers/_adamw.py index 34c990206..92c4130f0 100644 --- a/pybop/optimisers/_adamw.py +++ b/pybop/optimisers/_adamw.py @@ -156,7 +156,7 @@ def tell(self, reply): # Check ask-tell pattern if not self._ready_for_tell: - raise RuntimeError("ask() not called before tell()") + raise RuntimeError("ask() must be called before tell().") self._ready_for_tell = False # Unpack reply diff --git a/pybop/optimisers/_cuckoo.py b/pybop/optimisers/_cuckoo.py index 346052728..dba591d7c 100644 --- a/pybop/optimisers/_cuckoo.py +++ b/pybop/optimisers/_cuckoo.py @@ -105,6 +105,9 @@ def tell(self, replies): previously specified by `self.ask()`, and updates the optimiser state accordingly. """ + if not self._ready_for_tell: + raise RuntimeError("ask() must be called before tell().") + # Update iteration count self._iterations += 1 diff --git a/tests/unit/test_optimisation.py b/tests/unit/test_optimisation.py index 36d1ed9ff..a10d62e8d 100644 --- a/tests/unit/test_optimisation.py +++ b/tests/unit/test_optimisation.py @@ -1,4 +1,5 @@ import io +import re import sys import warnings @@ -141,42 +142,48 @@ def test_no_optimisation_parameters(self, model, dataset): ) @pytest.mark.unit def test_optimiser_kwargs(self, cost, optimiser): - optim = optimiser(cost=cost, max_iterations=3, tol=1e-6) - cost_bounds = cost.parameters.get_bounds() + def assert_log_update(optim): + optim.log_update(x=[0.7], cost=[0.01]) + assert optim.log["x"][-1] == 0.7 + assert optim.log["cost"][-1] == 0.01 - # Check maximum iterations - results = optim.run() - assert results.n_iterations == 3 + def check_max_iterations(optim): + results = optim.run() + assert results.n_iterations == 3 - # Test BaseOptimiser.log_update - optim.log_update(x=[0.7], cost=[0.01]) + def check_incorrect_update(optim): + with pytest.raises( + TypeError, match="Input must be a list, tuple, or numpy array" + ): + optim.log_update(x="Incorrect") - assert optim.log["x"][-1] == 0.7 - assert optim.log["cost"][-1] == 0.01 + def check_bounds_handling(optim, expected_bounds, should_raise=False): + if should_raise: + with pytest.raises( + ValueError, match="Either all bounds or no bounds must be set" + ): + optim = optimiser(cost=cost, bounds=expected_bounds) + else: + assert optim.bounds == expected_bounds - # Test incorrect update - with pytest.raises( - TypeError, match="Input must be a list, tuple, or numpy array" - ): - optim.log_update(x="Incorrect") + optim = optimiser(cost=cost, max_iterations=3, tol=1e-6) + cost_bounds = cost.parameters.get_bounds() + + check_max_iterations(optim) + assert_log_update(optim) + check_incorrect_update(optim) if optimiser in [pybop.GradientDescent, pybop.Adam, pybop.NelderMead]: - # Ignored bounds optim = optimiser(cost=cost, bounds=cost_bounds) assert optim.bounds is None elif optimiser in [pybop.PSO]: - assert optim.bounds == cost_bounds - # Cannot accept infinite bounds - bounds = {"upper": [np.inf], "lower": [0.57]} - with pytest.raises( - ValueError, - match="Either all bounds or no bounds must be set", - ): - optim = optimiser(cost=cost, bounds=bounds) + check_bounds_handling(optim, cost_bounds) + check_bounds_handling( + optim, {"upper": [np.inf], "lower": [0.57]}, should_raise=True + ) else: - # Check and update bounds - assert optim.bounds == cost_bounds bounds = {"upper": [0.63], "lower": [0.57]} + check_bounds_handling(optim, cost_bounds) optim = optimiser(cost=cost, bounds=bounds) assert optim.bounds == bounds @@ -197,22 +204,20 @@ def test_optimiser_kwargs(self, cost, optimiser): match="Unrecognised keyword arguments: {'unrecognised': 10} will not be used.", ): warnings.simplefilter("always") - optim = optimiser(cost=cost, unrecognised=10) + optimiser(cost=cost, unrecognised=10) assert not optim.optimiser.running() else: - # Check bounds in list format and update tol - bounds = [ + bounds_list = [ (lower, upper) for lower, upper in zip(bounds["lower"], bounds["upper"]) ] - optim = optimiser(cost=cost, bounds=bounds, tol=1e-2) - assert optim.bounds == bounds + optim = optimiser(cost=cost, bounds=bounds_list, tol=1e-2) + assert optim.bounds == bounds_list if optimiser in [ pybop.SciPyMinimize, pybop.SciPyDifferentialEvolution, pybop.XNES, ]: - # Pass nested options optim = optimiser(cost=cost, options=dict(max_iterations=10)) with pytest.raises( Exception, @@ -223,67 +228,72 @@ def test_optimiser_kwargs(self, cost, optimiser): ) if optimiser in [pybop.SciPyDifferentialEvolution, pybop.SciPyMinimize]: - # Pass duplicate keywords with pytest.raises( - Exception, - match="option was passed in addition to the expected", + Exception, match="option was passed in addition to the expected" ): optimiser(cost=cost, maxiter=5, max_iterations=10) - if optimiser in [pybop.SciPyDifferentialEvolution]: - # Update population size, test maxiter arg + if optimiser == pybop.SciPyDifferentialEvolution: pop_maxiter_optim = optimiser(cost=cost, maxiter=3, popsize=5) assert pop_maxiter_optim._options["maxiter"] == 3 assert pop_maxiter_optim._options["popsize"] == 5 - # Test invalid bounds - with pytest.raises( - ValueError, match="Bounds must be specified for differential_evolution." - ): - optimiser(cost=cost, bounds=None) - with pytest.raises( - ValueError, match="Bounds must be specified for differential_evolution." - ): - optimiser(cost=cost, bounds=[(0, np.inf)]) - with pytest.raises( - ValueError, match="Bounds must be specified for differential_evolution." - ): - optimiser(cost=cost, bounds={"upper": [np.inf], "lower": [0.57]}) - - # Test AdamW hyperparameters - if optimiser in [pybop.AdamW]: - optim = optimiser(cost=cost, b1=0.9, b2=0.999, lam=0.1) - optim.optimiser.b1 = 0.9 - optim.optimiser.b2 = 0.9 - optim.optimiser.lam = 0.1 - - assert optim.optimiser.b1 == 0.9 - assert optim.optimiser.b2 == 0.9 - assert optim.optimiser.lam == 0.1 + invalid_bounds_cases = [ + None, + [(0, np.inf)], + {"upper": [np.inf], "lower": [0.57]}, + ] - # Incorrect values - for i, _match in (("Value", -1),): - with pytest.raises( - Exception, match="must be a numeric value between 0 and 1." - ): - optim.optimiser.b1 = i - with pytest.raises( - Exception, match="must be a numeric value between 0 and 1." - ): - optim.optimiser.b2 = i + for bounds_case in invalid_bounds_cases: with pytest.raises( - Exception, match="must be a numeric value between 0 and 1." + ValueError, + match="Bounds must be specified for differential_evolution.", ): - optim.optimiser.lam = i + optimiser(cost=cost, bounds=bounds_case) - # Check defaults - assert optim.optimiser.n_hyper_parameters() == 5 - assert optim.optimiser.x_guessed() == optim.optimiser._x0 - with pytest.raises(RuntimeError): + if optimiser in [pybop.AdamW, pybop.CuckooSearch, pybop.GradientDescent]: + optim = optimiser(cost) + with pytest.raises( + RuntimeError, match=re.escape("ask() must be called before tell().") + ): optim.optimiser.tell([0.1]) + if optimiser is pybop.GradientDescent: + assert optim.optimiser.learning_rate() == 0.02 + optim.optimiser.set_learning_rate(0.1) + assert optim.optimiser.learning_rate() == 0.1 + assert optim.optimiser.n_hyper_parameters() == 1 + optim.optimiser.set_hyper_parameters([0.1, 0.3]) + np.testing.assert_allclose(optim.optimiser.learning_rate(), [0.1, 0.3]) + + if optimiser is pybop.AdamW: + optim = optimiser(cost=cost, b1=0.9, b2=0.999, lam=0.1) + optim.optimiser.b1 = 0.9 + optim.optimiser.b2 = 0.9 + optim.optimiser.lam = 0.1 + + assert optim.optimiser.b1 == 0.9 + assert optim.optimiser.b2 == 0.9 + assert optim.optimiser.lam == 0.1 + + for i, _match in (("Value", -1),): + with pytest.raises( + Exception, match="must be a numeric value between 0 and 1." + ): + optim.optimiser.b1 = i + with pytest.raises( + Exception, match="must be a numeric value between 0 and 1." + ): + optim.optimiser.b2 = i + with pytest.raises( + Exception, match="must be a numeric value between 0 and 1." + ): + optim.optimiser.lam = i + + assert optim.optimiser.n_hyper_parameters() == 5 + assert optim.optimiser.x_guessed() == optim.optimiser._x0 + else: - # Check and update initial values x0 = cost.parameters.initial_value() assert optim.x0 == x0 x0_new = np.array([0.6]) From 7bd2ea1014d3472cb47def5a02cf84fd3b36d428 Mon Sep 17 00:00:00 2001 From: Brady Planden Date: Tue, 26 Nov 2024 10:30:29 +0000 Subject: [PATCH 4/7] tests: adds missing coverage for negative learning rate ValueError --- tests/unit/test_optimisation.py | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/tests/unit/test_optimisation.py b/tests/unit/test_optimisation.py index a10d62e8d..137281608 100644 --- a/tests/unit/test_optimisation.py +++ b/tests/unit/test_optimisation.py @@ -266,6 +266,11 @@ def check_bounds_handling(optim, expected_bounds, should_raise=False): optim.optimiser.set_hyper_parameters([0.1, 0.3]) np.testing.assert_allclose(optim.optimiser.learning_rate(), [0.1, 0.3]) + with pytest.raises( + ValueError, match=re.escape("Learning rate(s) must be positive.") + ): + optim.optimiser.set_learning_rate(-0.1) + if optimiser is pybop.AdamW: optim = optimiser(cost=cost, b1=0.9, b2=0.999, lam=0.1) optim.optimiser.b1 = 0.9 From 78ebf9f3b1fe5a0efeff1f365605313890a252c5 Mon Sep 17 00:00:00 2001 From: Brady Planden Date: Tue, 26 Nov 2024 11:27:31 +0000 Subject: [PATCH 5/7] docs: add Pints' reference to docstring --- pybop/optimisers/_gradient_descent.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/pybop/optimisers/_gradient_descent.py b/pybop/optimisers/_gradient_descent.py index 35ad028d4..5a340d245 100644 --- a/pybop/optimisers/_gradient_descent.py +++ b/pybop/optimisers/_gradient_descent.py @@ -19,6 +19,9 @@ class GradientDescentImpl(pints.Optimiser): - \nabla f(x_t) is the gradient of the function at x_t, - \\eta is the learning rate, which controls the step size. + This class reimplements the Pints' Gradient Descent, but with multidimensional, + fixed learning rates. Original creation and credit is attributed to Pints. + Parameters ---------- x0 : array-like From 898f1738d3526a650f9ce9bb2c631f8edd5e949a Mon Sep 17 00:00:00 2001 From: Brady Planden Date: Tue, 26 Nov 2024 12:03:27 +0000 Subject: [PATCH 6/7] add changelog entry --- CHANGELOG.md | 1 + 1 file changed, 1 insertion(+) diff --git a/CHANGELOG.md b/CHANGELOG.md index bcfe6c905..6d662f24d 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -2,6 +2,7 @@ ## Features +- [#569](https://github.com/pybop-team/PyBOP/pull/569) - Adds parameter specific learning rate functionality to GradientDescent optimiser. - [#282](https://github.com/pybop-team/PyBOP/issues/282) - Restructures the examples directory. - [#396](https://github.com/pybop-team/PyBOP/issues/396) - Adds `ecm_with_tau.py` example script. - [#452](https://github.com/pybop-team/PyBOP/issues/452) - Extends `cell_mass` and `approximate_capacity` for half-cell models. From ea2c6e712e5f11c14cce2a425f1b56158dbe755e Mon Sep 17 00:00:00 2001 From: Brady Planden Date: Tue, 26 Nov 2024 13:19:15 +0000 Subject: [PATCH 7/7] docs: adds mathjax rendering to docstring --- pybop/optimisers/_gradient_descent.py | 10 ++++++---- 1 file changed, 6 insertions(+), 4 deletions(-) diff --git a/pybop/optimisers/_gradient_descent.py b/pybop/optimisers/_gradient_descent.py index 5a340d245..7042c927c 100644 --- a/pybop/optimisers/_gradient_descent.py +++ b/pybop/optimisers/_gradient_descent.py @@ -12,12 +12,14 @@ class GradientDescentImpl(pints.Optimiser): The update rule for each iteration is given by: - x_{t+1} = x_t - \\eta * \nabla f(x_t) + .. math:: + + x_{t+1} = x_t - \\eta * \\nabla f(x_t) where: - - x_t are the current parameter values at iteration t, - - \nabla f(x_t) is the gradient of the function at x_t, - - \\eta is the learning rate, which controls the step size. + - :math:`x_t` are the current parameter values at iteration t, + - :math:`\\nabla f(x_t)` is the gradient of the function at :math:`x_t`, + - :math:`\\eta` is the learning rate, which controls the step size. This class reimplements the Pints' Gradient Descent, but with multidimensional, fixed learning rates. Original creation and credit is attributed to Pints.