pints-team · MichaelClerx · Aug 17, 2022 · Aug 16, 2022 · Aug 16, 2022 · Aug 17, 2022
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -5,6 +5,7 @@ All notable changes to this project will be documented in this file.
 ## Unreleased
 
 ### Added
+- [#1460](https://github.com/pints-team/pints/pull/1460) Added the `Adam` local optimiser.
 - [#1459](https://github.com/pints-team/pints/pull/1459) Added the `iRprop-` local optimiser.
 - [#1432](https://github.com/pints-team/pints/pull/1432) Added 2 new stochastic models: production and degradation model, Schlogl's system of chemical reactions. Moved the stochastic logistic model into `pints.stochastic` to take advantage of the `MarkovJumpModel`.
 - [#1420](https://github.com/pints-team/pints/pull/1420) The `Optimiser` class now distinguishes between a best-visited point (`x_best`, with score `f_best`) and a best-guessed point (`x_guessed`, with approximate score `f_guessed`). For most optimisers, the two values are equivalent. The `OptimisationController` still tracks `x_best` and `f_best` by default, but this can be modified using the methods `set_f_guessed_tracking` and `f_guessed_tracking`.

diff --git a/docs/source/optimisers/adam.rst b/docs/source/optimisers/adam.rst
@@ -0,0 +1,8 @@
+*********************************
+Adam (adaptive moment estimation)
+*********************************
+
+.. currentmodule:: pints
+
+.. autoclass:: Adam
+
diff --git a/docs/source/optimisers/index.rst b/docs/source/optimisers/index.rst
@@ -16,6 +16,7 @@ or the :class:`OptimisationController` class.
     running
     base_classes
     convenience_methods
+    adam
     cmaes_bare
     cmaes
     gradient_descent

diff --git a/examples/README.md b/examples/README.md
@@ -38,6 +38,7 @@ relevant code.
 - [XNES](./optimisation/xnes.ipynb)
 
 ### Local optimisers
+- [Adam](./optimisation/adam.ipynb)
 - [Gradient descent](./optimisation/gradient-descent.ipynb)
 - [iRprop-](./optimisation/irpropmin.ipynb)
 - [Nelder-Mead](./optimisation/nelder-mead.ipynb)

diff --git a/examples/optimisation/adam.ipynb b/examples/optimisation/adam.ipynb
diff --git a/examples/optimisation/irpropmin.ipynb b/examples/optimisation/irpropmin.ipynb
diff --git a/pints/__init__.py b/pints/__init__.py
@@ -173,6 +173,7 @@ def version(formatted=False):
     Optimiser,
     PopulationBasedOptimiser,
 )
+from ._optimisers._adam import Adam
 from ._optimisers._cmaes import CMAES
 from ._optimisers._cmaes_bare import BareCMAES
 from ._optimisers._gradient_descent import GradientDescent

diff --git a/pints/_optimisers/_adam.py b/pints/_optimisers/_adam.py
@@ -0,0 +1,153 @@
+#
+# Adam optimiser.
+#
+# This file is part of PINTS (https://github.com/pints-team/pints/) which is
+# released under the BSD 3-clause license. See accompanying LICENSE.md for
+# copyright notice and full license details.
+#
+import pints
+
+import numpy as np
+
+
+class Adam(pints.Optimiser):
+    """
+    Adam optimiser (adaptive moment estimation), as described in [1]_.
+
+    This method is a variation on gradient descent that maintains two
+    "moments", allowing it to overshoot and go against the gradient for a short
+    time. This property can make it more robust against noisy gradients. Full
+    pseudo-code is given in [1]_ (Algorithm 1).
+
+    This implementation uses a fixed step size, set as `` min(sigma0)``. Note
+    that the adaptivity in this method comes from the changing moments, not
+    the step size.
+
+    References
+    ----------
+    .. [1] Adam: A method for stochastic optimization
+           Kingma and Ba, 2017, arxiv (version v9)
+           https://doi.org/10.48550/arXiv.1412.6980
+    """
+
+    def __init__(self, x0, sigma0=0.1, boundaries=None):
+        super().__init__(x0, sigma0, boundaries)
+
+        # Set optimiser state
+        self._running = False
+        self._ready_for_tell = False
+
+        # Best solution found
+        self._x_best = self._x0
+        self._f_best = np.inf
+
+        # Current point, score, and gradient
+        self._current = self._x0
+        self._current_f = np.inf
+        self._current_df = None
+
+        # Proposed next point (read-only, so can be passed to user)
+        self._proposed = self._x0
+        self._proposed.setflags(write=False)
+
+        # Moment vectors
+        self._m = np.zeros(self._x0.shape)
+        self._v = np.zeros(self._x0.shape)
+
+        # Exponential decay rates for the moment estimates
+        self._b1 = 0.9    # 0 < b1 <= 1
+        self._b2 = 0.999  # 0 < b2 <= 1
+
+        # Step size
+        self._alpha = np.min(self._sigma0)
+
+        # Small number added to avoid divide-by-zero
+        self._eps = 1e-8
+
+        # Powers of decay rates
+        self._b1t = 1
+        self._b2t = 1
+
+    def ask(self):
+        """ See :meth:`Optimiser.ask()`. """
+
+        # Running, and ready for tell now
+        self._ready_for_tell = True
+        self._running = True
+
+        # Return proposed points (just the one)
+        return [self._proposed]
+
+    def f_best(self):
+        """ See :meth:`Optimiser.f_best()`. """
+        return self._f_best
+
+    def f_guessed(self):
+        """ See :meth:`Optimiser.f_guessed()`. """
+        return self._current_f
+
+    def name(self):
+        """ See :meth:`Optimiser.name()`. """
+        return 'Adam'
+
+    def needs_sensitivities(self):
+        """ See :meth:`Optimiser.needs_sensitivities()`. """
+        return True
+
+    def n_hyper_parameters(self):
+        """ See :meth:`pints.TunableMethod.n_hyper_parameters()`. """
+        return 0
+
+    def running(self):
+        """ See :meth:`Optimiser.running()`. """
+        return self._running
+
+    def tell(self, reply):
+        """ See :meth:`Optimiser.tell()`. """
+
+        # Check ask-tell pattern
+        if not self._ready_for_tell:
+            raise Exception('ask() not called before tell()')
+        self._ready_for_tell = False
+
+        # Unpack reply
+        fx, dfx = reply[0]
+
+        # Update current point
+        self._current = self._proposed
+        self._current_f = fx
+        self._current_df = dfx
+
+        # Update bx^t
+        self._b1t *= self._b1
+        self._b2t *= self._b2
+
+        # "Update biased first moment estimate"
+        self._m = self._b1 * self._m + (1 - self._b1) * dfx
+
+        # "Update biased secon raw moment estimate"
+        self._v = self._b2 * self._v + (1 - self._b2) * dfx**2
+
+        # "Compute bias-corrected first moment estimate"
+        m = self._m / (1 - self._b1t)
+
+        # "Compute bias-corrected second raw moment estimate"
+        v = self._v / (1 - self._b2t)
+
+        # Take step
+        self._proposed = (
+            self._current - self._alpha * m / (np.sqrt(v) + self._eps))
+
+        # Update x_best and f_best
+        if self._f_best > fx:
+            self._f_best = fx
+            self._x_best = self._current
+
+    def x_best(self):
+        """ See :meth:`Optimiser.x_best()`. """
+        return self._x_best
+
+    def x_guessed(self):
+        """ See :meth:`Optimiser.x_guessed()`. """
+        return self._current
+
diff --git a/pints/_optimisers/_irpropmin.py b/pints/_optimisers/_irpropmin.py
@@ -146,11 +146,9 @@ def tell(self, reply):
 
         # First iteration
         if self._current_df is None:
+            self._current = self._proposed
             self._current_f = fx
             self._current_df = dfx
-            self._f_best = fx
-            self._x_best = self._current
-            return
 
         # Get product of new and previous gradient
         dprod = dfx * self._current_df
@@ -174,7 +172,7 @@ def tell(self, reply):
         #     the step size set in the current iteration
         dfx[dprod < 0] = 0
 
-        # "Accept" proposed point
+        # Update current position
         self._current = self._proposed
         self._current_f = fx
         self._current_df = dfx

diff --git a/pints/tests/test_opt_adam.py b/pints/tests/test_opt_adam.py
@@ -0,0 +1,118 @@
+#!/usr/bin/env python3
+#
+# Tests the API of the Adam optimiser.
+#
+# This file is part of PINTS (https://github.com/pints-team/pints/) which is
+# released under the BSD 3-clause license. See accompanying LICENSE.md for
+# copyright notice and full license details.
+#
+import unittest
+import numpy as np
+
+import pints
+import pints.toy
+
+from shared import StreamCapture
+
+
+debug = False
+method = pints.Adam
+
+
+class TestAdam(unittest.TestCase):
+    """
+    Tests the API of the Adam optimiser.
+    """
+    def setUp(self):
+        """ Called before every test """
+        np.random.seed(1)
+
+    def problem(self):
+        """ Returns a test problem, starting point, and sigma. """
+        r = pints.toy.ParabolicError()
+        x = [0.1, 0.1]
+        s = 0.1
+        return r, x, s
+
+    def test_simple(self):
+        # Runs an optimisation
+        r, x, s = self.problem()
+
+        opt = pints.OptimisationController(r, x, sigma0=s, method=method)
+        opt.set_log_to_screen(debug)
+        found_parameters, found_solution = opt.run()
+
+        # True solution is (0, 0) with error 0
+        self.assertTrue(found_solution < 1e-9)
+        self.assertLess(abs(found_parameters[0]), 1e-8)
+        self.assertLess(abs(found_parameters[1]), 1e-8)
+
+    def test_ask_tell(self):
+        # Tests ask-and-tell related error handling.
+        r, x, s = self.problem()
+        opt = method(x)
+
+        # Stop called when not running
+        self.assertFalse(opt.running())
+        self.assertFalse(opt.stop())
+
+        # Best position and score called before run
+        self.assertEqual(list(opt.x_best()), list(x))
+        self.assertEqual(list(opt.x_guessed()), list(x))
+        self.assertEqual(opt.f_best(), float('inf'))
+        self.assertEqual(opt.f_guessed(), float('inf'))
+
+        # Tell before ask
+        self.assertRaisesRegex(
+            Exception, r'ask\(\) not called before tell\(\)', opt.tell, 5)
+
+        # Ask
+        opt.ask()
+
+        # Now we should be running
+        self.assertTrue(opt.running())
+
+    def test_hyper_parameter_interface(self):
+        # Tests the hyper parameter interface for this optimiser.
+        opt = method([0])
+        self.assertEqual(opt.n_hyper_parameters(), 0)
+
+    def test_logging(self):
+
+        # Test with logpdf
+        r, x, s = self.problem()
+        opt = pints.OptimisationController(r, x, s, method=method)
+        opt.set_log_to_screen(True)
+        opt.set_max_unchanged_iterations(None)
+        opt.set_max_iterations(2)
+        with StreamCapture() as c:
+            opt.run()
+        lines = c.text().splitlines()
+        self.assertEqual(lines[0], 'Minimising error measure')
+        self.assertEqual(
+            lines[1], 'Using Adam')
+        self.assertEqual(lines[2], 'Running in sequential mode.')
+        self.assertEqual(
+            lines[3],
+            'Iter. Eval. Best      Current   Time m:s')
+        self.assertEqual(
+            lines[4][:-3],
+            '0     1      0.02      0.02       0:0')
+        self.assertEqual(
+            lines[5][:-3],
+            '1     2      5e-17     5e-17      0:0')
+
+    def test_name(self):
+        # Test the name() method.
+        opt = method(np.array([0]))
+        self.assertEqual(opt.name(), 'Adam')
+        self.assertTrue(opt.needs_sensitivities())
+
+
+if __name__ == '__main__':
+    print('Add -v for more debug output')
+    import sys
+    if '-v' in sys.argv:
+        debug = True
+    unittest.main()
+
diff --git a/pints/tests/test_opt_irpropmin.py b/pints/tests/test_opt_irpropmin.py
@@ -43,7 +43,7 @@ def test_simple(self):
         found_parameters, found_solution = opt.run()
 
         # True solution is (0, 0) with error 0
-        self.assertTrue(found_solution < 1e-6)
+        self.assertTrue(found_solution < 1e-9)
         self.assertLess(abs(found_parameters[0]), 1e-4)
         self.assertLess(abs(found_parameters[1]), 1e-4)
 
@@ -97,10 +97,10 @@ def test_logging(self):
             'Iter. Eval. Best      Current   Min. step Max. step Time m:s')
         self.assertEqual(
             lines[4][:-3],
-            '0     1      0.02      0.02      0.1       0.1        0:0')
+            '0     1      0.02      0.02      0.12      0.12       0:0')
         self.assertEqual(
             lines[5][:-3],
-            '1     2      0.02      0.02      0.12      0.12       0:0')
+            '1     2      0.0008    0.0008    0.06      0.06       0:0')
 
     def test_name(self):
         # Test the name() method.