From 1e4f2bba06fd6e5208f252d6cd6ef15641e900c8 Mon Sep 17 00:00:00 2001
From: Margaret Duff <margaret.duff@stfc.ac.uk>
Date: Tue, 24 Sep 2024 11:19:24 +0000
Subject: [PATCH 01/15] Work with ISTA and FISTA and new default

---
 .../cil/optimisation/algorithms/FISTA.py      | 13 +++++-
 .../optimisation/utilities/StepSizeMethods.py |  9 +++-
 Wrappers/Python/test/test_stepsizes.py        | 46 +++++++++++++++----
 3 files changed, 58 insertions(+), 10 deletions(-)

diff --git a/Wrappers/Python/cil/optimisation/algorithms/FISTA.py b/Wrappers/Python/cil/optimisation/algorithms/FISTA.py
index b507e42f04..b7ba923011 100644
--- a/Wrappers/Python/cil/optimisation/algorithms/FISTA.py
+++ b/Wrappers/Python/cil/optimisation/algorithms/FISTA.py
@@ -213,8 +213,19 @@ def update_objective(self):
         .. math:: f(x) + g(x)
 
         """
-        self.loss.append(self.f(self.x_old) + self.g(self.x_old))
+        self.loss.append(self.objective_function(self.x_old))
 
+    def objective_function(self, x):
+        """ Calculates the objective
+
+        .. math:: f(x) + g(x)
+        
+        Parameters
+        ----------
+        x : DataContainer
+        
+        """
+        return self.f(x) + self.g(x)
 
 class FISTA(ISTA):
 
diff --git a/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py b/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py
index ea5ca0ebdb..c015c0c4b7 100644
--- a/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py
+++ b/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py
@@ -83,6 +83,9 @@ class ArmijoStepSizeRule(StepSizeRule):
         The amount the step_size is reduced if the criterion is not met
     max_iterations: integer, optional, default is numpy.ceil (2 * numpy.log10(alpha) / numpy.log10(2))
         The maximum number of iterations to find a suitable step size 
+    warmstart: Boolean, default is True
+        If `warmstart = True` the initial step size at each Armijo iteration is the calculated step size from the last iteration. If `warmstart = False` at each  Armijo iteration, the initial step size is reset to the original, large `alpha`. 
+        In the case of *well-behaved* convex functions, `warmstart = True` is likely to be computationally less expensive. In the case of non-convex functions, or particularly tricky functions, setting `warmstart = False` may be beneficial. 
 
     Reference
     ---------
@@ -91,7 +94,7 @@ class ArmijoStepSizeRule(StepSizeRule):
 
     """
 
-    def __init__(self, alpha=1e6, beta=0.5, max_iterations=None):
+    def __init__(self, alpha=1e6, beta=0.5, max_iterations=None, warmstart=True):
         '''Initialises the step size rule 
         '''
         
@@ -106,6 +109,8 @@ def __init__(self, alpha=1e6, beta=0.5, max_iterations=None):
         self.max_iterations = max_iterations
         if self.max_iterations is None:
             self.max_iterations = numpy.ceil(2 * numpy.log10(self.alpha_orig) / numpy.log10(2))
+            
+        self.warmstart=warmstart
 
     def get_step_size(self, algorithm):
         """
@@ -137,4 +142,6 @@ def get_step_size(self, algorithm):
         if k == self.max_iterations:
             raise ValueError(
                 'Could not find a proper step_size in {} loops. Consider increasing alpha or max_iterations.'.format(self.max_iterations))
+        if self.warmstart:
+            self.alpha_orig= self.alpha 
         return self.alpha
diff --git a/Wrappers/Python/test/test_stepsizes.py b/Wrappers/Python/test/test_stepsizes.py
index be601eb7ac..0e7acfd2fa 100644
--- a/Wrappers/Python/test/test_stepsizes.py
+++ b/Wrappers/Python/test/test_stepsizes.py
@@ -41,17 +41,30 @@ def test_step_sizes_called(self):
         alg.run(5)
         self.assertEqual(len(step_size_test.get_step_size.mock_calls), 5)
 
+class TestStepSizeConstant(CCPiTestClass):
     def test_constant(self):
         test_stepsize = ConstantStepSize(0.3)
         self.assertEqual(test_stepsize.step_size, 0.3)
 
+class TestStepSizeArmijo(CCPiTestClass):
+    
+    def setUp(self):
+        self.ig = VectorGeometry(2)
+        self.data = self.ig.allocate('random')
+        self.data.fill(np.array([3.5, 3.5]))
+        self.A = MatrixOperator(np.diag([1., 1.]))
+        self.f = LeastSquares(self.A, self.data)
+
+        
     def test_armijo_init(self):
-        test_stepsize = ArmijoStepSizeRule(alpha=1e3, beta=0.4, max_iterations=40)
+        test_stepsize = ArmijoStepSizeRule(alpha=1e3, beta=0.4, max_iterations=40, warmstart=False)
+        self.assertFalse(test_stepsize.warmstart)        
         self.assertEqual(test_stepsize.alpha_orig, 1e3)
         self.assertEqual(test_stepsize.beta, 0.4)
         self.assertEqual(test_stepsize.max_iterations, 40)
 
         test_stepsize = ArmijoStepSizeRule()
+        self.assertTrue(test_stepsize.warmstart)
         self.assertEqual(test_stepsize.alpha_orig, 1e6)
         self.assertEqual(test_stepsize.beta, 0.5)
         self.assertEqual(test_stepsize.max_iterations, np.ceil(
@@ -59,14 +72,10 @@ def test_armijo_init(self):
 
     def test_armijo_calculation(self):
         test_stepsize = ArmijoStepSizeRule(alpha=8, beta=0.5, max_iterations=100)
-        ig = VectorGeometry(2)
-        data = ig.allocate('random')
-        data.fill(np.array([3.5, 3.5]))
-        A = MatrixOperator(np.diag([1., 1.]))
-        f = LeastSquares(A, data)
-        alg = GD(initial=ig.allocate(0), objective_function=f,
+
+        alg = GD(initial=self.ig.allocate(0), objective_function=self.f,
                  max_iteration=100, update_objective_interval=1, step_size=test_stepsize)
-        alg.gradient_update = ig.allocate(-1)
+        alg.gradient_update = self.ig.allocate(-1)
         step_size = test_stepsize.get_step_size(alg)
         self.assertAlmostEqual(step_size, 4)
 
@@ -77,3 +86,24 @@ def test_armijo_calculation(self):
         alg.gradient_update = ig.allocate(-2)
         step_size = test_stepsize.get_step_size(alg)
         self.assertAlmostEqual(step_size, 2)
+
+    def test_warmstart_true(self):
+        
+        rule = ArmijoStepSizeRule(warmstart=True, alpha=5000)
+        self.assertTrue(rule.warmstart)
+        self.assertTrue(rule.alpha_orig == 5000)
+        alg = GD(initial=self.ig.allocate(0), objective_function=self.f,
+                 max_iteration=100, update_objective_interval=1, step_size=rule)
+        alg.update()
+        self.assertFalse(rule.alpha_orig == 5000)
+        self.assertTrue(rule.alpha_orig == rule.alpha)  
+
+    def test_warmstart_false(self):
+        rule = ArmijoStepSizeRule(warmstart=False,  alpha=5000)
+        self.assertFalse(rule.warmstart)
+        self.assertTrue(rule.alpha_orig == 5000)
+        alg = GD(initial=self.ig.allocate(0), objective_function=self.f,
+                 max_iteration=100, update_objective_interval=1, step_size=rule)
+        alg.update()
+        self.assertTrue(rule.alpha_orig == 5000)
+        self.assertFalse(rule.alpha_orig == rule.alpha)  

From 9a6d8cea70d93c51117332f1a10b2687d6948385 Mon Sep 17 00:00:00 2001
From: Margaret Duff <margaret.duff@stfc.ac.uk>
Date: Tue, 24 Sep 2024 11:58:11 +0000
Subject: [PATCH 02/15] Indentation error

---
 Wrappers/Python/test/test_stepsizes.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Wrappers/Python/test/test_stepsizes.py b/Wrappers/Python/test/test_stepsizes.py
index d523da95b9..81a7de7f58 100644
--- a/Wrappers/Python/test/test_stepsizes.py
+++ b/Wrappers/Python/test/test_stepsizes.py
@@ -109,7 +109,7 @@ def test_warmstart_false(self):
         self.assertTrue(rule.alpha_orig == 5000)
         self.assertFalse(rule.alpha_orig == rule.alpha)  
 
-  class TestStepSizeBB(CCPiTestClass):
+class TestStepSizeBB(CCPiTestClass):
     def test_bb(self):
         n = 10
         m = 5

From 36ea51543ea73c77a20f4c318b8d4abceb7f8b93 Mon Sep 17 00:00:00 2001
From: Margaret Duff <margaret.duff@stfc.ac.uk>
Date: Tue, 24 Sep 2024 12:08:54 +0000
Subject: [PATCH 03/15] Try again with tests

---
 Wrappers/Python/test/test_algorithms.py | 2 +-
 Wrappers/Python/test/test_stepsizes.py  | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/Wrappers/Python/test/test_algorithms.py b/Wrappers/Python/test/test_algorithms.py
index e3f6302d78..c25da7f2cc 100644
--- a/Wrappers/Python/test/test_algorithms.py
+++ b/Wrappers/Python/test/test_algorithms.py
@@ -240,7 +240,7 @@ def test_gd_armijo_rosen(self):
         gd = GD(initial=self.initial, objective_function=self.f, step_size=armj,
                 max_iteration=2500,
                 update_objective_interval=500)
-        gd.run(2500,verbose=0)
+        gd.run(3000,verbose=0)
         np.testing.assert_allclose(
             gd.solution.array[0], self.scipy_opt_high.x[0], atol=1e-2)
         np.testing.assert_allclose(
diff --git a/Wrappers/Python/test/test_stepsizes.py b/Wrappers/Python/test/test_stepsizes.py
index 81a7de7f58..b952c44820 100644
--- a/Wrappers/Python/test/test_stepsizes.py
+++ b/Wrappers/Python/test/test_stepsizes.py
@@ -79,11 +79,11 @@ def test_armijo_calculation(self):
         step_size = test_stepsize.get_step_size(alg)
         self.assertAlmostEqual(step_size, 4)
 
-        alg.gradient_update = ig.allocate(-.5)
+        alg.gradient_update = self.ig.allocate(-.5)
         step_size = test_stepsize.get_step_size(alg)
         self.assertAlmostEqual(step_size, 8)
 
-        alg.gradient_update = ig.allocate(-2)
+        alg.gradient_update = self.ig.allocate(-2)
         step_size = test_stepsize.get_step_size(alg)
         self.assertAlmostEqual(step_size, 2)
 

From c2553de4d7d07cb10ad7bd4e351cc66c4d3332f3 Mon Sep 17 00:00:00 2001
From: Margaret Duff <margaret.duff@stfc.ac.uk>
Date: Tue, 24 Sep 2024 12:27:54 +0000
Subject: [PATCH 04/15] Kill max_iteration

---
 Wrappers/Python/test/test_algorithms.py | 136 ++++++++++--------------
 Wrappers/Python/test/test_stepsizes.py  |   4 +-
 2 files changed, 59 insertions(+), 81 deletions(-)

diff --git a/Wrappers/Python/test/test_algorithms.py b/Wrappers/Python/test/test_algorithms.py
index c25da7f2cc..56561d6901 100644
--- a/Wrappers/Python/test/test_algorithms.py
+++ b/Wrappers/Python/test/test_algorithms.py
@@ -105,13 +105,10 @@ def test_GD(self):
 
         alg = GD(initial=initial, objective_function=norm2sq, step_size=step_size,
                  atol=1e-9, rtol=1e-6)
-        alg.max_iteration = 1000
         alg.run(1000,verbose=0)
         self.assertNumpyArrayAlmostEqual(alg.x.as_array(), b.as_array())
         alg = GD(initial=initial, objective_function=norm2sq, step_size=step_size,
-                 atol=1e-9, rtol=1e-6, max_iteration=20, update_objective_interval=2)
-        alg.max_iteration = 20
-        self.assertTrue(alg.max_iteration == 20)
+                 atol=1e-9, rtol=1e-6, update_objective_interval=2)
         self.assertTrue(alg.update_objective_interval == 2)
         alg.run(20, verbose=0)
         self.assertNumpyArrayAlmostEqual(alg.x.as_array(), b.as_array())
@@ -132,7 +129,6 @@ def test_update_interval_0(self):
         norm2sq = LeastSquares(identity, b)
         alg = GD(initial=initial,
                  objective_function=norm2sq,
-                 max_iteration=20,
                  update_objective_interval=0,
                  atol=1e-9, rtol=1e-6)
         self.assertTrue(alg.update_objective_interval == 0)
@@ -176,7 +172,6 @@ def test_gd_constant_step_size_init(self):
     def test_gd_fixed_step_size_rosen(self):
 
         gd = GD(initial=self.initial, objective_function=self.f, step_size=0.002,
-                max_iteration=3000,
                 update_objective_interval=500)
         gd.run(3000, verbose=0)
         np.testing.assert_allclose(
@@ -224,21 +219,16 @@ def test_GDArmijo(self):
         norm2sq = LeastSquares(identity, b)
 
         alg = GD(initial=initial, objective_function=norm2sq)
-        alg.max_iteration = 100
         alg.run(100, verbose=0)
         self.assertNumpyArrayAlmostEqual(alg.x.as_array(), b.as_array())
-        alg = GD(initial=initial, objective_function=norm2sq,
-                 max_iteration=20, update_objective_interval=2)
-        # alg.max_iteration = 20
-        self.assertTrue(alg.max_iteration == 20)
+        alg = GD(initial=initial, objective_function=norm2sq, update_objective_interval=2)
         self.assertTrue(alg.update_objective_interval==2)
         alg.run(20, verbose=0)
         self.assertNumpyArrayAlmostEqual(alg.x.as_array(), b.as_array())
 
     def test_gd_armijo_rosen(self):
-        armj = ArmijoStepSizeRule(alpha=50, max_iterations=150)
+        armj = ArmijoStepSizeRule(alpha=50)
         gd = GD(initial=self.initial, objective_function=self.f, step_size=armj,
-                max_iteration=2500,
                 update_objective_interval=500)
         gd.run(3000,verbose=0)
         np.testing.assert_allclose(
@@ -262,31 +252,26 @@ def test_FISTA(self):
         log.info("initial objective %s", norm2sq(initial))
 
         alg = FISTA(initial=initial, f=norm2sq, g=ZeroFunction())
-        alg.max_iteration = 2
         alg.run(20, verbose=0)
         self.assertNumpyArrayAlmostEqual(alg.x.as_array(), b.as_array())
 
         alg = FISTA(initial=initial, f=norm2sq, g=ZeroFunction(),
-                    max_iteration=2, update_objective_interval=2)
+                     update_objective_interval=2)
 
-        self.assertTrue(alg.max_iteration == 2)
         self.assertTrue(alg.update_objective_interval == 2)
 
         alg.run(20, verbose=0)
         self.assertNumpyArrayAlmostEqual(alg.x.as_array(), b.as_array())
 
         # Testing g=None
-        alg = FISTA(initial=initial, f=norm2sq, g=None,
-                    max_iteration=2, update_objective_interval=2)
-        self.assertTrue(alg.max_iteration == 2)
+        alg = FISTA(initial=initial, f=norm2sq, g=None, update_objective_interval=2)
         self.assertTrue(alg.update_objective_interval == 2)
         alg.run(20, verbose=0)
         self.assertNumpyArrayAlmostEqual(alg.x.as_array(), b.as_array())
 
         # Testing f=None
         alg = FISTA(initial=initial, f=None, g=L1Norm(b=b),
-                    max_iteration=2, update_objective_interval=2)
-        self.assertTrue(alg.max_iteration == 2)
+                     update_objective_interval=2)
         self.assertTrue(alg.update_objective_interval == 2)
         alg.run(20, verbose=0)
         self.assertNumpyArrayAlmostEqual(alg.x.as_array(), b.as_array())
@@ -294,7 +279,7 @@ def test_FISTA(self):
         # Testing f and g is None
         with self.assertRaises(ValueError):
             alg = FISTA(initial=initial, f=None, g=None,
-                        max_iteration=2, update_objective_interval=2)
+                        update_objective_interval=2)
 
     def test_FISTA_update(self):
 
@@ -319,7 +304,7 @@ def test_FISTA_update(self):
 
         # ista run 10 iteration
         tmp_initial = ig.allocate()
-        fista = FISTA(initial=tmp_initial, f=f, g=g, max_iteration=1)
+        fista = FISTA(initial=tmp_initial, f=f, g=g)
         fista.run(1)
 
         # fista update method
@@ -348,11 +333,11 @@ def test_FISTA_update(self):
         self.assertTrue(res1 == res2)
 
         tmp_initial = ig.allocate()
-        fista1 = FISTA(initial=tmp_initial, f=f, g=g, max_iteration=1)
+        fista1 = FISTA(initial=tmp_initial, f=f, g=g)
         self.assertTrue(fista1.is_provably_convergent())
 
         fista1 = FISTA(initial=tmp_initial, f=f, g=g,
-                       max_iteration=1, step_size=30.0)
+                        step_size=30.0)
         self.assertFalse(fista1.is_provably_convergent())
 
     def test_FISTA_Norm2Sq(self):
@@ -367,13 +352,11 @@ def test_FISTA_Norm2Sq(self):
         opt = {'tol': 1e-4, 'memopt': False}
         log.info("initial objective %s", norm2sq(initial))
         alg = FISTA(initial=initial, f=norm2sq, g=ZeroFunction())
-        alg.max_iteration = 2
         alg.run(20, verbose=0)
         self.assertNumpyArrayAlmostEqual(alg.x.as_array(), b.as_array())
 
         alg = FISTA(initial=initial, f=norm2sq, g=ZeroFunction(),
-                    max_iteration=2, update_objective_interval=3)
-        self.assertTrue(alg.max_iteration == 2)
+                     update_objective_interval=3)
         self.assertTrue(alg.update_objective_interval == 3)
 
         alg.run(20, verbose=0)
@@ -419,7 +402,6 @@ def test_FISTA_Denoising(self):
 
         initial = ig.allocate()
         fista = FISTA(initial=initial, f=reg, g=fid)
-        fista.max_iteration = 3000
         fista.update_objective_interval = 500
         fista.run(3000, verbose=0)
         rmse = (fista.get_output() - data).norm() / data.as_array().size
@@ -483,7 +465,7 @@ def test_update(self):
 
         # ista run 10 iteration
         tmp_initial = self.ig.allocate()
-        ista = ISTA(initial=tmp_initial, f=self.f, g=self.g, max_iteration=1)
+        ista = ISTA(initial=tmp_initial, f=self.f, g=self.g)
         ista.run(1)
 
         x = tmp_initial.copy()
@@ -505,7 +487,7 @@ def test_update_g_none(self):
 
         # ista run 10 iteration
         tmp_initial = self.ig.allocate()
-        ista = ISTA(initial=tmp_initial, f=self.f, g=None,  max_iteration=1)
+        ista = ISTA(initial=tmp_initial, f=self.f, g=None)
         ista.run(1)
 
         x = tmp_initial.copy()
@@ -526,7 +508,7 @@ def test_update_f_none(self):
 
         # ista run 1 iteration
         tmp_initial = self.ig.allocate()
-        ista = ISTA(initial=tmp_initial, f=None, g=self.h,  max_iteration=1)
+        ista = ISTA(initial=tmp_initial, f=None, g=self.h)
         ista.run(1)
 
         x = tmp_initial.copy()
@@ -546,23 +528,23 @@ def test_update_f_none(self):
     def test_f_and_g_none(self):
         tmp_initial = self.ig.allocate()
         with self.assertRaises(ValueError):
-            ista = ISTA(initial=tmp_initial, f=None, g=None,  max_iteration=1)
+            ista = ISTA(initial=tmp_initial, f=None, g=None)
 
     def test_provable_condition(self):
 
         tmp_initial = self.ig.allocate()
-        ista1 = ISTA(initial=tmp_initial, f=self.f, g=self.g, max_iteration=10)
+        ista1 = ISTA(initial=tmp_initial, f=self.f, g=self.g)
         self.assertTrue(ista1.is_provably_convergent())
 
         ista1 = ISTA(initial=tmp_initial, f=self.f, g=self.g,
-                     max_iteration=10, step_size=30.0)
+                      step_size=30.0)
         self.assertFalse(ista1.is_provably_convergent())
 
     @unittest.skipUnless(has_cvxpy, "CVXpy not installed")
     def test_with_cvxpy(self):
 
         ista = ISTA(initial=self.initial, f=self.f,
-                    g=self.g, max_iteration=2000)
+                    g=self.g)
         ista.run(2000, verbose=0)
 
         u_cvxpy = cvxpy.Variable(self.ig.shape[0])
@@ -738,7 +720,6 @@ def setup(data, dnoise):
 
         # Setup and run the PDHG algorithm
         pdhg1 = PDHG(f=f1, g=g, operator=operator, tau=tau, sigma=sigma)
-        pdhg1.max_iteration = 2000
         pdhg1.update_objective_interval = 200
         pdhg1.run(1000, verbose=0)
 
@@ -763,7 +744,7 @@ def setup(data, dnoise):
 
         # Setup and run the PDHG algorithm
         pdhg1 = PDHG(f=f1, g=g, operator=operator, tau=tau, sigma=sigma,
-                     max_iteration=2000, update_objective_interval=200)
+                     update_objective_interval=200)
 
         pdhg1.run(1000, verbose=0)
 
@@ -788,7 +769,6 @@ def setup(data, dnoise):
 
         # Setup and run the PDHG algorithm
         pdhg1 = PDHG(f=f1, g=g, operator=operator, tau=tau, sigma=sigma)
-        pdhg1.max_iteration = 2000
         pdhg1.update_objective_interval = 200
         pdhg1.run(1000, verbose=0)
 
@@ -805,28 +785,28 @@ def test_PDHG_step_sizes(self):
         operator = 3*IdentityOperator(ig)
 
         # check if sigma, tau are None
-        pdhg = PDHG(f=f, g=g, operator=operator, max_iteration=10)
+        pdhg = PDHG(f=f, g=g, operator=operator)
         self.assertAlmostEqual(pdhg.sigma, 1./operator.norm())
         self.assertAlmostEqual(pdhg.tau, 1./operator.norm())
 
         # check if sigma is negative
         with self.assertRaises(ValueError):
             pdhg = PDHG(f=f, g=g, operator=operator,
-                        max_iteration=10, sigma=-1)
+                         sigma=-1)
 
         # check if tau is negative
         with self.assertRaises(ValueError):
-            pdhg = PDHG(f=f, g=g, operator=operator, max_iteration=10, tau=-1)
+            pdhg = PDHG(f=f, g=g, operator=operator,tau=-1)
 
         # check if tau is None
         sigma = 3.0
-        pdhg = PDHG(f=f, g=g, operator=operator, sigma=sigma, max_iteration=10)
+        pdhg = PDHG(f=f, g=g, operator=operator, sigma=sigma)
         self.assertAlmostEqual(pdhg.sigma, sigma)
         self.assertAlmostEqual(pdhg.tau, 1./(sigma * operator.norm()**2))
 
         # check if sigma is None
         tau = 3.0
-        pdhg = PDHG(f=f, g=g, operator=operator, tau=tau, max_iteration=10)
+        pdhg = PDHG(f=f, g=g, operator=operator, tau=tau)
         self.assertAlmostEqual(pdhg.tau, tau)
         self.assertAlmostEqual(pdhg.sigma, 1./(tau * operator.norm()**2))
 
@@ -834,7 +814,7 @@ def test_PDHG_step_sizes(self):
         tau = 1.0
         sigma = 1.0
         pdhg = PDHG(f=f, g=g, operator=operator, tau=tau,
-                    sigma=sigma, max_iteration=10)
+                    sigma=sigma)
         self.assertAlmostEqual(pdhg.tau, tau)
         self.assertAlmostEqual(pdhg.sigma, sigma)
 
@@ -843,29 +823,29 @@ def test_PDHG_step_sizes(self):
         sigma = ig1.allocate()
         with self.assertRaises(ValueError):
             pdhg = PDHG(f=f, g=g, operator=operator,
-                        sigma=sigma, max_iteration=10)
+                        sigma=sigma)
 
         # check sigma/tau as arrays, tau wrong shape
         tau = ig1.allocate()
         with self.assertRaises(ValueError):
-            pdhg = PDHG(f=f, g=g, operator=operator, tau=tau, max_iteration=10)
+            pdhg = PDHG(f=f, g=g, operator=operator, tau=tau)
 
         # check sigma not Number or object with correct shape
         with self.assertRaises(AttributeError):
             pdhg = PDHG(f=f, g=g, operator=operator,
-                        sigma="sigma", max_iteration=10)
+                        sigma="sigma")
 
         # check tau not Number or object with correct shape
         with self.assertRaises(AttributeError):
             pdhg = PDHG(f=f, g=g, operator=operator,
-                        tau="tau", max_iteration=10)
+                        tau="tau")
 
         # check warning message if condition is not satisfied
         sigma = 4
         tau = 1/3
         with self.assertWarnsRegex(UserWarning, "Convergence criterion"):
             pdhg = PDHG(f=f, g=g, operator=operator, tau=tau,
-                        sigma=sigma, max_iteration=10)
+                        sigma=sigma)
 
     def test_PDHG_strongly_convex_gamma_g(self):
         ig = ImageGeometry(3, 3)
@@ -880,7 +860,7 @@ def test_PDHG_strongly_convex_gamma_g(self):
         tau = 1.0
 
         pdhg = PDHG(f=f, g=g, operator=operator, sigma=sigma, tau=tau,
-                    max_iteration=5, gamma_g=0.5)
+                     gamma_g=0.5)
         pdhg.run(1, verbose=0)
         self.assertAlmostEqual(
             pdhg.theta, 1.0 / np.sqrt(1 + 2 * pdhg.gamma_g * tau))
@@ -893,12 +873,12 @@ def test_PDHG_strongly_convex_gamma_g(self):
         # check negative strongly convex constant
         with self.assertRaises(ValueError):
             pdhg = PDHG(f=f, g=g, operator=operator, sigma=sigma, tau=tau,
-                        max_iteration=5, gamma_g=-0.5)
+                         gamma_g=-0.5)
 
         # check strongly convex constant not a number
         with self.assertRaises(ValueError):
             pdhg = PDHG(f=f, g=g, operator=operator, sigma=sigma, tau=tau,
-                        max_iteration=5, gamma_g="-0.5")
+                         gamma_g="-0.5")
 
     def test_PDHG_strongly_convex_gamma_fcong(self):
         ig = ImageGeometry(3, 3)
@@ -913,7 +893,7 @@ def test_PDHG_strongly_convex_gamma_fcong(self):
         tau = 1.0
 
         pdhg = PDHG(f=f, g=g, operator=operator, sigma=sigma, tau=tau,
-                    max_iteration=5, gamma_fconj=0.5)
+                     gamma_fconj=0.5)
         pdhg.run(1, verbose=0)
         self.assertEqual(pdhg.theta, 1.0 / np.sqrt(1 +
                          2 * pdhg.gamma_fconj * sigma))
@@ -926,14 +906,14 @@ def test_PDHG_strongly_convex_gamma_fcong(self):
         # check negative strongly convex constant
         try:
             pdhg = PDHG(f=f, g=g, operator=operator, sigma=sigma, tau=tau,
-                        max_iteration=5, gamma_fconj=-0.5)
+                         gamma_fconj=-0.5)
         except ValueError as ve:
             log.info(str(ve))
 
         # check strongly convex constant not a number
         try:
             pdhg = PDHG(f=f, g=g, operator=operator, sigma=sigma, tau=tau,
-                        max_iteration=5, gamma_fconj="-0.5")
+                         gamma_fconj="-0.5")
         except ValueError as ve:
             log.info(str(ve))
 
@@ -947,7 +927,7 @@ def test_PDHG_strongly_convex_both_fconj_and_g(self):
         operator = IdentityOperator(ig)
 
         try:
-            pdhg = PDHG(f=f, g=g, operator=operator, max_iteration=10,
+            pdhg = PDHG(f=f, g=g, operator=operator, 
                         gamma_g=0.5, gamma_fconj=0.5)
             pdhg.run(verbose=0)
         except ValueError as err:
@@ -1031,7 +1011,7 @@ def test_update(self):
         # sirt run 5 iterations
         tmp_initial = self.ig.allocate()
         sirt = SIRT(initial=tmp_initial, operator=self.Aop,
-                    data=self.bop, max_iteration=5)
+                    data=self.bop)
         sirt.run(5)
 
         x = tmp_initial.copy()
@@ -1046,22 +1026,22 @@ def test_update(self):
 
     def test_update_constraints(self):
         alg = SIRT(initial=self.initial2, operator=self.A2,
-                   data=self.b2, max_iteration=20)
+                   data=self.b2)
         alg.run(20,verbose=0)
         np.testing.assert_array_almost_equal(alg.x.array, self.b2.array)
 
         alg = SIRT(initial=self.initial2, operator=self.A2,
-                   data=self.b2, max_iteration=20, upper=0.3)
+                   data=self.b2,  upper=0.3)
         alg.run(20,verbose=0)
         np.testing.assert_almost_equal(alg.solution.max(), 0.3)
 
         alg = SIRT(initial=self.initial2, operator=self.A2,
-                   data=self.b2, max_iteration=20, lower=0.7)
+                   data=self.b2, lower=0.7)
         alg.run(20,verbose=0)
         np.testing.assert_almost_equal(alg.solution.min(), 0.7)
 
         alg = SIRT(initial=self.initial2, operator=self.A2, data=self.b2,
-                   max_iteration=20, constraint=IndicatorBox(lower=0.1, upper=0.3))
+                    constraint=IndicatorBox(lower=0.1, upper=0.3))
         alg.run(20,verbose=0)
         np.testing.assert_almost_equal(alg.solution.max(), 0.3)
         np.testing.assert_almost_equal(alg.solution.min(), 0.1)
@@ -1069,7 +1049,7 @@ def test_update_constraints(self):
     def test_SIRT_relaxation_parameter(self):
         tmp_initial = self.ig.allocate()
         alg = SIRT(initial=tmp_initial, operator=self.Aop,
-                   data=self.bop, max_iteration=5)
+                   data=self.bop)
 
         with self.assertRaises(ValueError):
             alg.set_relaxation_parameter(0)
@@ -1078,7 +1058,7 @@ def test_SIRT_relaxation_parameter(self):
             alg.set_relaxation_parameter(2)
 
         alg = SIRT(initial=self.initial2, operator=self.A2,
-                   data=self.b2, max_iteration=20)
+                   data=self.b2)
         alg.set_relaxation_parameter(0.5)
 
         self.assertEqual(alg.relaxation_parameter, 0.5)
@@ -1095,7 +1075,7 @@ def test_SIRT_nan_inf_values(self):
 
         tmp_initial = self.ig.allocate()
         sirt = SIRT(initial=tmp_initial, operator=Aop_nan_inf,
-                    data=self.bop, max_iteration=5)
+                    data=self.bop)
 
         self.assertFalse(np.any(sirt.M == np.inf))
         self.assertFalse(np.any(sirt.D == np.inf))
@@ -1117,7 +1097,7 @@ def test_SIRT_remove_nan_or_inf_with_BlockDataContainer(self):
         tmp_initial = ig.allocate()
 
         sirt = SIRT(initial=tmp_initial, operator=Aop,
-                    data=bop, max_iteration=5)
+                    data=bop)
         for el in sirt.M.containers:
             self.assertFalse(np.any(el == np.inf))
 
@@ -1127,13 +1107,13 @@ def test_SIRT_with_TV(self):
         data = dataexample.SIMPLE_PHANTOM_2D.get(size=(128, 128))
         ig = data.geometry
         A = IdentityOperator(ig)
-        constraint = TotalVariation(warm_start=False, max_iteration=100)
+        constraint = TotalVariation(warm_start=False)
         initial = ig.allocate('random', seed=5)
         sirt = SIRT(initial=initial, operator=A, data=data,
-                    max_iteration=2, constraint=constraint)
+                     constraint=constraint)
         sirt.run(2, verbose=0)
         f = LeastSquares(A, data, c=0.5)
-        fista = FISTA(initial=initial, f=f, g=constraint, max_iteration=1000)
+        fista = FISTA(initial=initial, f=f, g=constraint)
         fista.run(100, verbose=0)
         self.assertNumpyArrayAlmostEqual(fista.x.as_array(), sirt.x.as_array())
 
@@ -1141,10 +1121,10 @@ def test_SIRT_with_TV_warm_start(self):
         data = dataexample.SIMPLE_PHANTOM_2D.get(size=(128, 128))
         ig = data.geometry
         A = IdentityOperator(ig)
-        constraint = 1e6*TotalVariation(warm_start=True, max_iteration=100)
+        constraint = 1e6*TotalVariation(warm_start=True)
         initial = ig.allocate('random', seed=5)
         sirt = SIRT(initial=initial, operator=A, data=data,
-                    max_iteration=150, constraint=constraint)
+                     constraint=constraint)
         sirt.run(25, verbose=0)
 
         self.assertNumpyArrayAlmostEqual(
@@ -1470,11 +1450,11 @@ def do_test_with_fidelity(self, fidelity):
         F = self.F
 
         admm = LADMM(f=G, g=F, operator=K, tau=self.tau, sigma=self.sigma,
-                     max_iteration=100, update_objective_interval=10)
+                     update_objective_interval=10)
         admm.run(1, verbose=0)
 
         admm_noaxpby = LADMM(f=G, g=F, operator=K, tau=self.tau, sigma=self.sigma,
-                             max_iteration=100, update_objective_interval=10)
+                             update_objective_interval=10)
         admm_noaxpby.run(1, verbose=0)
         np.testing.assert_array_almost_equal(
             admm.solution.as_array(), admm_noaxpby.solution.as_array())
@@ -1506,14 +1486,14 @@ def test_compare_with_PDHG(self):
         tau = 1./normK
 
         pdhg = PDHG(f=F, g=G, operator=K, tau=tau, sigma=sigma,
-                    max_iteration=500, update_objective_interval=10)
+                     update_objective_interval=10)
         pdhg.run(500,verbose=0)
 
         sigma = 1
         tau = sigma/normK**2
 
         admm = LADMM(f=G, g=F, operator=K, tau=tau, sigma=sigma,
-                     max_iteration=500, update_objective_interval=10)
+                      update_objective_interval=10)
         admm.run(500,verbose=0)
         np.testing.assert_almost_equal(
             admm.solution.array, pdhg.solution.array,  decimal=3)
@@ -1564,8 +1544,7 @@ def test_PD3O_PDHG_denoising_1_iteration(self):
         G = 0.5 * L2NormSquared(b=self.data)
         sigma = 1./norm_op
         tau = 1./norm_op
-        pdhg = PDHG(f=F, g=G, operator=operator, tau=tau, sigma=sigma, update_objective_interval = 100, 
-                    max_iteration = 2000)
+        pdhg = PDHG(f=F, g=G, operator=operator, tau=tau, sigma=sigma, update_objective_interval = 100)
         pdhg.run(1)
 
         # setup PD3O denoising  (F=ZeroFunction)   
@@ -1576,8 +1555,7 @@ def test_PD3O_PDHG_denoising_1_iteration(self):
         delta = 1./norm_op
 
         pd3O = PD3O(f=F, g=G, h=H, operator=operator, gamma=gamma, delta=delta,
-                    update_objective_interval = 100, 
-                    max_iteration = 2000)
+                    update_objective_interval = 100)
         pd3O.run(1)      
                
         # PD3O vs pdhg
diff --git a/Wrappers/Python/test/test_stepsizes.py b/Wrappers/Python/test/test_stepsizes.py
index b952c44820..4a36dc26de 100644
--- a/Wrappers/Python/test/test_stepsizes.py
+++ b/Wrappers/Python/test/test_stepsizes.py
@@ -71,7 +71,7 @@ def test_armijo_init(self):
             2 * np.log10(1e6) / np.log10(2)))
 
     def test_armijo_calculation(self):
-        test_stepsize = ArmijoStepSizeRule(alpha=8, beta=0.5, max_iterations=100)
+        test_stepsize = ArmijoStepSizeRule(alpha=8, beta=0.5, max_iterations=100, warmstart=False)
 
         alg = GD(initial=self.ig.allocate(0), objective_function=self.f,
                  max_iteration=100, update_objective_interval=1, step_size=test_stepsize)
@@ -250,7 +250,7 @@ def test_bb_converge(self):
         initial = ig.allocate()
         f = LeastSquares(Aop, b=bop, c=2)
         
-        ss_rule=ArmijoStepSizeRule(max_iterations=40)
+        ss_rule=ArmijoStepSizeRule(max_iterations=40, warmstart=False)
         alg_true = GD(initial=initial, objective_function=f, step_size=ss_rule)
         alg_true .run(300, verbose=0)
         

From 785cbbe0b6a1113608bffdbfab08584cc94c228b Mon Sep 17 00:00:00 2001
From: Margaret Duff <margaret.duff@stfc.ac.uk>
Date: Tue, 24 Sep 2024 12:39:32 +0000
Subject: [PATCH 05/15] Don't kill all  max_iteration

---
 Wrappers/Python/test/test_algorithms.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/Wrappers/Python/test/test_algorithms.py b/Wrappers/Python/test/test_algorithms.py
index 56561d6901..61d285c58b 100644
--- a/Wrappers/Python/test/test_algorithms.py
+++ b/Wrappers/Python/test/test_algorithms.py
@@ -227,7 +227,7 @@ def test_GDArmijo(self):
         self.assertNumpyArrayAlmostEqual(alg.x.as_array(), b.as_array())
 
     def test_gd_armijo_rosen(self):
-        armj = ArmijoStepSizeRule(alpha=50)
+        armj = ArmijoStepSizeRule(alpha=50, max_iterations=50)
         gd = GD(initial=self.initial, objective_function=self.f, step_size=armj,
                 update_objective_interval=500)
         gd.run(3000,verbose=0)
@@ -1121,7 +1121,7 @@ def test_SIRT_with_TV_warm_start(self):
         data = dataexample.SIMPLE_PHANTOM_2D.get(size=(128, 128))
         ig = data.geometry
         A = IdentityOperator(ig)
-        constraint = 1e6*TotalVariation(warm_start=True)
+        constraint = 1e6*TotalVariation(warm_start=True, max_iteration=100)
         initial = ig.allocate('random', seed=5)
         sirt = SIRT(initial=initial, operator=A, data=data,
                      constraint=constraint)

From 5b385dbc6efa1454b5690eb643547a7d754be012 Mon Sep 17 00:00:00 2001
From: Margaret Duff <margaret.duff@stfc.ac.uk>
Date: Tue, 24 Sep 2024 12:45:51 +0000
Subject: [PATCH 06/15] Broken ROsen

---
 Wrappers/Python/test/test_algorithms.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Wrappers/Python/test/test_algorithms.py b/Wrappers/Python/test/test_algorithms.py
index 61d285c58b..36a8e10847 100644
--- a/Wrappers/Python/test/test_algorithms.py
+++ b/Wrappers/Python/test/test_algorithms.py
@@ -230,7 +230,7 @@ def test_gd_armijo_rosen(self):
         armj = ArmijoStepSizeRule(alpha=50, max_iterations=50)
         gd = GD(initial=self.initial, objective_function=self.f, step_size=armj,
                 update_objective_interval=500)
-        gd.run(3000,verbose=0)
+        gd.run(5000,verbose=0)
         np.testing.assert_allclose(
             gd.solution.array[0], self.scipy_opt_high.x[0], atol=1e-2)
         np.testing.assert_allclose(

From af4e5d6cfcb39c846d6f9a71d00d1a921abbcb6c Mon Sep 17 00:00:00 2001
From: Margaret Duff <margaret.duff@stfc.ac.uk>
Date: Tue, 24 Sep 2024 12:53:11 +0000
Subject: [PATCH 07/15] Try again

---
 Wrappers/Python/test/test_algorithms.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/Wrappers/Python/test/test_algorithms.py b/Wrappers/Python/test/test_algorithms.py
index 36a8e10847..845b5a44ce 100644
--- a/Wrappers/Python/test/test_algorithms.py
+++ b/Wrappers/Python/test/test_algorithms.py
@@ -227,10 +227,10 @@ def test_GDArmijo(self):
         self.assertNumpyArrayAlmostEqual(alg.x.as_array(), b.as_array())
 
     def test_gd_armijo_rosen(self):
-        armj = ArmijoStepSizeRule(alpha=50, max_iterations=50)
+        armj = ArmijoStepSizeRule(alpha=50, max_iterations=50, warmstart=False)
         gd = GD(initial=self.initial, objective_function=self.f, step_size=armj,
                 update_objective_interval=500)
-        gd.run(5000,verbose=0)
+        gd.run(3500,verbose=0)
         np.testing.assert_allclose(
             gd.solution.array[0], self.scipy_opt_high.x[0], atol=1e-2)
         np.testing.assert_allclose(

From 284b45adbdfc0f6f23ffb0a75e12557effd3e66c Mon Sep 17 00:00:00 2001
From: Margaret Duff <margaret.duff@stfc.ac.uk>
Date: Tue, 24 Sep 2024 13:02:30 +0000
Subject: [PATCH 08/15] ISTA and FISTA tests

---
 Wrappers/Python/test/test_stepsizes.py | 30 ++++++++++++++++++++++++++
 1 file changed, 30 insertions(+)

diff --git a/Wrappers/Python/test/test_stepsizes.py b/Wrappers/Python/test/test_stepsizes.py
index 4a36dc26de..4276931945 100644
--- a/Wrappers/Python/test/test_stepsizes.py
+++ b/Wrappers/Python/test/test_stepsizes.py
@@ -87,6 +87,36 @@ def test_armijo_calculation(self):
         step_size = test_stepsize.get_step_size(alg)
         self.assertAlmostEqual(step_size, 2)
 
+    def test_armijo_ISTA_and_FISTA(self):
+        test_stepsize = ArmijoStepSizeRule(alpha=8, beta=0.5, max_iterations=100, warmstart=False)
+
+        alg = ISTA(initial=self.ig.allocate(0), f=self.f, g=IndicatorBox(lower=0),
+                    max_iteration=100, update_objective_interval=1, step_size=test_stepsize)
+        alg.gradient_update = self.ig.allocate(-1)
+        step_size = test_stepsize.get_step_size(alg)
+        self.assertAlmostEqual(step_size, 4)
+
+        alg.gradient_update = self.ig.allocate(-.5)
+        step_size = test_stepsize.get_step_size(alg)
+        self.assertAlmostEqual(step_size, 8)
+
+        alg.gradient_update = self.ig.allocate(-2)
+        step_size = test_stepsize.get_step_size(alg)
+        self.assertAlmostEqual(step_size, 2)
+
+        alg = FISTA(initial=self.ig.allocate(0), f=self.f, g=IndicatorBox(lower=0),
+                    max_iteration=100, update_objective_interval=1, step_size=test_stepsize)
+        alg.gradient_update = self.ig.allocate(-1)
+        step_size = test_stepsize.get_step_size(alg)
+        self.assertAlmostEqual(step_size, 4)
+
+        alg.gradient_update = self.ig.allocate(-.5)
+        step_size = test_stepsize.get_step_size(alg)
+        self.assertAlmostEqual(step_size, 8)
+
+        alg.gradient_update = self.ig.allocate(-2)
+        step_size = test_stepsize.get_step_size(alg)
+        self.assertAlmostEqual(step_size, 2)
 
     def test_warmstart_true(self):
         

From 373a4486336523e5053d52001ecdcbafd82e9e54 Mon Sep 17 00:00:00 2001
From: Margaret Duff <margaret.duff@stfc.ac.uk>
Date: Tue, 24 Sep 2024 13:12:39 +0000
Subject: [PATCH 09/15] Kill max_iteration from test_stepsizes.py

---
 Wrappers/Python/test/test_stepsizes.py | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)

diff --git a/Wrappers/Python/test/test_stepsizes.py b/Wrappers/Python/test/test_stepsizes.py
index 4276931945..76e0634f94 100644
--- a/Wrappers/Python/test/test_stepsizes.py
+++ b/Wrappers/Python/test/test_stepsizes.py
@@ -21,7 +21,7 @@ def test_step_sizes_called(self):
         step_size_test.get_step_size = MagicMock(return_value=.1)
         f = LeastSquares(A=A, b=data, c=0.5)
         alg = GD(initial=ig.allocate('random', seed=10), objective_function=f, step_size=step_size_test,
-                 max_iteration=100, update_objective_interval=1)
+                  update_objective_interval=1)
 
         alg.run(5)
 
@@ -30,14 +30,14 @@ def test_step_sizes_called(self):
         step_size_test = ConstantStepSize(3)
         step_size_test.get_step_size = MagicMock(return_value=.1)
         alg = ISTA(initial=ig.allocate('random', seed=10), f=f, g=IndicatorBox(lower=0), step_size=step_size_test,
-                   max_iteration=100, update_objective_interval=1)
+                    update_objective_interval=1)
         alg.run(5)
         self.assertEqual(len(step_size_test.get_step_size.mock_calls), 5)
 
         step_size_test = ConstantStepSize(3)
         step_size_test.get_step_size = MagicMock(return_value=.1)
         alg = FISTA(initial=ig.allocate('random', seed=10), f=f, g=IndicatorBox(lower=0), step_size=step_size_test,
-                    max_iteration=100, update_objective_interval=1)
+                     update_objective_interval=1)
         alg.run(5)
         self.assertEqual(len(step_size_test.get_step_size.mock_calls), 5)
 
@@ -74,7 +74,7 @@ def test_armijo_calculation(self):
         test_stepsize = ArmijoStepSizeRule(alpha=8, beta=0.5, max_iterations=100, warmstart=False)
 
         alg = GD(initial=self.ig.allocate(0), objective_function=self.f,
-                 max_iteration=100, update_objective_interval=1, step_size=test_stepsize)
+                  update_objective_interval=1, step_size=test_stepsize)
         alg.gradient_update = self.ig.allocate(-1)
         step_size = test_stepsize.get_step_size(alg)
         self.assertAlmostEqual(step_size, 4)
@@ -91,7 +91,7 @@ def test_armijo_ISTA_and_FISTA(self):
         test_stepsize = ArmijoStepSizeRule(alpha=8, beta=0.5, max_iterations=100, warmstart=False)
 
         alg = ISTA(initial=self.ig.allocate(0), f=self.f, g=IndicatorBox(lower=0),
-                    max_iteration=100, update_objective_interval=1, step_size=test_stepsize)
+                     update_objective_interval=1, step_size=test_stepsize)
         alg.gradient_update = self.ig.allocate(-1)
         step_size = test_stepsize.get_step_size(alg)
         self.assertAlmostEqual(step_size, 4)
@@ -105,7 +105,7 @@ def test_armijo_ISTA_and_FISTA(self):
         self.assertAlmostEqual(step_size, 2)
 
         alg = FISTA(initial=self.ig.allocate(0), f=self.f, g=IndicatorBox(lower=0),
-                    max_iteration=100, update_objective_interval=1, step_size=test_stepsize)
+                     update_objective_interval=1, step_size=test_stepsize)
         alg.gradient_update = self.ig.allocate(-1)
         step_size = test_stepsize.get_step_size(alg)
         self.assertAlmostEqual(step_size, 4)
@@ -124,7 +124,7 @@ def test_warmstart_true(self):
         self.assertTrue(rule.warmstart)
         self.assertTrue(rule.alpha_orig == 5000)
         alg = GD(initial=self.ig.allocate(0), objective_function=self.f,
-                 max_iteration=100, update_objective_interval=1, step_size=rule)
+                  update_objective_interval=1, step_size=rule)
         alg.update()
         self.assertFalse(rule.alpha_orig == 5000)
         self.assertTrue(rule.alpha_orig == rule.alpha)  
@@ -134,7 +134,7 @@ def test_warmstart_false(self):
         self.assertFalse(rule.warmstart)
         self.assertTrue(rule.alpha_orig == 5000)
         alg = GD(initial=self.ig.allocate(0), objective_function=self.f,
-                 max_iteration=100, update_objective_interval=1, step_size=rule)
+                  update_objective_interval=1, step_size=rule)
         alg.update()
         self.assertTrue(rule.alpha_orig == 5000)
         self.assertFalse(rule.alpha_orig == rule.alpha)  

From aae69726e68a8983fdf29654e2db68d600b570fe Mon Sep 17 00:00:00 2001
From: Margaret Duff <margaret.duff@stfc.ac.uk>
Date: Wed, 25 Sep 2024 12:45:04 +0000
Subject: [PATCH 10/15] Changes from Casper's comments

---
 .../Python/cil/optimisation/utilities/StepSizeMethods.py  | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py b/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py
index 8a31d6c20e..17d24358e5 100644
--- a/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py
+++ b/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py
@@ -101,7 +101,7 @@ def __init__(self, alpha=1e6, beta=0.5, max_iterations=None, warmstart=True):
         self.alpha_orig = alpha
         if self.alpha_orig is None: # Can be removed when alpha and beta are deprecated in GD
             self.alpha_orig = 1e6 
-
+        self.alpha = self.alpha_orig
         self.beta = beta 
         if self.beta is None:  # Can be removed when alpha and beta are deprecated in GD
             self.beta = 0.5
@@ -122,7 +122,7 @@ def get_step_size(self, algorithm):
 
         """
         k = 0
-        self.alpha = self.alpha_orig
+        
         f_x = algorithm.objective_function(algorithm.solution)
 
         self.x_armijo = algorithm.solution.copy()
@@ -142,8 +142,8 @@ def get_step_size(self, algorithm):
         if k == self.max_iterations:
             raise ValueError(
                 'Could not find a proper step_size in {} loops. Consider increasing alpha or max_iterations.'.format(self.max_iterations))
-        if self.warmstart:
-            self.alpha_orig= self.alpha 
+        if not self.warmstart:  
+            self.alpha = self.alpha_orig 
         return self.alpha
 
 

From 79f54f17c7daf3e9e68b64ec157ccfdb8a78a321 Mon Sep 17 00:00:00 2001
From: Margaret Duff <margaret.duff@stfc.ac.uk>
Date: Wed, 25 Sep 2024 15:45:04 +0000
Subject: [PATCH 11/15] Changes from Casper's comments - attempt 2

---
 .../Python/cil/optimisation/utilities/StepSizeMethods.py   | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py b/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py
index 17d24358e5..a249c4a2db 100644
--- a/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py
+++ b/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py
@@ -101,7 +101,7 @@ def __init__(self, alpha=1e6, beta=0.5, max_iterations=None, warmstart=True):
         self.alpha_orig = alpha
         if self.alpha_orig is None: # Can be removed when alpha and beta are deprecated in GD
             self.alpha_orig = 1e6 
-        self.alpha = self.alpha_orig
+        self.alpha = self.alpha_orig.copy()
         self.beta = beta 
         if self.beta is None:  # Can be removed when alpha and beta are deprecated in GD
             self.beta = 0.5
@@ -122,6 +122,8 @@ def get_step_size(self, algorithm):
 
         """
         k = 0
+        if not self.warmstart:  
+            self.alpha = self.alpha_orig
         
         f_x = algorithm.objective_function(algorithm.solution)
 
@@ -142,8 +144,7 @@ def get_step_size(self, algorithm):
         if k == self.max_iterations:
             raise ValueError(
                 'Could not find a proper step_size in {} loops. Consider increasing alpha or max_iterations.'.format(self.max_iterations))
-        if not self.warmstart:  
-            self.alpha = self.alpha_orig 
+        
         return self.alpha
 
 

From 238fc2827c561469f94b8904f84fdf59353bad9a Mon Sep 17 00:00:00 2001
From: Margaret Duff <margaret.duff@stfc.ac.uk>
Date: Wed, 25 Sep 2024 15:50:45 +0000
Subject: [PATCH 12/15] Changes from Casper's comments - attempt 3

---
 Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py b/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py
index a249c4a2db..605b1ea731 100644
--- a/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py
+++ b/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py
@@ -101,7 +101,7 @@ def __init__(self, alpha=1e6, beta=0.5, max_iterations=None, warmstart=True):
         self.alpha_orig = alpha
         if self.alpha_orig is None: # Can be removed when alpha and beta are deprecated in GD
             self.alpha_orig = 1e6 
-        self.alpha = self.alpha_orig.copy()
+        self.alpha = self.alpha_orig
         self.beta = beta 
         if self.beta is None:  # Can be removed when alpha and beta are deprecated in GD
             self.beta = 0.5

From 3725bd8636f07261ad39f8351e4201760629dae5 Mon Sep 17 00:00:00 2001
From: Margaret Duff <margaret.duff@stfc.ac.uk>
Date: Wed, 25 Sep 2024 16:19:10 +0000
Subject: [PATCH 13/15] Attempt 4

---
 Wrappers/Python/test/test_stepsizes.py | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/Wrappers/Python/test/test_stepsizes.py b/Wrappers/Python/test/test_stepsizes.py
index 76e0634f94..1ef0fc145c 100644
--- a/Wrappers/Python/test/test_stepsizes.py
+++ b/Wrappers/Python/test/test_stepsizes.py
@@ -126,8 +126,7 @@ def test_warmstart_true(self):
         alg = GD(initial=self.ig.allocate(0), objective_function=self.f,
                   update_objective_interval=1, step_size=rule)
         alg.update()
-        self.assertFalse(rule.alpha_orig == 5000)
-        self.assertTrue(rule.alpha_orig == rule.alpha)  
+        self.assertFalse(rule.alpha == 5000)
 
     def test_warmstart_false(self):
         rule = ArmijoStepSizeRule(warmstart=False,  alpha=5000)

From 2912262f969e1b0eb411c1f90d9ce604f98c6dbe Mon Sep 17 00:00:00 2001
From: Margaret Duff <margaret.duff@stfc.ac.uk>
Date: Thu, 26 Sep 2024 11:14:07 +0000
Subject: [PATCH 14/15] Changes after discussion with Gemma

---
 .../cil/optimisation/algorithms/FISTA.py      |  6 ++---
 .../Python/cil/optimisation/algorithms/GD.py  | 23 ++++++++++++++++---
 .../optimisation/utilities/StepSizeMethods.py | 13 ++++++++---
 3 files changed, 33 insertions(+), 9 deletions(-)

diff --git a/Wrappers/Python/cil/optimisation/algorithms/FISTA.py b/Wrappers/Python/cil/optimisation/algorithms/FISTA.py
index b7ba923011..05143e8157 100644
--- a/Wrappers/Python/cil/optimisation/algorithms/FISTA.py
+++ b/Wrappers/Python/cil/optimisation/algorithms/FISTA.py
@@ -213,10 +213,10 @@ def update_objective(self):
         .. math:: f(x) + g(x)
 
         """
-        self.loss.append(self.objective_function(self.x_old))
+        self.loss.append(self.calculate_objective_function_at_point(self.x_old))
 
-    def objective_function(self, x):
-        """ Calculates the objective
+    def calculate_objective_function_at_point(self, x):
+        """ Calculates the objective at a given point x
 
         .. math:: f(x) + g(x)
         
diff --git a/Wrappers/Python/cil/optimisation/algorithms/GD.py b/Wrappers/Python/cil/optimisation/algorithms/GD.py
index 22e1adcc78..9d3fdbee70 100644
--- a/Wrappers/Python/cil/optimisation/algorithms/GD.py
+++ b/Wrappers/Python/cil/optimisation/algorithms/GD.py
@@ -84,7 +84,7 @@ def set_up(self, initial, objective_function, step_size, preconditioner):
         log.info("%s setting up", self.__class__.__name__)
 
         self.x = initial.copy()
-        self.objective_function = objective_function
+        self._objective_function = objective_function
 
         if step_size is None:
             self.step_size_rule = ArmijoStepSizeRule(
@@ -106,7 +106,7 @@ def set_up(self, initial, objective_function, step_size, preconditioner):
 
     def update(self):
         '''Performs a single iteration of the gradient descent algorithm'''
-        self.objective_function.gradient(self.x, out=self.gradient_update)
+        self._objective_function.gradient(self.x, out=self.gradient_update)
 
         if self.preconditioner is not None:
             self.preconditioner.apply(
@@ -117,7 +117,7 @@ def update(self):
         self.x.sapyb(1.0, self.gradient_update, -step_size, out=self.x)
 
     def update_objective(self):
-        self.loss.append(self.objective_function(self.solution))
+        self.loss.append(self._objective_function(self.solution))
 
     def should_stop(self):
         '''Stopping criterion for the gradient descent algorithm '''
@@ -132,3 +132,20 @@ def step_size(self):
         else:
             raise TypeError(
                 "There is not a constant step size, it is set by a step-size rule")
+
+    def calculate_objective_function_at_point(self, x):
+        """ Calculates the objective at a given point x
+
+        .. math:: f(x) + g(x)
+        
+        Parameters
+        ----------
+        x : DataContainer
+        
+        """
+        return self._objective_function(x)
+    
+    @property
+    def objective_function(self):
+        warn('The attribute `objective_function` will be deprecated in the future. Please use `calculate_objective_function_at_point` instead.', DeprecationWarning, stacklevel=2)  
+        return self._objective_function
\ No newline at end of file
diff --git a/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py b/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py
index 605b1ea731..a680bd24d7 100644
--- a/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py
+++ b/Wrappers/Python/cil/optimisation/utilities/StepSizeMethods.py
@@ -19,6 +19,9 @@
 from abc import ABC, abstractmethod
 import numpy
 from numbers import Number
+import logging
+
+log = logging.getLogger(__name__)
 
 class StepSizeRule(ABC):
     """
@@ -125,21 +128,25 @@ def get_step_size(self, algorithm):
         if not self.warmstart:  
             self.alpha = self.alpha_orig
         
-        f_x = algorithm.objective_function(algorithm.solution)
+        f_x = algorithm.calculate_objective_function_at_point(algorithm.solution)
 
         self.x_armijo = algorithm.solution.copy()
-
+        
+        log.debug("Starting Armijo backtracking with initial step size: %f", self.alpha)
+        
         while k < self.max_iterations:
 
             algorithm.gradient_update.multiply(self.alpha, out=self.x_armijo)
             algorithm.solution.subtract(self.x_armijo, out=self.x_armijo)
 
-            f_x_a = algorithm.objective_function(self.x_armijo)
+            f_x_a = algorithm.calculate_objective_function_at_point(self.x_armijo)
             sqnorm = algorithm.gradient_update.squared_norm()
             if f_x_a - f_x <= - (self.alpha/2.) * sqnorm:
                 break
             k += 1.
             self.alpha *= self.beta
+        
+        log.info("Armijo rule took %d iterations to find step size", k)
 
         if k == self.max_iterations:
             raise ValueError(

From 6cc35143ef6a32b61635103d7874d04d5238a37b Mon Sep 17 00:00:00 2001
From: Margaret Duff <43645617+MargaretDuff@users.noreply.github.com>
Date: Tue, 8 Oct 2024 14:49:34 +0100
Subject: [PATCH 15/15] Update CHANGELOG.md

Signed-off-by: Margaret Duff <43645617+MargaretDuff@users.noreply.github.com>
---
 CHANGELOG.md | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 4afe8479ce..fc0be4e350 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -28,8 +28,10 @@
     - Make Binner accept accelerated=False (#1887)
     - Added checks on memory allocations within `FiniteDifferenceLibrary.cpp` and verified the status of the return in `GradientOperator` (#1929)
     - Build release version of `cilacc.dll` for Windows. Previously was defaulting to the debug build (#1928)
+    - Armijo step size rule now by default initialises the search for a step size from the previously calculated step size (#1934)
   - Changes that break backwards compatibility:
     - CGLS will no longer automatically stop iterations once a default tolerance is reached. The option to pass `tolerance` will be deprecated to be replaced by `optimisation.utilities.callbacks` (#1892)
+     
 
 * 24.1.0
   - New Features: