From 916a3f9d31078a93e0aed8025e77a7fd27a2a8b5 Mon Sep 17 00:00:00 2001
From: Jacek <jacek.barszczewski@gmail.com>
Date: Fri, 28 Jan 2022 13:47:10 +0100
Subject: [PATCH] Add basic version of parallelized Nelder-Mead (#276)

---
 ..._to_specify_algorithm_and_algo_options.rst |  36 ++
 environment.yml                               |   1 -
 src/estimagic/optimization/__init__.py        |   7 +-
 src/estimagic/optimization/neldermead.py      | 397 ++++++++++++++++++
 tests/optimization/test_neldermead.py         | 139 ++++++
 5 files changed, 578 insertions(+), 2 deletions(-)
 create mode 100644 src/estimagic/optimization/neldermead.py
 create mode 100644 tests/optimization/test_neldermead.py

diff --git a/docs/source/how_to_guides/optimization/how_to_specify_algorithm_and_algo_options.rst b/docs/source/how_to_guides/optimization/how_to_specify_algorithm_and_algo_options.rst
index a934d182d..1057b3017 100644
--- a/docs/source/how_to_guides/optimization/how_to_specify_algorithm_and_algo_options.rst
+++ b/docs/source/how_to_guides/optimization/how_to_specify_algorithm_and_algo_options.rst
@@ -518,6 +518,42 @@ noisy criterion functions.
       evaluations. Default is 1.
 
 
+.. dropdown:: neldermead_parallel
+
+    Minimize a function using the neldermead_parallel algorithm.
+
+    This is a parallel Nelder-Mead algorithm following Lee D., Wiswall M., A parallel
+    implementation of the simplex function minimization routine,
+    Computational Economics, 2007.
+
+    The algorithm was implemented by Jacek Barszczewski
+
+    The algorithm supports the following options:
+
+    - **init_simplex_method** (string or callable): Name of the method to create initial
+      simplex or callable which takes as an argument initial value of parameters
+      and returns initial simplex as j+1 x j array, where j is length of x.
+      The default is "gao_han".
+    - **n_cores** (int): Degree of parallization. The default is 1 (no parallelization).
+
+    - **adaptive** (bool): Adjust parameters of Nelder-Mead algorithm to account
+      for simplex size. The default is True.
+
+    - **stopping.max_iterations** (int): Maximum number of algorithm iterations.
+      The default is STOPPING_MAX_ITERATIONS.
+
+    - **convergence.absolute_criterion_tolerance** (float): maximal difference between
+      function value evaluated on simplex points.
+      The default is CONVERGENCE_SECOND_BEST_ABSOLUTE_CRITERION_TOLERANCE.
+
+    - **convergence.absolute_params_tolerance** (float): maximal distance between points
+      in the simplex. The default is CONVERGENCE_SECOND_BEST_ABSOLUTE_PARAMS_TOLERANCE.
+
+    - **batch_evaluator** (string or callable): See :ref:`batch_evaluators` for
+        details. Default "joblib".
+
+
+
 .. _tao_algorithms:
 
 Optimizers from the Toolkit for Advanced Optimization (TAO)
diff --git a/environment.yml b/environment.yml
index 62fc4cbac..a1d501efc 100644
--- a/environment.yml
+++ b/environment.yml
@@ -25,7 +25,6 @@ dependencies:
   - numpy
   - pandas
   - pdbpp
-  - petsc4py>=3.16.1
   - pygmo
   - pytest
   - pytest-cov
diff --git a/src/estimagic/optimization/__init__.py b/src/estimagic/optimization/__init__.py
index 73b6d1c2d..308240265 100644
--- a/src/estimagic/optimization/__init__.py
+++ b/src/estimagic/optimization/__init__.py
@@ -14,6 +14,7 @@
 from estimagic.optimization import pygmo_optimizers
 from estimagic.optimization import scipy_optimizers
 from estimagic.optimization import tao_optimizers
+from estimagic.optimization.neldermead import neldermead_parallel
 from estimagic.optimization.pounders import pounders
 
 
@@ -32,7 +33,11 @@
     )
 
 # drop private and helper functions
-AVAILABLE_ALGORITHMS = {"pounders": pounders}
+AVAILABLE_ALGORITHMS = {
+    "pounders": pounders,
+    "neldermead_parallel": neldermead_parallel,
+}
+
 PUBLIC_HELPERS = [
     "calculate_trustregion_initial_radius",
     "get_scipy_bounds",
diff --git a/src/estimagic/optimization/neldermead.py b/src/estimagic/optimization/neldermead.py
new file mode 100644
index 000000000..9ef7a3ae5
--- /dev/null
+++ b/src/estimagic/optimization/neldermead.py
@@ -0,0 +1,397 @@
+"""
+Implementation of parallelosation of Nelder-Mead algorithm
+"""
+from functools import partial
+
+import numpy as np
+from estimagic import batch_evaluators
+from estimagic.optimization.algo_options import (
+    CONVERGENCE_SECOND_BEST_ABSOLUTE_CRITERION_TOLERANCE,
+)
+from estimagic.optimization.algo_options import (
+    CONVERGENCE_SECOND_BEST_ABSOLUTE_PARAMS_TOLERANCE,
+)
+from estimagic.optimization.algo_options import STOPPING_MAX_ITERATIONS
+
+
+def neldermead_parallel(
+    criterion_and_derivative,
+    x,
+    *,
+    init_simplex_method="gao_han",
+    n_cores=1,
+    adaptive=True,
+    stopping_max_iterations=STOPPING_MAX_ITERATIONS,
+    convergence_absolute_criterion_tolerance=CONVERGENCE_SECOND_BEST_ABSOLUTE_CRITERION_TOLERANCE,  # noqa: E501
+    convergence_absolute_params_tolerance=CONVERGENCE_SECOND_BEST_ABSOLUTE_PARAMS_TOLERANCE,  # noqa: E501
+    batch_evaluator="joblib",
+):
+    """
+    Parallel Nelder-Mead algorithm following Lee D., Wiswall M., A parallel
+    implementation of the simplex function minimization routine,
+    Computational Economics, 2007.
+
+    Parameters
+    ----------
+    criterion_and_derivative (callable): A function that takes a Numpy array_like as
+        an argument and return scalar floating point or a :class:`numpy.ndarray`
+
+    x (array_like): 1-D array of initial value of parameters
+
+    init_simplex_method (string or callable): Name of the method to create initial
+        simplex or callable which takes as an argument initial value of parameters
+        and returns initial simplex as j+1 x j array, where j is length of x.
+        The default is "gao_han".
+
+    n_cores (int): Degrees of parallization. The default is 1 (no parallelization).
+
+    adaptive (bool): Adjust parameters of Nelder-Mead algorithm to accounf
+        for simplex size.
+        The default is True.
+
+    stopping_max_iterations (int): Maximum number of algorithm iterations.
+        The default is STOPPING_MAX_ITERATIONS.
+
+    convergence_absolute_criterion_tolerance (float): maximal difference between
+        function value evaluated on simplex points.
+        The default is CONVERGENCE_SECOND_BEST_ABSOLUTE_CRITERION_TOLERANCE.
+
+    convergence_absolute_params_tolerance (float): maximal distance between points in
+        the simplex. The default is CONVERGENCE_SECOND_BEST_ABSOLUTE_PARAMS_TOLERANCE.
+
+    batch_evaluator (string or callable): See :ref:`batch_evaluators` for
+        details. Default "joblib".
+
+    Returns
+    -------
+    TYPE
+        DESCRIPTION.
+
+    """
+    algo_info = {
+        "primary_criterion_entry": "value",
+        "parallelizes": True,
+        "needs_scaling": True,
+        "name": "parallel_neldermead",
+    }
+    criterion = partial(
+        criterion_and_derivative,
+        task="criterion",
+        algorithm_info=algo_info,
+    )
+
+    if x.ndim >= 1:
+        x = x.ravel()  # check if the vector of initial values is one-dimensional
+
+    j = len(x)  # size of the parameter vector
+
+    if n_cores <= 1:
+        p = 1  # if number of cores is nonpositive, set it to 1
+    else:
+        if n_cores >= j:  # number of parallelisation cannot be bigger than
+            # the number of parameters minus 1
+            p = int(j - 1)
+        else:
+            p = int(n_cores)
+
+    # set parameters of Nelder-Mead algorithm
+    # for a discussion about Nlder-Mead parameters see Gao F., Han L., Implementing the
+    # Nelder-Mead siplex algorithm with adaptive parameters, Computational Optimization
+    # and Applications, 2012
+    alpha, gamma, beta, tau = _init_algo_params(adaptive, j)
+
+    # construct initial simplex using one of feasible methods
+    # see Wssing, Simon, Proper initialization is crucial for
+    # the Nelder–Mead simplex search, Optimization Letters, 2019
+    # for a discussion about the choice of initialization
+
+    if not callable(init_simplex_method):
+        s = globals()["_" + init_simplex_method](x)
+    else:
+        s = init_simplex_method(x)
+
+    # check if batch is callable
+    if not callable(batch_evaluator):
+        batch_evaluator = getattr(
+            batch_evaluators, f"{batch_evaluator}_batch_evaluator"
+        )
+
+    # calculate criterion values for the initial simplex
+    f_s = np.array(batch_evaluator(func=criterion, arguments=s, n_cores=n_cores))[
+        :, None
+    ]
+
+    # parallelized function
+    def func_parallel(args):
+
+        criterion, s_j, s_j_r, f_s_0, f_s_j, f_s_j_1, m = args  # read arguments
+
+        f_s_j_r = criterion(
+            s_j_r
+        )  # calculate value of the criterion at the reflection point
+
+        if f_s_j_r < f_s_0:  # if the reflection point is better than the best point
+
+            s_j_e = m + gamma * (s_j_r - m)  # calculate expansion point
+            f_s_j_e = criterion(
+                s_j_e
+            )  # calculate value of the criterion at the expansion point
+
+            if f_s_j_e < f_s_0:  # if the expansion point is better than the best point
+
+                return np.hstack(
+                    [s_j_e, f_s_j_e, 0]
+                )  # return the expansion point as a new point
+
+            else:  # if the expansion point is worse than the best point
+
+                return np.hstack(
+                    [s_j_r, f_s_j_r, 0]
+                )  # return the reflection point as a new point
+
+        elif (
+            f_s_j_r < f_s_j_1
+        ):  # if reflection point is better than the next worst point
+
+            return np.hstack(
+                [s_j_r, f_s_j_r, 0]
+            )  # return reflection point as a new point
+
+        else:  # if the reflection point is worse than the next worst point
+
+            if (
+                f_s_j_r < f_s_j
+            ):  # if value of the criterion at reflection point is better than
+                # value of the criterion at initial point
+                s_j_c = m + beta * (s_j_r - m)  # calculate outside contraction point
+            else:
+                s_j_c = m - beta * (s_j_r - m)  # calculate inside contraction point
+
+            f_s_j_c = criterion(
+                s_j_c
+            )  # calculate a value of the criterion at contraction point
+
+            if f_s_j_c < np.minimum(
+                f_s_j, f_s_j_r
+            ):  # if ta value of the criterion at contraction point is better
+                # than original and refrelction point
+
+                return np.hstack(
+                    [s_j_c, f_s_j_c, 0]
+                )  # return contraction point as as new point
+
+            else:
+                if f_s_j_r < f_s_j:
+
+                    return np.hstack(
+                        [s_j_r, f_s_j_r, 1]
+                    )  # return reflection point as a new point
+
+                else:  # if value of the criterion at contraction point is worse
+                    # than the value uf the criterion at the reflection
+                    # and the initial points
+                    return np.hstack(
+                        [s_j, f_s_j, 1]
+                    )  # return the old point as a new point
+
+    optimal = False  # optmisation condition, if True stop the algorithem
+    iterations = 0  # number of criterion evaluations
+
+    while not optimal:
+
+        iterations += 1  # new iteration
+
+        # sort points and arguments increasing
+        row = np.argsort(f_s.ravel())
+        s = np.take(s, row, axis=0)
+        f_s = np.take(f_s, row, axis=0)
+
+        # calculate centroid
+        m = (s[:-p, :].sum(axis=0)) / (j - p + 1)
+
+        # calculate reflaction points
+        s_j_r = m + alpha * (m - s[-p:, :])
+
+        # calculate new points of simplex
+        s[-p:, :], f_s[-p:, :], shrink_count = np.split(
+            np.vstack(
+                batch_evaluator(
+                    func=func_parallel,
+                    arguments=tuple(
+                        (
+                            criterion,
+                            s[j + 1 - p + i, :],
+                            s_j_r[i, :],
+                            f_s[0, :],
+                            f_s[j + 1 - p + i, :],
+                            f_s[j - p + i, :],
+                            m,
+                        )
+                        for i in range(p)
+                    ),
+                    n_cores=p,
+                )
+            ),
+            [-2, -1],
+            axis=1,
+        )
+
+        # shrink simplex if there is no improvement in every process
+        if shrink_count.sum() == p:
+            s = (
+                tau * s[0:1, :] + (1 - tau) * s
+            )  # new simplex is a linear combination of the best point
+            # and remaining points
+            # evaluate function at new simplex
+            f_s = np.array(
+                batch_evaluator(
+                    func=criterion,
+                    arguments=s,
+                    n_cores=n_cores,
+                )
+            )[:, None]
+
+        # termination criteria
+        if (
+            np.max(np.abs(f_s[0, :] - f_s[1:, :]))
+            <= convergence_absolute_criterion_tolerance
+            and np.max(
+                np.abs(
+                    s[0, :]
+                    - s[
+                        1:,
+                    ]
+                )
+            )
+            <= convergence_absolute_params_tolerance
+        ):
+            optimal = True
+            converge = True
+            reason_to_stop = "Termination codition satisfied"
+        elif (
+            iterations >= stopping_max_iterations
+        ):  # if maximum amount of iteration is exceeded
+            optimal = True
+            converge = False
+            reason_to_stop = "Maximum number of interation exceeded"
+        continue
+
+    # save results
+    result = {
+        "solution_x": s[np.nonzero(f_s == f_s.min())[0][0], :],
+        "solution_criterion": f_s.min(),
+        "n_iterations": iterations,
+        "success": converge,
+        "reached_convergence_criterion": reason_to_stop,
+    }
+    return result
+
+
+# set parameters of Nelder-Mead algorithm
+# for a discussion about Nlder-Mead parameters see Gao F., Han L., Implementing the
+# Nelder-Mead siplex algorithm with adaptive parameters, Computational Optimization
+# and Applications, 2012
+def _init_algo_params(adaptive, j):
+
+    if adaptive:
+        # algorithem parameters alla Gao-Han (adaptive)
+        return (
+            1,
+            1 + 2 / j,
+            0.75 - 1 / (2 * j),
+            1 - 1 / j,
+        )
+    else:
+        # standard setting of Nelder-Mead
+        return (
+            1,
+            2,
+            0.5,
+            0.5,
+        )
+
+
+# initial structure of the simplex
+def _init_simplex(x):
+
+    s = np.vstack(
+        [
+            x,
+        ]
+        * (len(x) + 1)
+    ).astype(np.float64)
+
+    return s
+
+
+# initilize due to L. Pfeffer at Standford (Matlab fminsearch and SciPy default option)
+def _pfeffer(x):
+
+    s = _init_simplex(x)
+
+    # method parameters
+    c_p = 1.05
+
+    # initial simplex
+    np.fill_diagonal(s[1:, :], x * c_p * (x != 0) + 0.00025 * (x == 0))
+
+    return s
+
+
+# adopted from Nash (R default option)
+# see Nash, J.C.: Compact numerical methods for computers: linear algebra and
+# function minimisation, 2nd edn. Adam Hilger Ltd., Bristol (1990) for details
+def _nash(x):
+
+    s = _init_simplex(x)
+
+    # method parameters
+    c_n = 0.1
+
+    # initial simplex
+    np.fill_diagonal(s[1:, :], (x != 0) * (np.max(x) * c_n + x) + c_n * (x == 0))
+    return s
+
+
+# adopted from Gao F., Han L., Implementing the
+# Nelder-Mead siplex algorithm with adaptive parameters, Computational Optimizatio
+def _gao_han(x):
+
+    s = _init_simplex(x)
+
+    # method parameters
+    c_h = np.minimum(np.maximum(np.max(x), 1), 10)
+    j = len(x)
+
+    # initial simplex
+    s = (
+        s
+        + np.vstack(
+            [
+                np.array([[(1 - (j + 1) ** 0.5) / j]]) * np.ones([1, j]),
+                np.eye(j),
+            ]
+        )
+        * c_h
+    )
+
+    return s
+
+
+# adopted by Varadhan and Borchers for the R package dfoptim
+# see Varadhan, R., Borchers, H.W.: Dfoptim: derivative-free optimization (2016).
+# https://CRAN.R-project. org/package=dfoptim. R package version 2016.7-1 for details
+def _varadhan_borchers(x):
+
+    s = _init_simplex(x)
+
+    # method parameters
+    j = len(x)
+    c_s = np.maximum(1, ((x ** 2).sum()) ** 0.5)
+    beta1 = c_s / (j * 2 ** 0.5) * ((j + 1) ** 0.5 + j - 1)
+    beta2 = c_s / (j * 2 ** 0.5) * ((j + 1) ** 0.5 - 1)
+
+    # initial simplex
+    s[1:, :] = s[1:, :] + np.full([j, j], beta2) + np.eye(j) * (beta1 - beta2)
+
+    return s
diff --git a/tests/optimization/test_neldermead.py b/tests/optimization/test_neldermead.py
new file mode 100644
index 000000000..ea128c248
--- /dev/null
+++ b/tests/optimization/test_neldermead.py
@@ -0,0 +1,139 @@
+import numpy as np
+import pytest
+from estimagic.optimization.neldermead import _gao_han
+from estimagic.optimization.neldermead import _init_algo_params
+from estimagic.optimization.neldermead import _init_simplex
+from estimagic.optimization.neldermead import _nash
+from estimagic.optimization.neldermead import _pfeffer
+from estimagic.optimization.neldermead import _varadhan_borchers
+from estimagic.optimization.neldermead import neldermead_parallel
+
+
+# function to test
+def sphere(x, *args, **kwargs):
+
+    return (x ** 2).sum()
+
+
+# unit tests
+def test_init_algo_params():
+
+    # test setting
+    j = 2
+    adaptive = True
+
+    # outcome
+    result = _init_algo_params(adaptive, j)
+
+    # expected outcome
+    expected = (1, 2, 0.5, 0.5)
+
+    assert result == expected
+
+
+def test_init_simplex():
+
+    # test setting
+    x = np.array([1, 2, 3])
+
+    # outcome
+    result = _init_simplex(x)
+
+    # expected outcome
+    expected = np.array([[1, 2, 3], [1, 2, 3], [1, 2, 3], [1, 2, 3]])
+
+    assert (result == expected).all()
+
+
+def test_pfeffer():
+
+    # test setting
+    x = np.array([1, 0, 1])
+
+    # outcome
+    result = _pfeffer(x)
+
+    # expected outcome
+    expected = np.array([[1, 0, 1], [1.05, 0, 1], [1, 0.00025, 1], [1, 0, 1.05]])
+
+    assert (result == expected).all()
+
+
+def test_nash():
+
+    # test setting
+    x = np.array([1, 0, 1])
+
+    # outcome
+    result = _nash(x)
+
+    # expected outcome
+    expected = np.array([[1, 0, 1], [1.1, 0, 1], [1, 0.1, 1], [1, 0, 1.1]])
+
+    assert (result == expected).all()
+
+
+def test_gao_han():
+
+    # test setting
+    x = np.array([1, 0, 1])
+
+    # outcome
+    result = _gao_han(x)
+
+    # expected outcome
+    expected = np.array([[0.66667, -0.33333, 0.66667], [2, 0, 1], [1, 1, 1], [1, 0, 2]])
+
+    np.testing.assert_allclose(result, expected, atol=1e-3)
+
+
+def test_varadhan_borchers():
+
+    # test setting
+    x = np.array([1, 0, 1])
+
+    # outcome
+    result = _varadhan_borchers(x)
+
+    # expected outcome
+    expected = np.array(
+        [
+            [1, 0, 1],
+            [2.3333, 0.3333, 1.3333],
+            [1.3333, 1.3333, 1.3333],
+            [1.3333, 0.3333, 2.3333],
+        ]
+    )
+
+    np.testing.assert_allclose(result, expected, atol=1e-3)
+
+
+# general parameter test
+test_cases = [
+    {},
+    {"adaptive": False},
+    {"init_simplex_method": "nash"},
+    {"init_simplex_method": "pfeffer"},
+    {"init_simplex_method": "varadhan_borchers"},
+]
+
+
+@pytest.mark.parametrize("algo_options", test_cases)
+def test_neldermead_correct_algo_options(algo_options):
+    res = neldermead_parallel(
+        criterion_and_derivative=sphere,
+        x=np.array([1, -5, 3]),
+        **algo_options,
+    )
+    np.testing.assert_allclose(res["solution_x"], np.zeros(3), atol=5e-4)
+
+
+# test if maximum number of iterations works
+def test_fides_stop_after_one_iteration():
+    res = neldermead_parallel(
+        criterion_and_derivative=sphere,
+        x=np.array([1, -5, 3]),
+        stopping_max_iterations=1,
+    )
+    assert not res["success"]
+    assert res["n_iterations"] == 1