Skip to content


Merge pull request #3088 from js850/benchmarks
Browse files Browse the repository at this point in the history
ENH: optimize: Add a benchmark framework for the optimizers

This adds a framework for benchmarking the optimizers, along with 8 or
so benchmarks on different functions.
  • Loading branch information
pv committed Nov 28, 2013
2 parents 73c631b + c432b00 commit 0e7eb52
Show file tree
Hide file tree
Showing 2 changed files with 306 additions and 0 deletions.
204 changes: 204 additions & 0 deletions scipy/optimize/benchmarks/
Original file line number Diff line number Diff line change
@@ -0,0 +1,204 @@
import time
from collections import defaultdict

import numpy as np
from numpy.testing import Tester, TestCase

import scipy.optimize
from scipy.optimize.optimize import rosen, rosen_der, rosen_hess
import test_functions as funcs

class _BenchOptimizers(object):
"""a framework for benchmarking the optimizer
function_name : string
fun : callable
der : callable
function that returns the derivitive (jacobian, gradient) of fun
hess : callable
function that returns the hessian of fun
minimizer_kwargs : kwargs
additional keywords passed to the minimizer. e.g. tol, maxiter
def __init__(self, function_name, fun, der=None, hess=None,
self.function_name = function_name = fun
self.der = der
self.hess = hess
self.minimizer_kwargs = minimizer_kwargs
if "tol" not in minimizer_kwargs:
minimizer_kwargs["tol"] = 1e-4

self.results = []

def reset(self):
self.results = []

def add_result(self, result, t, name):
"""add a result to the list"""
result.time = t = name
if not hasattr(result, "njev"):
result.njev = 0
if not hasattr(result, "nhev"):
result.nhev = 0

def print_results(self):
"""print the current list of results"""
results = self.average_results()
results = sorted(results, key=lambda x: (x.nfail, x.mean_time))
print("Optimizer benchmark: %s" % (self.function_name))
print("dimensions: %d, extra kwargs: %s" % (results[0].ndim, str(self.minimizer_kwargs)))
print("averaged over %d starting configurations" % (results[0].ntrials))
print(" Optimizer nfail nfev njev nhev time")
for res in results:
print("%11s | %4d | %4d | %4d | %4d | %.6g" %
(, res.nfail, res.mean_nfev, res.mean_njev, res.mean_nhev, res.mean_time))

def average_results(self):
"""group the results by minimizer and average over the runs"""
grouped_results = defaultdict(list)
for res in self.results:

averaged_results = dict()
for name, result_list in grouped_results.items():
newres = scipy.optimize.Result() = name
newres.mean_nfev = np.mean([r.nfev for r in result_list])
newres.mean_njev = np.mean([r.njev for r in result_list])
newres.mean_nhev = np.mean([r.nhev for r in result_list])
newres.mean_time = np.mean([r.time for r in result_list])
newres.ntrials = len(result_list)
newres.nfail = len([r for r in result_list if not r.success])
newres.ndim = len(result_list[0].x)
except TypeError:
newres.ndim = 1
averaged_results[name] = newres
return averaged_results.values()

def bench_run(self, x0, **minimizer_kwargs):
"""do an optimization test starting at x0 for all the optimizers"""
kwargs = self.minimizer_kwargs

fonly_methods = ["COBYLA", 'Powell']
for method in fonly_methods:
t0 = time.time()
res = scipy.optimize.minimize(, x0, method=method,
t1 = time.time()
self.add_result(res, t1-t0, method)

gradient_methods = ['L-BFGS-B', 'BFGS', 'CG', 'TNC', 'SLSQP']
if self.der is not None:
for method in gradient_methods:
t0 = time.time()
res = scipy.optimize.minimize(, x0, method=method,
jac=self.der, **kwargs)
t1 = time.time()
self.add_result(res, t1-t0, method)

hessian_methods = ["Newton-CG", 'dogleg', 'trust-ncg']
if self.hess is not None:
for method in hessian_methods:
t0 = time.time()
res = scipy.optimize.minimize(, x0, method=method,
jac=self.der, hess=self.hess,
t1 = time.time()
self.add_result(res, t1-t0, method)

class BenchSmoothUnbounded(TestCase):
"""Benchmark the optimizers with smooth, unbounded, functions"""
def bench_rosenbrock(self):
b = _BenchOptimizers("Rosenbrock function",
fun=rosen, der=rosen_der, hess=rosen_hess)
for i in range(10):

def bench_rosenbrock_tight(self):
b = _BenchOptimizers("Rosenbrock function",
fun=rosen, der=rosen_der, hess=rosen_hess,
for i in range(10):

def bench_simple_quadratic(self):
s = funcs.SimpleQuadratic()
# print "checking gradient", scipy.optimize.check_grad(, s.der, np.array([1.1, -2.3]))
b = _BenchOptimizers("simple quadratic function",, der=s.der, hess=s.hess)
for i in range(10):

def bench_asymetric_quadratic(self):
s = funcs.AsymmetricQuadratic()
# print "checking gradient", scipy.optimize.check_grad(, s.der, np.array([1.1, -2.3]))
b = _BenchOptimizers("function sum(x**2) + x[0]",, der=s.der, hess=s.hess)
for i in range(10):

def bench_sin_1d(self):
fun = lambda x: np.sin(x[0])
der = lambda x: np.array([np.cos(x[0])])
b = _BenchOptimizers("1d sin function",
fun=fun, der=der, hess=None)
for i in range(10):

def bench_booth(self):
s = funcs.Booth()
# print "checking gradient", scipy.optimize.check_grad(, s.der, np.array([1.1, -2.3]))
b = _BenchOptimizers("Booth's function",, der=s.der, hess=None)
for i in range(10):

def bench_beale(self):
s = funcs.Beale()
# print "checking gradient", scipy.optimize.check_grad(, s.der, np.array([1.1, -2.3]))
b = _BenchOptimizers("Beale's function",, der=s.der, hess=None)
for i in range(10):

def bench_LJ(self):
s = funcs.LJ()
# print "checking gradient", scipy.optimize.check_grad(s.get_energy, s.get_gradient, np.random.uniform(-2,2,3*4))
natoms = 4
b = _BenchOptimizers("%d atom Lennard Jones potential" % (natoms),
fun=s.get_energy, der=s.get_gradient, hess=None)
for i in range(10):

#def main():
# bench_rosenbrock()
# bench_simple_quadratic()
# bench_asymetric_quadratic()
# bench_sin_1d()
# bench_booth()
# bench_beale()
# bench_LJ()

if __name__ == "__main__":
102 changes: 102 additions & 0 deletions scipy/optimize/benchmarks/
Original file line number Diff line number Diff line change
@@ -0,0 +1,102 @@
import numpy as np

class SimpleQuadratic(object):
def fun(self, x):
return, x)

def der(self, x):
return 2. * x

def hess(self, x):
return 2. * np.eye(x.size)

class AsymmetricQuadratic(object):
def fun(self, x):
return, x) + x[0]

def der(self, x):
d = 2. * x
d[0] += 1
return d

def hess(self, x):
return 2. * np.eye(x.size)

class LJ(object):
Lennard-Jones pairwise potential energy
def __init__(self, eps=1.0, sig=1.0):
""" simple lennard jones potential"""
self.sig = sig
self.eps = eps

def vij(self, r):
return 4.*self.eps * ( (self.sig/r)**12 - (self.sig/r)**6 )

def dvij(self, r):
return 4.*self.eps * ( -12./self.sig*(self.sig/r)**13 + 6./self.sig*(self.sig/r)**7 )

def get_energy(self, coords):
coords = np.reshape(coords, [-1,3])
natoms = coords.shape[0]
for i in range(natoms):
for j in range(i+1,natoms):
dr = coords[j,:]- coords[i,:]
r = np.linalg.norm(dr)
energy += self.vij(r)
return energy

def get_energy_gradient(self, coords):
coords = np.reshape(coords, [-1,3])
natoms = coords.shape[0]
V = np.zeros([natoms,3])
for i in range(natoms):
for j in range(i+1,natoms):
dr = coords[j,:]- coords[i,:]
r = np.linalg.norm(dr)
energy += self.vij(r)
g = self.dvij(r)
V[i,:] += -g * dr/r
V[j,:] += g * dr/r
V = V.reshape([natoms*3])
return energy,V

def get_gradient(self, coords):
e, g = self.get_energy_gradient(coords)
return g

class Booth(object):
# target_E = 0.
# target_coords = np.array([1., 3.])
# xmin = np.array([-10., -10.])
## xmin = np.array([0., 0.])
# xmax = np.array([10., 10.])
def fun(self, coords):
x, y = coords
return (x + 2.*y - 7.)**2 + (2.*x + y - 5.)**2

def der(self, coords):
x, y = coords
dx = 2.*(x + 2.*y - 7.) + 4.*(2.*x + y - 5.)
dy = 4.*(x + 2.*y - 7.) + 2.*(2.*x + y - 5.)
return np.array([dx, dy])

class Beale(object):
# target_E = 0.
# target_coords = np.array([3., 0.5])
# xmin = np.array([-4.5, -4.5])
## xmin = np.array([0., 0.])
# xmax = np.array([4.5, 4.5])
def fun(self, coords):
x, y = coords
return (1.5 - x + x*y)**2 + (2.25 - x + x * y**2)**2 + (2.625 - x + x * y**3)**2

def der(self, coords):
x, y = coords
dx = 2. * (1.5 - x + x*y) * (-1. + y) + 2. * (2.25 - x + x * y**2) * (-1. + y**2) + 2. * (2.625 - x + x * y**3) * (-1. + y**3)
dy = 2. * (1.5 - x + x*y) * (x) + 2. * (2.25 - x + x * y**2) * (2. * y * x) + 2. * (2.625 - x + x * y**3) * (3. * x * y**2)
return np.array([dx, dy])

0 comments on commit 0e7eb52

Please sign in to comment.