made SCG work nicely with the optimization framework

2026-05-21 14:05:14 +02:00 · 2013-03-12 14:01:14 +00:00 · 2013-03-12 14:01:14 +00:00 · c4d190e0fd
commit c4d190e0fd
parent 0503d0e3f5
2 changed files with 36 additions and 31 deletions
--- a/GPy/inference/SCG.py
+++ b/GPy/inference/SCG.py
@ -24,7 +24,7 @@

 import numpy as np

-def SCG(f, gradf, x, optargs=(), maxiters=500, display=True, xtol=1e-6, ftol=1e-6):
+def SCG(f, gradf, x, optargs=(), maxiters=500, max_f_eval=500, display=True, xtol=1e-6, ftol=1e-6):
    """
    Optimisation through Scaled Conjugate Gradients (SCG)

@ -35,13 +35,12 @@ def SCG(f, gradf, x, optargs=(), maxiters=500, display=True, xtol=1e-6, ftol=1e-
    Returns
    x the optimal value for x
    flog : a list of all the objective values
-    pointlog : a list of the x values tried
-    scalelog : a list of the scales used in optimisation (beta)

    """

    sigma0 = 1.0e-4
    fold = f(x, *optargs)	# Initial function value.
+    function_eval = 1
    fnow = fold
    gradnew = gradf(x, *optargs)	# Initial gradient.
    gradold = gradnew.copy()
@ -51,10 +50,9 @@ def SCG(f, gradf, x, optargs=(), maxiters=500, display=True, xtol=1e-6, ftol=1e-
    beta = 1.0				# Initial scale parameter.
    betamin = 1.0e-15 			# Lower bound on scale.
    betamax = 1.0e100			# Upper bound on scale.
+    status = "Not converged"

    flog = [fold]
-    pointlog = [x.copy()]
-    scalelog = [beta]

    iteration = 0

@ -68,8 +66,6 @@ def SCG(f, gradf, x, optargs=(), maxiters=500, display=True, xtol=1e-6, ftol=1e-
                d = -gradnew
                mu = np.dot(d, gradnew)
            kappa = np.dot(d, d)
-            #if kappa < eps():
-                #return x, flog, pointlog, scalelog
            sigma = sigma0/np.sqrt(kappa)
            xplus = x + sigma*d
            gplus = gradf(xplus, *optargs)
@ -86,6 +82,12 @@ def SCG(f, gradf, x, optargs=(), maxiters=500, display=True, xtol=1e-6, ftol=1e-
        # Calculate the comparison ratio.
        xnew = x + alpha*d
        fnew = f(xnew, *optargs)
+        function_eval += 1
+
+        if function_eval >= max_f_eval:
+            status = "Maximum number of function evaluations exceeded"
+            return x, flog, function_eval, status
+
        Delta = 2.*(fnew - fold)/(alpha*mu)
        if Delta  >= 0.:
            success = True
@ -98,8 +100,6 @@ def SCG(f, gradf, x, optargs=(), maxiters=500, display=True, xtol=1e-6, ftol=1e-

        # Store relevant variables
        flog.append(fnow)		# Current function value
-        pointlog.append(x)           # Current position
-        scalelog.append(beta)    # current scale parameter

        iteration += 1
        if display:
@ -108,7 +108,7 @@ def SCG(f, gradf, x, optargs=(), maxiters=500, display=True, xtol=1e-6, ftol=1e-
        if success:
            # Test for termination
            if np.max(np.abs(alpha*d)) < xtol or np.max(np.abs(fnew-fold)) < ftol:
-                return x, flog, pointlog, scalelog
+                return x, flog, function_eval, status

            else:
                # Update variables for new position
@ -117,7 +117,7 @@ def SCG(f, gradf, x, optargs=(), maxiters=500, display=True, xtol=1e-6, ftol=1e-
                gradnew = gradf(x, *optargs)
                # If the gradient is zero then we are done.
                if np.dot(gradnew,gradnew) == 0:
-                    return x, flog, pointlog, scalelog
+                    return x, flog, function_eval, status

        # Adjust beta according to comparison ratio.
        if Delta < 0.25:
@ -136,7 +136,6 @@ def SCG(f, gradf, x, optargs=(), maxiters=500, display=True, xtol=1e-6, ftol=1e-

    # If we get here, then we haven't terminated in the given number of
    # iterations.
-    if display:
-        print "maxiter exceeded"
+    status = "maxiter exceeded"

-    return x, flog, pointlog, scalelog
+    return x, flog, function_eval, status
--- a/GPy/inference/optimization.py
+++ b/GPy/inference/optimization.py
@ -1,18 +1,18 @@
 # Copyright (c) 2012, GPy authors (see AUTHORS.txt).
 # Licensed under the BSD 3-clause license (see LICENSE.txt)

-
+import pdb
+import pylab as pb
+import datetime as dt
 from scipy import optimize
+import numpy as np

 try:
    import rasmussens_minimize as rasm
    rasm_available = True
 except ImportError:
    rasm_available = False
-
-import pdb
-import pylab as pb
-import datetime as dt
+from SCG import SCG

 class Optimizer():
    """
@ -29,7 +29,7 @@ class Optimizer():
    :rtype: optimizer object.

    """
-    def __init__(self, x_init, messages=False, model = None, max_f_eval=1e4, ftol=None, gtol=None, xtol=None):
+    def __init__(self, x_init, messages=False, model = None, max_f_eval=1e4, max_iters = 1e3, ftol=None, gtol=None, xtol=None):
        self.opt_name = None
        self.x_init = x_init
        self.messages = messages
@ -38,6 +38,7 @@ class Optimizer():
        self.funct_eval = None
        self.status = None
        self.max_f_eval = int(max_f_eval)
+        self.max_iters = int(max_iters)
        self.trace = None
        self.time = "Not available"
        self.xtol = xtol
@ -63,12 +64,13 @@ class Optimizer():
            pb.xlabel('Iteration')
            pb.ylabel('f(x)')

-    def diagnostics(self):
-        print "Optimizer: \t\t\t\t %s" % self.opt_name
-        print "f(x_opt): \t\t\t\t %.3f" % self.f_opt
-        print "Number of function evaluations: \t %d" % self.funct_eval
-        print "Optimization status: \t\t\t %s" % self.status
-        print "Time elapsed: \t\t\t\t %s" % self.time
+    def __str__(self):
+        diagnostics = "Optimizer: \t\t\t\t %s\n" % self.opt_name
+        diagnostics += "f(x_opt): \t\t\t\t %.3f\n" % self.f_opt
+        diagnostics += "Number of function evaluations: \t %d\n" % self.funct_eval
+        diagnostics += "Optimization status: \t\t\t %s\n" % self.status
+        diagnostics += "Time elapsed: \t\t\t\t %s\n" % self.time
+        return diagnostics

 class opt_tnc(Optimizer):
    def __init__(self, *args, **kwargs):
@ -161,7 +163,6 @@ class opt_simplex(Optimizer):
        self.f_opt = opt_result[1]
        self.funct_eval = opt_result[3]
        self.status = statuses[opt_result[4]]
-
        self.trace = None


@ -196,7 +197,7 @@ class opt_rasm(Optimizer):

        self.trace = opt_result[1]

-class opt_scg(Optimizer):
+class opt_SCG(Optimizer):
    def __init__(self, *args, **kwargs):
        Optimizer.__init__(self, *args, **kwargs)
        self.opt_name = "Scaled Conjugate Gradients"
@ -204,15 +205,20 @@ class opt_scg(Optimizer):
    def opt(self, f_fp = None, f = None, fp = None):
        assert not f is None
        assert not fp is None
-        opt_result = SCG (f,fp,self.x_init, display=self.messages)
+        opt_result = SCG(f,fp,self.x_init, display=self.messages, maxiters=self.max_iters, max_f_eval=self.max_f_eval, xtol=self.xtol, ftol=self.ftol)
+        self.x_opt = opt_result[0]
+        self.trace = opt_result[1]
+        self.f_opt = self.trace[-1]
+        self.funct_eval = opt_result[2]
+        self.status = opt_result[3]

 def get_optimizer(f_min):
-    # import rasmussens_minimize as rasm
    from SGD import opt_SGD
-    
+
    optimizers = {'fmin_tnc': opt_tnc,
          'simplex': opt_simplex,
          'lbfgsb': opt_lbfgsb,
+          'scg': opt_SCG,
          'sgd': opt_SGD}

    if rasm_available: