GPy/python/likelihoods/Laplace.py

import numpy as np
import scipy as sp
import GPy
from GPy.util.linalg import jitchol
from functools import partial
from GPy.likelihoods.likelihood import likelihood
from GPy.util.linalg import pdinv,mdot
from scipy.stats import norm


class Laplace(likelihood):
    """Laplace approximation to a posterior"""

    def __init__(self, data, likelihood_function):
        """
        Laplace Approximation

        First find the moments \hat{f} and the hessian at this point (using Newton-Raphson)
        then find the z^{prime} which allows this to be a normalised gaussian instead of a
        non-normalized gaussian

        Finally we must compute the GP variables (i.e. generate some Y^{squiggle} and z^{squiggle}
        which makes a gaussian the same as the laplace approximation

        Arguments
        ---------

        :data: @todo
        :likelihood_function: @todo

        """
        self.data = data
        self.likelihood_function = likelihood_function

        #Inital values
        self.N, self.D = self.data.shape

    def _compute_GP_variables(self):
        """
        Generates data Y which would give the normal distribution identical to the laplace approximation

        GPy expects a likelihood to be gaussian, so need to caluclate the points Y^{squiggle} and Z^{squiggle}
        that makes the posterior match that found by a laplace approximation to a non-gaussian likelihood
        """
        #z_hat = N(f_hat|f_hat, hess_hat) / self.height_unnormalised
        normalised_approx = norm(loc=self.f_hat, scale=self.hess_hat)
        self.Z = normalised_approx.pdf(self.f_hat)/self.height_unnormalised
        #self.Y =
        #self.YYT =
        #self.covariance_matrix =
        #self.precision =

    def fit_full(self, K):
        """
        The laplace approximation algorithm
        For nomenclature see Rasmussen & Williams 2006
        :K: Covariance matrix
        """
        f = np.zeros((self.N, 1))
        #K = np.diag(np.ones(self.N))
        (Ki, _, _, log_Kdet) = pdinv(K)
        obj_constant = (0.5 * log_Kdet) - ((0.5 * self.N) * np.log(2 * np.pi))

        #Find \hat(f) using a newton raphson optimizer for example
        #TODO: Add newton-raphson as subclass of optimizer class

        #FIXME: Can we get rid of this horrible reshaping?
        def obj(f):
            f = f[:, None]
            res = -1 * (self.likelihood_function.link_function(self.data, f) - 0.5 * mdot(f.T, (Ki, f)) + obj_constant)
            return float(res)

        def obj_grad(f):
            f = f[:, None]
            res = -1 * (self.likelihood_function.link_grad(self.data, f) - mdot(Ki, f))
            return np.squeeze(res)

        def obj_hess(f):
            f = f[:, None]
            res = -1 * (np.diag(self.likelihood_function.link_hess(self.data, f)) - Ki)
            return np.squeeze(res)

        self.f_hat = sp.optimize.fmin_ncg(obj, f, fprime=obj_grad, fhess=obj_hess)
        print self.f_hat

        #At this point get the hessian matrix
        self.hess_hat = obj_hess(self.f_hat)

        #Need to add the constant as we previously were trying to avoid computing it (seems like a small overhead though...)
        self.height_unnormalised = obj(self.f_hat) #FIXME: Is it -1?

        return self._compute_GP_variables()
Got most of laplace approximation working 2013-03-13 17:55:41 +00:00			`import numpy as np`
			`import scipy as sp`
Initial commit, setting up the laplace approximation for a student t 2013-03-12 17:42:00 +00:00			`import GPy`
			`from GPy.util.linalg import jitchol`
Got most of laplace approximation working 2013-03-13 17:55:41 +00:00			`from functools import partial`
			`from GPy.likelihoods.likelihood import likelihood`
			`from GPy.util.linalg import pdinv,mdot`
Trying to 'debug' 2013-03-14 15:30:22 +00:00			`from scipy.stats import norm`
Got most of laplace approximation working 2013-03-13 17:55:41 +00:00

			`class Laplace(likelihood):`
Initial commit, setting up the laplace approximation for a student t 2013-03-12 17:42:00 +00:00			`"""Laplace approximation to a posterior"""`

Trying to 'debug' 2013-03-14 15:30:22 +00:00			`def __init__(self, data, likelihood_function):`
Initial commit, setting up the laplace approximation for a student t 2013-03-12 17:42:00 +00:00			`"""`
			`Laplace Approximation`

			`First find the moments \hat{f} and the hessian at this point (using Newton-Raphson)`
			`then find the z^{prime} which allows this to be a normalised gaussian instead of a`
			`non-normalized gaussian`

			`Finally we must compute the GP variables (i.e. generate some Y^{squiggle} and z^{squiggle}`
			`which makes a gaussian the same as the laplace approximation`

			`Arguments`
			`---------`

			`:data: @todo`
			`:likelihood_function: @todo`

			`"""`
			`self.data = data`
			`self.likelihood_function = likelihood_function`

			`#Inital values`
			`self.N, self.D = self.data.shape`

			`def _compute_GP_variables(self):`
			`"""`
			`Generates data Y which would give the normal distribution identical to the laplace approximation`

			`GPy expects a likelihood to be gaussian, so need to caluclate the points Y^{squiggle} and Z^{squiggle}`
			`that makes the posterior match that found by a laplace approximation to a non-gaussian likelihood`
			`"""`
Trying to 'debug' 2013-03-14 15:30:22 +00:00			`#z_hat = N(f_hat\|f_hat, hess_hat) / self.height_unnormalised`
			`normalised_approx = norm(loc=self.f_hat, scale=self.hess_hat)`
			`self.Z = normalised_approx.pdf(self.f_hat)/self.height_unnormalised`
			`#self.Y =`
			`#self.YYT =`
			`#self.covariance_matrix =`
			`#self.precision =`
Initial commit, setting up the laplace approximation for a student t 2013-03-12 17:42:00 +00:00
			`def fit_full(self, K):`
			`"""`
			`The laplace approximation algorithm`
			`For nomenclature see Rasmussen & Williams 2006`
			`:K: Covariance matrix`
			`"""`
Got most of laplace approximation working 2013-03-13 17:55:41 +00:00			`f = np.zeros((self.N, 1))`
Trying to 'debug' 2013-03-14 15:30:22 +00:00			`#K = np.diag(np.ones(self.N))`
Got most of laplace approximation working 2013-03-13 17:55:41 +00:00			`(Ki, _, _, log_Kdet) = pdinv(K)`
Trying to 'debug' 2013-03-14 15:30:22 +00:00			`obj_constant = (0.5 * log_Kdet) - ((0.5 * self.N) * np.log(2 * np.pi))`
Initial commit, setting up the laplace approximation for a student t 2013-03-12 17:42:00 +00:00
			`#Find \hat(f) using a newton raphson optimizer for example`
Got most of laplace approximation working 2013-03-13 17:55:41 +00:00			`#TODO: Add newton-raphson as subclass of optimizer class`

			`#FIXME: Can we get rid of this horrible reshaping?`
			`def obj(f):`
			`f = f[:, None]`
			`res = -1 * (self.likelihood_function.link_function(self.data, f) - 0.5 * mdot(f.T, (Ki, f)) + obj_constant)`
			`return float(res)`

			`def obj_grad(f):`
			`f = f[:, None]`
			`res = -1 * (self.likelihood_function.link_grad(self.data, f) - mdot(Ki, f))`
			`return np.squeeze(res)`

			`def obj_hess(f):`
			`f = f[:, None]`
			`res = -1 * (np.diag(self.likelihood_function.link_hess(self.data, f)) - Ki)`
			`return np.squeeze(res)`

			`self.f_hat = sp.optimize.fmin_ncg(obj, f, fprime=obj_grad, fhess=obj_hess)`
Trying to 'debug' 2013-03-14 15:30:22 +00:00			`print self.f_hat`
Initial commit, setting up the laplace approximation for a student t 2013-03-12 17:42:00 +00:00
			`#At this point get the hessian matrix`
Trying to 'debug' 2013-03-14 15:30:22 +00:00			`self.hess_hat = obj_hess(self.f_hat)`
Got most of laplace approximation working 2013-03-13 17:55:41 +00:00
			`#Need to add the constant as we previously were trying to avoid computing it (seems like a small overhead though...)`
Trying to 'debug' 2013-03-14 15:30:22 +00:00			`self.height_unnormalised = obj(self.f_hat) #FIXME: Is it -1?`
Initial commit, setting up the laplace approximation for a student t 2013-03-12 17:42:00 +00:00
Trying to 'debug' 2013-03-14 15:30:22 +00:00			`return self._compute_GP_variables()`