GPy/python/examples/laplace_approximations.py

import GPy
import numpy as np
import matplotlib.pyplot as plt
from scipy.stats import t, norm
from coxGP.python.likelihoods.Laplace import Laplace
from coxGP.python.likelihoods.likelihood_function import student_t


def student_t_approx():
    """
    Example of regressing with a student t likelihood
    """
    #Start a function, any function
    X = np.sort(np.random.uniform(0, 15, 100))[:, None]
    Y = np.sin(X)

    #Add student t random noise to datapoints
    deg_free = 2.5
    t_rv = t(deg_free, loc=5, scale=1)
    noise = t_rv.rvs(size=Y.shape)
    Y += noise

    # Kernel object
    print X.shape
    kernel = GPy.kern.rbf(X.shape[1])

    #A GP should completely break down due to the points as they get a lot of weight
    # create simple GP model
    m = GPy.models.GP_regression(X, Y, kernel=kernel)

    # optimize
    m.ensure_default_constraints()
    m.optimize()
    # plot
    #m.plot()
    print m

    #with a student t distribution, since it has heavy tails it should work well
    likelihood_function = student_t(deg_free, sigma=1)
    lap = Laplace(Y, likelihood_function)
    cov = kernel.K(X)
    lap.fit_full(cov)
    #Get one sample (just look at a single Y
    mode = float(lap.f_hat[0])
    variance = float((deg_free/(deg_free-2))) #BUG: Not convinced this is giving reasonable variables
    #variance = float((deg_free/(deg_free-2)) + np.diagonal(lap.hess_hat)[0]) #BUG: Not convinced this is giving reasonable variables
    normalised_approx = norm(loc=mode, scale=variance)
    print "Normal with mode %f, and variance %f" % (mode, variance)
    print lap.height_unnormalised

    test_range = np.arange(0, 10, 0.1)
    print np.diagonal(lap.hess_hat)
    plt.plot(test_range, t_rv.pdf(test_range))
    plt.plot(test_range, normalised_approx.pdf(test_range))
    plt.show()


def noisy_laplace_approx():
    """
    Example of regressing with a student t likelihood
    """
    #Start a function, any function
    X = np.sort(np.random.uniform(0, 15, 70))[:, None]
    Y = np.sin(X)

    #Add some extreme value noise to some of the datapoints
    percent_corrupted = 0.05
    corrupted_datums = int(np.round(Y.shape[0] * percent_corrupted))
    indices = np.arange(Y.shape[0])
    np.random.shuffle(indices)
    corrupted_indices = indices[:corrupted_datums]
    print corrupted_indices
    noise = np.random.uniform(-10, 10, (len(corrupted_indices), 1))
    Y[corrupted_indices] += noise

    #A GP should completely break down due to the points as they get a lot of weight
    # create simple GP model
    m = GPy.models.GP_regression(X, Y)

    # optimize
    m.ensure_default_constraints()
    m.optimize()
    # plot
    m.plot()
    print m

    #with a student t distribution, since it has heavy tails it should work well
Initial commit, setting up the laplace approximation for a student t 2013-03-12 17:42:00 +00:00			`import GPy`
			`import numpy as np`
			`import matplotlib.pyplot as plt`
Trying to 'debug' 2013-03-14 15:30:22 +00:00			`from scipy.stats import t, norm`
Got most of laplace approximation working 2013-03-13 17:55:41 +00:00			`from coxGP.python.likelihoods.Laplace import Laplace`
			`from coxGP.python.likelihoods.likelihood_function import student_t`
Initial commit, setting up the laplace approximation for a student t 2013-03-12 17:42:00 +00:00

			`def student_t_approx():`
			`"""`
			`Example of regressing with a student t likelihood`
			`"""`
			`#Start a function, any function`
Trying to 'debug' 2013-03-14 15:30:22 +00:00			`X = np.sort(np.random.uniform(0, 15, 100))[:, None]`
Initial commit, setting up the laplace approximation for a student t 2013-03-12 17:42:00 +00:00			`Y = np.sin(X)`

Got most of laplace approximation working 2013-03-13 17:55:41 +00:00			`#Add student t random noise to datapoints`
Trying to 'debug' 2013-03-14 15:30:22 +00:00			`deg_free = 2.5`
			`t_rv = t(deg_free, loc=5, scale=1)`
			`noise = t_rv.rvs(size=Y.shape)`
Got most of laplace approximation working 2013-03-13 17:55:41 +00:00			`Y += noise`

			`# Kernel object`
			`print X.shape`
			`kernel = GPy.kern.rbf(X.shape[1])`

			`#A GP should completely break down due to the points as they get a lot of weight`
			`# create simple GP model`
			`m = GPy.models.GP_regression(X, Y, kernel=kernel)`

			`# optimize`
			`m.ensure_default_constraints()`
			`m.optimize()`
			`# plot`
			`#m.plot()`
			`print m`

			`#with a student t distribution, since it has heavy tails it should work well`
			`likelihood_function = student_t(deg_free, sigma=1)`
			`lap = Laplace(Y, likelihood_function)`
			`cov = kernel.K(X)`
			`lap.fit_full(cov)`
Trying to 'debug' 2013-03-14 15:30:22 +00:00			`#Get one sample (just look at a single Y`
			`mode = float(lap.f_hat[0])`
			`variance = float((deg_free/(deg_free-2))) #BUG: Not convinced this is giving reasonable variables`
			`#variance = float((deg_free/(deg_free-2)) + np.diagonal(lap.hess_hat)[0]) #BUG: Not convinced this is giving reasonable variables`
			`normalised_approx = norm(loc=mode, scale=variance)`
			`print "Normal with mode %f, and variance %f" % (mode, variance)`
			`print lap.height_unnormalised`

			`test_range = np.arange(0, 10, 0.1)`
			`print np.diagonal(lap.hess_hat)`
			`plt.plot(test_range, t_rv.pdf(test_range))`
			`plt.plot(test_range, normalised_approx.pdf(test_range))`
			`plt.show()`
Got most of laplace approximation working 2013-03-13 17:55:41 +00:00

			`def noisy_laplace_approx():`
			`"""`
			`Example of regressing with a student t likelihood`
			`"""`
			`#Start a function, any function`
			`X = np.sort(np.random.uniform(0, 15, 70))[:, None]`
			`Y = np.sin(X)`

Initial commit, setting up the laplace approximation for a student t 2013-03-12 17:42:00 +00:00			`#Add some extreme value noise to some of the datapoints`
			`percent_corrupted = 0.05`
			`corrupted_datums = int(np.round(Y.shape[0] * percent_corrupted))`
			`indices = np.arange(Y.shape[0])`
			`np.random.shuffle(indices)`
			`corrupted_indices = indices[:corrupted_datums]`
			`print corrupted_indices`
Got most of laplace approximation working 2013-03-13 17:55:41 +00:00			`noise = np.random.uniform(-10, 10, (len(corrupted_indices), 1))`
Initial commit, setting up the laplace approximation for a student t 2013-03-12 17:42:00 +00:00			`Y[corrupted_indices] += noise`

			`#A GP should completely break down due to the points as they get a lot of weight`
			`# create simple GP model`
Got most of laplace approximation working 2013-03-13 17:55:41 +00:00			`m = GPy.models.GP_regression(X, Y)`
Initial commit, setting up the laplace approximation for a student t 2013-03-12 17:42:00 +00:00
			`# optimize`
			`m.ensure_default_constraints()`
			`m.optimize()`
			`# plot`
			`m.plot()`
			`print m`

			`#with a student t distribution, since it has heavy tails it should work well`