GPy/GPy/models/mrd.py

312 lines
12 KiB
Python
Raw Normal View History

2013-04-11 15:02:26 +01:00
'''
Created on 10 Apr 2013
@author: Max Zwiessele
'''
from GPy.core import model
from GPy.models.Bayesian_GPLVM import Bayesian_GPLVM
from GPy.models.sparse_GP import sparse_GP
2013-04-16 11:25:51 +01:00
from GPy.util.linalg import PCA
from scipy import linalg
import numpy
2013-04-11 15:02:26 +01:00
import itertools
2013-04-11 15:47:18 +01:00
import pylab
2013-05-22 17:14:54 +01:00
from GPy.kern.kern import kern
2013-04-11 15:02:26 +01:00
class MRD(model):
"""
Do MRD on given Datasets in Ylist.
2013-05-20 16:22:43 +01:00
All Ys in likelihood_list are in [N x Dn], where Dn can be different per Yn,
2013-04-11 15:02:26 +01:00
N must be shared across datasets though.
2013-05-20 16:22:43 +01:00
:param likelihood_list...: likelihoods of observed datasets
2013-05-22 17:14:54 +01:00
:type likelihood_list: [GPy.likelihood] | [Y1..Yy]
2013-04-11 15:02:26 +01:00
:param names: names for different gplvm models
:type names: [str]
2013-04-12 13:30:28 +01:00
:param Q: latent dimensionality (will raise
2013-04-11 15:02:26 +01:00
:type Q: int
2013-04-16 11:25:51 +01:00
:param initx: initialisation method for the latent space
:type initx: 'PCA'|'random'
:param initz: initialisation method for inducing inputs
:type initz: 'permute'|'random'
2013-04-11 15:02:26 +01:00
:param X:
Initial latent space
:param X_variance:
Initial latent space variance
:param init: [PCA|random]
initialization method to use
:param M:
number of inducing inputs to use
:param Z:
initial inducing inputs
2013-05-22 17:14:54 +01:00
:param kernels: list of kernels or kernel shared for all BGPLVMS
:type kernels: [GPy.kern.kern] | GPy.kern.kern | None (default)
2013-04-11 15:02:26 +01:00
"""
2013-05-22 17:14:54 +01:00
def __init__(self, likelihood_or_Y_list, Q, M=10, names=None,
kernels=None, initx='PCA',
initz='permute', _debug=False, **kwargs):
2013-05-22 10:13:02 +01:00
if names is None:
2013-05-22 17:14:54 +01:00
self.names = ["{}".format(i + 1) for i in range(len(likelihood_or_Y_list))]
2013-05-22 10:13:02 +01:00
2013-05-22 17:14:54 +01:00
# sort out the kernels
2013-05-22 10:13:02 +01:00
if kernels is None:
2013-05-22 17:14:54 +01:00
kernels = [None] * len(likelihood_or_Y_list)
elif isinstance(kernels, kern):
kernels = [kernels.copy() for i in range(len(likelihood_or_Y_list))]
2013-05-22 10:13:02 +01:00
else:
2013-05-22 17:14:54 +01:00
assert len(kernels) == len(likelihood_or_Y_list), "need one kernel per output"
assert all([isinstance(k, kern) for k in kernels]), "invalid kernel object detected!"
2013-05-22 10:13:02 +01:00
self.Q = Q
self.M = M
2013-05-22 17:14:54 +01:00
self._debug = _debug
2013-05-22 10:13:02 +01:00
self._init = True
2013-05-22 17:14:54 +01:00
X = self._init_X(initx, likelihood_or_Y_list)
2013-05-22 10:13:02 +01:00
Z = self._init_Z(initz, X)
2013-05-22 17:14:54 +01:00
self.bgplvms = [Bayesian_GPLVM(l, k, X=X, Z=Z, M=self.M, **kwargs) for l, k in zip(likelihood_or_Y_list, kernels)]
2013-04-15 10:57:27 +01:00
del self._init
2013-04-12 13:30:28 +01:00
2013-04-11 15:02:26 +01:00
self.gref = self.bgplvms[0]
nparams = numpy.array([0] + [sparse_GP._get_params(g).size - g.Z.size for g in self.bgplvms])
self.nparams = nparams.cumsum()
2013-04-12 13:30:28 +01:00
2013-04-11 15:02:26 +01:00
self.N = self.gref.N
self.NQ = self.N * self.Q
self.MQ = self.M * self.Q
2013-05-14 11:47:19 +01:00
model.__init__(self) # @UndefinedVariable
2013-04-11 15:02:26 +01:00
2013-04-15 10:57:27 +01:00
@property
def X(self):
return self.gref.X
@X.setter
def X(self, X):
try:
self.propagate_param(X=X)
except AttributeError:
if not self._init:
raise AttributeError("bgplvm list not initialized")
@property
2013-04-16 11:25:51 +01:00
def Z(self):
return self.gref.Z
@Z.setter
def Z(self, Z):
try:
self.propagate_param(Z=Z)
except AttributeError:
if not self._init:
raise AttributeError("bgplvm list not initialized")
@property
def X_variance(self):
return self.gref.X_variance
@X_variance.setter
def X_variance(self, X_var):
try:
self.propagate_param(X_variance=X_var)
except AttributeError:
if not self._init:
raise AttributeError("bgplvm list not initialized")
@property
2013-05-20 16:22:43 +01:00
def likelihood_list(self):
2013-04-15 10:57:27 +01:00
return [g.likelihood.Y for g in self.bgplvms]
2013-05-20 16:22:43 +01:00
@likelihood_list.setter
def likelihood_list(self, likelihood_list):
for g, Y in itertools.izip(self.bgplvms, likelihood_list):
2013-04-15 10:57:27 +01:00
g.likelihood.Y = Y
@property
def auto_scale_factor(self):
"""
set auto_scale_factor for all gplvms
:param b: auto_scale_factor
:type b:
"""
return self.gref.auto_scale_factor
@auto_scale_factor.setter
def auto_scale_factor(self, b):
self.propagate_param(auto_scale_factor=b)
def propagate_param(self, **kwargs):
for key, val in kwargs.iteritems():
for g in self.bgplvms:
g.__setattr__(key, val)
2013-04-16 11:25:51 +01:00
def randomize(self, initx='concat', initz='permute', *args, **kw):
super(MRD, self).randomize(*args, **kw)
2013-05-20 16:22:43 +01:00
self._init_X(initx, self.likelihood_list)
2013-04-16 11:25:51 +01:00
self._init_Z(initz, self.X)
2013-04-11 15:02:26 +01:00
def _get_param_names(self):
# X_names = sum([['X_%i_%i' % (n, q) for q in range(self.Q)] for n in range(self.N)], [])
# S_names = sum([['X_variance_%i_%i' % (n, q) for q in range(self.Q)] for n in range(self.N)], [])
n1 = self.gref._get_param_names()
n1var = n1[:self.NQ * 2 + self.MQ]
map_names = lambda ns, name: map(lambda x: "{1}_{0}".format(*x),
itertools.izip(ns,
itertools.repeat(name)))
return list(itertools.chain(n1var, *(map_names(\
sparse_GP._get_param_names(g)[self.MQ:], n) \
for g, n in zip(self.bgplvms, self.names))))
def _get_params(self):
"""
return parameter list containing private and shared parameters as follows:
=================================================================
| mu | S | Z || theta1 | theta2 | .. | thetaN |
=================================================================
"""
2013-04-12 13:30:28 +01:00
X = self.gref.X.ravel()
X_var = self.gref.X_variance.ravel()
Z = self.gref.Z.ravel()
2013-04-11 15:02:26 +01:00
thetas = [sparse_GP._get_params(g)[g.Z.size:] for g in self.bgplvms]
params = numpy.hstack([X, X_var, Z, numpy.hstack(thetas)])
return params
2013-04-16 11:25:51 +01:00
# def _set_var_params(self, g, X, X_var, Z):
# g.X = X.reshape(self.N, self.Q)
# g.X_variance = X_var.reshape(self.N, self.Q)
# g.Z = Z.reshape(self.M, self.Q)
#
# def _set_kern_params(self, g, p):
# g.kern._set_params(p[:g.kern.Nparam])
# g.likelihood._set_params(p[g.kern.Nparam:])
2013-04-11 15:02:26 +01:00
def _set_params(self, x):
start = 0; end = self.NQ
2013-04-15 10:57:27 +01:00
X = x[start:end]
2013-04-11 15:02:26 +01:00
start = end; end += start
2013-04-15 10:57:27 +01:00
X_var = x[start:end]
2013-04-11 15:02:26 +01:00
start = end; end += self.MQ
2013-04-15 10:57:27 +01:00
Z = x[start:end]
2013-04-11 15:02:26 +01:00
thetas = x[end:]
2013-04-12 13:30:28 +01:00
# set params for all:
2013-04-11 15:02:26 +01:00
for g, s, e in itertools.izip(self.bgplvms, self.nparams, self.nparams[1:]):
2013-04-15 10:57:27 +01:00
g._set_params(numpy.hstack([X, X_var, Z, thetas[s:e]]))
# self._set_var_params(g, X, X_var, Z)
# self._set_kern_params(g, thetas[s:e].copy())
# g._compute_kernel_matrices()
# if self.auto_scale_factor:
# g.scale_factor = numpy.sqrt(g.psi2.sum(0).mean() * g.likelihood.precision)
# # self.scale_factor = numpy.sqrt(self.psi2.sum(0).mean() * self.likelihood.precision)
# g._computations()
2013-04-11 15:02:26 +01:00
2013-05-22 17:14:54 +01:00
def update_likelihood_approximation(self): # TODO: object oriented vs script base
2013-05-20 16:22:43 +01:00
for bgplvm in self.bgplvms:
bgplvm.update_likelihood_approximation()
2013-04-11 15:02:26 +01:00
def log_likelihood(self):
2013-04-12 13:30:28 +01:00
ll = -self.gref.KL_divergence()
2013-04-11 15:02:26 +01:00
for g in self.bgplvms:
2013-04-12 13:30:28 +01:00
ll += sparse_GP.log_likelihood(g)
return ll
2013-04-11 15:02:26 +01:00
def _log_likelihood_gradients(self):
dLdmu, dLdS = reduce(lambda a, b: [a[0] + b[0], a[1] + b[1]], (g.dL_dmuS() for g in self.bgplvms))
dKLmu, dKLdS = self.gref.dKL_dmuS()
dLdmu -= dKLmu
dLdS -= dKLdS
dLdmuS = numpy.hstack((dLdmu.flatten(), dLdS.flatten())).flatten()
dldzt1 = reduce(lambda a, b: a + b, (sparse_GP._log_likelihood_gradients(g)[:self.MQ] for g in self.bgplvms))
return numpy.hstack((dLdmuS,
2013-04-11 15:02:26 +01:00
dldzt1,
numpy.hstack([numpy.hstack([g.dL_dtheta(),
g.likelihood._gradients(\
partial=g.partial_for_likelihood)]) \
for g in self.bgplvms])))
2013-05-20 16:22:43 +01:00
def _init_X(self, init='PCA', likelihood_list=None):
if likelihood_list is None:
likelihood_list = self.likelihood_list
2013-05-22 17:14:54 +01:00
Ylist = []
for likelihood_or_Y in likelihood_list:
if type(likelihood_or_Y) is numpy.ndarray:
Ylist.append(likelihood_or_Y)
else:
Ylist.append(likelihood_or_Y.Y)
del likelihood_list
2013-04-15 10:57:27 +01:00
if init in "PCA_single":
2013-05-22 17:14:54 +01:00
X = numpy.zeros((Ylist[0].shape[0], self.Q))
for qs, Y in itertools.izip(numpy.array_split(numpy.arange(self.Q), len(Ylist)), Ylist):
X[:, qs] = PCA(Y, len(qs))[0]
2013-04-15 10:57:27 +01:00
elif init in "PCA_concat":
2013-05-22 17:14:54 +01:00
X = PCA(numpy.hstack(Ylist), self.Q)[0]
2013-05-14 11:47:19 +01:00
else: # init == 'random':
2013-05-22 17:14:54 +01:00
X = numpy.random.randn(Ylist[0].shape[0], self.Q)
2013-04-15 10:57:27 +01:00
self.X = X
2013-04-12 13:30:28 +01:00
return X
2013-04-16 11:25:51 +01:00
def _init_Z(self, init="permute", X=None):
if X is None:
X = self.X
if init in "permute":
Z = numpy.random.permutation(X.copy())[:self.M]
elif init in "random":
Z = numpy.random.randn(self.M, self.Q) * X.var()
self.Z = Z
return Z
def _handle_plotting(self, fig_num, axes, plotf):
if axes is None:
2013-05-10 11:21:19 +01:00
fig = pylab.figure(num=fig_num, figsize=(4 * len(self.bgplvms), 3))
for i, g in enumerate(self.bgplvms):
if axes is None:
ax = fig.add_subplot(1, len(self.bgplvms), i + 1)
else:
ax = axes[i]
plotf(i, g, ax)
pylab.draw()
if axes is None:
fig.tight_layout()
return fig
else:
return pylab.gcf()
def plot_X_1d(self):
return self.gref.plot_X_1d()
def plot_X(self, fig_num="MRD Predictions", axes=None):
fig = self._handle_plotting(fig_num, axes, lambda i, g, ax: ax.imshow(g.X))
return fig
2013-05-20 16:22:43 +01:00
def plot_predict(self, fig_num="MRD Predictions", axes=None, **kwargs):
2013-05-22 17:14:54 +01:00
fig = self._handle_plotting(fig_num, axes, lambda i, g, ax: ax.imshow(g.predict(g.X)[0], **kwargs))
return fig
2013-04-11 15:02:26 +01:00
def plot_scales(self, fig_num="MRD Scales", axes=None, *args, **kwargs):
fig = self._handle_plotting(fig_num, axes, lambda i, g, ax: g.kern.plot_ARD(ax=ax, *args, **kwargs))
return fig
def plot_latent(self, fig_num="MRD Latent Spaces", axes=None, *args, **kwargs):
fig = self._handle_plotting(fig_num, axes, lambda i, g, ax: g.plot_latent(ax=ax, *args, **kwargs))
return fig
2013-04-12 13:30:28 +01:00
def _debug_plot(self):
2013-04-15 15:58:33 +01:00
self.plot_X_1d()
fig = pylab.figure("MRD DEBUG PLOT", figsize=(4 * len(self.bgplvms), 9))
fig.clf()
axes = [fig.add_subplot(3, len(self.bgplvms), i + 1) for i in range(len(self.bgplvms))]
self.plot_X(axes=axes)
axes = [fig.add_subplot(3, len(self.bgplvms), i + len(self.bgplvms) + 1) for i in range(len(self.bgplvms))]
self.plot_latent(axes=axes)
axes = [fig.add_subplot(3, len(self.bgplvms), i + 2 * len(self.bgplvms) + 1) for i in range(len(self.bgplvms))]
self.plot_scales(axes=axes)
pylab.draw()
fig.tight_layout()
2013-04-12 13:30:28 +01:00
def _debug_optimize(self, opt='scg', maxiters=5000, itersteps=10):
2013-04-12 13:30:28 +01:00
iters = 0
2013-04-15 10:57:27 +01:00
optstep = lambda: self.optimize(opt, messages=1, max_f_eval=itersteps)
2013-04-12 13:30:28 +01:00
self._debug_plot()
raw_input("enter to start debug")
while iters < maxiters:
optstep()
self._debug_plot()
iters += itersteps