merged plotting and input_dim

2026-05-10 20:42:39 +02:00 · 2013-06-05 11:34:58 +01:00 · 2013-06-05 11:34:58 +01:00 · 4b4af86e5b
commit 4b4af86e5b
parent ffb6eb414b 903e66486d
26 changed files with 312 additions and 317 deletions
--- a/GPy/models/Bayesian_GPLVM.py
+++ b/GPy/models/Bayesian_GPLVM.py
@ -22,13 +22,13 @@ class Bayesian_GPLVM(sparse_GP, GPLVM):

    :param Y: observed data (np.ndarray) or GPy.likelihood
    :type Y: np.ndarray| GPy.likelihood instance
-    :param Q: latent dimensionality
-    :type Q: int
+    :param input_dim: latent dimensionality
+    :type input_dim: int
    :param init: initialisation method for the latent space
    :type init: 'PCA'|'random'

    """
-    def __init__(self, likelihood_or_Y, Q, X=None, X_variance=None, init='PCA', M=10,
+    def __init__(self, likelihood_or_Y, input_dim, X=None, X_variance=None, init='PCA', M=10,
                 Z=None, kernel=None, oldpsave=10, _debug=False,
                 **kwargs):
        if type(likelihood_or_Y) is np.ndarray:
@ -37,7 +37,7 @@ class Bayesian_GPLVM(sparse_GP, GPLVM):
            likelihood = likelihood_or_Y

        if X == None:
-            X = self.initialise_latent(init, Q, likelihood.Y)
+            X = self.initialise_latent(init, input_dim, likelihood.Y)
        self.init = init

        if X_variance is None:
@ -48,7 +48,7 @@ class Bayesian_GPLVM(sparse_GP, GPLVM):
        assert Z.shape[1] == X.shape[1]

        if kernel is None:
-            kernel = kern.rbf(Q) + kern.white(Q)
+            kernel = kern.rbf(input_dim) + kern.white(input_dim)

        self.oldpsave = oldpsave
        self._oldps = []
@ -78,8 +78,8 @@ class Bayesian_GPLVM(sparse_GP, GPLVM):
        self._oldps.insert(0, p.copy())

    def _get_param_names(self):
-        X_names = sum([['X_%i_%i' % (n, q) for q in range(self.Q)] for n in range(self.N)], [])
-        S_names = sum([['X_variance_%i_%i' % (n, q) for q in range(self.Q)] for n in range(self.N)], [])
+        X_names = sum([['X_%i_%i' % (n, q) for q in range(self.input_dim)] for n in range(self.N)], [])
+        S_names = sum([['X_variance_%i_%i' % (n, q) for q in range(self.input_dim)] for n in range(self.N)], [])
        return (X_names + S_names + sparse_GP._get_param_names(self))

    def _get_params(self):
@ -101,10 +101,10 @@ class Bayesian_GPLVM(sparse_GP, GPLVM):
    def _set_params(self, x, save_old=True, save_count=0):
 #         try:
            x = self._clipped(x)
-            N, Q = self.N, self.Q
-            self.X = x[:self.X.size].reshape(N, Q).copy()
-            self.X_variance = x[(N * Q):(2 * N * Q)].reshape(N, Q).copy()
-            sparse_GP._set_params(self, x[(2 * N * Q):])
+            N, input_dim = self.N, self.input_dim
+            self.X = x[:self.X.size].reshape(N, input_dim).copy()
+            self.X_variance = x[(N * input_dim):(2 * N * input_dim)].reshape(N, input_dim).copy()
+            sparse_GP._set_params(self, x[(2 * N * input_dim):])
 #             self.oldps = x
 #         except (LinAlgError, FloatingPointError, ZeroDivisionError):
 #             print "\rWARNING: Caught LinAlgError, continueing without setting            "
@ -131,7 +131,7 @@ class Bayesian_GPLVM(sparse_GP, GPLVM):
    def KL_divergence(self):
        var_mean = np.square(self.X).sum()
        var_S = np.sum(self.X_variance - np.log(self.X_variance))
-        return 0.5 * (var_mean + var_S) - 0.5 * self.Q * self.N
+        return 0.5 * (var_mean + var_S) - 0.5 * self.input_dim * self.N

    def log_likelihood(self):
        ll = sparse_GP.log_likelihood(self)
@ -196,16 +196,16 @@ class Bayesian_GPLVM(sparse_GP, GPLVM):
        """
        assert not self.likelihood.is_heteroscedastic
        N_test = Y.shape[0]
-        Q = self.Z.shape[1]
-        means = np.zeros((N_test, Q))
-        covars = np.zeros((N_test, Q))
+        input_dim = self.Z.shape[1]
+        means = np.zeros((N_test, input_dim))
+        covars = np.zeros((N_test, input_dim))

        dpsi0 = -0.5 * self.D * self.likelihood.precision
        dpsi2 = self.dL_dpsi2[0][None, :, :] # TODO: this may change if we ignore het. likelihoods
        V = self.likelihood.precision * Y
        dpsi1 = np.dot(self.Cpsi1V, V.T)

-        start = np.zeros(self.Q * 2)
+        start = np.zeros(self.input_dim * 2)

        for n, dpsi1_n in enumerate(dpsi1.T[:, :, None]):
            args = (self.kern, self.Z, dpsi0, dpsi1_n, dpsi2)
@ -222,12 +222,12 @@ class Bayesian_GPLVM(sparse_GP, GPLVM):
        """
        Plot latent space X in 1D:

-            -if fig is given, create Q subplots in fig and plot in these
-            -if ax is given plot Q 1D latent space plots of X into each `axis`
+            -if fig is given, create input_dim subplots in fig and plot in these
+            -if ax is given plot input_dim 1D latent space plots of X into each `axis`
            -if neither fig nor ax is given create a figure with fignum and plot in there

        colors:
-            colors of different latent space dimensions Q
+            colors of different latent space dimensions input_dim
        """
        import pylab
        if ax is None:
@ -245,7 +245,7 @@ class Bayesian_GPLVM(sparse_GP, GPLVM):
            elif isinstance(ax, (tuple, list)):
                a = ax[i]
            else:
-                raise ValueError("Need one ax per latent dimnesion Q")
+                raise ValueError("Need one ax per latent dimnesion input_dim")
            a.plot(self.X, c='k', alpha=.3)
            plots.extend(a.plot(x, self.X.T[i], c=colors.next(), label=r"$\mathbf{{X_{{{}}}}}$".format(i)))
            a.fill_between(x,
@ -262,7 +262,7 @@ class Bayesian_GPLVM(sparse_GP, GPLVM):
        return fig

    def __getstate__(self):
-        return (self.likelihood, self.Q, self.X, self.X_variance,
+        return (self.likelihood, self.input_dim, self.X, self.X_variance,
                self.init, self.M, self.Z, self.kern,
                self.oldpsave, self._debug)

@ -271,12 +271,12 @@ class Bayesian_GPLVM(sparse_GP, GPLVM):

    def _debug_filter_params(self, x):
        start, end = 0, self.X.size,
-        X = x[start:end].reshape(self.N, self.Q)
+        X = x[start:end].reshape(self.N, self.input_dim)
        start, end = end, end + self.X_variance.size
-        X_v = x[start:end].reshape(self.N, self.Q)
-        start, end = end, end + (self.M * self.Q)
-        Z = x[start:end].reshape(self.M, self.Q)
-        start, end = end, end + self.Q
+        X_v = x[start:end].reshape(self.N, self.input_dim)
+        start, end = end, end + (self.M * self.input_dim)
+        Z = x[start:end].reshape(self.M, self.input_dim)
+        start, end = end, end + self.input_dim
        theta = x[start:]
        return X, X_v, Z, theta

@ -414,24 +414,24 @@ class Bayesian_GPLVM(sparse_GP, GPLVM):
 #         caxkmmdl = divider.append_axes("right", "5%", pad="1%")
 #         cbarkmmdl = pylab.colorbar(imkmmdl, cax=caxkmmdl)

-#         Qleg = ax1.legend(Xlatentplts, [r"$Q_{}$".format(i + 1) for i in range(self.Q)],
-#                    loc=3, ncol=self.Q, bbox_to_anchor=(0, 1.15, 1, 1.15),
+#         input_dimleg = ax1.legend(Xlatentplts, [r"$input_dim_{}$".format(i + 1) for i in range(self.input_dim)],
+#                    loc=3, ncol=self.input_dim, bbox_to_anchor=(0, 1.15, 1, 1.15),
 #                    borderaxespad=0, mode="expand")
-        ax2.legend(Xlatentplts, [r"$Q_{}$".format(i + 1) for i in range(self.Q)],
-                   loc=3, ncol=self.Q, bbox_to_anchor=(0, 1.1, 1, 1.1),
+        ax2.legend(Xlatentplts, [r"$input_dim_{}$".format(i + 1) for i in range(self.input_dim)],
+                   loc=3, ncol=self.input_dim, bbox_to_anchor=(0, 1.1, 1, 1.1),
                   borderaxespad=0, mode="expand")
-        ax3.legend(Xlatentplts, [r"$Q_{}$".format(i + 1) for i in range(self.Q)],
-                   loc=3, ncol=self.Q, bbox_to_anchor=(0, 1.1, 1, 1.1),
+        ax3.legend(Xlatentplts, [r"$input_dim_{}$".format(i + 1) for i in range(self.input_dim)],
+                   loc=3, ncol=self.input_dim, bbox_to_anchor=(0, 1.1, 1, 1.1),
                   borderaxespad=0, mode="expand")
-        ax4.legend(Xlatentplts, [r"$Q_{}$".format(i + 1) for i in range(self.Q)],
-                   loc=3, ncol=self.Q, bbox_to_anchor=(0, 1.1, 1, 1.1),
+        ax4.legend(Xlatentplts, [r"$input_dim_{}$".format(i + 1) for i in range(self.input_dim)],
+                   loc=3, ncol=self.input_dim, bbox_to_anchor=(0, 1.1, 1, 1.1),
                   borderaxespad=0, mode="expand")
-        ax5.legend(Xlatentplts, [r"$Q_{}$".format(i + 1) for i in range(self.Q)],
-                   loc=3, ncol=self.Q, bbox_to_anchor=(0, 1.1, 1, 1.1),
+        ax5.legend(Xlatentplts, [r"$input_dim_{}$".format(i + 1) for i in range(self.input_dim)],
+                   loc=3, ncol=self.input_dim, bbox_to_anchor=(0, 1.1, 1, 1.1),
                   borderaxespad=0, mode="expand")
        Lleg = ax1.legend()
        Lleg.draggable()
-#         ax1.add_artist(Qleg)
+#         ax1.add_artist(input_dimleg)

        indicatorKL, = ax1.plot(kllls[self.showing, 0], kllls[self.showing, 2], 'o', c=KL.get_color())
        indicatorLL, = ax1.plot(kllls[self.showing, 0], kllls[self.showing, 1] - kllls[self.showing, 2], 'o', c=LL.get_color())
--- a/GPy/models/GPLVM.py
+++ b/GPy/models/GPLVM.py
@ -20,35 +20,35 @@ class GPLVM(GP):

    :param Y: observed data
    :type Y: np.ndarray
-    :param Q: latent dimensionality
-    :type Q: int
+    :param input_dim: latent dimensionality
+    :type input_dim: int
    :param init: initialisation method for the latent space
    :type init: 'PCA'|'random'

    """
-    def __init__(self, Y, Q, init='PCA', X = None, kernel=None, normalize_Y=False):
+    def __init__(self, Y, input_dim, init='PCA', X = None, kernel=None, normalize_Y=False):
        if X is None:
-            X = self.initialise_latent(init, Q, Y)
+            X = self.initialise_latent(init, input_dim, Y)
        if kernel is None:
-            kernel = kern.rbf(Q, ARD=Q>1) + kern.bias(Q, np.exp(-2)) + kern.white(Q, np.exp(-2))
+            kernel = kern.rbf(input_dim, ARD=input_dim>1) + kern.bias(input_dim, np.exp(-2)) + kern.white(input_dim, np.exp(-2))
        likelihood = Gaussian(Y, normalize=normalize_Y)
        GP.__init__(self, X, likelihood, kernel, normalize_X=False)
        self._set_params(self._get_params())

-    def initialise_latent(self, init, Q, Y):
+    def initialise_latent(self, init, input_dim, Y):
        if init == 'PCA':
-            return PCA(Y, Q)[0]
+            return PCA(Y, input_dim)[0]
        else:
-            return np.random.randn(Y.shape[0], Q)
+            return np.random.randn(Y.shape[0], input_dim)

    def _get_param_names(self):
-        return sum([['X_%i_%i'%(n,q) for q in range(self.Q)] for n in range(self.N)],[]) + GP._get_param_names(self)
+        return sum([['X_%i_%i'%(n,q) for q in range(self.input_dim)] for n in range(self.N)],[]) + GP._get_param_names(self)

    def _get_params(self):
        return np.hstack((self.X.flatten(), GP._get_params(self)))

    def _set_params(self,x):
-        self.X = x[:self.N*self.Q].reshape(self.N,self.Q).copy()
+        self.X = x[:self.N*self.input_dim].reshape(self.N,self.input_dim).copy()
        GP._set_params(self, x[self.X.size:])

    def _log_likelihood_gradients(self):
--- a/GPy/models/generalized_FITC.py
+++ b/GPy/models/generalized_FITC.py
@ -20,15 +20,15 @@ class generalized_FITC(sparse_GP):
    Naish-Guzman, A. and Holden, S. (2008) implemantation of EP with FITC.

    :param X: inputs
-    :type X: np.ndarray (N x Q)
+    :type X: np.ndarray (N x input_dim)
    :param likelihood: a likelihood instance, containing the observed data
    :type likelihood: GPy.likelihood.(Gaussian | EP)
    :param kernel : the kernel/covariance function. See link kernels
    :type kernel: a GPy kernel
    :param X_variance: The variance in the measurements of X (Gaussian variance)
-    :type X_variance: np.ndarray (N x Q) | None
+    :type X_variance: np.ndarray (N x input_dim) | None
    :param Z: inducing inputs (optional, see note)
-    :type Z: np.ndarray (M x Q) | None
+    :type Z: np.ndarray (M x input_dim) | None
    :param M : Number of inducing points (optional, default 10. Ignored if Z is not None)
    :type M: int
    :param normalize_(X|Y) : whether to normalize the data before computing (predictions will be in original scales)
@ -44,7 +44,7 @@ class generalized_FITC(sparse_GP):
        self._set_params(self._get_params())

    def _set_params(self, p):
-        self.Z = p[:self.M*self.Q].reshape(self.M, self.Q)
+        self.Z = p[:self.M*self.input_dim].reshape(self.M, self.input_dim)
        self.kern._set_params(p[self.Z.size:self.Z.size+self.kern.Nparam])
        self.likelihood._set_params(p[self.Z.size+self.kern.Nparam:])
        self._compute_kernel_matrices()
--- a/GPy/models/mrd.py
+++ b/GPy/models/mrd.py
@ -23,8 +23,8 @@ class MRD(model):
    :type likelihood_list: [GPy.likelihood] | [Y1..Yy]
    :param names: names for different gplvm models
    :type names: [str]
-    :param Q: latent dimensionality (will raise
-    :type Q: int
+    :param input_dim: latent dimensionality (will raise
+    :type input_dim: int
    :param initx: initialisation method for the latent space
    :type initx: 'PCA'|'random'
    :param initz: initialisation method for inducing inputs
@ -45,7 +45,7 @@ class MRD(model):
    :param kernels: list of kernels or kernel shared for all BGPLVMS
    :type kernels: [GPy.kern.kern] | GPy.kern.kern | None (default)
    """
-    def __init__(self, likelihood_or_Y_list, Q, M=10, names=None,
+    def __init__(self, likelihood_or_Y_list, input_dim, M=10, names=None,
                 kernels=None, initx='PCA',
                 initz='permute', _debug=False, **kw):
        if names is None:
@ -61,14 +61,14 @@ class MRD(model):
            assert all([isinstance(k, kern) for k in kernels]), "invalid kernel object detected!"
        assert not ('kernel' in kw), "pass kernels through `kernels` argument"

-        self.Q = Q
+        self.input_dim = input_dim
        self.M = M
        self._debug = _debug

        self._init = True
        X = self._init_X(initx, likelihood_or_Y_list)
        Z = self._init_Z(initz, X)
-        self.bgplvms = [Bayesian_GPLVM(l, Q=Q, kernel=k, X=X, Z=Z, M=self.M, **kw) for l, k in zip(likelihood_or_Y_list, kernels)]
+        self.bgplvms = [Bayesian_GPLVM(l, input_dim=input_dim, kernel=k, X=X, Z=Z, M=self.M, **kw) for l, k in zip(likelihood_or_Y_list, kernels)]
        del self._init

        self.gref = self.bgplvms[0]
@ -76,8 +76,8 @@ class MRD(model):
        self.nparams = nparams.cumsum()

        self.N = self.gref.N
-        self.NQ = self.N * self.Q
-        self.MQ = self.M * self.Q
+        self.NQ = self.N * self.input_dim
+        self.MQ = self.M * self.input_dim

        model.__init__(self) # @UndefinedVariable
        self._set_params(self._get_params())
@ -143,8 +143,8 @@ class MRD(model):
        self._init_Z(initz, self.X)

    def _get_param_names(self):
-        # X_names = sum([['X_%i_%i' % (n, q) for q in range(self.Q)] for n in range(self.N)], [])
-        # S_names = sum([['X_variance_%i_%i' % (n, q) for q in range(self.Q)] for n in range(self.N)], [])
+        # X_names = sum([['X_%i_%i' % (n, q) for q in range(self.input_dim)] for n in range(self.N)], [])
+        # S_names = sum([['X_variance_%i_%i' % (n, q) for q in range(self.input_dim)] for n in range(self.N)], [])
        n1 = self.gref._get_param_names()
        n1var = n1[:self.NQ * 2 + self.MQ]
        map_names = lambda ns, name: map(lambda x: "{1}_{0}".format(*x),
@ -170,9 +170,9 @@ class MRD(model):
        return params

 #     def _set_var_params(self, g, X, X_var, Z):
-#         g.X = X.reshape(self.N, self.Q)
-#         g.X_variance = X_var.reshape(self.N, self.Q)
-#         g.Z = Z.reshape(self.M, self.Q)
+#         g.X = X.reshape(self.N, self.input_dim)
+#         g.X_variance = X_var.reshape(self.N, self.input_dim)
+#         g.Z = Z.reshape(self.M, self.input_dim)
 #
 #     def _set_kern_params(self, g, p):
 #         g.kern._set_params(p[:g.kern.Nparam])
@ -235,13 +235,13 @@ class MRD(model):
                Ylist.append(likelihood_or_Y.Y)
        del likelihood_list
        if init in "PCA_concat":
-            X = PCA(numpy.hstack(Ylist), self.Q)[0]
+            X = PCA(numpy.hstack(Ylist), self.input_dim)[0]
        elif init in "PCA_single":
-            X = numpy.zeros((Ylist[0].shape[0], self.Q))
-            for qs, Y in itertools.izip(numpy.array_split(numpy.arange(self.Q), len(Ylist)), Ylist):
+            X = numpy.zeros((Ylist[0].shape[0], self.input_dim))
+            for qs, Y in itertools.izip(numpy.array_split(numpy.arange(self.input_dim), len(Ylist)), Ylist):
                X[:, qs] = PCA(Y, len(qs))[0]
        else: # init == 'random':
-            X = numpy.random.randn(Ylist[0].shape[0], self.Q)
+            X = numpy.random.randn(Ylist[0].shape[0], self.input_dim)
        self.X = X
        return X

@ -252,7 +252,7 @@ class MRD(model):
        if init in "permute":
            Z = numpy.random.permutation(X.copy())[:self.M]
        elif init in "random":
-            Z = numpy.random.randn(self.M, self.Q) * X.var()
+            Z = numpy.random.randn(self.M, self.input_dim) * X.var()
        self.Z = Z
        return Z

@ -265,7 +265,7 @@ class MRD(model):
            elif isinstance(axes, (tuple, list)):
                ax = axes[i]
            else:
-                raise ValueError("Need one axes per latent dimension Q")
+                raise ValueError("Need one axes per latent dimension input_dim")
            plotf(i, g, ax)
        pylab.draw()
        if axes is None:
--- a/GPy/models/sparse_GPLVM.py
+++ b/GPy/models/sparse_GPLVM.py
@ -17,25 +17,25 @@ class sparse_GPLVM(sparse_GP_regression, GPLVM):

    :param Y: observed data
    :type Y: np.ndarray
-    :param Q: latent dimensionality
-    :type Q: int
+    :param input_dim: latent dimensionality
+    :type input_dim: int
    :param init: initialisation method for the latent space
    :type init: 'PCA'|'random'

    """
-    def __init__(self, Y, Q, kernel=None, init='PCA', M=10):
-        X = self.initialise_latent(init, Q, Y)
+    def __init__(self, Y, input_dim, kernel=None, init='PCA', M=10):
+        X = self.initialise_latent(init, input_dim, Y)
        sparse_GP_regression.__init__(self, X, Y, kernel=kernel,M=M)

    def _get_param_names(self):
-        return (sum([['X_%i_%i'%(n,q) for q in range(self.Q)] for n in range(self.N)],[])
+        return (sum([['X_%i_%i'%(n,q) for q in range(self.input_dim)] for n in range(self.N)],[])
                + sparse_GP_regression._get_param_names(self))

    def _get_params(self):
        return np.hstack((self.X.flatten(), sparse_GP_regression._get_params(self)))

    def _set_params(self,x):
-        self.X = x[:self.X.size].reshape(self.N,self.Q).copy()
+        self.X = x[:self.X.size].reshape(self.N,self.input_dim).copy()
        sparse_GP_regression._set_params(self, x[self.X.size:])

    def log_likelihood(self):