utils

2026-05-03 16:52:39 +02:00 · 2012-11-29 16:26:21 +00:00 · 2012-11-29 16:26:21 +00:00 · aa13e095a9
commit aa13e095a9
parent e1b766a8dd
7 changed files with 619 additions and 0 deletions
--- a/GPy/util/linalg.py
+++ b/GPy/util/linalg.py
@ -0,0 +1,150 @@
+import numpy as np
+from scipy import linalg, optimize
+import pylab as pb
+import Tango
+import sys
+import re
+import pdb
+import cPickle
+import types
+import scipy.lib.lapack.flapack
+import scipy as sp
+
+def mdot(*args):
+   """Multiply all the arguments using matrix product rules.
+   The output is equivalent to multiplying the arguments one by one
+   from left to right using dot().
+   Precedence can be controlled by creating tuples of arguments,
+   for instance mdot(a,((b,c),d)) multiplies a (a*((b*c)*d)).
+   Note that this means the output of dot(a,b) and mdot(a,b) will differ if
+   a or b is a pure tuple of numbers.
+   """
+   if len(args)==1:
+       return args[0]
+   elif len(args)==2:
+       return _mdot_r(args[0],args[1])
+   else:
+       return _mdot_r(args[:-1],args[-1])
+
+def _mdot_r(a,b):
+   """Recursive helper for mdot"""
+   if type(a)==types.TupleType:
+       if len(a)>1:
+           a = mdot(*a)
+       else:
+           a = a[0]
+   if type(b)==types.TupleType:
+       if len(b)>1:
+           b = mdot(*b)
+       else:
+           b = b[0]
+   return np.dot(a,b)
+
+def jitchol(A,maxtries=5):
+    """
+    Arguments
+    ---------
+    A : An almost pd square matrix
+
+    Returns
+    -------
+    cholesky(K)
+
+    Notes
+    -----
+    Adds jitter to K, to enforce positive-definiteness
+    if stuff breaks, please check:
+    np.allclose(sp.linalg.cholesky(XXT, lower = True), np.triu(sp.linalg.cho_factor(XXT)[0]).T)
+    """
+    try:
+        return linalg.cholesky(A, lower = True)
+    except linalg.LinAlgError:
+        diagA = np.diag(A)
+        if np.any(diagA<0.):
+            raise linalg.LinAlgError, "not pd: negative diagonal elements"
+        jitter= diagA.mean()*1e-6
+        for i in range(1,maxtries+1):
+            try:
+                print 'Warning: adding jitter of '+str(jitter)
+                return linalg.cholesky(A+np.eye(A.shape[0])*jitter, lower = True)
+            except:
+                jitter *= 10
+
+        raise linalg.LinAlgError,"not positive definite, even with jitter."
+
+def pdinv(A):
+    """
+    Arguments
+    ---------
+    :param A: A DxD pd numpy array
+
+    Returns
+    -------
+    inv : the inverse of A
+    hld: 0.5* the log of the determinant of A
+    """
+    L = jitchol(A)
+    hld = np.sum(np.log(np.diag(L)))
+
+    inv = sp.lib.lapack.flapack.dpotri(L)[0]
+    # inv = linalg.flapack.dpotri(L,lower = 1)[0]
+    inv = np.tril(inv)+np.tril(inv,-1).T
+
+    return inv, hld
+
+
+def chol_inv(L):
+    """
+    Inverts a Cholesky lower triangular matrix
+
+    :param L: lower triangular matrix
+    :rtype: inverse of L
+
+    """
+
+    return linalg.flapack.dtrtri(L, lower = True)[0]
+
+
+def multiple_pdinv(A):
+    """
+    Arguments
+    ---------
+    :param A: A DxDxN numpy array (each A[:,:,i] is pd)
+
+    Returns
+    -------
+    invs : the inverses of A
+    hld: 0.5* the log of the determinants of A
+    """
+    N = A.shape[-1]
+    chols = [jitchol(A[:,:,i]) for i in range(N)]
+    halflogdets = [np.sum(np.log(np.diag(L[0]))) for L in chols]
+    invs = [linalg.flapack.dpotri(L[0],True)[0] for L in chols]
+    invs = [np.triu(I)+np.triu(I,1).T for I in invs]
+    return np.dstack(invs),np.array(halflogdets)
+
+
+def PCA(Y, Q):
+    """
+    Principal component analysis: maximum likelihood solution by SVD
+
+    Arguments
+    ---------
+    :param Y: NxD np.array of data
+    :param Q: int, dimension of projection
+
+    Returns
+    -------
+    X - NxQ np.array of dimensionality reduced data
+    W - QxD mapping from X to Y
+    """
+    if not np.allclose(Y.mean(axis=0), 0.0):
+        print "Y is not zero mean, centering it locally (GPy.util.linalg.PCA)"
+        Y -= Y.mean(axis=0)
+
+    Z = linalg.svd(Y, full_matrices = False)
+    [X, W] = [Z[0][:,0:Q], np.dot(np.diag(Z[1]), Z[2]).T[:,0:Q]]
+    v = X.std(axis=0)
+    X /= v;
+    W *= v;
+    return X, W.T