Merge branch 'devel-cythonchol' of git://github.com/Dapid/GPy into Dapid-devel-cythonchol

2026-05-11 21:12:38 +02:00 · 2015-08-17 13:05:30 +01:00 · 2015-08-17 13:05:30 +01:00 · 8a7191c395
commit 8a7191c395
parent e3fd7885bf 629e57257f
5 changed files with 5783 additions and 4155 deletions
--- a/GPy/util/choleskies_cython.c
+++ b/GPy/util/choleskies_cython.c
--- a/GPy/util/choleskies_cython.pyx
+++ b/GPy/util/choleskies_cython.pyx
@ -7,8 +7,9 @@
 import numpy as np
 from cython.parallel import prange, parallel
 cimport numpy as np
+cimport scipy.linalg.cython_blas as cblas

-def flat_to_triang(np.ndarray[double, ndim=2] flat, int M):
+def flat_to_triang(double[:, :] flat, int M):
    """take a matrix N x D and return a D X M x M array where

    N = M(M+1)/2
@ -18,8 +19,9 @@ def flat_to_triang(np.ndarray[double, ndim=2] flat, int M):
    cdef int D = flat.shape[1]
    cdef int N = flat.shape[0]
    cdef int count = 0
-    cdef np.ndarray[double, ndim=3] ret = np.zeros((D, M, M))
+    cdef double[:, :, ::1] ret = np.zeros((D, M, M))
    cdef int d, m, mm
+    with nogil:
        for d in range(D):
            count = 0
            for m in range(M):
@ -28,13 +30,14 @@ def flat_to_triang(np.ndarray[double, ndim=2] flat, int M):
                    count += 1
    return ret

-def triang_to_flat(np.ndarray[double, ndim=3] L):
+def triang_to_flat(double[:, :, :] L):
    cdef int D = L.shape[0]
    cdef int M = L.shape[1]
    cdef int N = M*(M+1)/2
    cdef int count = 0
-    cdef np.ndarray[double, ndim=2] flat = np.empty((N, D))
+    cdef double[:, ::1] flat = np.empty((N, D))
    cdef int d, m, mm
+    with nogil:
        for d in range(D):
            count = 0
            for m in range(M):
@ -43,11 +46,11 @@ def triang_to_flat(np.ndarray[double, ndim=3] L):
                    count += 1
    return flat

-
-def backprop_gradient(np.ndarray[double, ndim=2] dL, np.ndarray[double, ndim=2] L):
-    cdef np.ndarray[double, ndim=2] dL_dK = np.tril(dL).copy()
+def backprop_gradient(double[:, :] dL, double[:, :] L):
+    cdef double[:, ::1] dL_dK = np.tril(dL)
    cdef int N = L.shape[0]
    cdef int k, j, i
+    with nogil:
        for k in range(N - 1, -1, -1):
            for j in range(k + 1, N):
                for i in range(j, N):
@ -60,11 +63,12 @@ def backprop_gradient(np.ndarray[double, ndim=2] dL, np.ndarray[double, ndim=2]
    return dL_dK

 def backprop_gradient_par(double[:,:] dL, double[:,:] L):
-    cdef double[:,:] dL_dK = np.tril(dL).copy()
+    cdef double[:,::1] dL_dK = np.tril(dL)
    cdef int N = L.shape[0]
    cdef int k, j, i
+    with nogil:
        for k in range(N - 1, -1, -1):
-        with nogil, parallel():
+            with parallel():
                for i in prange(k + 1, N):
                    for j in range(k+1, i+1):
                        dL_dK[i, k] -= dL_dK[i, j] * L[j, k]
@ -76,32 +80,35 @@ def backprop_gradient_par(double[:,:] dL, double[:,:] L):
            dL_dK[k, k] /= (2. * L[k, k])
    return dL_dK

-#here's a pure C version...
-cdef extern from "cholesky_backprop.h" nogil:
-    void chol_backprop(int N, double* dL, double* L)
+cdef void chol_backprop(int N, double[:, ::1] dL, double[:, ::1] L) nogil:
+    cdef int i, k, n

-def backprop_gradient_par_c(np.ndarray[double, ndim=2] dL, np.ndarray[double, ndim=2] L):
-    cdef np.ndarray[double, ndim=2] dL_dK = np.tril(dL) # makes a copy, c-contig
+    # DSYMV required constant arguments
+    cdef double alpha=-1, beta=1
+    cdef int incx=1
+
+    # DSCAL required arguments
+    cdef double scale
+
+    dL[N - 1, N - 1] /= (2. * L[N - 1, N - 1])
+    for k in range(N-2, -1, -1):
+        n = N-k-1
+        cblas.dsymv(uplo='l', n=&n, alpha=&alpha, a=&dL[k + 1, k + 1], lda=&N, x=&L[k, k + 1], incx=&incx,
+                    beta=&beta, y=&dL[k + 1, k], incy=&N)
+
+        for i in xrange(0, N - k - 1):
+            dL[k + 1 + i, k] -= dL[k + i+ 1, k + i + 1] * L[k, k + 1 + i]
+
+        scale = 1.0 / L[k, k]
+        cblas.dscal(&n, &scale , &dL[k + 1, k], &N)
+
+        dL[k, k] -= cblas.ddot(&n, &dL[k + 1, k], &N, &L[k, k], &incx)
+        dL[k, k] /= (2.0 * L[k, k])
+
+def backprop_gradient_par_c(double[:, :] dL, double[:, :] L):
+    cdef double[:, ::1] dL_dK = np.tril(dL) # makes a copy, c-contig
+    cdef double[:, ::1] L_cont = np.ascontiguousarray(L)
    cdef int N = L.shape[0]
    with nogil:
-        chol_backprop(N, <double*> dL_dK.data, <double*> L.data)
-    return dL_dK
-
-cdef extern from "cholesky_backprop.h" nogil:
-    void old_chol_backprop(int N, double* dL, double* L)
-
-def backprop_gradient_par_c_old(np.ndarray[double, ndim=2] dL, np.ndarray[double, ndim=2] L):
-    cdef np.ndarray[double, ndim=2] dL_dK = np.tril(dL) # makes a copy, c-contig
-    cdef int N = L.shape[0]
-    with nogil:
-        old_chol_backprop(N, <double*> dL_dK.data, <double*> L.data)
-    return dL_dK
-
-
-
-
-
-
-
-
-
+        chol_backprop(N, dL_dK, L_cont)
+    return np.asarray(dL_dK)
--- a/GPy/util/cholesky_backprop.c
+++ b/GPy/util/cholesky_backprop.c
@ -1,51 +0,0 @@
-#include <cblas.h>
-void chol_backprop(int N, double* dL, double* L){
-    //at the input to this fn, dL is df_dL. after this fn is complet, dL is df_dK
-    int i,k;
-
-    dL[N*N - 1] /= (2. * L[N*N - 1]);
-    for(k=N-2;k>(-1);k--){
-        cblas_dsymv(CblasRowMajor, CblasLower,
-	            N-k-1, -1,
-		    &dL[(N*(k+1) + k+1)],N,
-		    &L[k*N+k+1],1,
-		    1, &dL[N*(k+1)+k], N);
-        for(i=0;i<(N-k-1); i++){
-		dL[N*(k+1+i)+k] -= dL[N*(k+1)+k+i*(N+1)+1] * L[k*N+k+1+i];
-	}
-
-	cblas_dscal(N-k-1, 1.0/L[k*N+k], &dL[(k+1)*N+k], N);
-        dL[k*N + k] -= cblas_ddot(N-k-1, &dL[(k+1)*N+k], N, &L[k*N+k+1], 1);
-        dL[k*N + k] /= (2.0 * L[k*N + k]);
-    }
-}
-
-double mydot(int n, double* a,  int stride_a, double* b, int stride_b){
-    double ret = 0;	
-    for(int i=0; i<n; i++){
-	ret += a[i*stride_a]*b[i*stride_b];
-    }
-    return ret;
-}
-void old_chol_backprop(int N, double* dL, double* U){
-    //at the input to this fn, dL is df_dL. after this fn is complet, dL is df_dK
-    int iN, kN,i,j,k;
-    dL[N*N-1] /= (2. * U[N*N-1]);
-    for(k=N-2;k>(-1);k--){
-	kN = k*N;
-        #pragma omp parallel for private(i,iN)
-        for(i=k+1; i<N; i++){
-	    iN = i*N;
-	    dL[iN+k] -= mydot(i-k, &dL[iN+k+1], 1, &U[kN+k+1], 1);
-	    dL[iN+k] -= mydot(N-i, &dL[iN+i], N, &U[kN+i],  1);
-
-	}
-        for(i=(k + 1); i<N; i++){
-	    iN = i*N;
-            dL[iN + k] /= U[kN + k];
-            dL[kN + k] -= U[kN + i] * dL[iN + k];
-	}
-        dL[kN + k] /= (2. * U[kN + k]);
-    }
-}
-
--- a/GPy/util/cholesky_backprop.h
+++ b/GPy/util/cholesky_backprop.h
@ -1,5 +0,0 @@
-#include <cblas.h>
-
-void dsymv(int N, double*A, double*b, double*y);
-double mydot(int n, double* a,  int stride_a, double* b, int stride_b);
-void chol_backprop(int N, double* dL, double* L);
--- a/setup.py
+++ b/setup.py
@ -21,9 +21,9 @@ ext_mods = [Extension(name='GPy.kern._src.stationary_cython',
                      extra_compile_args=compile_flags,
                      extra_link_args = ['-lgomp']),
            Extension(name='GPy.util.choleskies_cython',
-                      sources=['GPy/util/choleskies_cython.c', 'GPy/util/cholesky_backprop.c'],
+                      sources=['GPy/util/choleskies_cython.c'],
                      include_dirs=[np.get_include()]+(['/System/Library/Frameworks/Accelerate.framework/Versions/Current/Frameworks/vecLib.framework/Versions/Current/Headers'] if sys.platform=='darwin' else []),
-                      extra_link_args = ['-lgomp', '-lblas'],
+                      extra_link_args = ['-lgomp'],
                      extra_compile_args=compile_flags+['-std=c99']),
            Extension(name='GPy.util.linalg_cython',
                      sources=['GPy/util/linalg_cython.c'],
@ -64,7 +64,7 @@ setup(name = 'GPy',
      py_modules = ['GPy.__init__'],
      test_suite = 'GPy.testing',
      long_description=read('README.md'),
-      install_requires=['numpy>=1.7', 'scipy>=0.12'],
+      install_requires=['numpy>=1.7', 'scipy>=0.16', 'cython>=0.22'],
      extras_require = {'docs':['matplotlib >=1.3','Sphinx','IPython']},
      classifiers=['License :: OSI Approved :: BSD License',
                   'Natural Language :: English',