Added negative binomial likelihood based on symbolic.

2026-06-11 15:15:15 +02:00 · 2014-04-01 07:03:01 +01:00 · 2014-04-01 07:03:01 +01:00 · f5b8989ef5
commit f5b8989ef5
parent 292e076a9a
7 changed files with 318 additions and 219 deletions
--- a/GPy/kern/_src/symbolic.py
+++ b/GPy/kern/_src/symbolic.py
@ -13,7 +13,7 @@ from ...core.parameterization.transformations import Logexp

 class Symbolic(Kern):
    """
-    A kernel object, where all the hard work in done by sympy.
+    A kernel object, where all the hard work is done by sympy.

    :param k: the covariance function
    :type k: a positive definite sympy function of x_0, z_0, x_1, z_1, x_2, z_2...
--- a/GPy/likelihoods/init.py
+++ b/GPy/likelihoods/init.py
@ -7,3 +7,4 @@ from student_t import StudentT
 from likelihood import Likelihood
 from mixed_noise import MixedNoise
 from symbolic import Symbolic
+from negative_binomial import Negative_binomial
--- a/GPy/likelihoods/link_functions.py
+++ b/GPy/likelihoods/link_functions.py
@ -71,6 +71,7 @@ class Probit(GPTransformation):

        g(f) = \\Phi^{-1} (mu)

+    
    """
    def transf(self,f):
        return std_norm_cdf(f)
--- a/GPy/likelihoods/negative_binomial.py
+++ b/GPy/likelihoods/negative_binomial.py
@ -0,0 +1,46 @@
+# Copyright (c) 2014 The GPy authors (see AUTHORS.txt)
+# Licensed under the BSD 3-clause license (see LICENSE.txt)
+
+
+try:
+    import sympy as sym
+    sympy_available=True
+    from sympy.utilities.lambdify import lambdify
+    from GPy.util.symbolic import gammaln, ln_cum_gaussian, cum_gaussian
+except ImportError:
+    sympy_available=False
+
+import numpy as np
+from ..util.univariate_Gaussian import std_norm_pdf, std_norm_cdf
+import link_functions
+from symbolic import Symbolic
+from scipy import stats
+
+if sympy_available:
+    class Negative_binomial(Symbolic):
+        """
+        Negative binomial
+
+        .. math::
+            p(y_{i}|\pi(f_{i})) = \left(\frac{r}{r+f_i}\right)^r \frac{\Gamma(r+y_i)}{y!\Gamma(r)}\left(\frac{f_i}{r+f_i}\right)^{y_i}
+
+        .. Note::
+            Y takes non zero integer values..
+            link function should have a positive domain, e.g. log (default).
+
+        .. See also::
+            symbolic.py, for the parent class
+        """
+        def __init__(self, gp_link=None):
+            if gp_link is None:
+                gp_link = link_functions.Log()
+
+            dispersion = sym.Symbol('dispersion', positive=True, real=True)
+            y = sym.Symbol('y', nonnegative=True, integer=True)
+            f = sym.Symbol('f', positive=True, real=True) 
+            log_pdf=dispersion*sym.log(dispersion) - (dispersion+y)*sym.log(dispersion+f) + gammaln(y+dispersion) - gammaln(y+1) - gammaln(dispersion) + y*sym.log(f)  
+            super(Negative_binomial, self).__init__(log_pdf=log_pdf, gp_link=gp_link, name='Negative_binomial')
+
+            # TODO: Check this.
+            self.log_concave = False
+
--- a/GPy/likelihoods/symbolic.py
+++ b/GPy/likelihoods/symbolic.py
@ -1,245 +1,260 @@
 # Copyright (c) 2014 GPy Authors
 # Licensed under the BSD 3-clause license (see LICENSE.txt)

+try:
+    import sympy as sym
+    sympy_available=True
+    from sympy.utilities.lambdify import lambdify
+except ImportError:
+    sympy_available=False
+
 import numpy as np
-import sympy as sym
-from sympy.utilities.lambdify import lambdify
 import link_functions
 from scipy import stats, integrate
 from scipy.special import gammaln, gamma, erf, polygamma
+from GPy.util.functions import cum_gaussian, ln_cum_gaussian
 from likelihood import Likelihood
 from ..core.parameterization import Param
-from ..core.parameterization.transformations import Logexp

-func_modules = ['numpy', {'gamma':gamma, 'gammaln':gammaln, 'erf':erf,'polygamma':polygamma}]
+func_modules = ['numpy', {'gamma':gamma, 'gammaln':gammaln, 'erf':erf,'polygamma':polygamma, 'cum_gaussian':cum_gaussian, 'ln_cum_gaussian':ln_cum_gaussian}]

-class Symbolic(Likelihood):
-    """
-    Symbolic likelihood.
-
-    Likelihood where the form of the likelihood is provided by a sympy expression.
-
-    """
-    def __init__(self, likelihood=None, log_likelihood=None, cdf=None, logZ=None, gp_link=None, name='symbolic', log_concave=False, param=None):
-        if gp_link is None:
-            gp_link = link_functions.Identity()
-
-        if likelihood is None and log_likelihood is None and cdf is None:
-            raise ValueError, "You must provide an argument for the likelihood or the log likelihood."
-
-        super(Symbolic, self).__init__(gp_link, name=name)
-
-        if likelihood is None and log_likelihood:
-            self._sp_likelihood = sym.exp(log_likelihood).simplify()
-            self._sp_log_likelihood = log_likelihood
-
-        if log_likelihood is None and likelihood:
-            self._sp_likelihood = likelihood
-            self._sp_log_likelihood = sym.log(likelihood).simplify()
-
-        # TODO: build likelihood and log likelihood from CDF or
-        # compute CDF given likelihood/log-likelihood. Also check log
-        # likelihood, likelihood and CDF are consistent.
-
-        # pull the variable names out of the symbolic likelihood
-        sp_vars = [e for e in self._sp_likelihood.atoms() if e.is_Symbol]
-        self._sp_f = [e for e in sp_vars if e.name=='f']
-        if not self._sp_f:
-            raise ValueError('No variable f in likelihood or log likelihood.')
-        self._sp_y = [e for e in sp_vars if e.name=='y']
-        if not self._sp_f:
-            raise ValueError('No variable y in likelihood or log likelihood.')
-        self._sp_theta = sorted([e for e in sp_vars if not (e.name=='f' or e.name=='y')],key=lambda e:e.name, reverse=True)
-
-        # These are all the arguments need to compute likelihoods.
-        self.arg_list = self._sp_y + self._sp_f + self._sp_theta
-
-        # these are arguments for computing derivatives.
-        derivative_arguments = self._sp_f + self._sp_theta
-        
-        # Do symbolic work to compute derivatives.
-        self._log_likelihood_derivatives = {theta.name : sym.diff(self._sp_log_likelihood,theta).simplify() for theta in derivative_arguments}
-        self._log_likelihood_second_derivatives = {theta.name : sym.diff(self._log_likelihood_derivatives['f'],theta).simplify() for theta in derivative_arguments}
-        self._log_likelihood_third_derivatives = {theta.name : sym.diff(self._log_likelihood_second_derivatives['f'],theta).simplify() for theta in derivative_arguments}
-
-        # Add parameters to the model.
-        for theta in self._sp_theta:
-            val = 1.0
-            # TODO: need to decide how to handle user passing values for the se parameter vectors.
-            if param is not None:
-                if param.has_key(theta):
-                    val = param[theta]
-            setattr(self, theta.name, Param(theta.name, val, None))
-            self.add_parameters(getattr(self, theta.name))
-
-
-        # Is there some way to check whether the likelihood is log
-        # concave? For the moment, need user to specify.
-        self.log_concave = log_concave
-
-        # initialise code arguments
-        self._arguments = {} 
-
-        # generate the code for the likelihood and derivatives
-        self._gen_code()
-
-    def _gen_code(self):
-        """Generate the code from the symbolic parts that will be used for likleihod computation."""
-        # TODO: Check here whether theano is available and set up
-        # functions accordingly.
-        self._likelihood_function = lambdify(self.arg_list, self._sp_likelihood, func_modules)
-        self._log_likelihood_function = lambdify(self.arg_list, self._sp_log_likelihood, func_modules)
-
-        # compute code for derivatives (for implicit likelihood terms
-        # we need up to 3rd derivatives)
-        setattr(self, '_first_derivative_code', {key: lambdify(self.arg_list, self._log_likelihood_derivatives[key], func_modules) for key in self._log_likelihood_derivatives.keys()})
-        setattr(self, '_second_derivative_code', {key: lambdify(self.arg_list, self._log_likelihood_second_derivatives[key], func_modules) for key in self._log_likelihood_second_derivatives.keys()})
-        setattr(self, '_third_derivative_code', {key: lambdify(self.arg_list, self._log_likelihood_third_derivatives[key], func_modules) for key in self._log_likelihood_third_derivatives.keys()})
-            
-        # TODO: compute EP code parts based on logZ. We need dlogZ/dmu, d2logZ/dmu2 and dlogZ/dtheta
-
-    def parameters_changed(self):
-        pass
-
-    def update_gradients(self, grads):
+if sympy_available:
+    class Symbolic(Likelihood):
        """
-        Pull out the gradients, be careful as the order must match the order
-        in which the parameters are added
-        """
-        # The way the Laplace approximation is run requires the
-        # covariance function to compute the true gradient (because it
-        # is dependent on the mode). This means we actually compute
-        # the gradient outside this object. This function would
-        # normally ask the object to update its gradients internally,
-        # but here it provides them externally, because they are
-        # computed in the inference code. TODO: Thought: How does this
-        # effect EP? Shouldn't this be done by a separate
-        # Laplace-approximation specific call?
-        for grad, theta in zip(grads, self._sp_theta):
-            parameter = getattr(self, theta.name)
-            setattr(parameter, 'gradient', grad)
+        Symbolic likelihood.

-    def _arguments_update(self, f, y):
-        """Set up argument lists for the derivatives."""
-        # If we do make use of Theano, then at this point we would
-        # need to do a lot of precomputation to ensure that the
-        # likelihoods and gradients are computed together, then check
-        # for parameter changes before updating.
-        for i, fvar in enumerate(self._sp_f):
-            self._arguments[fvar.name] =  f
-        for i, yvar in enumerate(self._sp_y):
-            self._arguments[yvar.name] = y
-        for theta in self._sp_theta:
-            self._arguments[theta.name] = np.asarray(getattr(self, theta.name))
-
-    def pdf_link(self, inv_link_f, y, Y_metadata=None):
-        """
-        Likelihood function given inverse link of f.
-
-        :param inv_link_f: inverse link of latent variables.
-        :type inv_link_f: Nx1 array
-        :param y: data
-        :type y: Nx1 array
-        :param Y_metadata: Y_metadata which is not used in student t distribution
-        :returns: likelihood evaluated for this point
-        :rtype: float
-        """
-        assert np.atleast_1d(inv_link_f).shape == np.atleast_1d(y).shape
-        self._arguments_update(inv_link_f, y)
-        l = self._likelihood_function(**self._arguments)
-        return np.prod(l)
-
-    def logpdf_link(self, inv_link_f, y, Y_metadata=None):
-        """
-        Log Likelihood Function given inverse link of latent variables.
-
-        :param inv_inv_link_f: latent variables (inverse link of f)
-        :type inv_inv_link_f: Nx1 array
-        :param y: data
-        :type y: Nx1 array
-        :param Y_metadata: Y_metadata 
-        :returns: likelihood evaluated for this point
-        :rtype: float
+        Likelihood where the form of the likelihood is provided by a sympy expression.

        """
-        assert np.atleast_1d(inv_link_f).shape == np.atleast_1d(y).shape
-        self._arguments_update(inv_link_f, y)
-        ll = self._log_likelihood_function(**self._arguments)
-        return np.sum(ll)
+        def __init__(self, pdf=None, log_pdf=None, cdf=None, logZ=None, gp_link=None, name='symbolic', log_concave=False, param=None):
+            if gp_link is None:
+                gp_link = link_functions.Identity()

-    def dlogpdf_dlink(self, inv_link_f, y, Y_metadata=None):
-        """
-        Gradient of log likelihood with respect to the inverse link function.
+            if pdf is None and log_pdf is None and cdf is None:
+                raise ValueError, "You must provide an argument for the pdf or the log pdf."

-        :param inv_inv_link_f: latent variables (inverse link of f)
-        :type inv_inv_link_f: Nx1 array
-        :param y: data
-        :type y: Nx1 array
-        :param Y_metadata: Y_metadata 
-        :returns: gradient of likelihood with respect to each point.
-        :rtype: Nx1 array
+            super(Symbolic, self).__init__(gp_link, name=name)

-        """
-        assert np.atleast_1d(inv_link_f).shape == np.atleast_1d(y).shape 
-        self._arguments_update(inv_link_f, y)
-        return self._first_derivative_code['f'](**self._arguments)
+            if pdf is None and log_pdf:
+                self._sp_pdf = sym.exp(log_pdf).simplify()
+                self._sp_log_pdf = log_pdf

-    def d2logpdf_dlink2(self, inv_link_f, y, Y_metadata=None):
-        """
-        Hessian of log likelihood given inverse link of latent variables with respect to that inverse link.
-        i.e. second derivative logpdf at y given inv_link(f_i) and inv_link(f_j)  w.r.t inv_link(f_i) and inv_link(f_j).
+            if log_pdf is None and pdf:
+                self._sp_pdf = pdf
+                self._sp_log_pdf = sym.log(pdf).simplify()
+
+            # TODO: build pdf and log pdf from CDF or
+            # compute CDF given pdf/log-pdf. Also check log
+            # pdf, pdf and CDF are consistent.
+
+            # pull the variable names out of the symbolic pdf
+            sp_vars = [e for e in self._sp_pdf.atoms() if e.is_Symbol]
+            self._sp_f = [e for e in sp_vars if e.name=='f']
+            if not self._sp_f:
+                raise ValueError('No variable f in pdf or log pdf.')
+            self._sp_y = [e for e in sp_vars if e.name=='y']
+            if not self._sp_f:
+                raise ValueError('No variable y in pdf or log pdf.')
+            self._sp_theta = sorted([e for e in sp_vars if not (e.name=='f' or e.name=='y')],key=lambda e:e.name)
+
+            # These are all the arguments need to compute likelihoods.
+            self.arg_list = self._sp_y + self._sp_f + self._sp_theta
+
+            # these are arguments for computing derivatives.
+            derivative_arguments = self._sp_f + self._sp_theta
+
+            # Do symbolic work to compute derivatives.
+            self._log_pdf_derivatives = {theta.name : sym.diff(self._sp_log_pdf,theta).simplify() for theta in derivative_arguments}
+            self._log_pdf_second_derivatives = {theta.name : sym.diff(self._log_pdf_derivatives['f'],theta).simplify() for theta in derivative_arguments}
+            self._log_pdf_third_derivatives = {theta.name : sym.diff(self._log_pdf_second_derivatives['f'],theta).simplify() for theta in derivative_arguments}
+
+            # Add parameters to the model.
+            for theta in self._sp_theta:
+                val = 1.0
+                # TODO: need to decide how to handle user passing values for the se parameter vectors.
+                if param is not None:
+                    if param.has_key(theta):
+                        val = param[theta]
+                setattr(self, theta.name, Param(theta.name, val, None))
+                self.add_parameters(getattr(self, theta.name))


-        :param inv_link_f: inverse link of the latent variables.
-        :type inv_link_f: Nx1 array
-        :param y: data
-        :type y: Nx1 array
-        :param Y_metadata: Y_metadata which is not used in student t distribution
-        :returns: Diagonal of Hessian matrix (second derivative of likelihood evaluated at points f)
-        :rtype: Nx1 array
+            # Is there some way to check whether the pdf is log
+            # concave? For the moment, need user to specify.
+            self.log_concave = log_concave

-        .. Note::
-            Returns diagonal of Hessian, since every where else it is
-            0, as the likelihood factorizes over cases (the
-            distribution for y_i depends only on link(f_i) not on
-            link(f_(j!=i))
-        """
-        assert np.atleast_1d(inv_link_f).shape == np.atleast_1d(y).shape 
-        self._arguments_update(inv_link_f, y)
-        return self._second_derivative_code['f'](**self._arguments)
+            # initialise code arguments
+            self._arguments = {} 

-    def d3logpdf_dlink3(self, inv_link_f, y, Y_metadata=None):
-        assert np.atleast_1d(inv_link_f).shape == np.atleast_1d(y).shape 
-        self._arguments_update(inv_link_f, y)
-        return self._third_derivative_code['f'](**self._arguments)
-        raise NotImplementedError
+            # generate the code for the pdf and derivatives
+            self._gen_code()

-    def dlogpdf_link_dtheta(self, inv_link_f, y, Y_metadata=None):
-        assert np.atleast_1d(inv_link_f).shape == np.atleast_1d(y).shape 
-        self._arguments_update(inv_link_f, y)
-        return np.hstack([self._first_derivative_code[theta.name](**self._arguments) for theta in self._sp_theta]).sum(0)
-            
-    def dlogpdf_dlink_dtheta(self, inv_link_f, y, Y_metadata=None):
-        assert np.atleast_1d(inv_link_f).shape == np.atleast_1d(y).shape 
-        self._arguments_update(inv_link_f, y)
-        return np.hstack([self._second_derivative_code[theta.name](**self._arguments) for theta in self._sp_theta])
+        def _gen_code(self):
+            """Generate the code from the symbolic parts that will be used for likleihod computation."""
+            # TODO: Check here whether theano is available and set up
+            # functions accordingly.
+            self._pdf_function = lambdify(self.arg_list, self._sp_pdf, func_modules)
+            self._log_pdf_function = lambdify(self.arg_list, self._sp_log_pdf, func_modules)

-    def d2logpdf_dlink2_dtheta(self, inv_link_f, y, Y_metadata=None):
-        assert np.atleast_1d(inv_link_f).shape == np.atleast_1d(y).shape 
-        self._arguments_update(inv_link_f, y)
-        return np.hstack([self._third_derivative_code[theta.name](**self._arguments) for theta in self._sp_theta])
+            # compute code for derivatives (for implicit likelihood terms
+            # we need up to 3rd derivatives)
+            setattr(self, '_first_derivative_code', {key: lambdify(self.arg_list, self._log_pdf_derivatives[key], func_modules) for key in self._log_pdf_derivatives.keys()})
+            setattr(self, '_second_derivative_code', {key: lambdify(self.arg_list, self._log_pdf_second_derivatives[key], func_modules) for key in self._log_pdf_second_derivatives.keys()})
+            setattr(self, '_third_derivative_code', {key: lambdify(self.arg_list, self._log_pdf_third_derivatives[key], func_modules) for key in self._log_pdf_third_derivatives.keys()})

-    def predictive_mean(self, mu, sigma, Y_metadata=None):
-        raise NotImplementedError
+            # TODO: compute EP code parts based on logZ. We need dlogZ/dmu, d2logZ/dmu2 and dlogZ/dtheta

-    def predictive_variance(self, mu,variance, predictive_mean=None, Y_metadata=None):
-        raise NotImplementedError
+        def parameters_changed(self):
+            pass

-    def conditional_mean(self, gp):
-        raise NotImplementedError
+        def update_gradients(self, grads):
+            """
+            Pull out the gradients, be careful as the order must match the order
+            in which the parameters are added
+            """
+            # The way the Laplace approximation is run requires the
+            # covariance function to compute the true gradient (because it
+            # is dependent on the mode). This means we actually compute
+            # the gradient outside this object. This function would
+            # normally ask the object to update its gradients internally,
+            # but here it provides them externally, because they are
+            # computed in the inference code. TODO: Thought: How does this
+            # effect EP? Shouldn't this be done by a separate
+            # Laplace-approximation specific call?
+            for grad, theta in zip(grads, self._sp_theta):
+                parameter = getattr(self, theta.name)
+                setattr(parameter, 'gradient', grad)

-    def conditional_variance(self, gp):
-        raise NotImplementedError
+        def _arguments_update(self, f, y):
+            """Set up argument lists for the derivatives."""
+            # If we do make use of Theano, then at this point we would
+            # need to do a lot of precomputation to ensure that the
+            # likelihoods and gradients are computed together, then check
+            # for parameter changes before updating.
+            for i, fvar in enumerate(self._sp_f):
+                self._arguments[fvar.name] =  f
+            for i, yvar in enumerate(self._sp_y):
+                self._arguments[yvar.name] = y
+            for theta in self._sp_theta:
+                self._arguments[theta.name] = np.asarray(getattr(self, theta.name))

-    def samples(self, gp, Y_metadata=None):
-        raise NotImplementedError
+        def pdf_link(self, inv_link_f, y, Y_metadata=None):
+            """
+            Likelihood function given inverse link of f.
+
+            :param inv_link_f: inverse link of latent variables.
+            :type inv_link_f: Nx1 array
+            :param y: data
+            :type y: Nx1 array
+            :param Y_metadata: Y_metadata which is not used in student t distribution
+            :returns: likelihood evaluated for this point
+            :rtype: float
+            """
+            assert np.atleast_1d(inv_link_f).shape == np.atleast_1d(y).shape
+            self._arguments_update(inv_link_f, y)
+            l = self._pdf_function(**self._arguments)
+            return np.prod(l)
+
+        def logpdf_link(self, inv_link_f, y, Y_metadata=None):
+            """
+            Log Likelihood Function given inverse link of latent variables.
+
+            :param inv_inv_link_f: latent variables (inverse link of f)
+            :type inv_inv_link_f: Nx1 array
+            :param y: data
+            :type y: Nx1 array
+            :param Y_metadata: Y_metadata 
+            :returns: likelihood evaluated for this point
+            :rtype: float
+
+            """
+            assert np.atleast_1d(inv_link_f).shape == np.atleast_1d(y).shape
+            self._arguments_update(inv_link_f, y)
+            ll = self._log_pdf_function(**self._arguments)
+            return np.sum(ll)
+
+        def dlogpdf_dlink(self, inv_link_f, y, Y_metadata=None):
+            """
+            Gradient of log likelihood with respect to the inverse link function.
+
+            :param inv_inv_link_f: latent variables (inverse link of f)
+            :type inv_inv_link_f: Nx1 array
+            :param y: data
+            :type y: Nx1 array
+            :param Y_metadata: Y_metadata 
+            :returns: gradient of likelihood with respect to each point.
+            :rtype: Nx1 array
+
+            """
+            assert np.atleast_1d(inv_link_f).shape == np.atleast_1d(y).shape 
+            self._arguments_update(inv_link_f, y)
+            return self._first_derivative_code['f'](**self._arguments)
+
+        def d2logpdf_dlink2(self, inv_link_f, y, Y_metadata=None):
+            """
+            Hessian of log likelihood given inverse link of latent variables with respect to that inverse link.
+            i.e. second derivative logpdf at y given inv_link(f_i) and inv_link(f_j)  w.r.t inv_link(f_i) and inv_link(f_j).
+
+
+            :param inv_link_f: inverse link of the latent variables.
+            :type inv_link_f: Nx1 array
+            :param y: data
+            :type y: Nx1 array
+            :param Y_metadata: Y_metadata which is not used in student t distribution
+            :returns: Diagonal of Hessian matrix (second derivative of likelihood evaluated at points f)
+            :rtype: Nx1 array
+
+            .. Note::
+                Returns diagonal of Hessian, since every where else it is
+                0, as the likelihood factorizes over cases (the
+                distribution for y_i depends only on link(f_i) not on
+                link(f_(j!=i))
+            """
+            assert np.atleast_1d(inv_link_f).shape == np.atleast_1d(y).shape 
+            self._arguments_update(inv_link_f, y)
+            return self._second_derivative_code['f'](**self._arguments)
+
+        def d3logpdf_dlink3(self, inv_link_f, y, Y_metadata=None):
+            assert np.atleast_1d(inv_link_f).shape == np.atleast_1d(y).shape 
+            self._arguments_update(inv_link_f, y)
+            return self._third_derivative_code['f'](**self._arguments)
+            raise NotImplementedError
+
+        def dlogpdf_link_dtheta(self, inv_link_f, y, Y_metadata=None):
+            assert np.atleast_1d(inv_link_f).shape == np.atleast_1d(y).shape 
+            self._arguments_update(inv_link_f, y)
+            g = np.zeros((y.shape[0], len(self._sp_theta)))
+            for i, theta in enumerate(self._sp_theta):
+                g[:, i:i+1] = self._first_derivative_code[theta.name](**self._arguments)
+            return g.sum(0)
+
+        def dlogpdf_dlink_dtheta(self, inv_link_f, y, Y_metadata=None):
+            assert np.atleast_1d(inv_link_f).shape == np.atleast_1d(y).shape 
+            self._arguments_update(inv_link_f, y)
+            g = np.zeros((y.shape[0], len(self._sp_theta)))
+            for i, theta in enumerate(self._sp_theta):
+                g[:, i:i+1] = self._second_derivative_code[theta.name](**self._arguments)
+            return g
+
+        def d2logpdf_dlink2_dtheta(self, inv_link_f, y, Y_metadata=None):
+            assert np.atleast_1d(inv_link_f).shape == np.atleast_1d(y).shape 
+            self._arguments_update(inv_link_f, y)
+            g = np.zeros((y.shape[0], len(self._sp_theta)))
+            for i, theta in enumerate(self._sp_theta):
+                g[:, i:i+1] = self._third_derivative_code[theta.name](**self._arguments)
+            return g
+
+        def predictive_mean(self, mu, sigma, Y_metadata=None):
+            raise NotImplementedError
+
+        def predictive_variance(self, mu,variance, predictive_mean=None, Y_metadata=None):
+            raise NotImplementedError
+
+        def conditional_mean(self, gp):
+            raise NotImplementedError
+
+        def conditional_variance(self, gp):
+            raise NotImplementedError
+
+        def samples(self, gp, Y_metadata=None):
+            raise NotImplementedError
--- a/GPy/util/datasets.py
+++ b/GPy/util/datasets.py
@ -331,7 +331,7 @@ def football_data(season='1314', data_set='football_data'):

 # This will be for downloading google trends data.
 def google_trends(query_terms=['big data', 'machine learning', 'data science'], data_set='google_trends'):
-    """Data downloaded from Google trends for given query terms."""
+    """Data downloaded from Google trends for given query terms. Warning, if you use this function multiple times in a row you get blocked due to terms of service violations."""
    # Inspired by this notebook:
    # http://nbviewer.ipython.org/github/sahuguet/notebooks/blob/master/GoogleTrends%20meet%20Notebook.ipynb

--- a/GPy/util/symbolic.py
+++ b/GPy/util/symbolic.py
@ -1,12 +1,48 @@
-from sympy import Function, S, oo, I, cos, sin, asin, log, erf, pi, exp, sqrt, sign, gamma
+from sympy import Function, S, oo, I, cos, sin, asin, log, erf, pi, exp, sqrt, sign, gamma,polygamma

 class gammaln(Function):
    nargs = 1
+
+    def fdiff(self, argindex=1):
+        x=self.args[0]
+        return polygamma(0, x)
+
    @classmethod
    def eval(cls, x):
-        return log(gamma(x))
+        if x.is_Number:
+            return log(gamma(x))
    

+class ln_cum_gaussian(Function):
+    nargs = 1
+
+    def fdiff(self, argindex=1):
+        x = self.args[0]
+        return 1/cum_gaussian(x)*gaussian(x)
+
+    @classmethod
+    def eval(cls, x):
+        if x.is_Number:
+            return log(cum_gaussian(x))
+
+class cum_gaussian(Function):
+    nargs = 1
+    def fdiff(self, argindex=1):
+        x = self.args[0]
+        return gaussian(x)
+
+    @classmethod
+    def eval(cls, x):
+        if x.is_Number:
+            return 0.5*(1+erf(sqrt(2)/2*x))
+
+class gaussian(Function):
+    nargs = 1
+    @classmethod
+    def eval(cls, x):
+        return 1/sqrt(2*pi)*exp(-0.5*x*x)
+
+
 class ln_diff_erf(Function):
    nargs = 2