GPy/GPy/kern/_src/kern.py

# Copyright (c) 2012, GPy authors (see AUTHORS.txt).
# Licensed under the BSD 3-clause license (see LICENSE.txt)

import sys
import numpy as np
from ...core.parameterization.parameterized import Parameterized
from kernel_slice_operations import KernCallsViaSlicerMeta
from ...util.caching import Cache_this


class Kern(Parameterized):
    #===========================================================================
    # This adds input slice support. The rather ugly code for slicing can be
    # found in kernel_slice_operations
    __metaclass__ = KernCallsViaSlicerMeta
    #===========================================================================
    _debug=False
    def __init__(self, input_dim, active_dims, name, *a, **kw):
        """
        The base class for a kernel: a positive definite function
        which forms of a covariance function (kernel).

        :param int input_dim: the number of input dimensions to the function
        :param array-like|slice active_dims: list of indices on which dimensions this kernel works on

        Do not instantiate.
        """
        super(Kern, self).__init__(name=name, *a, **kw)
        self.active_dims = active_dims if active_dims is not None else slice(0, input_dim)
        self.input_dim = input_dim
        assert isinstance(self.active_dims, (slice, list, tuple, np.ndarray)), 'active_dims needs to be an array-like or slice object over dimensions, {} given'.format(self.active_dims.__class__)
        if isinstance(self.active_dims, slice):
            self.active_dims = slice(self.active_dims.start or 0, self.active_dims.stop or self.input_dim, self.active_dims.step or 1)
            active_dim_size = int(np.round((self.active_dims.stop-self.active_dims.start)/self.active_dims.step))
        elif isinstance(self.active_dims, np.ndarray):
            assert self.active_dims.ndim == 1, 'only flat indices allowed, given active_dims.shape={}, provide only indexes to the dimensions of the input'.format(self.active_dims.shape)
            active_dim_size = self.active_dims.size
        else:
            active_dim_size = len(self.active_dims)
        assert active_dim_size == self.input_dim, "input_dim={} does not match len(active_dim)={}, active_dims={}".format(self.input_dim, active_dim_size, self.active_dims)
        self._sliced_X = 0

    @Cache_this(limit=10)
    def _slice_X(self, X):
        return X[:, self.active_dims]

    def K(self, X, X2):
        """
        Compute the kernel function.

        :param X: the first set of inputs to the kernel
        :param X2: (optional) the second set of arguments to the kernel. If X2
                   is None, this is passed throgh to the 'part' object, which
                   handLes this as X2 == X.
        """
        raise NotImplementedError
    def Kdiag(self, X):
        raise NotImplementedError
    def psi0(self, Z, variational_posterior):
        raise NotImplementedError
    def psi1(self, Z, variational_posterior):
        raise NotImplementedError
    def psi2(self, Z, variational_posterior):
        raise NotImplementedError
    def gradients_X(self, dL_dK, X, X2):
        raise NotImplementedError
    def gradients_X_diag(self, dL_dKdiag, X):
        raise NotImplementedError

    def update_gradients_diag(self, dL_dKdiag, X):
        """ update the gradients of all parameters when using only the diagonal elements of the covariance matrix"""
        raise NotImplementedError

    def update_gradients_full(self, dL_dK, X, X2):
        """Set the gradients of all parameters when doing full (N) inference."""
        raise NotImplementedError

    def update_gradients_expectations(self, dL_dpsi0, dL_dpsi1, dL_dpsi2, Z, variational_posterior):
        """
        Set the gradients of all parameters when doing inference with
        uncertain inputs, using expectations of the kernel.

        The esential maths is

        dL_d{theta_i} = dL_dpsi0 * dpsi0_d{theta_i} +
                        dL_dpsi1 * dpsi1_d{theta_i} +
                        dL_dpsi2 * dpsi2_d{theta_i}
        """
        raise NotImplementedError

    def gradients_Z_expectations(self, dL_dpsi1, dL_dpsi2, Z, variational_posterior):
        """
        Returns the derivative of the objective wrt Z, using the chain rule
        through the expectation variables.
        """
        raise NotImplementedError

    def gradients_qX_expectations(self, dL_dpsi0, dL_dpsi1, dL_dpsi2, Z, variational_posterior):
        """
        Compute the gradients wrt the parameters of the variational
        distruibution q(X), chain-ruling via the expectations of the kernel
        """
        raise NotImplementedError

    def plot(self, *args, **kwargs):
        """
        See GPy.plotting.matplot_dep.plot
        """
        assert "matplotlib" in sys.modules, "matplotlib package has not been imported."
        from ...plotting.matplot_dep import kernel_plots
        kernel_plots.plot(self,*args)

    def plot_ARD(self, *args, **kw):
        """
        See :class:`~GPy.plotting.matplot_dep.kernel_plots`
        """
        import sys
        assert "matplotlib" in sys.modules, "matplotlib package has not been imported."
        from ...plotting.matplot_dep import kernel_plots
        return kernel_plots.plot_ARD(self,*args,**kw)

    def input_sensitivity(self):
        """
        Returns the sensitivity for each dimension of this kernel.
        """
        return np.zeros(self.input_dim)

    def __add__(self, other):
        """ Overloading of the '+' operator. for more control, see self.add """
        return self.add(other)

    def add(self, other, name='add'):
        """
        Add another kernel to this one.

        :param other: the other kernel to be added
        :type other: GPy.kern

        """
        assert isinstance(other, Kern), "only kernels can be added to kernels..."
        from add import Add
        return Add([self, other], name=name)

    def __mul__(self, other):
        """ Here we overload the '*' operator. See self.prod for more information"""
        return self.prod(other)

    def __pow__(self, other):
        """
        Shortcut for tensor `prod`.
        """
        assert self.active_dims == range(self.input_dim), "Can only use kernels, which have their input_dims defined from 0"
        assert other.active_dims == range(other.input_dim), "Can only use kernels, which have their input_dims defined from 0"
        other.active_dims += self.input_dim
        return self.prod(other)

    def prod(self, other, name='mul'):
        """
        Multiply two kernels (either on the same space, or on the tensor
        product of the input space).

        :param other: the other kernel to be added
        :type other: GPy.kern
        :param tensor: whether or not to use the tensor space (default is false).
        :type tensor: bool

        """
        assert isinstance(other, Kern), "only kernels can be added to kernels..."
        from prod import Prod
        #kernels = []
        #if isinstance(self, Prod): kernels.extend(self._parameters_)
        #else: kernels.append(self)
        #if isinstance(other, Prod): kernels.extend(other._parameters_)
        #else: kernels.append(other)
        return Prod([self, other], name)

    def _getstate(self):
        """
        Get the current state of the class,
        here just all the indices, rest can get recomputed
        """
        return super(Kern, self)._getstate() + [
                self.active_dims,
                self.input_dim,
                self._sliced_X]

    def _setstate(self, state):
        self._sliced_X = state.pop()
        self.input_dim = state.pop()
        self.active_dims = state.pop()
        super(Kern, self)._setstate(state)

class CombinationKernel(Kern):
    """
    Abstract super class for combination kernels.
    A combination kernel combines (a list of) kernels and works on those.
    Examples are the HierarchicalKernel or Add and Prod kernels.
    """
    def __init__(self, kernels, name, extra_dims=[]):
        """
        Abstract super class for combination kernels.
        A combination kernel combines (a list of) kernels and works on those.
        Examples are the HierarchicalKernel or Add and Prod kernels.

        :param list kernels: List of kernels to combine (can be only one element)
        :param str name: name of the combination kernel
        :param array-like|slice extra_dims: if needed extra dimensions for the combination kernel to work on
        """
        assert all([isinstance(k, Kern) for k in kernels])
        active_dims = reduce(np.union1d, (np.r_[x.active_dims] for x in kernels), np.array([], dtype=int))
        input_dim = active_dims.max()+1 + len(extra_dims)
        active_dims = slice(active_dims.max()+1+len(extra_dims))
        # initialize the kernel with the full input_dim
        super(CombinationKernel, self).__init__(input_dim, active_dims, name)
        self.extra_dims = extra_dims
        self.add_parameters(*kernels)

    @property
    def parts(self):
        return self._parameters_

    def input_sensitivity(self):
        in_sen = np.zeros((self.num_params, self.input_dim))
        for i, p in enumerate(self.parts):
            in_sen[i, p.active_dims] = p.input_sensitivity()
        return in_sen
rbf and white seem to work 2014-02-19 15:00:48 +00:00			`# Copyright (c) 2012, GPy authors (see AUTHORS.txt).`
			`# Licensed under the BSD 3-clause license (see LICENSE.txt)`

			`import sys`
Combination Kernel for add and prod 2014-03-11 10:24:15 +00:00			`import numpy as np`
automatic slicing 2014-03-11 16:24:09 +00:00			`from ...core.parameterization.parameterized import Parameterized`
			`from kernel_slice_operations import KernCallsViaSlicerMeta`
slicing support for kernel input dimension 2014-03-07 16:59:41 +00:00			`from ...util.caching import Cache_this`
rbf and white seem to work 2014-02-19 15:00:48 +00:00
automatic slicing 2014-03-11 16:24:09 +00:00
Combination Kernel for add and prod 2014-03-11 10:24:15 +00:00
rbf and white seem to work 2014-02-19 15:00:48 +00:00			`class Kern(Parameterized):`
automatic slicing 2014-03-11 16:24:09 +00:00			`#===========================================================================`
Full Linear kernel added, inc testing 2014-03-25 16:59:52 +00:00			`# This adds input slice support. The rather ugly code for slicing can be`
automatic slicing 2014-03-11 16:24:09 +00:00			`# found in kernel_slice_operations`
slicing support for kernel input dimension 2014-03-07 16:59:41 +00:00			`__metaclass__ = KernCallsViaSlicerMeta`
automatic slicing 2014-03-11 16:24:09 +00:00			`#===========================================================================`
psi_stat slices for kernels 2014-03-12 12:03:37 +00:00			`_debug=False`
active_dims as extra parameter for kernels, it tells which input dimensions to work on 2014-03-14 09:18:08 +00:00			`def __init__(self, input_dim, active_dims, name, a, *kw):`
rbf and white seem to work 2014-02-19 15:00:48 +00:00			`"""`
			`The base class for a kernel: a positive definite function`
			`which forms of a covariance function (kernel).`

active_dims as extra parameter for kernels, it tells which input dimensions to work on 2014-03-14 09:18:08 +00:00			`:param int input_dim: the number of input dimensions to the function`
			`:param array-like\|slice active_dims: list of indices on which dimensions this kernel works on`
rbf and white seem to work 2014-02-19 15:00:48 +00:00
			`Do not instantiate.`
			`"""`
gradient operations and cachong 2014-02-21 10:38:11 +00:00			`super(Kern, self).__init__(name=name, a, *kw)`
kernel slices allowed 2014-03-14 10:55:16 +00:00			`self.active_dims = active_dims if active_dims is not None else slice(0, input_dim)`
active_dims as extra parameter for kernels, it tells which input dimensions to work on 2014-03-14 09:18:08 +00:00			`self.input_dim = input_dim`
			`assert isinstance(self.active_dims, (slice, list, tuple, np.ndarray)), 'active_dims needs to be an array-like or slice object over dimensions, {} given'.format(self.active_dims.__class__)`
kernel slices allowed 2014-03-14 10:55:16 +00:00			`if isinstance(self.active_dims, slice):`
			`self.active_dims = slice(self.active_dims.start or 0, self.active_dims.stop or self.input_dim, self.active_dims.step or 1)`
			`active_dim_size = int(np.round((self.active_dims.stop-self.active_dims.start)/self.active_dims.step))`
			`elif isinstance(self.active_dims, np.ndarray):`
			`assert self.active_dims.ndim == 1, 'only flat indices allowed, given active_dims.shape={}, provide only indexes to the dimensions of the input'.format(self.active_dims.shape)`
			`active_dim_size = self.active_dims.size`
			`else:`
			`active_dim_size = len(self.active_dims)`
			`assert active_dim_size == self.input_dim, "input_dim={} does not match len(active_dim)={}, active_dims={}".format(self.input_dim, active_dim_size, self.active_dims)`
psi_stat slices for kernels 2014-03-12 12:03:37 +00:00			`self._sliced_X = 0`
Combination Kernel for add and prod 2014-03-11 10:24:15 +00:00
active_dims as extra parameter for kernels, it tells which input dimensions to work on 2014-03-14 09:18:08 +00:00			`@Cache_this(limit=10)`
slicing support for kernel input dimension 2014-03-07 16:59:41 +00:00			`def _slice_X(self, X):`
			`return X[:, self.active_dims]`
Combination Kernel for add and prod 2014-03-11 10:24:15 +00:00
linear without caching, derivatives done 2014-02-21 09:14:31 +00:00			`def K(self, X, X2):`
Combination Kernel for add and prod 2014-03-11 10:24:15 +00:00			`"""`
			`Compute the kernel function.`

			`:param X: the first set of inputs to the kernel`
			`:param X2: (optional) the second set of arguments to the kernel. If X2`
			`is None, this is passed throgh to the 'part' object, which`
			`handLes this as X2 == X.`
			`"""`
rbf and white seem to work 2014-02-19 15:00:48 +00:00			`raise NotImplementedError`
slicing support for kernel input dimension 2014-03-07 16:59:41 +00:00			`def Kdiag(self, X):`
rbf and white seem to work 2014-02-19 15:00:48 +00:00			`raise NotImplementedError`
docstrings in kern.py 2014-02-26 08:23:46 +00:00			`def psi0(self, Z, variational_posterior):`
rbf and white seem to work 2014-02-19 15:00:48 +00:00			`raise NotImplementedError`
docstrings in kern.py 2014-02-26 08:23:46 +00:00			`def psi1(self, Z, variational_posterior):`
rbf and white seem to work 2014-02-19 15:00:48 +00:00			`raise NotImplementedError`
docstrings in kern.py 2014-02-26 08:23:46 +00:00			`def psi2(self, Z, variational_posterior):`
rbf and white seem to work 2014-02-19 15:00:48 +00:00			`raise NotImplementedError`
weird Max related stuff is happening 2014-02-20 14:24:41 +00:00			`def gradients_X(self, dL_dK, X, X2):`
rbf and white seem to work 2014-02-19 15:00:48 +00:00			`raise NotImplementedError`
slicing support for kernel input dimension 2014-03-07 16:59:41 +00:00			`def gradients_X_diag(self, dL_dKdiag, X):`
rbf and white seem to work 2014-02-19 15:00:48 +00:00			`raise NotImplementedError`
psi_stat slices for kernels 2014-03-12 12:03:37 +00:00
added update_gradints_diag to the add and base kernels 2014-03-10 11:14:19 +00:00			`def update_gradients_diag(self, dL_dKdiag, X):`
			`""" update the gradients of all parameters when using only the diagonal elements of the covariance matrix"""`
			`raise NotImplementedError`

Part working version of sympy covariance with new params version. 2014-02-24 21:16:26 +00:00			`def update_gradients_full(self, dL_dK, X, X2):`
rbf and white seem to work 2014-02-19 15:00:48 +00:00			`"""Set the gradients of all parameters when doing full (N) inference."""`
			`raise NotImplementedError`
active_dims as extra parameter for kernels, it tells which input dimensions to work on 2014-03-14 09:18:08 +00:00
messing with kernels 2014-02-25 17:15:38 +00:00			`def update_gradients_expectations(self, dL_dpsi0, dL_dpsi1, dL_dpsi2, Z, variational_posterior):`
			`"""`
			`Set the gradients of all parameters when doing inference with`
			`uncertain inputs, using expectations of the kernel.`
docstrings in kern.py 2014-02-26 08:23:46 +00:00
			`The esential maths is`

			`dL_d{theta_i} = dL_dpsi0 * dpsi0_d{theta_i} +`
			`dL_dpsi1 * dpsi1_d{theta_i} +`
			`dL_dpsi2 * dpsi2_d{theta_i}`
messing with kernels 2014-02-25 17:15:38 +00:00			`"""`
rbf and white seem to work 2014-02-19 15:00:48 +00:00			`raise NotImplementedError`
docstrings in kern.py 2014-02-26 08:23:46 +00:00
messing with kernels 2014-02-25 17:15:38 +00:00			`def gradients_Z_expectations(self, dL_dpsi1, dL_dpsi2, Z, variational_posterior):`
docstrings in kern.py 2014-02-26 08:23:46 +00:00			`"""`
			`Returns the derivative of the objective wrt Z, using the chain rule`
			`through the expectation variables.`
			`"""`
linear without caching, derivatives done 2014-02-21 09:14:31 +00:00			`raise NotImplementedError`
docstrings in kern.py 2014-02-26 08:23:46 +00:00
messing with kernels 2014-02-25 17:15:38 +00:00			`def gradients_qX_expectations(self, dL_dpsi0, dL_dpsi1, dL_dpsi2, Z, variational_posterior):`
			`"""`
			`Compute the gradients wrt the parameters of the variational`
			`distruibution q(X), chain-ruling via the expectations of the kernel`
			`"""`
linear without caching, derivatives done 2014-02-21 09:14:31 +00:00			`raise NotImplementedError`
messing with kernels 2014-02-25 17:15:38 +00:00
moved plot functionality from add to kern 2014-02-26 14:30:28 +00:00			`def plot(self, args, *kwargs):`
			`"""`
			`See GPy.plotting.matplot_dep.plot`
			`"""`
			`assert "matplotlib" in sys.modules, "matplotlib package has not been imported."`
plotting \o/ 2014-03-03 15:07:52 +00:00			`from ...plotting.matplot_dep import kernel_plots`
moved plot functionality from add to kern 2014-02-26 14:30:28 +00:00			`kernel_plots.plot(self,*args)`

input_sensitivity and ard plotting 2014-02-24 14:47:43 +00:00			`def plot_ARD(self, args, *kw):`
ard plotting 2014-02-26 08:21:14 +00:00			`"""`
			See :class:`~GPy.plotting.matplot_dep.kernel_plots`
			`"""`
			`import sys`
rbf and white seem to work 2014-02-19 15:00:48 +00:00			`assert "matplotlib" in sys.modules, "matplotlib package has not been imported."`
parameterized now supports deleting of parameters 2014-02-21 17:53:44 +00:00			`from ...plotting.matplot_dep import kernel_plots`
input_sensitivity and ard plotting 2014-02-24 14:47:43 +00:00			`return kernel_plots.plot_ARD(self,args,*kw)`
messing with kernels 2014-02-25 17:15:38 +00:00
input_sensitivity and ard plotting 2014-02-24 14:47:43 +00:00			`def input_sensitivity(self):`
			`"""`
			`Returns the sensitivity for each dimension of this kernel.`
			`"""`
all parameters in memory 2014-03-10 08:21:13 +00:00			`return np.zeros(self.input_dim)`
messing with kernels 2014-02-25 17:15:38 +00:00
rbf and white seem to work 2014-02-19 15:00:48 +00:00			`def __add__(self, other):`
			`""" Overloading of the '+' operator. for more control, see self.add """`
			`return self.add(other)`

Combination Kernel for add and prod 2014-03-11 10:24:15 +00:00			`def add(self, other, name='add'):`
rbf and white seem to work 2014-02-19 15:00:48 +00:00			`"""`
			`Add another kernel to this one.`

			`:param other: the other kernel to be added`
			`:type other: GPy.kern`

			`"""`
			`assert isinstance(other, Kern), "only kernels can be added to kernels..."`
			`from add import Add`
adding kernels flattening and parameters already in hierarchy 2014-03-18 17:41:08 +00:00			`return Add([self, other], name=name)`
rbf and white seem to work 2014-02-19 15:00:48 +00:00
			`def __mul__(self, other):`
			`""" Here we overload the '*' operator. See self.prod for more information"""`
			`return self.prod(other)`

old way of tensor product 2014-03-12 13:23:01 +00:00			`def __pow__(self, other):`
			`"""`
			Shortcut for tensor `prod`.
			`"""`
			`assert self.active_dims == range(self.input_dim), "Can only use kernels, which have their input_dims defined from 0"`
			`assert other.active_dims == range(other.input_dim), "Can only use kernels, which have their input_dims defined from 0"`
			`other.active_dims += self.input_dim`
			`return self.prod(other)`
rbf and white seem to work 2014-02-19 15:00:48 +00:00
testing a bit cleaned periodic is turned off, bc it need different tests, discontinuous still needed 2014-03-13 13:13:15 +00:00			`def prod(self, other, name='mul'):`
rbf and white seem to work 2014-02-19 15:00:48 +00:00			`"""`
docstrings in kern.py 2014-02-26 08:23:46 +00:00			`Multiply two kernels (either on the same space, or on the tensor`
			`product of the input space).`
rbf and white seem to work 2014-02-19 15:00:48 +00:00
			`:param other: the other kernel to be added`
			`:type other: GPy.kern`
			`:param tensor: whether or not to use the tensor space (default is false).`
			`:type tensor: bool`

			`"""`
			`assert isinstance(other, Kern), "only kernels can be added to kernels..."`
			`from prod import Prod`
product kernel and combination kernel updates 2014-03-13 11:01:48 +00:00			`#kernels = []`
			`#if isinstance(self, Prod): kernels.extend(self._parameters_)`
			`#else: kernels.append(self)`
			`#if isinstance(other, Prod): kernels.extend(other._parameters_)`
			`#else: kernels.append(other)`
			`return Prod([self, other], name)`
Combination Kernel for add and prod 2014-03-11 10:24:15 +00:00
automatic slicing 2014-03-11 16:24:09 +00:00			`def _getstate(self):`
			`"""`
			`Get the current state of the class,`
			`here just all the indices, rest can get recomputed`
			`"""`
			`return super(Kern, self)._getstate() + [`
			`self.active_dims,`
			`self.input_dim,`
			`self._sliced_X]`

			`def _setstate(self, state):`
			`self._sliced_X = state.pop()`
			`self.input_dim = state.pop()`
			`self.active_dims = state.pop()`
			`super(Kern, self)._setstate(state)`
Combination Kernel for add and prod 2014-03-11 10:24:15 +00:00
			`class CombinationKernel(Kern):`
active_dims as extra parameter for kernels, it tells which input dimensions to work on 2014-03-14 09:18:08 +00:00			`"""`
			`Abstract super class for combination kernels.`
			`A combination kernel combines (a list of) kernels and works on those.`
			`Examples are the HierarchicalKernel or Add and Prod kernels.`
			`"""`
			`def __init__(self, kernels, name, extra_dims=[]):`
			`"""`
			`Abstract super class for combination kernels.`
			`A combination kernel combines (a list of) kernels and works on those.`
			`Examples are the HierarchicalKernel or Add and Prod kernels.`

			`:param list kernels: List of kernels to combine (can be only one element)`
			`:param str name: name of the combination kernel`
			`:param array-like\|slice extra_dims: if needed extra dimensions for the combination kernel to work on`
			`"""`
Combination Kernel for add and prod 2014-03-11 10:24:15 +00:00			`assert all([isinstance(k, Kern) for k in kernels])`
kernel slices allowed 2014-03-14 10:55:16 +00:00			`active_dims = reduce(np.union1d, (np.r_[x.active_dims] for x in kernels), np.array([], dtype=int))`
			`input_dim = active_dims.max()+1 + len(extra_dims)`
			`active_dims = slice(active_dims.max()+1+len(extra_dims))`
product kernel and combination kernel updates 2014-03-13 11:01:48 +00:00			`# initialize the kernel with the full input_dim`
kernel slices allowed 2014-03-14 10:55:16 +00:00			`super(CombinationKernel, self).__init__(input_dim, active_dims, name)`
active_dims as extra parameter for kernels, it tells which input dimensions to work on 2014-03-14 09:18:08 +00:00			`self.extra_dims = extra_dims`
Combination Kernel for add and prod 2014-03-11 10:24:15 +00:00			`self.add_parameters(*kernels)`

			`@property`
			`def parts(self):`
			`return self._parameters_`

automatic slicing 2014-03-11 16:24:09 +00:00			`def input_sensitivity(self):`
			`in_sen = np.zeros((self.num_params, self.input_dim))`
			`for i, p in enumerate(self.parts):`
			`in_sen[i, p.active_dims] = p.input_sensitivity()`
			`return in_sen`