mirror of
https://github.com/SheffieldML/GPy.git
synced 2026-05-09 20:12:38 +02:00
[statespace] make predict comply to gpy standards (no confidence interval)
This commit is contained in:
parent
5f3956478f
commit
d6ccccc7e4
1 changed files with 76 additions and 84 deletions
|
|
@ -15,52 +15,43 @@
|
|||
#
|
||||
|
||||
import numpy as np
|
||||
from scipy import linalg
|
||||
from scipy import stats
|
||||
from ..core import Model
|
||||
from .. import kern
|
||||
#from GPy.plotting.matplot_dep.models_plots import gpplot
|
||||
#from GPy.plotting.matplot_dep.base_plots import x_frame1D
|
||||
#from GPy.plotting.matplot_dep import Tango
|
||||
#import pylab as pb
|
||||
from GPy.core.parameterization.param import Param
|
||||
|
||||
import GPy
|
||||
from .. import likelihoods
|
||||
|
||||
#from . import state_space_setup as ss_setup
|
||||
from ..core import Model
|
||||
from . import state_space_main as ssm
|
||||
from . import state_space_setup as ss_setup
|
||||
|
||||
class StateSpace(Model):
|
||||
def __init__(self, X, Y, kernel=None, noise_var=1.0, kalman_filter_type = 'regular', use_cython = False, name='StateSpace'):
|
||||
super(StateSpace, self).__init__(name=name)
|
||||
|
||||
|
||||
if len(X.shape) == 1:
|
||||
X = np.atleast_2d(X).T
|
||||
self.num_data, input_dim = X.shape
|
||||
|
||||
self.num_data, self.input_dim = X.shape
|
||||
|
||||
if len(Y.shape) == 1:
|
||||
Y = np.atleast_2d(Y).T
|
||||
|
||||
assert input_dim==1, "State space methods are only for 1D data"
|
||||
|
||||
|
||||
assert self.input_dim==1, "State space methods are only for 1D data"
|
||||
|
||||
if len(Y.shape)==2:
|
||||
num_data_Y, self.output_dim = Y.shape
|
||||
ts_number = None
|
||||
elif len(Y.shape)==3:
|
||||
num_data_Y, self.output_dim, ts_number = Y.shape
|
||||
|
||||
|
||||
self.ts_number = ts_number
|
||||
|
||||
|
||||
assert num_data_Y == self.num_data, "X and Y data don't match"
|
||||
assert self.output_dim == 1, "State space methods are for single outputs only"
|
||||
|
||||
self.kalman_filter_type = kalman_filter_type
|
||||
#self.kalman_filter_type = 'svd' # temp test
|
||||
ss_setup.use_cython = use_cython
|
||||
|
||||
|
||||
#import pdb; pdb.set_trace()
|
||||
|
||||
|
||||
global ssm
|
||||
#from . import state_space_main as ssm
|
||||
if (ssm.cython_code_available) and (ssm.use_cython != ss_setup.use_cython):
|
||||
|
|
@ -72,13 +63,13 @@ class StateSpace(Model):
|
|||
|
||||
# Noise variance
|
||||
self.likelihood = likelihoods.Gaussian(variance=noise_var)
|
||||
|
||||
|
||||
# Default kernel
|
||||
if kernel is None:
|
||||
raise ValueError("State-Space Model: the kernel must be provided.")
|
||||
else:
|
||||
self.kern = kernel
|
||||
|
||||
|
||||
self.link_parameter(self.kern)
|
||||
self.link_parameter(self.likelihood)
|
||||
self.posterior = None
|
||||
|
|
@ -92,14 +83,14 @@ class StateSpace(Model):
|
|||
"""
|
||||
Parameters have now changed
|
||||
"""
|
||||
|
||||
|
||||
#np.set_printoptions(16)
|
||||
#print(self.param_array)
|
||||
#import pdb; pdb.set_trace()
|
||||
|
||||
|
||||
# Get the model matrices from the kernel
|
||||
(F,L,Qc,H,P_inf, P0, dFt,dQct,dP_inft, dP0t) = self.kern.sde()
|
||||
|
||||
|
||||
# necessary parameters
|
||||
measurement_dim = self.output_dim
|
||||
grad_params_no = dFt.shape[2]+1 # we also add measurement noise as a parameter
|
||||
|
|
@ -109,30 +100,30 @@ class StateSpace(Model):
|
|||
dQc = np.zeros([dQct.shape[0],dQct.shape[1],grad_params_no])
|
||||
dP_inf = np.zeros([dP_inft.shape[0],dP_inft.shape[1],grad_params_no])
|
||||
dP0 = np.zeros([dP0t.shape[0],dP0t.shape[1],grad_params_no])
|
||||
|
||||
|
||||
# Assign the values for the kernel function
|
||||
dF[:,:,:-1] = dFt
|
||||
dQc[:,:,:-1] = dQct
|
||||
dP_inf[:,:,:-1] = dP_inft
|
||||
dP0[:,:,:-1] = dP0t
|
||||
|
||||
|
||||
# The sigma2 derivative
|
||||
dR = np.zeros([measurement_dim,measurement_dim,grad_params_no])
|
||||
dR[:,:,-1] = np.eye(measurement_dim)
|
||||
|
||||
# Balancing
|
||||
#(F,L,Qc,H,P_inf,P0, dF,dQc,dP_inf,dP0) = ssm.balance_ss_model(F,L,Qc,H,P_inf,P0, dF,dQc,dP_inf, dP0)
|
||||
|
||||
# Use the Kalman filter to evaluate the likelihood
|
||||
|
||||
# Use the Kalman filter to evaluate the likelihood
|
||||
grad_calc_params = {}
|
||||
grad_calc_params['dP_inf'] = dP_inf
|
||||
grad_calc_params['dF'] = dF
|
||||
grad_calc_params['dQc'] = dQc
|
||||
grad_calc_params['dR'] = dR
|
||||
grad_calc_params['dP_init'] = dP0
|
||||
|
||||
|
||||
kalman_filter_type = self.kalman_filter_type
|
||||
|
||||
|
||||
# The following code is required because sometimes the shapes of self.Y
|
||||
# becomes 3D even though is must be 2D. The reason is undescovered.
|
||||
Y = self.Y
|
||||
|
|
@ -140,63 +131,63 @@ class StateSpace(Model):
|
|||
Y.shape = (self.num_data,1)
|
||||
else:
|
||||
Y.shape = (self.num_data,1,self.ts_number)
|
||||
|
||||
(filter_means, filter_covs, log_likelihood,
|
||||
|
||||
(filter_means, filter_covs, log_likelihood,
|
||||
grad_log_likelihood,SmootherMatrObject) = ssm.ContDescrStateSpace.cont_discr_kalman_filter(F,L,Qc,H,
|
||||
float(self.Gaussian_noise.variance),P_inf,self.X,Y,m_init=None,
|
||||
P_init=P0, p_kalman_filter_type = kalman_filter_type, calc_log_likelihood=True,
|
||||
calc_grad_log_likelihood=True,
|
||||
grad_params_no=grad_params_no,
|
||||
P_init=P0, p_kalman_filter_type = kalman_filter_type, calc_log_likelihood=True,
|
||||
calc_grad_log_likelihood=True,
|
||||
grad_params_no=grad_params_no,
|
||||
grad_calc_params=grad_calc_params)
|
||||
|
||||
|
||||
if np.any( np.isfinite(log_likelihood) == False):
|
||||
#import pdb; pdb.set_trace()
|
||||
print("State-Space: NaN valkues in the log_likelihood")
|
||||
|
||||
|
||||
if np.any( np.isfinite(grad_log_likelihood) == False):
|
||||
#import pdb; pdb.set_trace()
|
||||
print("State-Space: NaN valkues in the grad_log_likelihood")
|
||||
#print(grad_log_likelihood)
|
||||
|
||||
|
||||
grad_log_likelihood_sum = np.sum(grad_log_likelihood,axis=1)
|
||||
grad_log_likelihood_sum.shape = (grad_log_likelihood_sum.shape[0],1)
|
||||
self._log_marginal_likelihood = np.sum( log_likelihood,axis=1 )
|
||||
self.likelihood.update_gradients(grad_log_likelihood_sum[-1,0])
|
||||
|
||||
|
||||
self.kern.sde_update_gradient_full(grad_log_likelihood_sum[:-1,0])
|
||||
|
||||
|
||||
def log_likelihood(self):
|
||||
return self._log_marginal_likelihood
|
||||
|
||||
def _raw_predict(self, Xnew=None, Ynew=None, filteronly=False):
|
||||
def _raw_predict(self, Xnew=None, Ynew=None, filteronly=False, **kw):
|
||||
"""
|
||||
Performs the actual prediction for new X points.
|
||||
Inner function. It is called only from inside this class.
|
||||
|
||||
|
||||
Input:
|
||||
---------------------
|
||||
|
||||
|
||||
Xnews: vector or (n_points,1) matrix
|
||||
New time points where to evaluate predictions.
|
||||
|
||||
|
||||
Ynews: (n_train_points, ts_no) matrix
|
||||
This matrix can substitude the original training points (in order
|
||||
This matrix can substitude the original training points (in order
|
||||
to use only the parameters of the model).
|
||||
|
||||
|
||||
filteronly: bool
|
||||
Use only Kalman Filter for prediction. In this case the output does
|
||||
not coincide with corresponding Gaussian process.
|
||||
|
||||
|
||||
Output:
|
||||
--------------------
|
||||
|
||||
|
||||
m: vector
|
||||
Mean prediction
|
||||
|
||||
|
||||
V: vector
|
||||
Variance in every point
|
||||
"""
|
||||
|
||||
|
||||
# Set defaults
|
||||
if Ynew is None:
|
||||
Ynew = self.Y
|
||||
|
|
@ -209,8 +200,8 @@ class StateSpace(Model):
|
|||
else:
|
||||
X = self.X
|
||||
Y = Ynew
|
||||
predict_only_training = True
|
||||
|
||||
predict_only_training = True
|
||||
|
||||
# Sort the matrix (save the order)
|
||||
_, return_index, return_inverse = np.unique(X,True,True)
|
||||
X = X[return_index] # TODO they are not used
|
||||
|
|
@ -218,37 +209,37 @@ class StateSpace(Model):
|
|||
|
||||
# Get the model matrices from the kernel
|
||||
(F,L,Qc,H,P_inf, P0, dF,dQc,dP_inf,dP0) = self.kern.sde()
|
||||
state_dim = F.shape[0]
|
||||
|
||||
state_dim = F.shape[0]
|
||||
|
||||
#Y = self.Y[:, 0,0]
|
||||
# Run the Kalman filter
|
||||
#import pdb; pdb.set_trace()
|
||||
kalman_filter_type = self.kalman_filter_type
|
||||
|
||||
|
||||
(M, P, log_likelihood,
|
||||
grad_log_likelihood,SmootherMatrObject) = ssm.ContDescrStateSpace.cont_discr_kalman_filter(
|
||||
F,L,Qc,H,float(self.Gaussian_noise.variance),P_inf,X,Y,m_init=None,
|
||||
P_init=P0, p_kalman_filter_type = kalman_filter_type,
|
||||
calc_log_likelihood=False,
|
||||
P_init=P0, p_kalman_filter_type = kalman_filter_type,
|
||||
calc_log_likelihood=False,
|
||||
calc_grad_log_likelihood=False)
|
||||
|
||||
# (filter_means, filter_covs, log_likelihood,
|
||||
|
||||
# (filter_means, filter_covs, log_likelihood,
|
||||
# grad_log_likelihood,SmootherMatrObject) = ssm.ContDescrStateSpace.cont_discr_kalman_filter(F,L,Qc,H,
|
||||
# float(self.Gaussian_noise.variance),P_inf,self.X,self.Y,m_init=None,
|
||||
# P_init=P0, p_kalman_filter_type = kalman_filter_type, calc_log_likelihood=True,
|
||||
# calc_grad_log_likelihood=True,
|
||||
# grad_params_no=grad_params_no,
|
||||
# P_init=P0, p_kalman_filter_type = kalman_filter_type, calc_log_likelihood=True,
|
||||
# calc_grad_log_likelihood=True,
|
||||
# grad_params_no=grad_params_no,
|
||||
# grad_calc_params=grad_calc_params)
|
||||
|
||||
|
||||
# Run the Rauch-Tung-Striebel smoother
|
||||
if not filteronly:
|
||||
(M, P) = ssm.ContDescrStateSpace.cont_discr_rts_smoother(state_dim, M, P,
|
||||
(M, P) = ssm.ContDescrStateSpace.cont_discr_rts_smoother(state_dim, M, P,
|
||||
p_dynamic_callables=SmootherMatrObject, X=X, F=F,L=L,Qc=Qc)
|
||||
|
||||
# remove initial values
|
||||
|
||||
# remove initial values
|
||||
M = M[1:,:,:]
|
||||
P = P[1:,:,:]
|
||||
|
||||
P = P[1:,:,:]
|
||||
|
||||
# Put the data back in the original order
|
||||
M = M[return_inverse,:,:]
|
||||
P = P[return_inverse,:,:]
|
||||
|
|
@ -257,40 +248,41 @@ class StateSpace(Model):
|
|||
if not predict_only_training:
|
||||
M = M[self.num_data:,:,:]
|
||||
P = P[self.num_data:,:,:]
|
||||
|
||||
|
||||
# Calculate the mean and variance
|
||||
# after einsum m has dimension in 3D (sample_num, dim_no,time_series_no)
|
||||
m = np.einsum('ijl,kj', M, H)# np.dot(M,H.T)
|
||||
m.shape = (m.shape[0], m.shape[1]) # remove the third dimension
|
||||
|
||||
|
||||
V = np.einsum('ij,ajk,kl', H, P, H.T)
|
||||
|
||||
|
||||
V.shape = (V.shape[0], V.shape[1]) # remove the third dimension
|
||||
|
||||
# Return the posterior of the state
|
||||
return (m, V)
|
||||
|
||||
def predict(self, Xnew=None, filteronly=False):
|
||||
def predict(self, Xnew=None, filteronly=False, include_likelihood=True, **kw):
|
||||
|
||||
# Run the Kalman filter to get the state
|
||||
(m, V) = self._raw_predict(Xnew,filteronly=filteronly)
|
||||
|
||||
# Add the noise variance to the state variance
|
||||
V += float(self.Gaussian_noise.variance)
|
||||
if include_likelihood:
|
||||
V += float(self.likelihood.variance)
|
||||
|
||||
# Lower and upper bounds
|
||||
lower = m - 2*np.sqrt(V)
|
||||
upper = m + 2*np.sqrt(V)
|
||||
#lower = m - 2*np.sqrt(V)
|
||||
#upper = m + 2*np.sqrt(V)
|
||||
|
||||
# Return mean and variance
|
||||
return (m, V, lower, upper)
|
||||
|
||||
def predict_quantiles(self, Xnew=None, quantiles=(2.5, 97.5)):
|
||||
return m, V
|
||||
|
||||
def predict_quantiles(self, Xnew=None, quantiles=(2.5, 97.5), **kw):
|
||||
mu, var = self._raw_predict(Xnew)
|
||||
#import pdb; pdb.set_trace()
|
||||
return [stats.norm.ppf(q/100.)*np.sqrt(var + float(self.Gaussian_noise.variance)) + mu for q in quantiles]
|
||||
|
||||
|
||||
|
||||
|
||||
# def plot(self, plot_limits=None, levels=20, samples=0, fignum=None,
|
||||
# ax=None, resolution=None, plot_raw=False, plot_filter=False,
|
||||
# linecol=Tango.colorsHex['darkBlue'],fillcol=Tango.colorsHex['lightBlue']):
|
||||
|
|
@ -399,8 +391,8 @@ class StateSpace(Model):
|
|||
#
|
||||
# # Return trajectory
|
||||
# return Y
|
||||
#
|
||||
#
|
||||
#
|
||||
#
|
||||
# def simulate(self,F,L,Qc,Pinf,X,size=1):
|
||||
# # Simulate a trajectory using the state space model
|
||||
#
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue