[statespace] make predict comply to gpy standards (no confidence interval)

2026-05-09 20:12:38 +02:00 · 2016-04-04 15:37:51 +01:00 · 2016-04-04 15:37:51 +01:00 · d6ccccc7e4
commit d6ccccc7e4
parent 5f3956478f
1 changed files with 76 additions and 84 deletions
--- a/GPy/models/state_space_model.py
+++ b/GPy/models/state_space_model.py
@ -15,52 +15,43 @@
 #

 import numpy as np
-from scipy import linalg
 from scipy import stats
-from ..core import Model
-from .. import kern
-#from GPy.plotting.matplot_dep.models_plots import gpplot
-#from GPy.plotting.matplot_dep.base_plots import x_frame1D
-#from GPy.plotting.matplot_dep import Tango
-#import pylab as pb
-from GPy.core.parameterization.param import Param
-
-import GPy
 from .. import likelihoods
-
+#from . import state_space_setup as ss_setup
+from ..core import Model
 from . import state_space_main as ssm
 from . import state_space_setup as ss_setup

 class StateSpace(Model):
    def __init__(self, X, Y, kernel=None, noise_var=1.0, kalman_filter_type = 'regular', use_cython = False, name='StateSpace'):
        super(StateSpace, self).__init__(name=name)
-        
+
        if len(X.shape) == 1:
            X = np.atleast_2d(X).T
-        self.num_data, input_dim = X.shape
-        
+        self.num_data, self.input_dim = X.shape
+
        if len(Y.shape) == 1:
            Y = np.atleast_2d(Y).T
-                
-        assert input_dim==1, "State space methods are only for 1D data"
-        
+
+        assert self.input_dim==1, "State space methods are only for 1D data"
+
        if len(Y.shape)==2:
            num_data_Y, self.output_dim = Y.shape
            ts_number = None
        elif len(Y.shape)==3:
            num_data_Y, self.output_dim, ts_number = Y.shape
-        
+
        self.ts_number = ts_number
-        
+
        assert num_data_Y == self.num_data, "X and Y data don't match"
        assert self.output_dim == 1, "State space methods are for single outputs only"

        self.kalman_filter_type = kalman_filter_type
        #self.kalman_filter_type = 'svd' # temp test
        ss_setup.use_cython = use_cython
-        
+
        #import pdb; pdb.set_trace()
-        
+
        global ssm
        #from . import state_space_main as ssm
        if (ssm.cython_code_available) and (ssm.use_cython != ss_setup.use_cython):
@ -72,13 +63,13 @@ class StateSpace(Model):

        # Noise variance
        self.likelihood = likelihoods.Gaussian(variance=noise_var)
-        
+
        # Default kernel
        if kernel is None:
            raise ValueError("State-Space Model: the kernel must be provided.")
        else:
            self.kern = kernel
-            
+
        self.link_parameter(self.kern)
        self.link_parameter(self.likelihood)
        self.posterior = None
@ -92,14 +83,14 @@ class StateSpace(Model):
        """
        Parameters have now changed
        """
-    
+
        #np.set_printoptions(16)
        #print(self.param_array)
        #import pdb; pdb.set_trace()
-        
+
        # Get the model matrices from the kernel
        (F,L,Qc,H,P_inf, P0, dFt,dQct,dP_inft, dP0t) = self.kern.sde()
-        
+
        # necessary parameters
        measurement_dim = self.output_dim
        grad_params_no = dFt.shape[2]+1 # we also add measurement noise as a parameter
@ -109,30 +100,30 @@ class StateSpace(Model):
        dQc   = np.zeros([dQct.shape[0],dQct.shape[1],grad_params_no])
        dP_inf = np.zeros([dP_inft.shape[0],dP_inft.shape[1],grad_params_no])
        dP0 = np.zeros([dP0t.shape[0],dP0t.shape[1],grad_params_no])
-        
+
        # Assign the values for the kernel function
        dF[:,:,:-1] = dFt
        dQc[:,:,:-1] = dQct
        dP_inf[:,:,:-1] = dP_inft
        dP0[:,:,:-1] = dP0t
-        
+
        # The sigma2 derivative
        dR = np.zeros([measurement_dim,measurement_dim,grad_params_no])
        dR[:,:,-1] = np.eye(measurement_dim)

        # Balancing
        #(F,L,Qc,H,P_inf,P0, dF,dQc,dP_inf,dP0) = ssm.balance_ss_model(F,L,Qc,H,P_inf,P0, dF,dQc,dP_inf, dP0)
-        
-        # Use the Kalman filter to evaluate the likelihood        
+
+        # Use the Kalman filter to evaluate the likelihood
        grad_calc_params = {}
        grad_calc_params['dP_inf'] = dP_inf
        grad_calc_params['dF'] = dF
        grad_calc_params['dQc'] = dQc
        grad_calc_params['dR'] = dR
        grad_calc_params['dP_init'] = dP0
-        
+
        kalman_filter_type = self.kalman_filter_type
-             
+
        # The following code is required because sometimes the shapes of self.Y
        # becomes 3D even though is must be 2D. The reason is undescovered.
        Y = self.Y
@ -140,63 +131,63 @@ class StateSpace(Model):
            Y.shape = (self.num_data,1)
        else:
            Y.shape = (self.num_data,1,self.ts_number)
-            
-        (filter_means, filter_covs, log_likelihood, 
+
+        (filter_means, filter_covs, log_likelihood,
         grad_log_likelihood,SmootherMatrObject) = ssm.ContDescrStateSpace.cont_discr_kalman_filter(F,L,Qc,H,
                                      float(self.Gaussian_noise.variance),P_inf,self.X,Y,m_init=None,
-                                      P_init=P0, p_kalman_filter_type = kalman_filter_type, calc_log_likelihood=True, 
-                                      calc_grad_log_likelihood=True, 
-                                      grad_params_no=grad_params_no, 
+                                      P_init=P0, p_kalman_filter_type = kalman_filter_type, calc_log_likelihood=True,
+                                      calc_grad_log_likelihood=True,
+                                      grad_params_no=grad_params_no,
                                      grad_calc_params=grad_calc_params)
-            
+
        if np.any( np.isfinite(log_likelihood) == False):
            #import pdb; pdb.set_trace()
            print("State-Space: NaN valkues in the log_likelihood")
-        
+
        if np.any( np.isfinite(grad_log_likelihood) == False):
            #import pdb; pdb.set_trace()
            print("State-Space: NaN valkues in the grad_log_likelihood")
        #print(grad_log_likelihood)
-        
+
        grad_log_likelihood_sum = np.sum(grad_log_likelihood,axis=1)
        grad_log_likelihood_sum.shape = (grad_log_likelihood_sum.shape[0],1)
        self._log_marginal_likelihood = np.sum( log_likelihood,axis=1 )
        self.likelihood.update_gradients(grad_log_likelihood_sum[-1,0])
-        
+
        self.kern.sde_update_gradient_full(grad_log_likelihood_sum[:-1,0])
-        
+
    def log_likelihood(self):
        return self._log_marginal_likelihood

-    def _raw_predict(self, Xnew=None, Ynew=None, filteronly=False):
+    def _raw_predict(self, Xnew=None, Ynew=None, filteronly=False, **kw):
        """
        Performs the actual prediction for new X points.
        Inner function. It is called only from inside this class.
-        
+
        Input:
        ---------------------
-        
+
        Xnews: vector or (n_points,1) matrix
            New time points where to evaluate predictions.
-            
+
        Ynews: (n_train_points, ts_no) matrix
-            This matrix can substitude the original training points (in order 
+            This matrix can substitude the original training points (in order
            to use only the parameters of the model).
-            
+
        filteronly: bool
            Use only Kalman Filter for prediction. In this case the output does
            not coincide with corresponding Gaussian process.
-            
+
        Output:
        --------------------
-        
+
        m: vector
            Mean prediction
-        
+
        V: vector
            Variance in every point
        """
-        
+
        # Set defaults
        if Ynew is None:
            Ynew = self.Y
@ -209,8 +200,8 @@ class StateSpace(Model):
        else:
            X = self.X
            Y = Ynew
-            predict_only_training = True            
-            
+            predict_only_training = True
+
        # Sort the matrix (save the order)
        _, return_index, return_inverse = np.unique(X,True,True)
        X = X[return_index] # TODO they are not used
@ -218,37 +209,37 @@ class StateSpace(Model):

        # Get the model matrices from the kernel
        (F,L,Qc,H,P_inf, P0, dF,dQc,dP_inf,dP0) = self.kern.sde()
-        state_dim = F.shape[0]        
-        
+        state_dim = F.shape[0]
+
        #Y = self.Y[:, 0,0]
        # Run the Kalman filter
        #import pdb; pdb.set_trace()
        kalman_filter_type = self.kalman_filter_type
-        
+
        (M, P, log_likelihood,
         grad_log_likelihood,SmootherMatrObject) = ssm.ContDescrStateSpace.cont_discr_kalman_filter(
                                      F,L,Qc,H,float(self.Gaussian_noise.variance),P_inf,X,Y,m_init=None,
-                                      P_init=P0, p_kalman_filter_type = kalman_filter_type, 
-                                      calc_log_likelihood=False, 
+                                      P_init=P0, p_kalman_filter_type = kalman_filter_type,
+                                      calc_log_likelihood=False,
                                      calc_grad_log_likelihood=False)
-                                                                   
-#        (filter_means, filter_covs, log_likelihood, 
+
+#        (filter_means, filter_covs, log_likelihood,
 #         grad_log_likelihood,SmootherMatrObject) = ssm.ContDescrStateSpace.cont_discr_kalman_filter(F,L,Qc,H,
 #                                      float(self.Gaussian_noise.variance),P_inf,self.X,self.Y,m_init=None,
-#                                      P_init=P0, p_kalman_filter_type = kalman_filter_type, calc_log_likelihood=True, 
-#                                      calc_grad_log_likelihood=True, 
-#                                      grad_params_no=grad_params_no, 
+#                                      P_init=P0, p_kalman_filter_type = kalman_filter_type, calc_log_likelihood=True,
+#                                      calc_grad_log_likelihood=True,
+#                                      grad_params_no=grad_params_no,
 #                                      grad_calc_params=grad_calc_params)
-                                      
+
        # Run the Rauch-Tung-Striebel smoother
        if not filteronly:
-            (M, P) = ssm.ContDescrStateSpace.cont_discr_rts_smoother(state_dim, M, P, 
+            (M, P) = ssm.ContDescrStateSpace.cont_discr_rts_smoother(state_dim, M, P,
                                p_dynamic_callables=SmootherMatrObject, X=X, F=F,L=L,Qc=Qc)
-        
-        # remove initial values        
+
+        # remove initial values
        M = M[1:,:,:]
-        P = P[1:,:,:]        
-        
+        P = P[1:,:,:]
+
        # Put the data back in the original order
        M = M[return_inverse,:,:]
        P = P[return_inverse,:,:]
@ -257,40 +248,41 @@ class StateSpace(Model):
        if not predict_only_training:
            M = M[self.num_data:,:,:]
            P = P[self.num_data:,:,:]
-        
+
        # Calculate the mean and variance
        # after einsum m has dimension in 3D (sample_num, dim_no,time_series_no)
        m = np.einsum('ijl,kj', M, H)# np.dot(M,H.T)
        m.shape = (m.shape[0], m.shape[1]) # remove the third dimension
-        
+
        V = np.einsum('ij,ajk,kl', H, P, H.T)
-        
+
        V.shape = (V.shape[0], V.shape[1]) # remove the third dimension

        # Return the posterior of the state
        return (m, V)

-    def predict(self, Xnew=None, filteronly=False):
+    def predict(self, Xnew=None, filteronly=False, include_likelihood=True, **kw):

        # Run the Kalman filter to get the state
        (m, V) = self._raw_predict(Xnew,filteronly=filteronly)

        # Add the noise variance to the state variance
-        V += float(self.Gaussian_noise.variance)
+        if include_likelihood:
+            V += float(self.likelihood.variance)

        # Lower and upper bounds
-        lower = m - 2*np.sqrt(V)
-        upper = m + 2*np.sqrt(V)
+        #lower = m - 2*np.sqrt(V)
+        #upper = m + 2*np.sqrt(V)

        # Return mean and variance
-        return (m, V, lower, upper)
-        
-    def predict_quantiles(self, Xnew=None, quantiles=(2.5, 97.5)):
+        return m, V
+
+    def predict_quantiles(self, Xnew=None, quantiles=(2.5, 97.5), **kw):
        mu, var = self._raw_predict(Xnew)
        #import pdb; pdb.set_trace()
        return  [stats.norm.ppf(q/100.)*np.sqrt(var + float(self.Gaussian_noise.variance)) + mu for q in quantiles]
-        
-        
+
+
 #    def plot(self, plot_limits=None, levels=20, samples=0, fignum=None,
 #            ax=None, resolution=None, plot_raw=False, plot_filter=False,
 #            linecol=Tango.colorsHex['darkBlue'],fillcol=Tango.colorsHex['lightBlue']):
@ -399,8 +391,8 @@ class StateSpace(Model):
 #
 #        # Return trajectory
 #        return Y
-#        
-#        
+#
+#
 #    def simulate(self,F,L,Qc,Pinf,X,size=1):
 #        # Simulate a trajectory using the state space model
 #