diff --git a/GPy/models/state_space_model.py b/GPy/models/state_space_model.py
index 241cfe73..5d22c0fc 100644
--- a/GPy/models/state_space_model.py
+++ b/GPy/models/state_space_model.py
@@ -15,52 +15,43 @@
 #
 
 import numpy as np
-from scipy import linalg
 from scipy import stats
-from ..core import Model
-from .. import kern
-#from GPy.plotting.matplot_dep.models_plots import gpplot
-#from GPy.plotting.matplot_dep.base_plots import x_frame1D
-#from GPy.plotting.matplot_dep import Tango
-#import pylab as pb
-from GPy.core.parameterization.param import Param
-
-import GPy
 from .. import likelihoods
-
+#from . import state_space_setup as ss_setup
+from ..core import Model
 from . import state_space_main as ssm
 from . import state_space_setup as ss_setup
 
 class StateSpace(Model):
     def __init__(self, X, Y, kernel=None, noise_var=1.0, kalman_filter_type = 'regular', use_cython = False, name='StateSpace'):
         super(StateSpace, self).__init__(name=name)
-        
+
         if len(X.shape) == 1:
             X = np.atleast_2d(X).T
-        self.num_data, input_dim = X.shape
-        
+        self.num_data, self.input_dim = X.shape
+
         if len(Y.shape) == 1:
             Y = np.atleast_2d(Y).T
-                
-        assert input_dim==1, "State space methods are only for 1D data"
-        
+
+        assert self.input_dim==1, "State space methods are only for 1D data"
+
         if len(Y.shape)==2:
             num_data_Y, self.output_dim = Y.shape
             ts_number = None
         elif len(Y.shape)==3:
             num_data_Y, self.output_dim, ts_number = Y.shape
-        
+
         self.ts_number = ts_number
-        
+
         assert num_data_Y == self.num_data, "X and Y data don't match"
         assert self.output_dim == 1, "State space methods are for single outputs only"
 
         self.kalman_filter_type = kalman_filter_type
         #self.kalman_filter_type = 'svd' # temp test
         ss_setup.use_cython = use_cython
-        
+
         #import pdb; pdb.set_trace()
-        
+
         global ssm
         #from . import state_space_main as ssm
         if (ssm.cython_code_available) and (ssm.use_cython != ss_setup.use_cython):
@@ -72,13 +63,13 @@ class StateSpace(Model):
 
         # Noise variance
         self.likelihood = likelihoods.Gaussian(variance=noise_var)
-        
+
         # Default kernel
         if kernel is None:
             raise ValueError("State-Space Model: the kernel must be provided.")
         else:
             self.kern = kernel
-            
+
         self.link_parameter(self.kern)
         self.link_parameter(self.likelihood)
         self.posterior = None
@@ -92,14 +83,14 @@ class StateSpace(Model):
         """
         Parameters have now changed
         """
-    
+
         #np.set_printoptions(16)
         #print(self.param_array)
         #import pdb; pdb.set_trace()
-        
+
         # Get the model matrices from the kernel
         (F,L,Qc,H,P_inf, P0, dFt,dQct,dP_inft, dP0t) = self.kern.sde()
-        
+
         # necessary parameters
         measurement_dim = self.output_dim
         grad_params_no = dFt.shape[2]+1 # we also add measurement noise as a parameter
@@ -109,30 +100,30 @@ class StateSpace(Model):
         dQc   = np.zeros([dQct.shape[0],dQct.shape[1],grad_params_no])
         dP_inf = np.zeros([dP_inft.shape[0],dP_inft.shape[1],grad_params_no])
         dP0 = np.zeros([dP0t.shape[0],dP0t.shape[1],grad_params_no])
-        
+
         # Assign the values for the kernel function
         dF[:,:,:-1] = dFt
         dQc[:,:,:-1] = dQct
         dP_inf[:,:,:-1] = dP_inft
         dP0[:,:,:-1] = dP0t
-        
+
         # The sigma2 derivative
         dR = np.zeros([measurement_dim,measurement_dim,grad_params_no])
         dR[:,:,-1] = np.eye(measurement_dim)
 
         # Balancing
         #(F,L,Qc,H,P_inf,P0, dF,dQc,dP_inf,dP0) = ssm.balance_ss_model(F,L,Qc,H,P_inf,P0, dF,dQc,dP_inf, dP0)
-        
-        # Use the Kalman filter to evaluate the likelihood        
+
+        # Use the Kalman filter to evaluate the likelihood
         grad_calc_params = {}
         grad_calc_params['dP_inf'] = dP_inf
         grad_calc_params['dF'] = dF
         grad_calc_params['dQc'] = dQc
         grad_calc_params['dR'] = dR
         grad_calc_params['dP_init'] = dP0
-        
+
         kalman_filter_type = self.kalman_filter_type
-             
+
         # The following code is required because sometimes the shapes of self.Y
         # becomes 3D even though is must be 2D. The reason is undescovered.
         Y = self.Y
@@ -140,63 +131,63 @@ class StateSpace(Model):
             Y.shape = (self.num_data,1)
         else:
             Y.shape = (self.num_data,1,self.ts_number)
-            
-        (filter_means, filter_covs, log_likelihood, 
+
+        (filter_means, filter_covs, log_likelihood,
          grad_log_likelihood,SmootherMatrObject) = ssm.ContDescrStateSpace.cont_discr_kalman_filter(F,L,Qc,H,
                                       float(self.Gaussian_noise.variance),P_inf,self.X,Y,m_init=None,
-                                      P_init=P0, p_kalman_filter_type = kalman_filter_type, calc_log_likelihood=True, 
-                                      calc_grad_log_likelihood=True, 
-                                      grad_params_no=grad_params_no, 
+                                      P_init=P0, p_kalman_filter_type = kalman_filter_type, calc_log_likelihood=True,
+                                      calc_grad_log_likelihood=True,
+                                      grad_params_no=grad_params_no,
                                       grad_calc_params=grad_calc_params)
-            
+
         if np.any( np.isfinite(log_likelihood) == False):
             #import pdb; pdb.set_trace()
             print("State-Space: NaN valkues in the log_likelihood")
-        
+
         if np.any( np.isfinite(grad_log_likelihood) == False):
             #import pdb; pdb.set_trace()
             print("State-Space: NaN valkues in the grad_log_likelihood")
         #print(grad_log_likelihood)
-        
+
         grad_log_likelihood_sum = np.sum(grad_log_likelihood,axis=1)
         grad_log_likelihood_sum.shape = (grad_log_likelihood_sum.shape[0],1)
         self._log_marginal_likelihood = np.sum( log_likelihood,axis=1 )
         self.likelihood.update_gradients(grad_log_likelihood_sum[-1,0])
-        
+
         self.kern.sde_update_gradient_full(grad_log_likelihood_sum[:-1,0])
-        
+
     def log_likelihood(self):
         return self._log_marginal_likelihood
 
-    def _raw_predict(self, Xnew=None, Ynew=None, filteronly=False):
+    def _raw_predict(self, Xnew=None, Ynew=None, filteronly=False, **kw):
         """
         Performs the actual prediction for new X points.
         Inner function. It is called only from inside this class.
-        
+
         Input:
         ---------------------
-        
+
         Xnews: vector or (n_points,1) matrix
             New time points where to evaluate predictions.
-            
+
         Ynews: (n_train_points, ts_no) matrix
-            This matrix can substitude the original training points (in order 
+            This matrix can substitude the original training points (in order
             to use only the parameters of the model).
-            
+
         filteronly: bool
             Use only Kalman Filter for prediction. In this case the output does
             not coincide with corresponding Gaussian process.
-            
+
         Output:
         --------------------
-        
+
         m: vector
             Mean prediction
-        
+
         V: vector
             Variance in every point
         """
-        
+
         # Set defaults
         if Ynew is None:
             Ynew = self.Y
@@ -209,8 +200,8 @@ class StateSpace(Model):
         else:
             X = self.X
             Y = Ynew
-            predict_only_training = True            
-            
+            predict_only_training = True
+
         # Sort the matrix (save the order)
         _, return_index, return_inverse = np.unique(X,True,True)
         X = X[return_index] # TODO they are not used
@@ -218,37 +209,37 @@ class StateSpace(Model):
 
         # Get the model matrices from the kernel
         (F,L,Qc,H,P_inf, P0, dF,dQc,dP_inf,dP0) = self.kern.sde()
-        state_dim = F.shape[0]        
-        
+        state_dim = F.shape[0]
+
         #Y = self.Y[:, 0,0]
         # Run the Kalman filter
         #import pdb; pdb.set_trace()
         kalman_filter_type = self.kalman_filter_type
-        
+
         (M, P, log_likelihood,
          grad_log_likelihood,SmootherMatrObject) = ssm.ContDescrStateSpace.cont_discr_kalman_filter(
                                       F,L,Qc,H,float(self.Gaussian_noise.variance),P_inf,X,Y,m_init=None,
-                                      P_init=P0, p_kalman_filter_type = kalman_filter_type, 
-                                      calc_log_likelihood=False, 
+                                      P_init=P0, p_kalman_filter_type = kalman_filter_type,
+                                      calc_log_likelihood=False,
                                       calc_grad_log_likelihood=False)
-                                                                   
-#        (filter_means, filter_covs, log_likelihood, 
+
+#        (filter_means, filter_covs, log_likelihood,
 #         grad_log_likelihood,SmootherMatrObject) = ssm.ContDescrStateSpace.cont_discr_kalman_filter(F,L,Qc,H,
 #                                      float(self.Gaussian_noise.variance),P_inf,self.X,self.Y,m_init=None,
-#                                      P_init=P0, p_kalman_filter_type = kalman_filter_type, calc_log_likelihood=True, 
-#                                      calc_grad_log_likelihood=True, 
-#                                      grad_params_no=grad_params_no, 
+#                                      P_init=P0, p_kalman_filter_type = kalman_filter_type, calc_log_likelihood=True,
+#                                      calc_grad_log_likelihood=True,
+#                                      grad_params_no=grad_params_no,
 #                                      grad_calc_params=grad_calc_params)
-                                      
+
         # Run the Rauch-Tung-Striebel smoother
         if not filteronly:
-            (M, P) = ssm.ContDescrStateSpace.cont_discr_rts_smoother(state_dim, M, P, 
+            (M, P) = ssm.ContDescrStateSpace.cont_discr_rts_smoother(state_dim, M, P,
                                 p_dynamic_callables=SmootherMatrObject, X=X, F=F,L=L,Qc=Qc)
-        
-        # remove initial values        
+
+        # remove initial values
         M = M[1:,:,:]
-        P = P[1:,:,:]        
-        
+        P = P[1:,:,:]
+
         # Put the data back in the original order
         M = M[return_inverse,:,:]
         P = P[return_inverse,:,:]
@@ -257,40 +248,41 @@ class StateSpace(Model):
         if not predict_only_training:
             M = M[self.num_data:,:,:]
             P = P[self.num_data:,:,:]
-        
+
         # Calculate the mean and variance
         # after einsum m has dimension in 3D (sample_num, dim_no,time_series_no)
         m = np.einsum('ijl,kj', M, H)# np.dot(M,H.T)
         m.shape = (m.shape[0], m.shape[1]) # remove the third dimension
-        
+
         V = np.einsum('ij,ajk,kl', H, P, H.T)
-        
+
         V.shape = (V.shape[0], V.shape[1]) # remove the third dimension
 
         # Return the posterior of the state
         return (m, V)
 
-    def predict(self, Xnew=None, filteronly=False):
+    def predict(self, Xnew=None, filteronly=False, include_likelihood=True, **kw):
 
         # Run the Kalman filter to get the state
         (m, V) = self._raw_predict(Xnew,filteronly=filteronly)
 
         # Add the noise variance to the state variance
-        V += float(self.Gaussian_noise.variance)
+        if include_likelihood:
+            V += float(self.likelihood.variance)
 
         # Lower and upper bounds
-        lower = m - 2*np.sqrt(V)
-        upper = m + 2*np.sqrt(V)
+        #lower = m - 2*np.sqrt(V)
+        #upper = m + 2*np.sqrt(V)
 
         # Return mean and variance
-        return (m, V, lower, upper)
-        
-    def predict_quantiles(self, Xnew=None, quantiles=(2.5, 97.5)):
+        return m, V
+
+    def predict_quantiles(self, Xnew=None, quantiles=(2.5, 97.5), **kw):
         mu, var = self._raw_predict(Xnew)
         #import pdb; pdb.set_trace()
         return  [stats.norm.ppf(q/100.)*np.sqrt(var + float(self.Gaussian_noise.variance)) + mu for q in quantiles]
-        
-        
+
+
 #    def plot(self, plot_limits=None, levels=20, samples=0, fignum=None,
 #            ax=None, resolution=None, plot_raw=False, plot_filter=False,
 #            linecol=Tango.colorsHex['darkBlue'],fillcol=Tango.colorsHex['lightBlue']):
@@ -399,8 +391,8 @@ class StateSpace(Model):
 #
 #        # Return trajectory
 #        return Y
-#        
-#        
+#
+#
 #    def simulate(self,F,L,Qc,Pinf,X,size=1):
 #        # Simulate a trajectory using the state space model
 #