SHOGUN: LaplacianInferenceMethod.cpp Source File

Go to the documentation of this file.
 /*
  * This program is free software; you can redistribute it and/or modify
  * it under the terms of the GNU General Public License as published by
  * the Free Software Foundation; either version 3 of the License, or
  * (at your option) any later version.
  *
  * Written (W) 2013 Roman Votyakov
  * Copyright (C) 2012 Jacob Walker
  * Copyright (C) 2013 Roman Votyakov
  *
  * Code adapted from Gaussian Process Machine Learning Toolbox
  * http://www.gaussianprocess.org/gpml/code/matlab/doc/
  * This code specifically adapted from infLaplace.m
  */
 
 #include <shogun/machine/gp/LaplacianInferenceMethod.h>
 
 #ifdef HAVE_EIGEN3
 
 #include <shogun/machine/gp/StudentsTLikelihood.h>
 #include <shogun/mathematics/Math.h>
 #include <shogun/lib/external/brent.h>
 #include <shogun/mathematics/eigen3.h>
 
 using namespace shogun;
 using namespace Eigen;
 
 namespace shogun
 {
 
 #ifndef DOXYGEN_SHOULD_SKIP_THIS
 
 class CPsiLine : public func_base
 {
 public:
     float64_t scale;
     MatrixXd K;
     VectorXd dalpha;
     VectorXd start_alpha;
     Map<VectorXd>* alpha;
     SGVector<float64_t>* dlp;
     SGVector<float64_t>* W;
     SGVector<float64_t>* f;
     SGVector<float64_t>* m;
     CLikelihoodModel* lik;
     CLabels* lab;
 
     virtual double operator() (double x)
     {
         Map<VectorXd> eigen_f(f->vector, f->vlen);
         Map<VectorXd> eigen_m(m->vector, m->vlen);
 
         // compute alpha=alpha+x*dalpha and f=K*alpha+m
         (*alpha)=start_alpha+x*dalpha;
         eigen_f=K*(*alpha)*CMath::sq(scale)+eigen_m;
 
         // get first and second derivatives of log likelihood
         (*dlp)=lik->get_log_probability_derivative_f(lab, (*f), 1);
 
         (*W)=lik->get_log_probability_derivative_f(lab, (*f), 2);
         W->scale(-1.0);
 
         // compute psi=alpha'*(f-m)/2-lp
         float64_t result = (*alpha).dot(eigen_f-eigen_m)/2.0-
             SGVector<float64_t>::sum(lik->get_log_probability_f(lab, *f));
 
         return result;
     }
 };
 
 #endif /* DOXYGEN_SHOULD_SKIP_THIS */
 
 CLaplacianInferenceMethod::CLaplacianInferenceMethod() : CInferenceMethod()
 {
     init();
 }
 
 CLaplacianInferenceMethod::CLaplacianInferenceMethod(CKernel* kern,
         CFeatures* feat, CMeanFunction* m, CLabels* lab, CLikelihoodModel* mod)
         : CInferenceMethod(kern, feat, m, lab, mod)
 {
     init();
 }
 
 void CLaplacianInferenceMethod::init()
 {
     m_iter=20;
     m_tolerance=1e-6;
     m_opt_tolerance=1e-10;
     m_opt_max=10;
 }
 
 CLaplacianInferenceMethod::~CLaplacianInferenceMethod()
 {
 }
 
 void CLaplacianInferenceMethod::update()
 {
     CInferenceMethod::update();
     update_alpha();
     update_chol();
     update_approx_cov();
     update_deriv();
 }
 
 SGVector<float64_t> CLaplacianInferenceMethod::get_diagonal_vector()
 {
     if (update_parameter_hash())
         update();
 
     return SGVector<float64_t>(sW);
 }
 
 float64_t CLaplacianInferenceMethod::get_negative_log_marginal_likelihood()
 {
     if (update_parameter_hash())
         update();
 
     // create eigen representations alpha, f, W, L
     Map<VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);
     Map<VectorXd> eigen_mu(m_mu.vector, m_mu.vlen);
     Map<VectorXd> eigen_W(W.vector, W.vlen);
     Map<MatrixXd> eigen_L(m_L.matrix, m_L.num_rows, m_L.num_cols);
 
     // get mean vector and create eigen representation of it
     SGVector<float64_t> mean=m_mean->get_mean_vector(m_features);
     Map<VectorXd> eigen_mean(mean.vector, mean.vlen);
 
     // get log likelihood
     float64_t lp=SGVector<float64_t>::sum(m_model->get_log_probability_f(m_labels,
         m_mu));
 
     float64_t result;
 
     if (eigen_W.minCoeff()<0)
     {
         Map<VectorXd> eigen_sW(sW.vector, sW.vlen);
         Map<MatrixXd> eigen_ktrtr(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);
 
         FullPivLU<MatrixXd> lu(MatrixXd::Identity(m_ktrtr.num_rows, m_ktrtr.num_cols)+
             eigen_ktrtr*CMath::sq(m_scale)*eigen_sW.asDiagonal());
 
         result=(eigen_alpha.dot(eigen_mu-eigen_mean))/2.0-
             lp+log(lu.determinant())/2.0;
     }
     else
     {
         result=eigen_alpha.dot(eigen_mu-eigen_mean)/2.0-lp+
             eigen_L.diagonal().array().log().sum();
     }
 
     return result;
 }
 
 SGVector<float64_t> CLaplacianInferenceMethod::get_alpha()
 {
     if (update_parameter_hash())
         update();
 
     SGVector<float64_t> result(m_alpha);
     return result;
 }
 
 SGMatrix<float64_t> CLaplacianInferenceMethod::get_cholesky()
 {
     if (update_parameter_hash())
         update();
 
     return SGMatrix<float64_t>(m_L);
 }
 
 SGVector<float64_t> CLaplacianInferenceMethod::get_posterior_mean()
 {
     if (update_parameter_hash())
         update();
 
     return SGVector<float64_t>(m_mu);
 }
 
 SGMatrix<float64_t> CLaplacianInferenceMethod::get_posterior_covariance()
 {
     if (update_parameter_hash())
         update();
 
     return SGMatrix<float64_t>(m_Sigma);
 }
 
 void CLaplacianInferenceMethod::update_approx_cov()
 {
     Map<MatrixXd> eigen_L(m_L.matrix, m_L.num_rows, m_L.num_cols);
     Map<MatrixXd> eigen_K(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);
     Map<VectorXd> eigen_sW(sW.vector, sW.vlen);
 
     m_Sigma=SGMatrix<float64_t>(m_ktrtr.num_rows, m_ktrtr.num_cols);
     Map<MatrixXd> eigen_Sigma(m_Sigma.matrix, m_Sigma.num_rows, m_Sigma.num_cols);
 
     // compute V = L^(-1) * W^(1/2) * K, using upper triangular factor L^T
     MatrixXd eigen_V=eigen_L.triangularView<Upper>().adjoint().solve(
             eigen_sW.asDiagonal()*eigen_K*CMath::sq(m_scale));
 
     // compute covariance matrix of the posterior:
     // Sigma = K - K * W^(1/2) * (L * L^T)^(-1) * W^(1/2) * K =
     // K - (K * W^(1/2)) * (L^T)^(-1) * L^(-1) * W^(1/2) * K =
     // K - (W^(1/2) * K)^T * (L^(-1))^T * L^(-1) * W^(1/2) * K = K - V^T * V
     eigen_Sigma=eigen_K*CMath::sq(m_scale)-eigen_V.adjoint()*eigen_V;
 }
 
 void CLaplacianInferenceMethod::update_chol()
 {
     Map<VectorXd> eigen_W(W.vector, W.vlen);
 
     // create eigen representation of kernel matrix
     Map<MatrixXd> eigen_ktrtr(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);
 
     // create shogun and eigen representation of posterior cholesky
     m_L=SGMatrix<float64_t>(m_ktrtr.num_rows, m_ktrtr.num_cols);
     Map<MatrixXd> eigen_L(m_L.matrix, m_L.num_rows, m_L.num_cols);
 
     if (eigen_W.minCoeff() < 0)
     {
         // compute inverse of diagonal noise: iW = 1/W
         VectorXd eigen_iW = (VectorXd::Ones(W.vlen)).cwiseQuotient(eigen_W);
 
         FullPivLU<MatrixXd> lu(
             eigen_ktrtr*CMath::sq(m_scale)+MatrixXd(eigen_iW.asDiagonal()));
 
         // compute cholesky: L = -(K + iW)^-1
         eigen_L = -lu.inverse();
     }
     else
     {
         Map<VectorXd> eigen_sW(sW.vector, sW.vlen);
 
         // compute cholesky: L = chol(sW * sW' .* K + I)
         LLT<MatrixXd> L(
             (eigen_sW*eigen_sW.transpose()).cwiseProduct(eigen_ktrtr*CMath::sq(m_scale))+
             MatrixXd::Identity(m_ktrtr.num_rows, m_ktrtr.num_cols));
 
         eigen_L = L.matrixU();
     }
 }
 
 void CLaplacianInferenceMethod::update_alpha()
 {
     float64_t Psi_Old = CMath::INFTY;
     float64_t Psi_New;
     float64_t Psi_Def;
 
     // get mean vector and create eigen representation of it
     SGVector<float64_t> mean=m_mean->get_mean_vector(m_features);
     Map<VectorXd> eigen_mean(mean.vector, mean.vlen);
 
     // create eigen representation of kernel matrix
     Map<MatrixXd> eigen_ktrtr(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);
 
     // create shogun and eigen representation of function vector
     m_mu=SGVector<float64_t>(mean.vlen);
     Map<VectorXd> eigen_mu(m_mu, m_mu.vlen);
 
     if (m_alpha.vlen!=m_labels->get_num_labels())
     {
         // set alpha a zero vector
         m_alpha=SGVector<float64_t>(m_labels->get_num_labels());
         m_alpha.zero();
 
         // f = mean, if length of alpha and length of y doesn't match
         eigen_mu=eigen_mean;
 
         // compute W = -d2lp
         W=m_model->get_log_probability_derivative_f(m_labels, m_mu, 2);
         W.scale(-1.0);
 
         Psi_New=-SGVector<float64_t>::sum(m_model->get_log_probability_f(
             m_labels, m_mu));
     }
     else
     {
         Map<VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);
 
         // compute f = K * alpha + m
         eigen_mu=eigen_ktrtr*CMath::sq(m_scale)*eigen_alpha+eigen_mean;
 
         // compute W = -d2lp
         W=m_model->get_log_probability_derivative_f(m_labels, m_mu, 2);
         W.scale(-1.0);
 
         Psi_New=eigen_alpha.dot(eigen_mu-eigen_mean)/2.0-
             SGVector<float64_t>::sum(m_model->get_log_probability_f(m_labels, m_mu));
 
         Psi_Def=-SGVector<float64_t>::sum(m_model->get_log_probability_f(m_labels, mean));
 
         // if default is better, then use it
         if (Psi_Def < Psi_New)
         {
             m_alpha.zero();
             eigen_mu=eigen_mean;
             Psi_New=-SGVector<float64_t>::sum(m_model->get_log_probability_f(
                 m_labels, m_mu));
         }
     }
 
     Map<VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);
 
     // get first derivative of log probability function
     dlp=m_model->get_log_probability_derivative_f(m_labels, m_mu, 1);
 
     // create shogun and eigen representation of sW
     sW=SGVector<float64_t>(W.vlen);
     Map<VectorXd> eigen_sW(sW.vector, sW.vlen);
 
     index_t iter=0;
 
     while (Psi_Old-Psi_New>m_tolerance && iter<m_iter)
     {
         Map<VectorXd> eigen_W(W.vector, W.vlen);
         Map<VectorXd> eigen_dlp(dlp.vector, dlp.vlen);
 
         Psi_Old = Psi_New;
         iter++;
 
         if (eigen_W.minCoeff() < 0)
         {
             // Suggested by Vanhatalo et. al.,
             // Gaussian Process Regression with Student's t likelihood, NIPS 2009
             // Quoted from infLaplace.m
             float64_t df;
 
             if (m_model->get_model_type()==LT_STUDENTST)
             {
                 CStudentsTLikelihood* lik=CStudentsTLikelihood::obtain_from_generic(m_model);
                 df=lik->get_degrees_freedom();
                 SG_UNREF(lik);
             }
             else
                 df=1;
 
             eigen_W+=(2.0/df)*eigen_dlp.cwiseProduct(eigen_dlp);
         }
 
         // compute sW = sqrt(W)
         eigen_sW=eigen_W.cwiseSqrt();
 
         LLT<MatrixXd> L((eigen_sW*eigen_sW.transpose()).cwiseProduct(eigen_ktrtr*CMath::sq(m_scale))+
             MatrixXd::Identity(m_ktrtr.num_rows, m_ktrtr.num_cols));
 
         VectorXd b=eigen_W.cwiseProduct(eigen_mu - eigen_mean)+eigen_dlp;
 
         VectorXd dalpha=b-eigen_sW.cwiseProduct(
             L.solve(eigen_sW.cwiseProduct(eigen_ktrtr*b*CMath::sq(m_scale))))-eigen_alpha;
 
         // perform Brent's optimization
         CPsiLine func;
 
         func.scale=m_scale;
         func.K=eigen_ktrtr;
         func.dalpha=dalpha;
         func.start_alpha=eigen_alpha;
         func.alpha=&eigen_alpha;
         func.dlp=&dlp;
         func.f=&m_mu;
         func.m=&mean;
         func.W=&W;
         func.lik=m_model;
         func.lab=m_labels;
 
         float64_t x;
         Psi_New=local_min(0, m_opt_max, m_opt_tolerance, func, x);
     }
 
     // compute f = K * alpha + m
     eigen_mu=eigen_ktrtr*CMath::sq(m_scale)*eigen_alpha+eigen_mean;
 
     // get log probability derivatives
     dlp=m_model->get_log_probability_derivative_f(m_labels, m_mu, 1);
     d2lp=m_model->get_log_probability_derivative_f(m_labels, m_mu, 2);
     d3lp=m_model->get_log_probability_derivative_f(m_labels, m_mu, 3);
 
     // W = -d2lp
     W=d2lp.clone();
     W.scale(-1.0);
 
     // compute sW
     Map<VectorXd> eigen_W(W.vector, W.vlen);
 
     if (eigen_W.minCoeff()>0)
         eigen_sW=eigen_W.cwiseSqrt();
     else
         eigen_sW.setZero();
 }
 
 void CLaplacianInferenceMethod::update_deriv()
 {
     // create eigen representation of W, sW, dlp, d3lp, K, alpha and L
     Map<VectorXd> eigen_W(W.vector, W.vlen);
     Map<VectorXd> eigen_sW(sW.vector, sW.vlen);
     Map<VectorXd> eigen_dlp(dlp.vector, dlp.vlen);
     Map<VectorXd> eigen_d3lp(d3lp.vector, d3lp.vlen);
     Map<MatrixXd> eigen_K(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);
     Map<VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);
     Map<MatrixXd> eigen_L(m_L.matrix, m_L.num_rows, m_L.num_cols);
 
     // create shogun and eigen representation of matrix Z
     m_Z=SGMatrix<float64_t>(m_L.num_rows, m_L.num_cols);
     Map<MatrixXd> eigen_Z(m_Z.matrix, m_Z.num_rows, m_Z.num_cols);
 
     // create shogun and eigen representation of the vector g
     m_g=SGVector<float64_t>(m_Z.num_rows);
     Map<VectorXd> eigen_g(m_g.vector, m_g.vlen);
 
     if (eigen_W.minCoeff()<0)
     {
         eigen_Z=-eigen_L;
 
         // compute iA = (I + K * diag(W))^-1
         FullPivLU<MatrixXd> lu(MatrixXd::Identity(m_ktrtr.num_rows, m_ktrtr.num_cols)+
                 eigen_K*CMath::sq(m_scale)*eigen_W.asDiagonal());
         MatrixXd iA=lu.inverse();
 
         // compute derivative ln|L'*L| wrt W: g=sum(iA.*K,2)/2
         eigen_g=(iA.cwiseProduct(eigen_K*CMath::sq(m_scale))).rowwise().sum()/2.0;
     }
     else
     {
         // solve L'*L*Z=diag(sW) and compute Z=diag(sW)*Z
         eigen_Z=eigen_L.triangularView<Upper>().adjoint().solve(
                 MatrixXd(eigen_sW.asDiagonal()));
         eigen_Z=eigen_L.triangularView<Upper>().solve(eigen_Z);
         eigen_Z=eigen_sW.asDiagonal()*eigen_Z;
 
         // solve L'*C=diag(sW)*K
         MatrixXd C=eigen_L.triangularView<Upper>().adjoint().solve(
                 eigen_sW.asDiagonal()*eigen_K*CMath::sq(m_scale));
 
         // compute derivative ln|L'*L| wrt W: g=(diag(K)-sum(C.^2,1)')/2
         eigen_g=(eigen_K.diagonal()*CMath::sq(m_scale)-
                 (C.cwiseProduct(C)).colwise().sum().adjoint())/2.0;
     }
 
     // create shogun and eigen representation of the vector dfhat
     m_dfhat=SGVector<float64_t>(m_g.vlen);
     Map<VectorXd> eigen_dfhat(m_dfhat.vector, m_dfhat.vlen);
 
     // compute derivative of nlZ wrt fhat
     eigen_dfhat=eigen_g.cwiseProduct(eigen_d3lp);
 }
 
 SGVector<float64_t> CLaplacianInferenceMethod::get_derivative_wrt_inference_method(
         const TParameter* param)
 {
     REQUIRE(!strcmp(param->m_name, "scale"), "Can't compute derivative of "
             "the nagative log marginal likelihood wrt %s.%s parameter\n",
             get_name(), param->m_name)
 
     // create eigen representation of K, Z, dfhat, dlp and alpha
     Map<MatrixXd> eigen_K(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);
     Map<MatrixXd> eigen_Z(m_Z.matrix, m_Z.num_rows, m_Z.num_cols);
     Map<VectorXd> eigen_dfhat(m_dfhat.vector, m_dfhat.vlen);
     Map<VectorXd> eigen_dlp(dlp.vector, dlp.vlen);
     Map<VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);
 
     SGVector<float64_t> result(1);
 
     // compute derivative K wrt scale
     MatrixXd dK=eigen_K*m_scale*2.0;
 
     // compute dnlZ=sum(sum(Z.*dK))/2-alpha'*dK*alpha/2
     result[0]=(eigen_Z.cwiseProduct(dK)).sum()/2.0-
         (eigen_alpha.adjoint()*dK).dot(eigen_alpha)/2.0;
 
     // compute b=dK*dlp
     VectorXd b=dK*eigen_dlp;
 
     // compute dnlZ=dnlZ-dfhat'*(b-K*(Z*b))
     result[0]=result[0]-eigen_dfhat.dot(b-eigen_K*CMath::sq(m_scale)*(eigen_Z*b));
 
     return result;
 }
 
 SGVector<float64_t> CLaplacianInferenceMethod::get_derivative_wrt_likelihood_model(
         const TParameter* param)
 {
     // create eigen representation of K, Z, g and dfhat
     Map<MatrixXd> eigen_K(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);
     Map<MatrixXd> eigen_Z(m_Z.matrix, m_Z.num_rows, m_Z.num_cols);
     Map<VectorXd> eigen_g(m_g.vector, m_g.vlen);
     Map<VectorXd> eigen_dfhat(m_dfhat.vector, m_dfhat.vlen);
 
     // get derivatives wrt likelihood model parameters
     SGVector<float64_t> lp_dhyp=m_model->get_first_derivative(m_labels,
             m_mu, param);
     SGVector<float64_t> dlp_dhyp=m_model->get_second_derivative(m_labels,
             m_mu, param);
     SGVector<float64_t> d2lp_dhyp=m_model->get_third_derivative(m_labels,
             m_mu, param);
 
     // create eigen representation of the derivatives
     Map<VectorXd> eigen_lp_dhyp(lp_dhyp.vector, lp_dhyp.vlen);
     Map<VectorXd> eigen_dlp_dhyp(dlp_dhyp.vector, dlp_dhyp.vlen);
     Map<VectorXd> eigen_d2lp_dhyp(d2lp_dhyp.vector, d2lp_dhyp.vlen);
 
     SGVector<float64_t> result(1);
 
     // compute b vector
     VectorXd b=eigen_K*eigen_dlp_dhyp;
 
     // compute dnlZ=-g'*d2lp_dhyp-sum(lp_dhyp)-dfhat'*(b-K*(Z*b))
     result[0]=-eigen_g.dot(eigen_d2lp_dhyp)-eigen_lp_dhyp.sum()-
         eigen_dfhat.dot(b-eigen_K*CMath::sq(m_scale)*(eigen_Z*b));
 
     return result;
 }
 
 SGVector<float64_t> CLaplacianInferenceMethod::get_derivative_wrt_kernel(
         const TParameter* param)
 {
     // create eigen representation of K, Z, dfhat, dlp and alpha
     Map<MatrixXd> eigen_K(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);
     Map<MatrixXd> eigen_Z(m_Z.matrix, m_Z.num_rows, m_Z.num_cols);
     Map<VectorXd> eigen_dfhat(m_dfhat.vector, m_dfhat.vlen);
     Map<VectorXd> eigen_dlp(dlp.vector, dlp.vlen);
     Map<VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);
 
     SGVector<float64_t> result;
 
     if (param->m_datatype.m_ctype==CT_VECTOR ||
             param->m_datatype.m_ctype==CT_SGVECTOR)
     {
         REQUIRE(param->m_datatype.m_length_y,
                 "Length of the parameter %s should not be NULL\n", param->m_name)
         result=SGVector<float64_t>(*(param->m_datatype.m_length_y));
     }
     else
     {
         result=SGVector<float64_t>(1);
     }
 
     for (index_t i=0; i<result.vlen; i++)
     {
         SGMatrix<float64_t> dK;
 
         if (result.vlen==1)
             dK=m_kernel->get_parameter_gradient(param);
         else
             dK=m_kernel->get_parameter_gradient(param, i);
 
         Map<MatrixXd> eigen_dK(dK.matrix, dK.num_cols, dK.num_rows);
 
         // compute dnlZ=sum(sum(Z.*dK))/2-alpha'*dK*alpha/2
         result[i]=(eigen_Z.cwiseProduct(eigen_dK)).sum()/2.0-
             (eigen_alpha.adjoint()*eigen_dK).dot(eigen_alpha)/2.0;
 
         // compute b=dK*dlp
         VectorXd b=eigen_dK*eigen_dlp;
 
         // compute dnlZ=dnlZ-dfhat'*(b-K*(Z*b))
         result[i]=result[i]-eigen_dfhat.dot(b-eigen_K*CMath::sq(m_scale)*
                 (eigen_Z*b));
     }
 
     return result;
 }
 
 SGVector<float64_t> CLaplacianInferenceMethod::get_derivative_wrt_mean(
         const TParameter* param)
 {
     // create eigen representation of K, Z, dfhat and alpha
     Map<MatrixXd> eigen_K(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);
     Map<MatrixXd> eigen_Z(m_Z.matrix, m_Z.num_rows, m_Z.num_cols);
     Map<VectorXd> eigen_dfhat(m_dfhat.vector, m_dfhat.vlen);
     Map<VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);
 
     SGVector<float64_t> result;
 
     if (param->m_datatype.m_ctype==CT_VECTOR ||
             param->m_datatype.m_ctype==CT_SGVECTOR)
     {
         REQUIRE(param->m_datatype.m_length_y,
                 "Length of the parameter %s should not be NULL\n", param->m_name)
 
         result=SGVector<float64_t>(*(param->m_datatype.m_length_y));
     }
     else
     {
         result=SGVector<float64_t>(1);
     }
 
     for (index_t i=0; i<result.vlen; i++)
     {
         SGVector<float64_t> dmu;
 
         if (result.vlen==1)
             dmu=m_mean->get_parameter_derivative(m_features, param);
         else
             dmu=m_mean->get_parameter_derivative(m_features, param, i);
 
         Map<VectorXd> eigen_dmu(dmu.vector, dmu.vlen);
 
         // compute dnlZ=-alpha'*dm-dfhat'*(dm-K*(Z*dm))
         result[i]=-eigen_alpha.dot(eigen_dmu)-eigen_dfhat.dot(eigen_dmu-
                 eigen_K*CMath::sq(m_scale)*(eigen_Z*eigen_dmu));
     }
 
     return result;
 }
 }
 
 #endif /* HAVE_EIGEN3 */