en/latest/SingleFITCLaplaceInferenceMethod_8cpp_source.html

 /*

  * Copyright (c) The Shogun Machine Learning Toolbox

  * Written (W) 2015 Wu Lin

  * All rights reserved.

  *

  * Redistribution and use in source and binary forms, with or without

  * modification, are permitted provided that the following conditions are met:

  *

  * 1. Redistributions of source code must retain the above copyright notice, this

  *    list of conditions and the following disclaimer.

  * 2. Redistributions in binary form must reproduce the above copyright notice,

  *    this list of conditions and the following disclaimer in the documentation

  *    and/or other materials provided with the distribution.

  *

  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND

  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED

  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE

  * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR

  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES

  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND

  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS

  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

  *

  * The views and conclusions contained in the software and documentation are those

  * of the authors and should not be interpreted as representing official policies,

  * either expressed or implied, of the Shogun Development Team.

  *

  */


 #include <shogun/machine/gp/SingleFITCLaplaceInferenceMethod.h>


 #include <shogun/machine/gp/StudentsTLikelihood.h>

 #include <shogun/mathematics/Math.h>

 #include <shogun/lib/external/brent.h>

 #include <shogun/mathematics/eigen3.h>

 #include <shogun/features/DotFeatures.h>

 #include <shogun/optimization/FirstOrderMinimizer.h>


 using namespace shogun;

 using namespace Eigen;


 namespace shogun

 {


 #ifndef DOXYGEN_SHOULD_SKIP_THIS


 class CFITCPsiLine : public func_base

 {

 public:

     float64_t log_scale;

     VectorXd dalpha;

     VectorXd start_alpha;

     SGVector<float64_t>* alpha;

     SGVector<float64_t>* dlp;

     SGVector<float64_t>* W;

     SGVector<float64_t>* f;

     SGVector<float64_t>* m;

     CLikelihoodModel* lik;

     CLabels* lab;

     CSingleFITCLaplaceInferenceMethod *inf;


     virtual double operator() (double x)

     {

         //time complexity O(m*n)

         Map<VectorXd> eigen_f(f->vector, f->vlen);

         Map<VectorXd> eigen_m(m->vector, m->vlen);

         Map<VectorXd> eigen_alpha(alpha->vector, alpha->vlen);


         //alpha = alpha + s*dalpha;

         eigen_alpha=start_alpha+x*dalpha;

         SGVector<float64_t> tmp=inf->compute_mvmK(*alpha);

         Map<VectorXd> eigen_tmp(tmp.vector, tmp.vlen);

         //f = mvmK(alpha,V,d0)+m;

         eigen_f=eigen_tmp+eigen_m;


         // get first and second derivatives of log likelihood

         (*dlp)=lik->get_log_probability_derivative_f(lab, (*f), 1);


         (*W)=lik->get_log_probability_derivative_f(lab, (*f), 2);

         W->scale(-1.0);


         // compute psi=alpha'*(f-m)/2-lp

         float64_t result = eigen_alpha.dot(eigen_f-eigen_m)/2.0-

             SGVector<float64_t>::sum(lik->get_log_probability_f(lab, *f));


         return result;

     }

 };


 class SingleFITCLaplaceInferenceMethodCostFunction: public FirstOrderCostFunction

 {

 public:

     SingleFITCLaplaceInferenceMethodCostFunction():FirstOrderCostFunction() {  init(); }

     virtual ~SingleFITCLaplaceInferenceMethodCostFunction() { clean(); }

     void set_target(CSingleFITCLaplaceInferenceMethod *obj)

     {

         REQUIRE(obj, "Obj must set\n");

         if(m_obj != obj)

         {

             SG_REF(obj);

             SG_UNREF(m_obj);

             m_obj=obj;

         }

     }


     void clean()

     {

         SG_UNREF(m_obj);

     }


     virtual float64_t get_cost()

     {

         REQUIRE(m_obj,"Object not set\n");

         return m_obj->get_psi_wrt_alpha();

     }

     void unset_target(bool is_unref)

     {

         if(is_unref)

         {

             SG_UNREF(m_obj);

         }

         m_obj=NULL;

     }

     virtual SGVector<float64_t> obtain_variable_reference()

     {

         REQUIRE(m_obj,"Object not set\n");

         m_derivatives = SGVector<float64_t>((m_obj->m_al).vlen);

         return m_obj->m_al;

     }

     virtual SGVector<float64_t> get_gradient()

     {

         REQUIRE(m_obj,"Object not set\n");

         m_obj->get_gradient_wrt_alpha(m_derivatives);

         return m_derivatives;

     }

     virtual const char* get_name() const { return "SingleFITCLaplaceInferenceMethodCostFunction"; }

 private:

     void init()

     {

         m_obj=NULL;

         m_derivatives = SGVector<float64_t>();

         SG_ADD(&m_derivatives, "SingleFITCLaplaceInferenceMethodCostFunction__m_derivatives",

             "derivatives in SingleFITCLaplaceInferenceMethodCostFunction", MS_NOT_AVAILABLE);

         SG_ADD((CSGObject **)&m_obj, "SingleFITCLaplaceInferenceMethodCostFunction__m_obj",

             "obj in SingleFITCLaplaceInferenceMethodCostFunction", MS_NOT_AVAILABLE);

     }


     SGVector<float64_t> m_derivatives;

     CSingleFITCLaplaceInferenceMethod *m_obj;

 };


 #endif /* DOXYGEN_SHOULD_SKIP_THIS */


 void CSingleFITCLaplaceNewtonOptimizer::set_target(CSingleFITCLaplaceInferenceMethod *obj)

 {

     REQUIRE(obj, "Obj must set\n");

     if(m_obj != obj)

     {

         SG_REF(obj);

         SG_UNREF(m_obj);

         m_obj=obj;

     }

 }


 void CSingleFITCLaplaceNewtonOptimizer::unset_target(bool is_unref)

 {

     if(is_unref)

     {

         SG_UNREF(m_obj);

     }

     m_obj=NULL;


 }


 void CSingleFITCLaplaceNewtonOptimizer::init()

 {

     m_obj=NULL;

     m_iter=20;

     m_tolerance=1e-6;

     m_opt_tolerance=1e-6;

     m_opt_max=10;


     SG_ADD((CSGObject **)&m_obj, "CSingleFITCLaplaceNewtonOptimizer__m_obj",

         "obj in CSingleFITCLaplaceNewtonOptimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_iter, "CSingleFITCLaplaceNewtonOptimizer__m_iter",

         "iter in CSingleFITCLaplaceNewtonOptimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_tolerance, "CSingleFITCLaplaceNewtonOptimizer__m_tolerance",

         "tolerance in CSingleFITCLaplaceNewtonOptimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_opt_tolerance, "CSingleFITCLaplaceNewtonOptimizer__m_opt_tolerance",

         "opt_tolerance in CSingleFITCLaplaceNewtonOptimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_opt_max, "CSingleFITCLaplaceNewtonOptimizer__m_opt_max",

         "opt_max in CSingleFITCLaplaceNewtonOptimizer", MS_NOT_AVAILABLE);

 }


 float64_t CSingleFITCLaplaceNewtonOptimizer::minimize()

 {

     REQUIRE(m_obj,"Object not set\n");

     //time complexity O(m^2*n)

     Map<MatrixXd> eigen_kuu((m_obj->m_kuu).matrix, (m_obj->m_kuu).num_rows, (m_obj->m_kuu).num_cols);

     Map<MatrixXd> eigen_V((m_obj->m_V).matrix, (m_obj->m_V).num_rows, (m_obj->m_V).num_cols);

     Map<VectorXd> eigen_dg((m_obj->m_dg).vector, (m_obj->m_dg).vlen);

     Map<MatrixXd> eigen_R0((m_obj->m_chol_R0).matrix, (m_obj->m_chol_R0).num_rows, (m_obj->m_chol_R0).num_cols);

     Map<VectorXd> eigen_mu(m_obj->m_mu, (m_obj->m_mu).vlen);


     SGVector<float64_t> mean=m_obj->m_mean->get_mean_vector(m_obj->m_features);

     Map<VectorXd> eigen_mean(mean.vector, mean.vlen);


     float64_t Psi_Old=CMath::INFTY;

     float64_t Psi_New=m_obj->m_Psi;


     // compute W = -d2lp

     m_obj->m_W=m_obj->m_model->get_log_probability_derivative_f(m_obj->m_labels, m_obj->m_mu, 2);

     m_obj->m_W.scale(-1.0);


     //n-by-1 vector

     Map<VectorXd> eigen_al((m_obj->m_al).vector, (m_obj->m_al).vlen);


     // get first derivative of log probability function

     m_obj->m_dlp=m_obj->m_model->get_log_probability_derivative_f(m_obj->m_labels, m_obj->m_mu, 1);


     index_t iter=0;


     m_obj->m_Wneg=false;

     while (Psi_Old-Psi_New>m_tolerance && iter<m_iter)

     {

         //time complexity O(m^2*n)

         Map<VectorXd> eigen_W((m_obj->m_W).vector, (m_obj->m_W).vlen);

         Map<VectorXd> eigen_dlp((m_obj->m_dlp).vector, (m_obj->m_dlp).vlen);


         Psi_Old = Psi_New;

         iter++;


         if (eigen_W.minCoeff() < 0)

         {

             // Suggested by Vanhatalo et. al.,

             // Gaussian Process Regression with Student's t likelihood, NIPS 2009

             // Quoted from infFITC_Laplace.m

             float64_t df;


             if (m_obj->m_model->get_model_type()==LT_STUDENTST)

             {

                 CStudentsTLikelihood* lik=CStudentsTLikelihood::obtain_from_generic(m_obj->m_model);

                 df=lik->get_degrees_freedom();

                 SG_UNREF(lik);

             }

             else

                 df=1;

             eigen_W+=(2.0/(df+1))*eigen_dlp.cwiseProduct(eigen_dlp);

         }


         //b = W.*(f-m) + dlp;

         VectorXd b=eigen_W.cwiseProduct(eigen_mu-eigen_mean)+eigen_dlp;


         //dd = 1./(1+W.*d0);

         VectorXd dd=MatrixXd::Ones(b.rows(),1).cwiseQuotient(eigen_W.cwiseProduct(eigen_dg)+MatrixXd::Ones(b.rows(),1));


         VectorXd eigen_t=eigen_W.cwiseProduct(dd);

         //m-by-m matrix

         SGMatrix<float64_t> tmp( (m_obj->m_V).num_rows, (m_obj->m_V).num_rows);

         Map<MatrixXd> eigen_tmp(tmp.matrix, tmp.num_rows, tmp.num_cols);

         //eye(nu)+(V.*repmat((W.*dd)',nu,1))*V'

         eigen_tmp=eigen_V*eigen_t.asDiagonal()*eigen_V.transpose()+MatrixXd::Identity(tmp.num_rows,tmp.num_rows);

         tmp=m_obj->get_chol_inv(tmp);

         //chol_inv(eye(nu)+(V.*repmat((W.*dd)',nu,1))*V')

         Map<MatrixXd> eigen_tmp2(tmp.matrix, tmp.num_rows, tmp.num_cols);

         //RV = chol_inv(eye(nu)+(V.*repmat((W.*dd)',nu,1))*V')*V;

         // m-by-n matrix

         MatrixXd eigen_RV=eigen_tmp2*eigen_V;

         //dalpha = dd.*b - (W.*dd).*(RV'*(RV*(dd.*b))) - alpha; % Newt dir + line search

         VectorXd dalpha=dd.cwiseProduct(b)-eigen_t.cwiseProduct(eigen_RV.transpose()*(eigen_RV*(dd.cwiseProduct(b))))-eigen_al;


         //perform Brent's optimization

         CFITCPsiLine func;


         func.log_scale=m_obj->m_log_scale;

         func.dalpha=dalpha;

         func.start_alpha=eigen_al;

         func.alpha=&(m_obj->m_al);

         func.dlp=&(m_obj->m_dlp);

         func.f=&(m_obj->m_mu);

         func.m=&mean;

         func.W=&(m_obj->m_W);

         func.lik=m_obj->m_model;

         func.lab=m_obj->m_labels;

         func.inf=m_obj;


         float64_t x;

         Psi_New=local_min(0, m_opt_max, m_opt_tolerance, func, x);

     }


     if (Psi_Old-Psi_New>m_tolerance && iter>=m_iter)

     {

         SG_SWARNING("Max iterations (%d) reached, but convergence level (%f) is not yet below tolerance (%f)\n", m_iter, Psi_Old-Psi_New, m_tolerance);

     }

     return Psi_New;

 }


 CSingleFITCLaplaceInferenceMethod::CSingleFITCLaplaceInferenceMethod() : CSingleFITCInference()

 {

     init();

 }


 CSingleFITCLaplaceInferenceMethod::CSingleFITCLaplaceInferenceMethod(CKernel* kern, CFeatures* feat,

     CMeanFunction* m, CLabels* lab, CLikelihoodModel* mod, CFeatures* lat)

 : CSingleFITCInference(kern, feat, m, lab, mod, lat)

 {

     init();

 }


 void CSingleFITCLaplaceInferenceMethod::init()

 {

     m_Psi=0;

     m_Wneg=false;


     SG_ADD(&m_dlp, "dlp", "derivative of log likelihood with respect to function location", MS_NOT_AVAILABLE);

     SG_ADD(&m_W, "W", "the noise matrix", MS_NOT_AVAILABLE);


     SG_ADD(&m_sW, "sW", "square root of W", MS_NOT_AVAILABLE);

     SG_ADD(&m_d2lp, "d2lp", "second derivative of log likelihood with respect to function location", MS_NOT_AVAILABLE);

     SG_ADD(&m_d3lp, "d3lp", "third derivative of log likelihood with respect to function location", MS_NOT_AVAILABLE);

     SG_ADD(&m_chol_R0, "chol_R0", "Cholesky of inverse covariance of inducing features", MS_NOT_AVAILABLE);

     SG_ADD(&m_dfhat, "dfhat", "derivative of negative log (approximated) marginal likelihood wrt f", MS_NOT_AVAILABLE);

     SG_ADD(&m_g, "g", "variable g defined in infFITC_Laplace.m", MS_NOT_AVAILABLE);

     SG_ADD(&m_dg, "dg", "variable d0 defined in infFITC_Laplace.m", MS_NOT_AVAILABLE);

     SG_ADD(&m_Psi, "Psi", "the negative log likelihood without constant terms used in Newton's method", MS_NOT_AVAILABLE);

     SG_ADD(&m_Wneg, "Wneg", "whether W contains negative elements", MS_NOT_AVAILABLE);


     register_minimizer(new CSingleFITCLaplaceNewtonOptimizer());

 }


 void CSingleFITCLaplaceInferenceMethod::compute_gradient()

 {

     CInference::compute_gradient();


     if (!m_gradient_update)

     {

         update_approx_cov();

         update_deriv();

         m_gradient_update=true;

         update_parameter_hash();

     }

 }


 void CSingleFITCLaplaceInferenceMethod::update()

 {

     SG_DEBUG("entering\n");


     CInference::update();

     update_init();

     update_alpha();

     update_chol();

     m_gradient_update=false;

     update_parameter_hash();


     SG_DEBUG("leaving\n");

 }


 SGVector<float64_t> CSingleFITCLaplaceInferenceMethod::get_diagonal_vector()

 {

     if (parameter_hash_changed())

         update();


     return SGVector<float64_t>(m_sW);

 }


 CSingleFITCLaplaceInferenceMethod::~CSingleFITCLaplaceInferenceMethod()

 {

 }


 SGVector<float64_t> CSingleFITCLaplaceInferenceMethod::compute_mvmZ(SGVector<float64_t> x)

 {

     //time complexity O(m*n)

     Map<MatrixXd> eigen_Rvdd(m_Rvdd.matrix, m_Rvdd.num_rows, m_Rvdd.num_cols);

     Map<VectorXd> eigen_t(m_t.vector, m_t.vlen);

     Map<VectorXd> eigen_x(x.vector, x.vlen);


     SGVector<float64_t> res(x.vlen);

     Map<VectorXd> eigen_res(res.vector, res.vlen);


     //Zx = t.*x - RVdd'*(RVdd*x);

     eigen_res=eigen_x.cwiseProduct(eigen_t)-eigen_Rvdd.transpose()*(eigen_Rvdd*eigen_x);

     return res;

 }


 SGVector<float64_t> CSingleFITCLaplaceInferenceMethod::compute_mvmK(SGVector<float64_t> al)

 {

     //time complexity O(m*n)

     Map<MatrixXd> eigen_V(m_V.matrix, m_V.num_rows, m_V.num_cols);

     Map<VectorXd> eigen_dg(m_dg.vector, m_dg.vlen);

     Map<VectorXd> eigen_al(al.vector, al.vlen);


     SGVector<float64_t> res(al.vlen);

     Map<VectorXd> eigen_res(res.vector, res.vlen);


     //Kal = V'*(V*al) + d0.*al;

     eigen_res= eigen_V.transpose()*(eigen_V*eigen_al)+eigen_dg.cwiseProduct(eigen_al);

     return res;

 }


 CSingleFITCLaplaceInferenceMethod* CSingleFITCLaplaceInferenceMethod::obtain_from_generic(

         CInference* inference)

 {

     REQUIRE(inference!=NULL, "Inference should be not NULL");


     if (inference->get_inference_type()!=INF_FITC_LAPLACE_SINGLE)

         SG_SERROR("Provided inference is not of type CSingleFITCLaplaceInferenceMethod!\n")


     SG_REF(inference);

     return (CSingleFITCLaplaceInferenceMethod*)inference;

 }


 SGMatrix<float64_t> CSingleFITCLaplaceInferenceMethod::get_chol_inv(SGMatrix<float64_t> mtx)

 {

     //time complexity O(m^3), where mtx is a m-by-m matrix

     REQUIRE(mtx.num_rows==mtx.num_cols, "Matrix must be square\n");


     Map<MatrixXd> eigen_mtx(mtx.matrix, mtx.num_rows, mtx.num_cols);

     LLT<MatrixXd> chol(eigen_mtx.colwise().reverse().rowwise().reverse().matrix());

     //tmp=chol(rot180(A))'

     MatrixXd tmp=chol.matrixL();

     SGMatrix<float64_t> res(mtx.num_rows, mtx.num_cols);

     Map<MatrixXd> eigen_res(res.matrix, res.num_rows, res.num_cols);

     //chol_inv = @(A) rot180(chol(rot180(A))')\eye(nu);                 % chol(inv(A))

     eigen_res=tmp.colwise().reverse().rowwise().reverse().matrix().triangularView<Upper>(

         ).solve(MatrixXd::Identity(mtx.num_rows, mtx.num_cols));

     return res;

 }


 float64_t CSingleFITCLaplaceInferenceMethod::get_negative_log_marginal_likelihood()

 {

     if (parameter_hash_changed())

         update();


     if (m_Wneg)

     {

         SG_WARNING("nlZ cannot be computed since W is too negative");

         //nlZ = NaN;

         return CMath::INFTY;

     }

     //time complexity O(m^2*n)

     Map<VectorXd> eigen_alpha(m_al.vector, m_al.vlen);

     Map<VectorXd> eigen_mu(m_mu.vector, m_mu.vlen);

     SGVector<float64_t> mean=m_mean->get_mean_vector(m_features);

     Map<VectorXd> eigen_mean(mean.vector, mean.vlen);

     // get log likelihood

     float64_t lp=SGVector<float64_t>::sum(m_model->get_log_probability_f(m_labels,

         m_mu));


     Map<MatrixXd> eigen_V(m_V.matrix, m_V.num_rows, m_V.num_cols);

     Map<VectorXd>eigen_t(m_t.vector, m_t.vlen);

     MatrixXd A=eigen_V*eigen_t.asDiagonal()*eigen_V.transpose()+MatrixXd::Identity(m_V.num_rows,m_V.num_rows);

     LLT<MatrixXd> chol(A);

     A=chol.matrixU();


     Map<VectorXd> eigen_dg(m_dg.vector, m_dg.vlen);

     Map<VectorXd> eigen_W(m_W.vector, m_W.vlen);


     //nlZ = alpha'*(f-m)/2 - sum(lp) - sum(log(dd))/2 + sum(log(diag(chol(A))));

     float64_t result=eigen_alpha.dot(eigen_mu-eigen_mean)/2.0-lp+

         A.diagonal().array().log().sum()+(eigen_W.cwiseProduct(eigen_dg)+MatrixXd::Ones(eigen_dg.rows(),1)).array().log().sum()/2.0;


     return result;

 }


 void CSingleFITCLaplaceInferenceMethod::update_approx_cov()

 {

 }


 void CSingleFITCLaplaceInferenceMethod::update_init()

 {

     //time complexity O(m^2*n)

     //m-by-m matrix

     Map<MatrixXd> eigen_kuu(m_kuu.matrix, m_kuu.num_rows, m_kuu.num_cols);

     //m-by-n matrix

     Map<MatrixXd> eigen_ktru(m_ktru.matrix, m_ktru.num_rows, m_ktru.num_cols);


     Map<VectorXd> eigen_ktrtr_diag(m_ktrtr_diag.vector, m_ktrtr_diag.vlen);


     SGMatrix<float64_t> cor_kuu(m_kuu.num_rows, m_kuu.num_cols);

     Map<MatrixXd> eigen_cor_kuu(cor_kuu.matrix, cor_kuu.num_rows, cor_kuu.num_cols);

     eigen_cor_kuu=eigen_kuu*CMath::exp(m_log_scale*2.0)+CMath::exp(m_log_ind_noise)*MatrixXd::Identity(

         m_kuu.num_rows, m_kuu.num_cols);

     //R0 = chol_inv(Kuu+snu2*eye(nu)); m-by-m matrix

     m_chol_R0=get_chol_inv(cor_kuu);

     Map<MatrixXd> eigen_R0(m_chol_R0.matrix, m_chol_R0.num_rows, m_chol_R0.num_cols);


     //V = R0*Ku;  m-by-n matrix

     m_V=SGMatrix<float64_t>(m_chol_R0.num_cols, m_ktru.num_cols);

     Map<MatrixXd> eigen_V(m_V.matrix, m_V.num_rows, m_V.num_cols);


     eigen_V=eigen_R0*(eigen_ktru*CMath::exp(m_log_scale*2.0));

     m_dg=SGVector<float64_t>(m_ktrtr_diag.vlen);

     Map<VectorXd> eigen_dg(m_dg.vector, m_dg.vlen);

     //d0 = diagK-sum(V.*V,1)';

     eigen_dg=eigen_ktrtr_diag*CMath::exp(m_log_scale*2.0)-(eigen_V.cwiseProduct(eigen_V)).colwise().sum().adjoint();


     // get mean vector and create eigen representation of it

     m_mean_f=m_mean->get_mean_vector(m_features);

     Map<VectorXd> eigen_mean(m_mean_f.vector, m_mean_f.vlen);


     // create shogun and eigen representation of function vector

     m_mu=SGVector<float64_t>(m_mean_f.vlen);

     Map<VectorXd> eigen_mu(m_mu, m_mu.vlen);


     float64_t Psi_New;

     float64_t Psi_Def;

     if (m_al.vlen!=m_labels->get_num_labels())

     {

         // set alpha a zero vector

         m_al=SGVector<float64_t>(m_labels->get_num_labels());

         m_al.zero();


         // f = mean, if length of alpha and length of y doesn't match

         eigen_mu=eigen_mean;


         Psi_New=-SGVector<float64_t>::sum(m_model->get_log_probability_f(

             m_labels, m_mu));

     }

     else

     {

         Map<VectorXd> eigen_alpha(m_al.vector, m_al.vlen);


         // compute f = K * alpha + m

         SGVector<float64_t> tmp=compute_mvmK(m_al);

         Map<VectorXd> eigen_tmp(tmp.vector, tmp.vlen);

         eigen_mu=eigen_tmp+eigen_mean;


         Psi_New=eigen_alpha.dot(eigen_tmp)/2.0-

             SGVector<float64_t>::sum(m_model->get_log_probability_f(m_labels, m_mu));


         Psi_Def=-SGVector<float64_t>::sum(m_model->get_log_probability_f(m_labels, m_mean_f));


         // if default is better, then use it

         if (Psi_Def < Psi_New)

         {

             m_al.zero();

             eigen_mu=eigen_mean;

             Psi_New=Psi_Def;

         }

     }

     m_Psi=Psi_New;

 }


 void CSingleFITCLaplaceInferenceMethod::register_minimizer(Minimizer* minimizer)

 {

     REQUIRE(minimizer, "Minimizer must set\n");

     if (!dynamic_cast<CSingleFITCLaplaceNewtonOptimizer*>(minimizer))

     {

         FirstOrderMinimizer* opt= dynamic_cast<FirstOrderMinimizer*>(minimizer);

         REQUIRE(opt, "The provided minimizer is not supported\n")

     }

     CInference::register_minimizer(minimizer);

 }


 void CSingleFITCLaplaceInferenceMethod::update_alpha()

 {

     CSingleFITCLaplaceNewtonOptimizer *opt=dynamic_cast<CSingleFITCLaplaceNewtonOptimizer*>(m_minimizer);

     bool cleanup=false;

     if (opt)

     {

         opt->set_target(this);

         if(this->ref_count()>1)

             cleanup=true;

         opt->minimize();

         opt->unset_target(cleanup);

     }

     else

     {

         FirstOrderMinimizer* minimizer= dynamic_cast<FirstOrderMinimizer*>(m_minimizer);

         REQUIRE(minimizer, "The provided minimizer is not supported\n");


         SingleFITCLaplaceInferenceMethodCostFunction *cost_fun=new SingleFITCLaplaceInferenceMethodCostFunction();

         cost_fun->set_target(this);

         if(this->ref_count()>1)

             cleanup=true;

         minimizer->set_cost_function(cost_fun);

         minimizer->minimize();

         minimizer->unset_cost_function(false);

         cost_fun->unset_target(cleanup);

         SG_UNREF(cost_fun);

     }


     Map<VectorXd> eigen_mean(m_mean_f.vector, m_mean_f.vlen);

     Map<MatrixXd> eigen_V(m_V.matrix, m_V.num_rows, m_V.num_cols);

     Map<MatrixXd> eigen_R0(m_chol_R0.matrix, m_chol_R0.num_rows, m_chol_R0.num_cols);

     Map<VectorXd> eigen_mu(m_mu, m_mu.vlen);

     Map<VectorXd> eigen_al(m_al.vector, m_al.vlen);


     // compute f = K * alpha + m

     SGVector<float64_t> tmp=compute_mvmK(m_al);

     Map<VectorXd> eigen_tmp(tmp.vector, tmp.vlen);

     eigen_mu=eigen_tmp+eigen_mean;


     m_alpha=SGVector<float64_t>(m_chol_R0.num_cols);

     Map<VectorXd> eigen_post_alpha(m_alpha.vector, m_alpha.vlen);

     //post.alpha = R0'*(V*alpha);

     //m-by-1 vector

     eigen_post_alpha=eigen_R0.transpose()*(eigen_V*eigen_al);

 }


 void CSingleFITCLaplaceInferenceMethod::update_chol()

 {

     //time complexity O(m^2*n)

     Map<VectorXd> eigen_dg(m_dg.vector, m_dg.vlen);

     Map<MatrixXd> eigen_R0(m_chol_R0.matrix, m_chol_R0.num_rows, m_chol_R0.num_cols);

     Map<MatrixXd> eigen_V(m_V.matrix, m_V.num_rows, m_V.num_cols);


     // get log probability derivatives

     m_dlp=m_model->get_log_probability_derivative_f(m_labels, m_mu, 1);

     m_d2lp=m_model->get_log_probability_derivative_f(m_labels, m_mu, 2);

     m_d3lp=m_model->get_log_probability_derivative_f(m_labels, m_mu, 3);


     // W = -d2lp

     m_W=m_d2lp.clone();

     m_W.scale(-1.0);


     Map<VectorXd> eigen_W(m_W.vector, m_W.vlen);

     m_sW=SGVector<float64_t>(m_W.vlen);

     Map<VectorXd> eigen_sW(m_sW.vector, m_sW.vlen);


     VectorXd Wd0_1=eigen_W.cwiseProduct(eigen_dg)+MatrixXd::Ones(eigen_W.rows(),1);


     // compute sW

     // post.sW = sqrt(abs(W)).*sign(W);             % preserve sign in case of negative

     if (eigen_W.minCoeff()>0)

     {

         eigen_sW=eigen_W.cwiseSqrt();

     }

     else

     {

         eigen_sW=((eigen_W.array().abs()+eigen_W.array())/2).sqrt()-((eigen_W.array().abs()-eigen_W.array())/2).sqrt();

         //any(1+d0.*W<0)

         if (!(Wd0_1.array().abs().matrix()==Wd0_1))

             m_Wneg=true;

     }


     m_t=SGVector<float64_t>(m_W.vlen);

     Map<VectorXd>eigen_t(m_t.vector, m_t.vlen);


     //dd = 1./(1+d0.*W);

     VectorXd dd=MatrixXd::Ones(Wd0_1.rows(),1).cwiseQuotient(Wd0_1);

     eigen_t=eigen_W.cwiseProduct(dd);


     //m-by-m matrix

     SGMatrix<float64_t> A(m_V.num_rows, m_V.num_rows);

     Map<MatrixXd> eigen_A(A.matrix, A.num_rows, A.num_cols);

     //A = eye(nu)+(V.*repmat((W.*dd)',nu,1))*V';

     eigen_A=eigen_V*eigen_t.asDiagonal()*eigen_V.transpose()+MatrixXd::Identity(A.num_rows,A.num_rows);


     //R0tV = R0'*V; m-by-n

     MatrixXd R0tV=eigen_R0.transpose()*eigen_V;


     //B = R0tV.*repmat((W.*dd)',nu,1); m-by-n matrix

     MatrixXd B=R0tV*eigen_t.asDiagonal();


     //m-by-m matrix

     m_L=SGMatrix<float64_t>(m_kuu.num_rows, m_kuu.num_cols);

     Map<MatrixXd> eigen_L(m_L.matrix, m_L.num_rows, m_L.num_cols);


     //post.L = -B*R0tV';

     eigen_L=-B*R0tV.transpose();


     SGMatrix<float64_t> tmp=get_chol_inv(A);

     Map<MatrixXd> eigen_tmp(tmp.matrix, tmp.num_rows, tmp.num_cols);

     //RV = chol_inv(A)*V; m-by-n matrix

     MatrixXd eigen_RV=eigen_tmp*eigen_V;

     //RVdd m-by-n matrix

     m_Rvdd=SGMatrix<float64_t>(m_V.num_rows, m_V.num_cols);

     Map<MatrixXd> eigen_Rvdd(m_Rvdd.matrix, m_Rvdd.num_rows, m_Rvdd.num_cols);

     //RVdd = RV.*repmat((W.*dd)',nu,1);

     eigen_Rvdd=eigen_RV*eigen_t.asDiagonal();


     if (!m_Wneg)

     {

         //B = B*RV';

         B=B*eigen_RV.transpose();

         //post.L = post.L + B*B';

         eigen_L+=B*B.transpose();

     }

     else

     {

         //B = B*V';

         B=B*eigen_V.transpose();

         //post.L = post.L + (B*inv(A))*B';

         FullPivLU<MatrixXd> lu(eigen_A);

         eigen_L+=B*lu.inverse()*B.transpose();

     }


     Map<MatrixXd> eigen_ktru(m_ktru.matrix, m_ktru.num_rows, m_ktru.num_cols);

     m_g=SGVector<float64_t>(m_dg.vlen);

     Map<VectorXd> eigen_g(m_g.vector, m_g.vlen);

     //g = d/2 + sum(((R*R0)*P).^2,1)'/2

     eigen_g=((eigen_dg.cwiseProduct(dd)).array()+

         ((eigen_tmp*eigen_R0)*(eigen_ktru*CMath::exp(m_log_scale*2.0))*dd.asDiagonal()

          ).array().pow(2).colwise().sum().transpose())/2;

 }


 void CSingleFITCLaplaceInferenceMethod::update_deriv()

 {

     //time complexity O(m^2*n)

     Map<MatrixXd> eigen_ktru(m_ktru.matrix, m_ktru.num_rows, m_ktru.num_cols);

     Map<MatrixXd> eigen_R0(m_chol_R0.matrix, m_chol_R0.num_rows, m_chol_R0.num_cols);

     Map<VectorXd> eigen_al(m_al.vector, m_al.vlen);

     Map<MatrixXd> eigen_V(m_V.matrix, m_V.num_rows, m_V.num_cols);

     // create shogun and eigen representation of B

     // m-by-n matrix

     m_B=SGMatrix<float64_t>(m_ktru.num_rows, m_ktru.num_cols);

     Map<MatrixXd> eigen_B(m_B.matrix, m_B.num_rows, m_B.num_cols);


     //B = (R0'*R0)*Ku

     eigen_B=eigen_R0.transpose()*eigen_V;


     // create shogun and eigen representation of w

     m_w=SGVector<float64_t>(m_B.num_rows);

     //w = B*al;

     Map<VectorXd> eigen_w(m_w.vector, m_w.vlen);

     eigen_w=eigen_B*eigen_al;


     // create shogun and eigen representation of the vector dfhat

     Map<VectorXd> eigen_d3lp(m_d3lp.vector, m_d3lp.vlen);

     Map<VectorXd> eigen_g(m_g.vector, m_g.vlen);

     m_dfhat=SGVector<float64_t>(m_g.vlen);

     Map<VectorXd> eigen_dfhat(m_dfhat.vector, m_dfhat.vlen);


     // compute derivative of nlZ wrt fhat

     // dfhat = g.*d3lp;

     eigen_dfhat=eigen_g.cwiseProduct(eigen_d3lp);

 }


 float64_t CSingleFITCLaplaceInferenceMethod::get_derivative_related_cov(SGVector<float64_t> ddiagKi,

     SGMatrix<float64_t> dKuui, SGMatrix<float64_t> dKui)

 {

     //time complexity O(m^2*n)

     Map<MatrixXd> eigen_R0tV(m_B.matrix, m_B.num_rows, m_B.num_cols);

     Map<VectorXd> eigen_ddiagKi(ddiagKi.vector, ddiagKi.vlen);

     //m-by-m matrix

     Map<MatrixXd> eigen_dKuui(dKuui.matrix, dKuui.num_rows, dKuui.num_cols);

     //m-by-n matrix

     Map<MatrixXd> eigen_dKui(dKui.matrix, dKui.num_rows, dKui.num_cols);


     // compute R=2*dKui-dKuui*B

     SGMatrix<float64_t> dA(dKui.num_rows, dKui.num_cols);

     Map<MatrixXd> eigen_dA(dA.matrix, dA.num_rows, dA.num_cols);

     //dA = 2*dKu'-R0tV'*dKuu;

     //dA' = 2*dKu-dKuu'*R0tV;

     eigen_dA=2*eigen_dKui-eigen_dKuui*eigen_R0tV;


     SGVector<float64_t> v(ddiagKi.vlen);

     Map<VectorXd> eigen_v(v.vector, v.vlen);

     //w = sum(dA.*R0tV',2);

     //w' = sum(dA'.*R0tV,1);

     //v = ddiagK-w;

     eigen_v=eigen_ddiagKi-eigen_dA.cwiseProduct(eigen_R0tV).colwise().sum().transpose();


     //explicit term

     float64_t result=CSingleFITCInference::get_derivative_related_cov(ddiagKi, dKuui, dKui, v, dA);


     //implicit term

     Map<VectorXd> eigen_dlp(m_dlp.vector, m_dlp.vlen);

     Map<VectorXd> eigen_dfhat(m_dfhat.vector, m_dfhat.vlen);


     SGVector<float64_t> b(v.vlen);

     Map<VectorXd> eigen_b(b.vector, b.vlen);

     //b = dA*(R0tV*dlp) + v.*dlp;

     eigen_b=eigen_dA.transpose()*(eigen_R0tV*eigen_dlp)+eigen_v.cwiseProduct(eigen_dlp);

     //KZb = mvmK(mvmZ(b,RVdd,t),V,d0);

     SGVector<float64_t> KZb=compute_mvmK(compute_mvmZ(b));

     Map<VectorXd> eigen_KZb(KZb.vector, KZb.vlen);

     //dnlZ.cov(i) = dnlZ.cov(i) - dfhat'*( b-KZb );

     result-=eigen_dfhat.dot(eigen_b-eigen_KZb);

     return result;

 }


 SGVector<float64_t> CSingleFITCLaplaceInferenceMethod::get_derivative_wrt_inference_method(

         const TParameter* param)

 {

     REQUIRE(param, "Param not set\n");

     //time complexity O(m^2*n)

     REQUIRE(!(strcmp(param->m_name, "log_scale")

         && strcmp(param->m_name, "log_inducing_noise")

         && strcmp(param->m_name, "inducing_features")),

         "Can't compute derivative of"

         " the nagative log marginal likelihood wrt %s.%s parameter\n",

         get_name(), param->m_name)


     SGVector<float64_t> result;

     int32_t len;

     if (!strcmp(param->m_name, "inducing_features"))

     {

         if(m_Wneg)

         {

             int32_t dim=m_inducing_features.num_rows;

             int32_t num_samples=m_inducing_features.num_cols;

             len=dim*num_samples;

         }

         else if (!m_fully_sparse)

             return CSingleFITCInference::get_derivative_wrt_inference_method(param);

         else

             return get_derivative_wrt_inducing_features(param);

     }

     else

         len=1;


     if (m_Wneg)

     {

         result=SGVector<float64_t>(len);

         return derivative_helper_when_Wneg(result, param);

     }


     if (!strcmp(param->m_name, "log_inducing_noise"))

         // wrt inducing_noise

         // compute derivative wrt inducing noise

         return get_derivative_wrt_inducing_noise(param);


     result=SGVector<float64_t>(len);

     // wrt scale

     // clone kernel matrices

     SGVector<float64_t> deriv_trtr=m_ktrtr_diag.clone();

     SGMatrix<float64_t> deriv_uu=m_kuu.clone();

     SGMatrix<float64_t> deriv_tru=m_ktru.clone();


     // create eigen representation of kernel matrices

     Map<VectorXd> ddiagKi(deriv_trtr.vector, deriv_trtr.vlen);

     Map<MatrixXd> dKuui(deriv_uu.matrix, deriv_uu.num_rows, deriv_uu.num_cols);

     Map<MatrixXd> dKui(deriv_tru.matrix, deriv_tru.num_rows, deriv_tru.num_cols);


     // compute derivatives wrt scale for each kernel matrix

     result[0]=get_derivative_related_cov(deriv_trtr, deriv_uu, deriv_tru);

     result[0]*=CMath::exp(m_log_scale*2.0)*2.0;

     return result;

 }


 SGVector<float64_t> CSingleFITCLaplaceInferenceMethod::get_derivative_wrt_likelihood_model(

         const TParameter* param)

 {

     SGVector<float64_t> result(1);

     if (m_Wneg)

         return derivative_helper_when_Wneg(result, param);


     // get derivatives wrt likelihood model parameters

     SGVector<float64_t> lp_dhyp=m_model->get_first_derivative(m_labels,

             m_mu, param);

     SGVector<float64_t> dlp_dhyp=m_model->get_second_derivative(m_labels,

             m_mu, param);

     SGVector<float64_t> d2lp_dhyp=m_model->get_third_derivative(m_labels,

             m_mu, param);


     // create eigen representation of the derivatives

     Map<VectorXd> eigen_lp_dhyp(lp_dhyp.vector, lp_dhyp.vlen);

     Map<VectorXd> eigen_dlp_dhyp(dlp_dhyp.vector, dlp_dhyp.vlen);

     Map<VectorXd> eigen_d2lp_dhyp(d2lp_dhyp.vector, d2lp_dhyp.vlen);

     Map<VectorXd> eigen_g(m_g.vector, m_g.vlen);

     Map<VectorXd> eigen_dfhat(m_dfhat.vector, m_dfhat.vlen);


     //explicit term

     //dnlZ.lik(i) = -g'*d2lp_dhyp - sum(lp_dhyp);

     result[0]=-eigen_g.dot(eigen_d2lp_dhyp)-eigen_lp_dhyp.sum();


     //implicit term

     //b = mvmK(dlp_dhyp,V,d0);

     SGVector<float64_t> b=compute_mvmK(dlp_dhyp);

     //dnlZ.lik(i) = dnlZ.lik(i) - dfhat'*(b-mvmK(mvmZ(b,RVdd,t),V,d0));

     result[0]-= get_derivative_implicit_term_helper(b);


     return result;

 }


 SGVector<float64_t> CSingleFITCLaplaceInferenceMethod::get_derivative_wrt_kernel(

         const TParameter* param)

 {

     REQUIRE(param, "Param not set\n");

     SGVector<float64_t> result;

     int64_t len=const_cast<TParameter *>(param)->m_datatype.get_num_elements();

     result=SGVector<float64_t>(len);


     if (m_Wneg)

         return derivative_helper_when_Wneg(result, param);


     m_lock->lock();

     CFeatures *inducing_features=get_inducing_features();

     for (index_t i=0; i<result.vlen; i++)

     {

         //time complexity O(m^2*n)

         SGVector<float64_t> deriv_trtr;

         SGMatrix<float64_t> deriv_uu;

         SGMatrix<float64_t> deriv_tru;


         m_kernel->init(m_features, m_features);

         deriv_trtr=m_kernel->get_parameter_gradient_diagonal(param, i);


         m_kernel->init(inducing_features, inducing_features);

         deriv_uu=m_kernel->get_parameter_gradient(param, i);


         m_kernel->init(inducing_features, m_features);

         deriv_tru=m_kernel->get_parameter_gradient(param, i);


         // create eigen representation of derivatives

         Map<VectorXd> ddiagKi(deriv_trtr.vector, deriv_trtr.vlen);

         Map<MatrixXd> dKuui(deriv_uu.matrix, deriv_uu.num_rows,

                 deriv_uu.num_cols);

         Map<MatrixXd> dKui(deriv_tru.matrix, deriv_tru.num_rows,

                 deriv_tru.num_cols);


         result[i]=get_derivative_related_cov(deriv_trtr, deriv_uu, deriv_tru);

         result[i]*=CMath::exp(m_log_scale*2.0);

     }

     SG_UNREF(inducing_features);

     m_lock->unlock();


     return result;

 }


 float64_t CSingleFITCLaplaceInferenceMethod::get_derivative_related_mean(SGVector<float64_t> dmu)

 {

     //time complexity O(m*n)

     //explicit term

     float64_t result=CSingleFITCInference::get_derivative_related_mean(dmu);


     //implicit term

     //Zdm = mvmZ(dm,RVdd,t);

     //tmp = mvmK(Zdm,V,d0)

     //dnlZ.mean(i) = dnlZ.mean(i) - dfhat'*(dm-mvmK(Zdm,V,d0));

     result-=get_derivative_implicit_term_helper(dmu);


     return result;

 }


 float64_t CSingleFITCLaplaceInferenceMethod::get_derivative_implicit_term_helper(SGVector<float64_t> d)

 {

     //time complexity O(m*n)

     Map<VectorXd> eigen_d(d.vector, d.vlen);

     SGVector<float64_t> tmp=compute_mvmK(compute_mvmZ(d));

     Map<VectorXd> eigen_tmp(tmp.vector, tmp.vlen);

     Map<VectorXd> eigen_dfhat(m_dfhat.vector, m_dfhat.vlen);

     return eigen_dfhat.dot(eigen_d-eigen_tmp);

 }


 SGVector<float64_t> CSingleFITCLaplaceInferenceMethod::get_derivative_wrt_mean(

         const TParameter* param)

 {

     //time complexity O(m*n)

     REQUIRE(param, "Param not set\n");

     SGVector<float64_t> result;

     int64_t len=const_cast<TParameter *>(param)->m_datatype.get_num_elements();

     result=SGVector<float64_t>(len);


     if (m_Wneg)

         return derivative_helper_when_Wneg(result, param);


     for (index_t i=0; i<result.vlen; i++)

     {

         SGVector<float64_t> dmu;

         dmu=m_mean->get_parameter_derivative(m_features, param, i);

         result[i]=get_derivative_related_mean(dmu);

     }


     return result;

 }


 SGVector<float64_t> CSingleFITCLaplaceInferenceMethod::derivative_helper_when_Wneg(

     SGVector<float64_t> res, const TParameter *param)

 {

     REQUIRE(param, "Param not set\n");

     SG_WARNING("Derivative wrt %s cannot be computed since W (the Hessian (diagonal) matrix) is too negative\n", param->m_name);

     //dnlZ = struct('cov',0*hyp.cov, 'mean',0*hyp.mean, 'lik',0*hyp.lik);

     res.zero();

     return res;

 }


 SGVector<float64_t> CSingleFITCLaplaceInferenceMethod::get_derivative_wrt_inducing_features(

     const TParameter* param)

 {

     //time complexity depends on the implementation of the provided kernel

     //time complexity is at least O(max((p*n*m),(m^2*n))), where p is the dimension (#) of features

     //For an ARD kernel with KL_FULL, the time complexity is O(max((p*n*m*d),(m^2*n)))

     //where the paramter \f$\Lambda\f$ of the ARD kerenl is a \f$d\f$-by-\f$p\f$ matrix,

     //For an ARD kernel with KL_SCALE and KL_DIAG, the time complexity is O(max((p*n*m),(m^2*n)))

     //efficiently compute the implicit term and explicit term at one shot

     Map<VectorXd> eigen_al(m_al.vector, m_al.vlen);

     Map<MatrixXd> eigen_Rvdd(m_Rvdd.matrix, m_Rvdd.num_rows, m_Rvdd.num_cols);

     //w=B*al

     Map<VectorXd> eigen_w(m_w.vector, m_w.vlen);

     Map<MatrixXd> eigen_B(m_B.matrix, m_B.num_rows, m_B.num_cols);

     Map<VectorXd> eigen_dlp(m_dlp.vector, m_dlp.vlen);

     Map<VectorXd> eigen_dfhat(m_dfhat.vector, m_dfhat.vlen);


     //q = dfhat - mvmZ(mvmK(dfhat,V,d0),RVdd,t);

     SGVector<float64_t> q=compute_mvmZ(compute_mvmK(m_dfhat));

     Map<VectorXd> eigen_q(q.vector, q.vlen);

     eigen_q=eigen_dfhat-eigen_q;


     //explicit term

     //diag_dK = alpha.*alpha + sum(RVdd.*RVdd,1)'-t, where t can be cancelled out

     //-v_1=get_derivative_related_cov_diagonal= -(alpha.*alpha + sum(RVdd.*RVdd,1)')

     //implicit term

     //-v_2=-2*dlp.*q

     //neg_v = -(diag_dK+ 2*dlp.*q);

     SGVector<float64_t> neg_v=get_derivative_related_cov_diagonal();

     Map<VectorXd> eigen_neg_v(neg_v.vector, neg_v.vlen);

     eigen_neg_v-=2*eigen_dlp.cwiseProduct(eigen_q);


     SGMatrix<float64_t> BdK(m_B.num_rows, m_B.num_cols);

     Map<MatrixXd> eigen_BdK(BdK.matrix, BdK.num_rows, BdK.num_cols);

     //explicit

     //BdK = (B*alpha)*alpha' + (B*RVdd')*RVdd - B.*repmat(v_1',nu,1),

     //implicit

     //BdK = BdK + (B*dlp)*q' + (B*q)*dlp' - B.*repmat(v_2',nu,1)

     //where v_1 is the explicit part of v and v_2 is the implicit part of v

     //v=v_1+v_2

     eigen_BdK=eigen_B*eigen_neg_v.asDiagonal()+eigen_w*(eigen_al.transpose())+

         (eigen_B*eigen_Rvdd.transpose())*eigen_Rvdd+

         (eigen_B*eigen_dlp)*eigen_q.transpose()+(eigen_B*eigen_q)*eigen_dlp.transpose();


     return get_derivative_related_inducing_features(BdK, param);

 }


 SGVector<float64_t> CSingleFITCLaplaceInferenceMethod::get_derivative_wrt_inducing_noise(

     const TParameter* param)

 {

     //time complexity O(m^2*n)

     //explicit term

     SGVector<float64_t> result=CSingleFITCInference::get_derivative_wrt_inducing_noise(param);


     //implicit term

     Map<MatrixXd> eigen_B(m_B.matrix, m_B.num_rows, m_B.num_cols);

     Map<VectorXd> eigen_dlp(m_dlp.vector, m_dlp.vlen);


     //snu = sqrt(snu2);

     //T = chol_inv(Kuu + snu2*eye(nu)); T = T'*(T*(snu*Ku));

     //t1 = sum(T.*T,1)';

     VectorXd eigen_t1=eigen_B.cwiseProduct(eigen_B).colwise().sum().adjoint();


     //b = (t1.*dlp-T'*(T*dlp))*2;

     SGVector<float64_t> b(eigen_t1.rows());

     Map<VectorXd> eigen_b(b.vector, b.vlen);

     float64_t factor=2.0*CMath::exp(m_log_ind_noise);

     eigen_b=(eigen_t1.cwiseProduct(eigen_dlp)-eigen_B.transpose()*(eigen_B*eigen_dlp))*factor;


     //KZb = mvmK(mvmZ(b,RVdd,t),V,d0);

     //z = z - dfhat'*( b-KZb );

     result[0]-=get_derivative_implicit_term_helper(b);


     return result;

 }


 SGVector<float64_t> CSingleFITCLaplaceInferenceMethod::get_posterior_mean()

 {

     compute_gradient();


     SGVector<float64_t> res(m_mu.vlen);

     Map<VectorXd> eigen_res(res.vector, res.vlen);


     /*

     //true posterior mean with equivalent FITC prior approximated by Newton method

     //time complexity O(n)

     Map<VectorXd> eigen_mu(m_mu, m_mu.vlen);

     SGVector<float64_t> mean=m_mean->get_mean_vector(m_features);

     Map<VectorXd> eigen_mean(mean.vector, mean.vlen);

     eigen_res=eigen_mu-eigen_mean;

     */


     //FITC (further) approximated posterior mean with Netwon method

     //time complexity of the following operation is O(m*n)

     Map<VectorXd> eigen_post_alpha(m_alpha.vector, m_alpha.vlen);

     Map<MatrixXd> eigen_Ktru(m_ktru.matrix, m_ktru.num_rows, m_ktru.num_cols);

     eigen_res=CMath::exp(m_log_scale*2.0)*eigen_Ktru.adjoint()*eigen_post_alpha;


     return res;

 }


 SGMatrix<float64_t> CSingleFITCLaplaceInferenceMethod::get_posterior_covariance()

 {

     compute_gradient();

     //time complexity of the following operations is O(m*n^2)

     //Warning: the the time complexity increases from O(m^2*n) to O(n^2*m) if this method is called

     m_Sigma=SGMatrix<float64_t>(m_ktrtr_diag.vlen, m_ktrtr_diag.vlen);

     Map<MatrixXd> eigen_Sigma(m_Sigma.matrix, m_Sigma.num_rows,

             m_Sigma.num_cols);


     //FITC (further) approximated posterior covariance with Netwon method

     Map<MatrixXd> eigen_L(m_L.matrix, m_L.num_rows, m_L.num_cols);

     Map<MatrixXd> eigen_Ktru(m_ktru.matrix, m_ktru.num_rows, m_ktru.num_cols);

     Map<VectorXd> eigen_dg(m_dg.vector, m_dg.vlen);

     Map<MatrixXd> eigen_V(m_V.matrix, m_V.num_rows, m_V.num_cols);


     MatrixXd diagonal_part=eigen_dg.asDiagonal();

     //FITC equivalent prior

     MatrixXd prior=eigen_V.transpose()*eigen_V+diagonal_part;


     MatrixXd tmp=CMath::exp(m_log_scale*2.0)*eigen_Ktru;

     eigen_Sigma=prior-tmp.adjoint()*eigen_L*tmp;


     /*

     //true posterior mean with equivalent FITC prior approximated by Newton method

     Map<VectorXd> eigen_t(m_t.vector, m_t.vlen);

     Map<MatrixXd> eigen_Rvdd(m_Rvdd.matrix, m_Rvdd.num_rows, m_Rvdd.num_cols);

     Map<VectorXd> eigen_W(m_W.vector, m_W.vlen);

     MatrixXd tmp1=eigen_Rvdd*prior;

     eigen_Sigma=prior+tmp.transpose()*tmp;


     MatrixXd tmp2=((eigen_dg.cwiseProduct(eigen_t)).asDiagonal()*eigen_V.transpose())*eigen_V;

     eigen_Sigma-=(tmp2+tmp2.transpose());

     eigen_Sigma-=eigen_V.transpose()*(eigen_V*eigen_t.asDiagonal()*eigen_V.transpose())*eigen_V;

     MatrixXd tmp3=((eigen_dg.cwiseProduct(eigen_dg)).cwiseProduct(eigen_t)).asDiagonal();

     eigen_Sigma-=tmp3;

     */


     return SGMatrix<float64_t>(m_Sigma);

 }


 float64_t CSingleFITCLaplaceInferenceMethod::get_psi_wrt_alpha()

 {

     //time complexity O(m*n)

     Map<VectorXd> eigen_alpha(m_al, m_al.vlen);

     SGVector<float64_t> f(m_al.vlen);

     Map<VectorXd> eigen_f(f.vector, f.vlen);

     Map<VectorXd> eigen_mean_f(m_mean_f.vector,m_mean_f.vlen);

     /* f = K * alpha + mean_f given alpha*/

     SGVector<float64_t> tmp=compute_mvmK(m_al);

     Map<VectorXd> eigen_tmp(tmp.vector, tmp.vlen);

     eigen_f=eigen_tmp+eigen_mean_f;


     /* psi = 0.5 * alpha .* (f - m) - sum(dlp)*/

     float64_t psi=eigen_alpha.dot(eigen_tmp) * 0.5;

     psi-=SGVector<float64_t>::sum(m_model->get_log_probability_f(m_labels, f));


     return psi;

 }


 void CSingleFITCLaplaceInferenceMethod::get_gradient_wrt_alpha(SGVector<float64_t> gradient)

 {

     //time complexity O(m*n)

     Map<VectorXd> eigen_alpha(m_al, m_al.vlen);

     Map<VectorXd> eigen_gradient(gradient.vector, gradient.vlen);

     SGVector<float64_t> f(m_al.vlen);

     Map<VectorXd> eigen_f(f.vector, f.vlen);

     Map<MatrixXd> kernel(m_ktrtr.matrix,

         m_ktrtr.num_rows,

         m_ktrtr.num_cols);

     Map<VectorXd> eigen_mean_f(m_mean_f.vector, m_mean_f.vlen);


     /* f = K * alpha + mean_f given alpha*/

     SGVector<float64_t> tmp=compute_mvmK(m_al);

     Map<VectorXd> eigen_tmp(tmp.vector, tmp.vlen);

     eigen_f=eigen_tmp+eigen_mean_f;


     SGVector<float64_t> dlp_f =

         m_model->get_log_probability_derivative_f(m_labels, f, 1);


     Map<VectorXd> eigen_dlp_f(dlp_f.vector, dlp_f.vlen);


     /* g_alpha = K * (alpha - dlp_f)*/

     SGVector<float64_t> tmp2(m_al.vlen);

     Map<VectorXd> eigen_tmp2(tmp2.vector, tmp2.vlen);

     eigen_tmp2=eigen_alpha-eigen_dlp_f;

     tmp2=compute_mvmK(tmp2);

     Map<VectorXd> eigen_tmp3(tmp2.vector, tmp2.vlen);

     eigen_gradient=eigen_tmp3;

 }


 }

shogun::CSingleFITCLaplaceInferenceMethod::m_dg
SGVector< float64_t > m_dg
Definition: SingleFITCLaplaceInferenceMethod.h:385

shogun::CKernel::init
virtual bool init(CFeatures *lhs, CFeatures *rhs)
Definition: Kernel.cpp:98

shogun::CInference::m_log_scale
float64_t m_log_scale
Definition: Inference.h:490

shogun::CLikelihoodModel::get_log_probability_f
virtual SGVector< float64_t > get_log_probability_f(const CLabels *lab, SGVector< float64_t > func) const =0

shogun::CInference::update
virtual void update()
Definition: Inference.cpp:316

shogun::CSingleFITCLaplaceInferenceMethod::update_deriv
virtual void update_deriv()
Definition: SingleFITCLaplaceInferenceMethod.cpp:703

shogun::CSingleFITCLaplaceNewtonOptimizer::set_target
void set_target(CSingleFITCLaplaceInferenceMethod *obj)
Definition: SingleFITCLaplaceInferenceMethod.cpp:157

shogun::CSingleFITCLaplaceInferenceMethod::m_dfhat
SGVector< float64_t > m_dfhat
Definition: SingleFITCLaplaceInferenceMethod.h:371

shogun::TParameter::m_name
char * m_name
Definition: base/Parameter.h:145

shogun::CSGObject::update_parameter_hash
virtual void update_parameter_hash()
Definition: SGObject.cpp:281

shogun::CSingleSparseInference::get_derivative_wrt_inference_method
virtual SGVector< float64_t > get_derivative_wrt_inference_method(const TParameter *param)
Definition: SingleSparseInference.cpp:188

shogun::CSingleFITCLaplaceInferenceMethod::get_derivative_wrt_inducing_noise
virtual SGVector< float64_t > get_derivative_wrt_inducing_noise(const TParameter *param)
Definition: SingleFITCLaplaceInferenceMethod.cpp:1022

Math.h

shogun::CSingleFITCInference::m_w
SGVector< float64_t > m_w
Definition: SingleFITCInference.h:242

shogun::CSingleFITCLaplaceInferenceMethod::get_gradient_wrt_alpha
void get_gradient_wrt_alpha(SGVector< float64_t > gradient)
Definition: SingleFITCLaplaceInferenceMethod.cpp:1135

shogun::SGMatrix::matrix
T * matrix
Definition: SGMatrix.h:372

index_t
int32_t index_t
Definition: common.h:62

shogun::CLabels
The class Labels models labels, i.e. class assignments of objects.
Definition: Labels.h:43

shogun::CMath::INFTY
static const float64_t INFTY
infinity
Definition: Math.h:2048

shogun::CInference::get_inference_type
virtual EInferenceType get_inference_type() const
Definition: Inference.h:104

shogun::CLikelihoodModel::get_second_derivative
virtual SGVector< float64_t > get_second_derivative(const CLabels *lab, SGVector< float64_t > func, const TParameter *param) const
Definition: LikelihoodModel.h:210

shogun::CLabels::get_num_labels
virtual int32_t get_num_labels() const =0

eigen3.h

shogun::INF_FITC_LAPLACE_SINGLE
Definition: Inference.h:59

shogun::CInference::m_kernel
CKernel * m_kernel
Definition: Inference.h:469

Eigen::Map
Definition: SGMatrix.h:24

SG_SWARNING
#define SG_SWARNING(...)
Definition: SGIO.h:178

shogun::CSparseInference::m_mu
SGVector< float64_t > m_mu
Definition: SparseInference.h:319

shogun::CSingleFITCLaplaceNewtonOptimizer
The build-in minimizer for SingleFITCLaplaceInference.
Definition: SingleFITCLaplaceInferenceMethod.h:392

shogun::CSingleFITCLaplaceInferenceMethod::update_approx_cov
virtual void update_approx_cov()
Definition: SingleFITCLaplaceInferenceMethod.cpp:468

shogun::CSingleFITCLaplaceInferenceMethod::update_alpha
virtual void update_alpha()
Definition: SingleFITCLaplaceInferenceMethod.cpp:559

Eigen
Definition: SGMatrix.h:20

shogun::CSingleFITCLaplaceInferenceMethod::m_W
SGVector< float64_t > m_W
Definition: SingleFITCLaplaceInferenceMethod.h:365

shogun::SGMatrix::clone
SGMatrix< T > clone()
Definition: SGMatrix.cpp:256

shogun::TParameter
parameter struct
Definition: base/Parameter.h:32

DotFeatures.h

shogun::CSingleFITCLaplaceInferenceMethod::m_mean_f
SGVector< float64_t > m_mean_f
Definition: SingleFITCLaplaceInferenceMethod.h:350

shogun::CSingleFITCLaplaceInferenceMethod::get_derivative_wrt_inference_method
virtual SGVector< float64_t > get_derivative_wrt_inference_method(const TParameter *param)
Definition: SingleFITCLaplaceInferenceMethod.cpp:779

REQUIRE
#define REQUIRE(x,...)
Definition: SGIO.h:206

shogun::CSingleFITCLaplaceInferenceMethod::get_derivative_wrt_mean
virtual SGVector< float64_t > get_derivative_wrt_mean(const TParameter *param)
Definition: SingleFITCLaplaceInferenceMethod.cpp:943

shogun::CLock::unlock
void unlock()
Definition: Lock.cpp:64

shogun::SGMatrix::num_cols
index_t num_cols
Definition: SGMatrix.h:376

shogun::CMeanFunction::get_mean_vector
virtual SGVector< float64_t > get_mean_vector(const CFeatures *features) const =0

shogun::CSingleFITCLaplaceInferenceMethod::CSingleFITCLaplaceInferenceMethod
CSingleFITCLaplaceInferenceMethod()
Definition: SingleFITCLaplaceInferenceMethod.cpp:301

shogun::CStudentsTLikelihood::get_degrees_freedom
float64_t get_degrees_freedom() const
Definition: StudentsTLikelihood.h:98

shogun::CSingleFITCInference::get_derivative_related_cov_diagonal
virtual SGVector< float64_t > get_derivative_related_cov_diagonal()
Definition: SingleFITCInference.cpp:68

shogun::CSingleFITCInference::get_derivative_related_cov
virtual float64_t get_derivative_related_cov(SGVector< float64_t > ddiagKi, SGMatrix< float64_t > dKuui, SGMatrix< float64_t > dKui)
Definition: SingleFITCInference.cpp:104

shogun::CSingleFITCLaplaceInferenceMethod::obtain_from_generic
static CSingleFITCLaplaceInferenceMethod * obtain_from_generic(CInference *inference)
Definition: SingleFITCLaplaceInferenceMethod.cpp:403

shogun::LT_STUDENTST
Definition: LikelihoodModel.h:51

shogun::CSingleFITCLaplaceInferenceMethod::m_d3lp
SGVector< float64_t > m_d3lp
Definition: SingleFITCLaplaceInferenceMethod.h:359

shogun::CMeanFunction
An abstract class of the mean function.
Definition: MeanFunction.h:49

shogun::SGVector::scale
void scale(T alpha)
Scale vector inplace.
Definition: SGVector.cpp:841

shogun::CSingleFITCLaplaceInferenceMethod::m_g
SGVector< float64_t > m_g
Definition: SingleFITCLaplaceInferenceMethod.h:374

SingleFITCLaplaceInferenceMethod.h

SG_REF
#define SG_REF(x)
Definition: SGObject.h:54

shogun::CSingleSparseInference::m_fully_sparse
bool m_fully_sparse
Definition: SingleSparseInference.h:224

shogun::SGMatrix::num_rows
index_t num_rows
Definition: SGMatrix.h:374

shogun::CSingleFITCLaplaceInferenceMethod::update_init
virtual void update_init()
Definition: SingleFITCLaplaceInferenceMethod.cpp:472

shogun::SGMatrix< float64_t >

shogun::CInference::m_features
CFeatures * m_features
Definition: Inference.h:478

shogun::MS_NOT_AVAILABLE
Definition: SGObject.h:92

shogun::CInference::m_ktrtr
SGMatrix< float64_t > m_ktrtr
Definition: Inference.h:493

shogun::CInference::m_mean
CMeanFunction * m_mean
Definition: Inference.h:472

shogun::CSingleFITCLaplaceInferenceMethod::register_minimizer
virtual void register_minimizer(Minimizer *minimizer)
Definition: SingleFITCLaplaceInferenceMethod.cpp:547

shogun::CSingleFITCLaplaceInferenceMethod::m_d2lp
SGVector< float64_t > m_d2lp
Definition: SingleFITCLaplaceInferenceMethod.h:356

shogun::SGVector::vlen
index_t vlen
Definition: SGVector.h:494

shogun::SGVector::zero
void zero()
Definition: SGVector.cpp:136

shogun::SGVector::vector
T * vector
Definition: SGVector.h:492

shogun::CSingleFITCInference::get_derivative_wrt_inducing_noise
virtual SGVector< float64_t > get_derivative_wrt_inducing_noise(const TParameter *param)
Definition: SingleFITCInference.cpp:179

shogun::CSingleFITCLaplaceInferenceMethod::m_sW
SGVector< float64_t > m_sW
Definition: SingleFITCLaplaceInferenceMethod.h:353

shogun::CSGObject
Class SGObject is the base class of all shogun objects.
Definition: SGObject.h:115

shogun::SGVector< float64_t >

shogun::CSingleFITCInference::get_derivative_related_mean
virtual float64_t get_derivative_related_mean(SGVector< float64_t > dmu)
Definition: SingleFITCInference.cpp:149

shogun::CSingleFITCLaplaceInferenceMethod::m_Wneg
bool m_Wneg
Definition: SingleFITCLaplaceInferenceMethod.h:388

shogun::CInference::m_labels
CLabels * m_labels
Definition: Inference.h:481

shogun::FirstOrderMinimizer::unset_cost_function
virtual void unset_cost_function(bool is_unref=true)
Definition: FirstOrderMinimizer.h:94

shogun::CSingleFITCLaplaceInferenceMethod::get_diagonal_vector
virtual SGVector< float64_t > get_diagonal_vector()
Definition: SingleFITCLaplaceInferenceMethod.cpp:361

float64_t
double float64_t
Definition: common.h:50

shogun::CInference::compute_gradient
virtual void compute_gradient()
Definition: Inference.cpp:343

shogun::CSparseInference::m_Sigma
SGMatrix< float64_t > m_Sigma
Definition: SparseInference.h:316

shogun::CSingleFITCLaplaceInferenceMethod::m_chol_R0
SGMatrix< float64_t > m_chol_R0
Definition: SingleFITCLaplaceInferenceMethod.h:368

shogun::CSingleFITCLaplaceNewtonOptimizer::unset_target
void unset_target(bool is_unref)
Definition: SingleFITCLaplaceInferenceMethod.cpp:168

shogun::CSparseInference::get_inducing_features
virtual CFeatures * get_inducing_features()
Definition: SparseInference.h:121

shogun::CSingleFITCInference::m_Rvdd
SGMatrix< float64_t > m_Rvdd
Definition: SingleFITCInference.h:248

shogun::CSparseInference::m_kuu
SGMatrix< float64_t > m_kuu
Definition: SparseInference.h:310

shogun::SGVector::sum
static T sum(T *vec, int32_t len)
Return sum(vec)
Definition: SGVector.h:354

shogun::CInference::m_L
SGMatrix< float64_t > m_L
Definition: Inference.h:487

shogun::FirstOrderCostFunction
The first order cost function base class.
Definition: FirstOrderCostFunction.h:51

shogun::CSingleSparseInference::m_lock
CLock * m_lock
Definition: SingleSparseInference.h:227

shogun::CSingleFITCLaplaceInferenceMethod::SingleFITCLaplaceInferenceMethodCostFunction
friend class SingleFITCLaplaceInferenceMethodCostFunction
Definition: SingleFITCLaplaceInferenceMethod.h:62

shogun::CSingleFITCLaplaceInferenceMethod::get_negative_log_marginal_likelihood
virtual float64_t get_negative_log_marginal_likelihood()
Definition: SingleFITCLaplaceInferenceMethod.cpp:432

shogun::CSingleFITCInference::get_derivative_related_inducing_features
virtual SGVector< float64_t > get_derivative_related_inducing_features(SGMatrix< float64_t > BdK, const TParameter *param)
Definition: SingleFITCInference.cpp:210

shogun::Minimizer::minimize
virtual float64_t minimize()=0

shogun::CSparseInference::m_ktrtr_diag
SGVector< float64_t > m_ktrtr_diag
Definition: SparseInference.h:322

shogun::CSingleFITCLaplaceInferenceMethod::derivative_helper_when_Wneg
virtual SGVector< float64_t > derivative_helper_when_Wneg(SGVector< float64_t > res, const TParameter *param)
Definition: SingleFITCLaplaceInferenceMethod.cpp:965

shogun::CSingleFITCInference::m_t
SGVector< float64_t > m_t
Definition: SingleFITCInference.h:236

shogun::CStudentsTLikelihood
Class that models a Student's-t likelihood.
Definition: StudentsTLikelihood.h:57

shogun::CInference::register_minimizer
virtual void register_minimizer(Minimizer *minimizer)
Definition: Inference.cpp:128

shogun::CSingleFITCLaplaceInferenceMethod::get_posterior_mean
virtual SGVector< float64_t > get_posterior_mean()
Definition: SingleFITCLaplaceInferenceMethod.cpp:1051

shogun::CSingleFITCLaplaceInferenceMethod::compute_mvmZ
virtual SGVector< float64_t > compute_mvmZ(SGVector< float64_t > x)
Definition: SingleFITCLaplaceInferenceMethod.cpp:373

shogun::CMeanFunction::get_parameter_derivative
virtual SGVector< float64_t > get_parameter_derivative(const CFeatures *features, const TParameter *param, index_t index=-1)
Definition: MeanFunction.h:73

shogun::CSingleFITCLaplaceInferenceMethod::compute_gradient
virtual void compute_gradient()
Definition: SingleFITCLaplaceInferenceMethod.cpp:334

shogun::CSingleFITCLaplaceInferenceMethod::update_chol
virtual void update_chol()
Definition: SingleFITCLaplaceInferenceMethod.cpp:606

shogun::CSingleFITCLaplaceInferenceMethod::get_psi_wrt_alpha
float64_t get_psi_wrt_alpha()
Definition: SingleFITCLaplaceInferenceMethod.cpp:1116

SG_UNREF
#define SG_UNREF(x)
Definition: SGObject.h:55

SG_DEBUG
#define SG_DEBUG(...)
Definition: SGIO.h:107

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

shogun::CSingleFITCInference::m_V
SGMatrix< float64_t > m_V
Definition: SingleFITCInference.h:251

shogun::CInference
The Inference Method base class.
Definition: Inference.h:81

shogun::CSingleFITCLaplaceInferenceMethod::get_posterior_covariance
virtual SGMatrix< float64_t > get_posterior_covariance()
Definition: SingleFITCLaplaceInferenceMethod.cpp:1076

shogun::CInference::m_minimizer
Minimizer * m_minimizer
Definition: Inference.h:466

shogun::CSingleFITCLaplaceInferenceMethod::get_derivative_implicit_term_helper
virtual float64_t get_derivative_implicit_term_helper(SGVector< float64_t > d)
Definition: SingleFITCLaplaceInferenceMethod.cpp:933

shogun::CSparseInference::m_inducing_features
SGMatrix< float64_t > m_inducing_features
Definition: SparseInference.h:304

shogun::CSingleFITCLaplaceInferenceMethod::m_dlp
SGVector< float64_t > m_dlp
Definition: SingleFITCLaplaceInferenceMethod.h:362

shogun::CSingleFITCLaplaceInferenceMethod::m_Psi
float64_t m_Psi
Definition: SingleFITCLaplaceInferenceMethod.h:382

shogun::CFeatures
The class Features is the base class of all feature objects.
Definition: Features.h:68

SG_SERROR
#define SG_SERROR(...)
Definition: SGIO.h:179

shogun::CMath::exp
static float64_t exp(float64_t x)
Definition: Math.h:621

Eigen::Matrix
Definition: SGMatrix.h:22

shogun::CSingleFITCLaplaceNewtonOptimizer::minimize
virtual float64_t minimize()
Definition: SingleFITCLaplaceInferenceMethod.cpp:198

shogun::CKernel::get_parameter_gradient
virtual SGMatrix< float64_t > get_parameter_gradient(const TParameter *param, index_t index=-1)
Definition: Kernel.h:851

shogun::CSingleFITCLaplaceInferenceMethod::get_name
virtual const char * get_name() const
Definition: SingleFITCLaplaceInferenceMethod.h:86

shogun::CSingleFITCLaplaceInferenceMethod::~CSingleFITCLaplaceInferenceMethod
virtual ~CSingleFITCLaplaceInferenceMethod()
Definition: SingleFITCLaplaceInferenceMethod.cpp:369

shogun::CSingleFITCLaplaceInferenceMethod::get_derivative_related_cov
virtual float64_t get_derivative_related_cov(SGVector< float64_t > ddiagKi, SGMatrix< float64_t > dKuui, SGMatrix< float64_t > dKui)
Definition: SingleFITCLaplaceInferenceMethod.cpp:735

shogun::CSingleFITCLaplaceInferenceMethod::compute_mvmK
virtual SGVector< float64_t > compute_mvmK(SGVector< float64_t > al)
Definition: SingleFITCLaplaceInferenceMethod.cpp:388

shogun::SGVector::clone
SGVector< T > clone() const
Definition: SGVector.cpp:207

shogun::CSingleFITCLaplaceInferenceMethod::update
virtual void update()
Definition: SingleFITCLaplaceInferenceMethod.cpp:347

shogun::CLikelihoodModel::get_log_probability_derivative_f
virtual SGVector< float64_t > get_log_probability_derivative_f(const CLabels *lab, SGVector< float64_t > func, index_t i) const =0

shogun::CKernel
The Kernel base class.
Definition: Kernel.h:159

shogun::CSparseInference::m_ktru
SGMatrix< float64_t > m_ktru
Definition: SparseInference.h:313

shogun::CLikelihoodModel::get_third_derivative
virtual SGVector< float64_t > get_third_derivative(const CLabels *lab, SGVector< float64_t > func, const TParameter *param) const
Definition: LikelihoodModel.h:227

shogun::CInference::m_gradient_update
bool m_gradient_update
Definition: Inference.h:499

shogun::CSingleFITCLaplaceInferenceMethod::CSingleFITCLaplaceNewtonOptimizer
friend class CSingleFITCLaplaceNewtonOptimizer
Definition: SingleFITCLaplaceInferenceMethod.h:61

shogun::Minimizer
The minimizer base class.
Definition: Minimizer.h:43

SG_WARNING
#define SG_WARNING(...)
Definition: SGIO.h:128

SG_ADD
#define SG_ADD(...)
Definition: SGObject.h:84

shogun::CStudentsTLikelihood::obtain_from_generic
static CStudentsTLikelihood * obtain_from_generic(CLikelihoodModel *likelihood)
Definition: StudentsTLikelihood.cpp:287

shogun::CSingleFITCLaplaceInferenceMethod::get_chol_inv
virtual SGMatrix< float64_t > get_chol_inv(SGMatrix< float64_t > mtx)
Definition: SingleFITCLaplaceInferenceMethod.cpp:415

shogun::CSingleFITCInference::m_B
SGMatrix< float64_t > m_B
Definition: SingleFITCInference.h:239

shogun::CSingleFITCLaplaceInferenceMethod
The FITC approximation inference method class for regression and binary Classification. Note that the number of inducing points (m) is usually far less than the number of input points (n). (the time complexity is computed based on the assumption m < n)
Definition: SingleFITCLaplaceInferenceMethod.h:58

shogun::CSingleFITCInference
The Fully Independent Conditional Training inference base class for Laplace and regression for 1-D la...
Definition: SingleFITCInference.h:68

shogun::CSingleFITCLaplaceInferenceMethod::get_derivative_wrt_inducing_features
virtual SGVector< float64_t > get_derivative_wrt_inducing_features(const TParameter *param)
Definition: SingleFITCLaplaceInferenceMethod.cpp:975

shogun::CLikelihoodModel::get_first_derivative
virtual SGVector< float64_t > get_first_derivative(const CLabels *lab, SGVector< float64_t > func, const TParameter *param) const
Definition: LikelihoodModel.h:192

shogun::CInference::m_model
CLikelihoodModel * m_model
Definition: Inference.h:475

shogun::CSingleFITCLaplaceInferenceMethod::get_derivative_wrt_kernel
virtual SGVector< float64_t > get_derivative_wrt_kernel(const TParameter *param)
Definition: SingleFITCLaplaceInferenceMethod.cpp:873

shogun::CSGObject::parameter_hash_changed
virtual bool parameter_hash_changed()
Definition: SGObject.cpp:295

shogun::CKernel::get_parameter_gradient_diagonal
virtual SGVector< float64_t > get_parameter_gradient_diagonal(const TParameter *param, index_t index=-1)
Definition: Kernel.h:865

shogun::CLock::lock
void lock()
Definition: Lock.cpp:57

shogun::CLikelihoodModel
The Likelihood model base class.
Definition: LikelihoodModel.h:62

shogun::CSingleFITCInference::m_al
SGVector< float64_t > m_al
Definition: SingleFITCInference.h:230

shogun::CSingleFITCLaplaceInferenceMethod::get_derivative_related_mean
virtual float64_t get_derivative_related_mean(SGVector< float64_t > dmu)
Definition: SingleFITCLaplaceInferenceMethod.cpp:918

shogun::CSingleFITCLaplaceInferenceMethod::get_derivative_wrt_likelihood_model
virtual SGVector< float64_t > get_derivative_wrt_likelihood_model(const TParameter *param)
Definition: SingleFITCLaplaceInferenceMethod.cpp:838

shogun::FirstOrderMinimizer::set_cost_function
virtual void set_cost_function(FirstOrderCostFunction *fun)
Definition: FirstOrderMinimizer.cpp:42

StudentsTLikelihood.h

shogun::CSparseInference::m_log_ind_noise
float64_t m_log_ind_noise
Definition: SparseInference.h:307

shogun::CInference::m_alpha
SGVector< float64_t > m_alpha
Definition: Inference.h:484

shogun::FirstOrderMinimizer
The first order minimizer base class.
Definition: FirstOrderMinimizer.h:52

FirstOrderMinimizer.h