en/latest/SingleLaplaceInferenceMethod_8cpp_source.html

 /*

  * This program is free software; you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation; either version 3 of the License, or

  * (at your option) any later version.

  *

  * Written (W) 2016 Wu Lin

  * Written (W) 2013 Roman Votyakov

  * Copyright (C) 2012 Jacob Walker

  * Copyright (C) 2013 Roman Votyakov

  *

  * Code adapted from Gaussian Process Machine Learning Toolbox

  * http://www.gaussianprocess.org/gpml/code/matlab/doc/

  * This code specifically adapted from infLaplace.m

  */


 #include <shogun/machine/gp/SingleLaplaceInferenceMethod.h>


 #include <shogun/machine/gp/StudentsTLikelihood.h>

 #include <shogun/mathematics/Math.h>

 #include <shogun/lib/external/brent.h>

 #include <shogun/mathematics/eigen3.h>

 #include <shogun/optimization/FirstOrderMinimizer.h>


 using namespace shogun;

 using namespace Eigen;


 namespace shogun

 {


 #ifndef DOXYGEN_SHOULD_SKIP_THIS


 class PsiLine : public func_base

 {

 public:

     float64_t log_scale;

     MatrixXd K;

     VectorXd dalpha;

     VectorXd start_alpha;

     Map<VectorXd>* alpha;

     SGVector<float64_t>* dlp;

     SGVector<float64_t>* W;

     SGVector<float64_t>* f;

     SGVector<float64_t>* m;

     CLikelihoodModel* lik;

     CLabels* lab;


     virtual double operator() (double x)

     {

         Map<VectorXd> eigen_f(f->vector, f->vlen);

         Map<VectorXd> eigen_m(m->vector, m->vlen);


         // compute alpha=alpha+x*dalpha and f=K*alpha+m

         (*alpha)=start_alpha+x*dalpha;

         eigen_f=K*(*alpha)*CMath::exp(log_scale*2.0)+eigen_m;


         // get first and second derivatives of log likelihood

         (*dlp)=lik->get_log_probability_derivative_f(lab, (*f), 1);


         (*W)=lik->get_log_probability_derivative_f(lab, (*f), 2);

         W->scale(-1.0);


         // compute psi=alpha'*(f-m)/2-lp

         float64_t result = (*alpha).dot(eigen_f-eigen_m)/2.0-

             SGVector<float64_t>::sum(lik->get_log_probability_f(lab, *f));


         return result;

     }

 };


 class SingleLaplaceInferenceMethodCostFunction: public FirstOrderCostFunction

 {

 public:

     SingleLaplaceInferenceMethodCostFunction():FirstOrderCostFunction() {  init(); }

     virtual ~SingleLaplaceInferenceMethodCostFunction() { SG_UNREF(m_obj); }

     void set_target(CSingleLaplaceInferenceMethod *obj)

     {

         REQUIRE(obj, "Obj must set\n");

         if(m_obj != obj)

         {

             SG_REF(obj);

             SG_UNREF(m_obj);

             m_obj=obj;

         }

     }

     virtual float64_t get_cost()

     {

         REQUIRE(m_obj,"Object not set\n");

         return m_obj->get_psi_wrt_alpha();

     }

     void unset_target(bool is_unref)

     {

         if(is_unref)

         {

             SG_UNREF(m_obj);

         }

         m_obj=NULL;

     }

     virtual SGVector<float64_t> obtain_variable_reference()

     {

         REQUIRE(m_obj,"Object not set\n");

         m_derivatives = SGVector<float64_t>((m_obj->m_alpha).vlen);

         return m_obj->m_alpha;

     }

     virtual SGVector<float64_t> get_gradient()

     {

         REQUIRE(m_obj,"Object not set\n");

         m_obj->get_gradient_wrt_alpha(m_derivatives);

         return m_derivatives;

     }

     virtual const char* get_name() const { return "SingleLaplaceInferenceMethodCostFunction"; }

 private:

     void init()

     {

         m_obj=NULL;

         m_derivatives = SGVector<float64_t>();

         SG_ADD(&m_derivatives, "SingleLaplaceInferenceMethodCostFunction__m_derivatives",

             "derivatives in SingleLaplaceInferenceMethodCostFunction", MS_NOT_AVAILABLE);

         SG_ADD((CSGObject **)&m_obj, "SingleLaplaceInferenceMethodCostFunction__m_obj",

             "obj in SingleLaplaceInferenceMethodCostFunction", MS_NOT_AVAILABLE);


     }


     SGVector<float64_t> m_derivatives;

     CSingleLaplaceInferenceMethod *m_obj;

 };

 #endif /* DOXYGEN_SHOULD_SKIP_THIS */


 void CSingleLaplaceNewtonOptimizer::set_target(CSingleLaplaceInferenceMethod *obj)

 {

     REQUIRE(obj, "Obj must set\n");

     if(m_obj != obj)

     {

         SG_REF(obj);

         SG_UNREF(m_obj);

         m_obj=obj;

     }

 }


 void CSingleLaplaceNewtonOptimizer::unset_target(bool is_unref)

 {

     if(is_unref)

     {

         SG_UNREF(m_obj);

     }

     m_obj=NULL;


 }


 void CSingleLaplaceNewtonOptimizer::init()

 {

     m_obj=NULL;

     m_iter=20;

     m_tolerance=1e-6;

     m_opt_tolerance=1e-6;

     m_opt_max=10;


     SG_ADD((CSGObject **)&m_obj, "CSingleLaplaceNewtonOptimizer__m_obj",

         "obj in CSingleLaplaceNewtonOptimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_iter, "CSingleLaplaceNewtonOptimizer__m_iter",

         "iter in CSingleLaplaceNewtonOptimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_tolerance, "CSingleLaplaceNewtonOptimizer__m_tolerance",

         "tolerance in CSingleLaplaceNewtonOptimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_opt_tolerance, "CSingleLaplaceNewtonOptimizer__m_opt_tolerance",

         "opt_tolerance in CSingleLaplaceNewtonOptimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_opt_max, "CSingleLaplaceNewtonOptimizer__m_opt_max",

         "opt_max in CSingleLaplaceNewtonOptimizer", MS_NOT_AVAILABLE);

 }


 float64_t CSingleLaplaceNewtonOptimizer::minimize()

 {

     REQUIRE(m_obj,"Object not set\n");

     float64_t Psi_Old=CMath::INFTY;

     float64_t Psi_New=m_obj->m_Psi;


     // get mean vector and create eigen representation of it

     Map<VectorXd> eigen_mean( (m_obj->m_mean_f).vector, (m_obj->m_mean_f).vlen);


     // create eigen representation of kernel matrix

     Map<MatrixXd> eigen_ktrtr( (m_obj->m_ktrtr).matrix, (m_obj->m_ktrtr).num_rows, (m_obj->m_ktrtr).num_cols);


     Map<VectorXd> eigen_mu(m_obj->m_mu, (m_obj->m_mu).vlen);


     // compute W = -d2lp

     m_obj->m_W=m_obj->m_model->get_log_probability_derivative_f(m_obj->m_labels, m_obj->m_mu, 2);

     m_obj->m_W.scale(-1.0);


     Map<VectorXd> eigen_alpha(m_obj->m_alpha.vector, m_obj->m_alpha.vlen);


     // get first derivative of log probability function

     m_obj->m_dlp=m_obj->m_model->get_log_probability_derivative_f(m_obj->m_labels, m_obj->m_mu, 1);


     // create shogun and eigen representation of sW

     m_obj->m_sW=SGVector<float64_t>((m_obj->m_W).vlen);

     Map<VectorXd> eigen_sW((m_obj->m_sW).vector, (m_obj->m_sW).vlen);


     index_t iter=0;


     while (Psi_Old-Psi_New>m_tolerance && iter<m_iter)

     {

         Map<VectorXd> eigen_W( (m_obj->m_W).vector, (m_obj->m_W).vlen);

         Map<VectorXd> eigen_dlp( (m_obj->m_dlp).vector, (m_obj->m_dlp).vlen);


         Psi_Old = Psi_New;

         iter++;


         if (eigen_W.minCoeff() < 0)

         {

             // Suggested by Vanhatalo et. al.,

             // Gaussian Process Regression with Student's t likelihood, NIPS 2009

             // Quoted from infLaplace.m

             float64_t df;


             if (m_obj->m_model->get_model_type()==LT_STUDENTST)

             {

                 CStudentsTLikelihood* lik=CStudentsTLikelihood::obtain_from_generic(m_obj->m_model);

                 df=lik->get_degrees_freedom();

                 SG_UNREF(lik);

             }

             else

                 df=1;


             eigen_W+=(2.0/df)*eigen_dlp.cwiseProduct(eigen_dlp);

         }


         // compute sW = sqrt(W)

         eigen_sW=eigen_W.cwiseSqrt();


         LLT<MatrixXd> L((eigen_sW*eigen_sW.transpose()).cwiseProduct(eigen_ktrtr*CMath::exp((m_obj->m_log_scale)*2.0))+

             MatrixXd::Identity( (m_obj->m_ktrtr).num_rows, (m_obj->m_ktrtr).num_cols));


         VectorXd b=eigen_W.cwiseProduct(eigen_mu - eigen_mean)+eigen_dlp;


         VectorXd dalpha=b-eigen_sW.cwiseProduct(

             L.solve(eigen_sW.cwiseProduct(eigen_ktrtr*b*CMath::exp((m_obj->m_log_scale)*2.0))))-eigen_alpha;


         // perform Brent's optimization

         PsiLine func;


         func.log_scale=m_obj->m_log_scale;

         func.K=eigen_ktrtr;

         func.dalpha=dalpha;

         func.start_alpha=eigen_alpha;

         func.alpha=&eigen_alpha;

         func.dlp=&(m_obj->m_dlp);

         func.f=&(m_obj->m_mu);

         func.m=&(m_obj->m_mean_f);

         func.W=&(m_obj->m_W);

         func.lik=m_obj->m_model;

         func.lab=m_obj->m_labels;


         float64_t x;

         Psi_New=local_min(0, m_opt_max, m_opt_tolerance, func, x);

     }


     if (Psi_Old-Psi_New>m_tolerance && iter>=m_iter)

     {

         SG_SWARNING("Max iterations (%d) reached, but convergence level (%f) is not yet below tolerance (%f)\n", m_iter, Psi_Old-Psi_New, m_tolerance);

     }

     return Psi_New;

 }


 CSingleLaplaceInferenceMethod::CSingleLaplaceInferenceMethod() : CLaplaceInference()

 {

     init();

 }


 CSingleLaplaceInferenceMethod::CSingleLaplaceInferenceMethod(CKernel* kern,

         CFeatures* feat, CMeanFunction* m, CLabels* lab, CLikelihoodModel* mod)

         : CLaplaceInference(kern, feat, m, lab, mod)

 {

     init();

 }


 void CSingleLaplaceInferenceMethod::init()

 {

     m_Psi=0;

     SG_ADD(&m_Psi, "Psi", "posterior log likelihood without constant terms", MS_NOT_AVAILABLE);

     SG_ADD(&m_sW, "sW", "square root of W", MS_NOT_AVAILABLE);

     SG_ADD(&m_d2lp, "d2lp", "second derivative of log likelihood with respect to function location", MS_NOT_AVAILABLE);

     SG_ADD(&m_d3lp, "d3lp", "third derivative of log likelihood with respect to function location", MS_NOT_AVAILABLE);

     register_minimizer(new CSingleLaplaceNewtonOptimizer());

 }


 SGVector<float64_t> CSingleLaplaceInferenceMethod::get_diagonal_vector()

 {

     if (parameter_hash_changed())

         update();


     return SGVector<float64_t>(m_sW);

 }


 CSingleLaplaceInferenceMethod* CSingleLaplaceInferenceMethod::obtain_from_generic(

         CInference* inference)

 {

     if (inference==NULL)

         return NULL;


     if (inference->get_inference_type()!=INF_LAPLACE_SINGLE)

         SG_SERROR("Provided inference is not of type CSingleLaplaceInferenceMethod\n")


     SG_REF(inference);

     return (CSingleLaplaceInferenceMethod*)inference;

 }


 CSingleLaplaceInferenceMethod::~CSingleLaplaceInferenceMethod()

 {

 }


 float64_t CSingleLaplaceInferenceMethod::get_negative_log_marginal_likelihood()

 {

     if (parameter_hash_changed())

         update();


     // create eigen representations alpha, f, W, L

     Map<VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);

     Map<VectorXd> eigen_mu(m_mu.vector, m_mu.vlen);

     Map<VectorXd> eigen_W(m_W.vector, m_W.vlen);

     Map<MatrixXd> eigen_L(m_L.matrix, m_L.num_rows, m_L.num_cols);


     // get mean vector and create eigen representation of it

     SGVector<float64_t> mean=m_mean->get_mean_vector(m_features);

     Map<VectorXd> eigen_mean(mean.vector, mean.vlen);


     // get log likelihood

     float64_t lp=SGVector<float64_t>::sum(m_model->get_log_probability_f(m_labels,

         m_mu));


     float64_t result;


     if (eigen_W.minCoeff()<0)

     {

         Map<VectorXd> eigen_sW(m_sW.vector, m_sW.vlen);

         Map<MatrixXd> eigen_ktrtr(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);


         FullPivLU<MatrixXd> lu(MatrixXd::Identity(m_ktrtr.num_rows, m_ktrtr.num_cols)+

             eigen_ktrtr*CMath::exp(m_log_scale*2.0)*eigen_sW.asDiagonal());


         result=(eigen_alpha.dot(eigen_mu-eigen_mean))/2.0-

             lp+log(lu.determinant())/2.0;

     }

     else

     {

         result=eigen_alpha.dot(eigen_mu-eigen_mean)/2.0-lp+

             eigen_L.diagonal().array().log().sum();

     }


     return result;

 }


 void CSingleLaplaceInferenceMethod::update_approx_cov()

 {

     Map<MatrixXd> eigen_L(m_L.matrix, m_L.num_rows, m_L.num_cols);

     Map<MatrixXd> eigen_K(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);

     Map<VectorXd> eigen_sW(m_sW.vector, m_sW.vlen);


     m_Sigma=SGMatrix<float64_t>(m_ktrtr.num_rows, m_ktrtr.num_cols);

     Map<MatrixXd> eigen_Sigma(m_Sigma.matrix, m_Sigma.num_rows, m_Sigma.num_cols);


     // compute V = L^(-1) * W^(1/2) * K, using upper triangular factor L^T

     MatrixXd eigen_V=eigen_L.triangularView<Upper>().adjoint().solve(

             eigen_sW.asDiagonal()*eigen_K*CMath::exp(m_log_scale*2.0));


     // compute covariance matrix of the posterior:

     // Sigma = K - K * W^(1/2) * (L * L^T)^(-1) * W^(1/2) * K =

     // K - (K * W^(1/2)) * (L^T)^(-1) * L^(-1) * W^(1/2) * K =

     // K - (W^(1/2) * K)^T * (L^(-1))^T * L^(-1) * W^(1/2) * K = K - V^T * V

     eigen_Sigma=eigen_K*CMath::exp(m_log_scale*2.0)-eigen_V.adjoint()*eigen_V;

 }


 void CSingleLaplaceInferenceMethod::update_chol()

 {

     // get log probability derivatives

     m_dlp=m_model->get_log_probability_derivative_f(m_labels, m_mu, 1);

     m_d2lp=m_model->get_log_probability_derivative_f(m_labels, m_mu, 2);

     m_d3lp=m_model->get_log_probability_derivative_f(m_labels, m_mu, 3);


     // W = -d2lp

     m_W=m_d2lp.clone();

     m_W.scale(-1.0);

     m_sW=SGVector<float64_t>(m_W.vlen);


     // compute sW

     Map<VectorXd> eigen_W(m_W.vector, m_W.vlen);

     Map<VectorXd> eigen_sW(m_sW.vector, m_sW.vlen);


     if (eigen_W.minCoeff()>0)

         eigen_sW=eigen_W.cwiseSqrt();

     else

         //post.sW = sqrt(abs(W)).*sign(W);

         eigen_sW=((eigen_W.array().abs()+eigen_W.array())/2).sqrt()-((eigen_W.array().abs()-eigen_W.array())/2).sqrt();


     // create eigen representation of kernel matrix

     Map<MatrixXd> eigen_ktrtr(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);


     // create shogun and eigen representation of posterior cholesky

     m_L=SGMatrix<float64_t>(m_ktrtr.num_rows, m_ktrtr.num_cols);

     Map<MatrixXd> eigen_L(m_L.matrix, m_L.num_rows, m_L.num_cols);


     if (eigen_W.minCoeff() < 0)

     {

         //A = eye(n)+K.*repmat(w',n,1);

         FullPivLU<MatrixXd> lu(

             MatrixXd::Identity(m_ktrtr.num_rows,m_ktrtr.num_cols)+

             eigen_ktrtr*CMath::exp(m_log_scale*2.0)*eigen_W.asDiagonal());

         // compute cholesky: L = -(K + 1/W)^-1

         //-iA = -inv(A)

         eigen_L=-lu.inverse();

         // -repmat(w,1,n).*iA == (-iA'.*repmat(w',n,1))'

         eigen_L=eigen_W.asDiagonal()*eigen_L;

     }

     else

     {

         // compute cholesky: L = chol(sW * sW' .* K + I)

         LLT<MatrixXd> L(

             (eigen_sW*eigen_sW.transpose()).cwiseProduct(eigen_ktrtr*CMath::exp(m_log_scale*2.0))+

             MatrixXd::Identity(m_ktrtr.num_rows, m_ktrtr.num_cols));


         eigen_L = L.matrixU();

     }

 }


 void CSingleLaplaceInferenceMethod::update()

 {

     SG_DEBUG("entering\n");


     CInference::update();

     update_init();

     update_alpha();

     update_chol();

     m_gradient_update=false;

     update_parameter_hash();


     SG_DEBUG("leaving\n");

 }


 void CSingleLaplaceInferenceMethod::update_init()

 {

     float64_t Psi_New;

     float64_t Psi_Def;

     // get mean vector and create eigen representation of it

     m_mean_f = m_mean->get_mean_vector(m_features);

     Map<VectorXd> eigen_mean(m_mean_f.vector, m_mean_f.vlen);


     // create eigen representation of kernel matrix

     Map<MatrixXd> eigen_ktrtr(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);


     // create shogun and eigen representation of function vector

     m_mu=SGVector<float64_t>(m_mean_f.vlen);

     Map<VectorXd> eigen_mu(m_mu, m_mu.vlen);


     if (m_alpha.vlen!=m_labels->get_num_labels())

     {

         // set alpha a zero vector

         m_alpha=SGVector<float64_t>(m_labels->get_num_labels());

         m_alpha.zero();


         // f = mean, if length of alpha and length of y doesn't match

         eigen_mu=eigen_mean;


         Psi_New=-SGVector<float64_t>::sum(m_model->get_log_probability_f(

             m_labels, m_mu));

     }

     else

     {

         Map<VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);


         // compute f = K * alpha + m

         eigen_mu=eigen_ktrtr*CMath::exp(m_log_scale*2.0)*eigen_alpha+eigen_mean;


         Psi_New=eigen_alpha.dot(eigen_mu-eigen_mean)/2.0-

             SGVector<float64_t>::sum(m_model->get_log_probability_f(m_labels, m_mu));


         Psi_Def=-SGVector<float64_t>::sum(m_model->get_log_probability_f(m_labels, m_mean_f));


         // if default is better, then use it

         if (Psi_Def < Psi_New)

         {

             m_alpha.zero();

             eigen_mu=eigen_mean;

             Psi_New=Psi_Def;

         }

     }

     m_Psi=Psi_New;

 }


 void CSingleLaplaceInferenceMethod::register_minimizer(Minimizer* minimizer)

 {

     REQUIRE(minimizer, "Minimizer must set\n");

     if (!dynamic_cast<CSingleLaplaceNewtonOptimizer*>(minimizer))

     {

         FirstOrderMinimizer* opt= dynamic_cast<FirstOrderMinimizer*>(minimizer);

         REQUIRE(opt, "The provided minimizer is not supported\n")

     }

     CInference::register_minimizer(minimizer);

 }


 void CSingleLaplaceInferenceMethod::update_alpha()

 {

     CSingleLaplaceNewtonOptimizer *opt=dynamic_cast<CSingleLaplaceNewtonOptimizer*>(m_minimizer);

     bool cleanup=false;

     if (opt)

     {

         opt->set_target(this);

         if(this->ref_count()>1)

             cleanup=true;

         opt->minimize();

         opt->unset_target(cleanup);

     }

     else

     {

         FirstOrderMinimizer* minimizer= dynamic_cast<FirstOrderMinimizer*>(m_minimizer);

         REQUIRE(minimizer, "The provided minimizer is not supported\n");


         SingleLaplaceInferenceMethodCostFunction *cost_fun=new SingleLaplaceInferenceMethodCostFunction();

         cost_fun->set_target(this);

         if(this->ref_count()>1)

             cleanup=true;

         minimizer->set_cost_function(cost_fun);

         minimizer->minimize();

         minimizer->unset_cost_function(false);

         cost_fun->unset_target(cleanup);

         SG_UNREF(cost_fun);

     }

     // get mean vector and create eigen representation of it

     Map<VectorXd> eigen_mean(m_mean_f.vector, m_mean_f.vlen);


     // create eigen representation of kernel matrix

     Map<MatrixXd> eigen_ktrtr(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);


     Map<VectorXd> eigen_mu(m_mu, m_mu.vlen);


     Map<VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);


     // compute f = K * alpha + m

     eigen_mu=eigen_ktrtr*CMath::exp(m_log_scale*2.0)*eigen_alpha+eigen_mean;

 }


 void CSingleLaplaceInferenceMethod::update_deriv()

 {

     // create eigen representation of W, sW, dlp, d3lp, K, alpha and L

     Map<VectorXd> eigen_W(m_W.vector, m_W.vlen);

     Map<VectorXd> eigen_sW(m_sW.vector, m_sW.vlen);

     Map<VectorXd> eigen_dlp(m_dlp.vector, m_dlp.vlen);

     Map<VectorXd> eigen_d3lp(m_d3lp.vector, m_d3lp.vlen);

     Map<MatrixXd> eigen_K(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);

     Map<VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);

     Map<MatrixXd> eigen_L(m_L.matrix, m_L.num_rows, m_L.num_cols);


     // create shogun and eigen representation of matrix Z

     m_Z=SGMatrix<float64_t>(m_L.num_rows, m_L.num_cols);

     Map<MatrixXd> eigen_Z(m_Z.matrix, m_Z.num_rows, m_Z.num_cols);


     // create shogun and eigen representation of the vector g

     m_g=SGVector<float64_t>(m_Z.num_rows);

     Map<VectorXd> eigen_g(m_g.vector, m_g.vlen);


     if (eigen_W.minCoeff()<0)

     {

         eigen_Z=-eigen_L;


         // compute iA = (I + K * diag(W))^-1

         FullPivLU<MatrixXd> lu(MatrixXd::Identity(m_ktrtr.num_rows, m_ktrtr.num_cols)+

                 eigen_K*CMath::exp(m_log_scale*2.0)*eigen_W.asDiagonal());

         MatrixXd iA=lu.inverse();


         // compute derivative ln|L'*L| wrt W: g=sum(iA.*K,2)/2

         eigen_g=(iA.cwiseProduct(eigen_K*CMath::exp(m_log_scale*2.0))).rowwise().sum()/2.0;

     }

     else

     {

         // solve L'*L*Z=diag(sW) and compute Z=diag(sW)*Z

         eigen_Z=eigen_L.triangularView<Upper>().adjoint().solve(

                 MatrixXd(eigen_sW.asDiagonal()));

         eigen_Z=eigen_L.triangularView<Upper>().solve(eigen_Z);

         eigen_Z=eigen_sW.asDiagonal()*eigen_Z;


         // solve L'*C=diag(sW)*K

         MatrixXd C=eigen_L.triangularView<Upper>().adjoint().solve(

                 eigen_sW.asDiagonal()*eigen_K*CMath::exp(m_log_scale*2.0));


         // compute derivative ln|L'*L| wrt W: g=(diag(K)-sum(C.^2,1)')/2

         eigen_g=(eigen_K.diagonal()*CMath::exp(m_log_scale*2.0)-

                 (C.cwiseProduct(C)).colwise().sum().adjoint())/2.0;

     }


     // create shogun and eigen representation of the vector dfhat

     m_dfhat=SGVector<float64_t>(m_g.vlen);

     Map<VectorXd> eigen_dfhat(m_dfhat.vector, m_dfhat.vlen);


     // compute derivative of nlZ wrt fhat

     eigen_dfhat=eigen_g.cwiseProduct(eigen_d3lp);

 }


 SGVector<float64_t> CSingleLaplaceInferenceMethod::get_derivative_wrt_inference_method(

         const TParameter* param)

 {

     REQUIRE(!strcmp(param->m_name, "log_scale"), "Can't compute derivative of "

             "the nagative log marginal likelihood wrt %s.%s parameter\n",

             get_name(), param->m_name)


     // create eigen representation of K, Z, dfhat, dlp and alpha

     Map<MatrixXd> eigen_K(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);

     Map<MatrixXd> eigen_Z(m_Z.matrix, m_Z.num_rows, m_Z.num_cols);

     Map<VectorXd> eigen_dfhat(m_dfhat.vector, m_dfhat.vlen);

     Map<VectorXd> eigen_dlp(m_dlp.vector, m_dlp.vlen);

     Map<VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);


     SGVector<float64_t> result(1);


     // compute derivative K wrt scale

     // compute dnlZ=sum(sum(Z.*dK))/2-alpha'*dK*alpha/2

     result[0]=(eigen_Z.cwiseProduct(eigen_K)).sum()/2.0-

         (eigen_alpha.adjoint()*eigen_K).dot(eigen_alpha)/2.0;


     // compute b=dK*dlp

     VectorXd b=eigen_K*eigen_dlp;


     // compute dnlZ=dnlZ-dfhat'*(b-K*(Z*b))

     result[0]=result[0]-eigen_dfhat.dot(b-eigen_K*CMath::exp(m_log_scale*2.0)*(eigen_Z*b));

     result[0]*=CMath::exp(m_log_scale*2.0)*2.0;


     return result;

 }


 SGVector<float64_t> CSingleLaplaceInferenceMethod::get_derivative_wrt_likelihood_model(

         const TParameter* param)

 {

     // create eigen representation of K, Z, g and dfhat

     Map<MatrixXd> eigen_K(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);

     Map<MatrixXd> eigen_Z(m_Z.matrix, m_Z.num_rows, m_Z.num_cols);

     Map<VectorXd> eigen_g(m_g.vector, m_g.vlen);

     Map<VectorXd> eigen_dfhat(m_dfhat.vector, m_dfhat.vlen);


     // get derivatives wrt likelihood model parameters

     SGVector<float64_t> lp_dhyp=m_model->get_first_derivative(m_labels,

             m_mu, param);

     SGVector<float64_t> dlp_dhyp=m_model->get_second_derivative(m_labels,

             m_mu, param);

     SGVector<float64_t> d2lp_dhyp=m_model->get_third_derivative(m_labels,

             m_mu, param);


     // create eigen representation of the derivatives

     Map<VectorXd> eigen_lp_dhyp(lp_dhyp.vector, lp_dhyp.vlen);

     Map<VectorXd> eigen_dlp_dhyp(dlp_dhyp.vector, dlp_dhyp.vlen);

     Map<VectorXd> eigen_d2lp_dhyp(d2lp_dhyp.vector, d2lp_dhyp.vlen);


     SGVector<float64_t> result(1);


     // compute b vector

     VectorXd b=eigen_K*eigen_dlp_dhyp;


     // compute dnlZ=-g'*d2lp_dhyp-sum(lp_dhyp)-dfhat'*(b-K*(Z*b))

     result[0]=-eigen_g.dot(eigen_d2lp_dhyp)-eigen_lp_dhyp.sum()-

         eigen_dfhat.dot(b-eigen_K*CMath::exp(m_log_scale*2.0)*(eigen_Z*b));


     return result;

 }


 SGVector<float64_t> CSingleLaplaceInferenceMethod::get_derivative_wrt_kernel(

         const TParameter* param)

 {

     // create eigen representation of K, Z, dfhat, dlp and alpha

     Map<MatrixXd> eigen_K(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);

     Map<MatrixXd> eigen_Z(m_Z.matrix, m_Z.num_rows, m_Z.num_cols);

     Map<VectorXd> eigen_dfhat(m_dfhat.vector, m_dfhat.vlen);

     Map<VectorXd> eigen_dlp(m_dlp.vector, m_dlp.vlen);

     Map<VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);


     REQUIRE(param, "Param not set\n");

     SGVector<float64_t> result;

     int64_t len=const_cast<TParameter *>(param)->m_datatype.get_num_elements();

     result=SGVector<float64_t>(len);


     for (index_t i=0; i<result.vlen; i++)

     {

         SGMatrix<float64_t> dK;


         if (result.vlen==1)

             dK=m_kernel->get_parameter_gradient(param);

         else

             dK=m_kernel->get_parameter_gradient(param, i);


         Map<MatrixXd> eigen_dK(dK.matrix, dK.num_rows, dK.num_cols);


         // compute dnlZ=sum(sum(Z.*dK))/2-alpha'*dK*alpha/2

         result[i]=(eigen_Z.cwiseProduct(eigen_dK)).sum()/2.0-

             (eigen_alpha.adjoint()*eigen_dK).dot(eigen_alpha)/2.0;


         // compute b=dK*dlp

         VectorXd b=eigen_dK*eigen_dlp;


         // compute dnlZ=dnlZ-dfhat'*(b-K*(Z*b))

         result[i]=result[i]-eigen_dfhat.dot(b-eigen_K*CMath::exp(m_log_scale*2.0)*

                 (eigen_Z*b));

         result[i]*=CMath::exp(m_log_scale*2.0);

     }


     return result;

 }


 SGVector<float64_t> CSingleLaplaceInferenceMethod::get_derivative_wrt_mean(

         const TParameter* param)

 {

     // create eigen representation of K, Z, dfhat and alpha

     Map<MatrixXd> eigen_K(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);

     Map<MatrixXd> eigen_Z(m_Z.matrix, m_Z.num_rows, m_Z.num_cols);

     Map<VectorXd> eigen_dfhat(m_dfhat.vector, m_dfhat.vlen);

     Map<VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);


     REQUIRE(param, "Param not set\n");

     SGVector<float64_t> result;

     int64_t len=const_cast<TParameter *>(param)->m_datatype.get_num_elements();

     result=SGVector<float64_t>(len);


     for (index_t i=0; i<result.vlen; i++)

     {

         SGVector<float64_t> dmu;


         if (result.vlen==1)

             dmu=m_mean->get_parameter_derivative(m_features, param);

         else

             dmu=m_mean->get_parameter_derivative(m_features, param, i);


         Map<VectorXd> eigen_dmu(dmu.vector, dmu.vlen);


         // compute dnlZ=-alpha'*dm-dfhat'*(dm-K*(Z*dm))

         result[i]=-eigen_alpha.dot(eigen_dmu)-eigen_dfhat.dot(eigen_dmu-

                 eigen_K*CMath::exp(m_log_scale*2.0)*(eigen_Z*eigen_dmu));

     }


     return result;

 }


 SGVector<float64_t> CSingleLaplaceInferenceMethod::get_posterior_mean()

 {

     compute_gradient();


     SGVector<float64_t> res(m_mu.vlen);

     Map<VectorXd> eigen_res(res.vector, res.vlen);


     Map<VectorXd> eigen_mu(m_mu, m_mu.vlen);

     SGVector<float64_t> mean=m_mean->get_mean_vector(m_features);

     Map<VectorXd> eigen_mean(mean.vector, mean.vlen);

     eigen_res=eigen_mu-eigen_mean;


     return res;

 }


 float64_t CSingleLaplaceInferenceMethod::get_psi_wrt_alpha()

 {

     Eigen::Map<Eigen::VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);

     SGVector<float64_t> f(m_alpha.vlen);

     Eigen::Map<Eigen::VectorXd> eigen_f(f.vector, f.vlen);

     Eigen::Map<Eigen::MatrixXd> kernel(m_ktrtr.matrix,

         m_ktrtr.num_rows,

         m_ktrtr.num_cols);

     Eigen::Map<Eigen::VectorXd> eigen_mean_f(m_mean_f.vector,

         m_mean_f.vlen);

     /* f = K * alpha + mean_f given alpha*/

     eigen_f

         = kernel * ((eigen_alpha) * CMath::exp(m_log_scale*2.0)) + eigen_mean_f;


     /* psi = 0.5 * alpha .* (f - m) - sum(dlp)*/

     float64_t psi = eigen_alpha.dot(eigen_f - eigen_mean_f) * 0.5;

     psi -= SGVector<float64_t>::sum(m_model->get_log_probability_f(m_labels, f));

     return psi;

 }


 void CSingleLaplaceInferenceMethod::get_gradient_wrt_alpha(SGVector<float64_t> gradient)

 {

     REQUIRE(gradient.vlen==m_alpha.vlen,

         "The length of gradients (%d) should the same as the length of parameters (%d)\n",

         gradient.vlen, m_alpha.vlen);


     Eigen::Map<Eigen::VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);

     Eigen::Map<Eigen::VectorXd> eigen_gradient(gradient.vector, gradient.vlen);

     SGVector<float64_t> f(m_alpha.vlen);

     Eigen::Map<Eigen::VectorXd> eigen_f(f.vector, f.vlen);

     Eigen::Map<Eigen::MatrixXd> kernel(m_ktrtr.matrix,

         m_ktrtr.num_rows,

         m_ktrtr.num_cols);

     Eigen::Map<Eigen::VectorXd> eigen_mean_f(m_mean_f.vector,

         m_mean_f.vlen);


     /* f = K * alpha + mean_f given alpha*/

     eigen_f = kernel * ((eigen_alpha) * CMath::exp(m_log_scale*2.0)) + eigen_mean_f;


     SGVector<float64_t> dlp_f =

         m_model->get_log_probability_derivative_f(m_labels, f, 1);


     Eigen::Map<Eigen::VectorXd> eigen_dlp_f(dlp_f.vector, dlp_f.vlen);


     /* g_alpha = K * (alpha - dlp_f)*/

     eigen_gradient = kernel * ((eigen_alpha - eigen_dlp_f) * CMath::exp(m_log_scale*2.0));

 }


 }


shogun::CSingleLaplaceInferenceMethod::update
virtual void update()
Definition: SingleLaplaceInferenceMethod.cpp:425

shogun::CInference::m_log_scale
float64_t m_log_scale
Definition: Inference.h:490

shogun::CLikelihoodModel::get_log_probability_f
virtual SGVector< float64_t > get_log_probability_f(const CLabels *lab, SGVector< float64_t > func) const =0

shogun::CInference::update
virtual void update()
Definition: Inference.cpp:316

shogun::CSingleLaplaceNewtonOptimizer::minimize
virtual float64_t minimize()
Definition: SingleLaplaceInferenceMethod.cpp:172

shogun::CSingleLaplaceInferenceMethod::update_alpha
virtual void update_alpha()
Definition: SingleLaplaceInferenceMethod.cpp:502

shogun::TParameter::m_name
char * m_name
Definition: base/Parameter.h:145

shogun::CSingleLaplaceInferenceMethod::update_chol
virtual void update_chol()
Definition: SingleLaplaceInferenceMethod.cpp:373

shogun::CSGObject::update_parameter_hash
virtual void update_parameter_hash()
Definition: SGObject.cpp:281

shogun::CSingleLaplaceInferenceMethod::CSingleLaplaceInferenceMethod
CSingleLaplaceInferenceMethod()
Definition: SingleLaplaceInferenceMethod.cpp:265

shogun::CLaplaceInference::m_mu
SGVector< float64_t > m_mu
Definition: LaplaceInference.h:154

Math.h

shogun::SGMatrix::matrix
T * matrix
Definition: SGMatrix.h:372

index_t
int32_t index_t
Definition: common.h:62

shogun::linalg::dot
Vector::Scalar dot(Vector a, Vector b)
Definition: Redux.h:58

shogun::CLabels
The class Labels models labels, i.e. class assignments of objects.
Definition: Labels.h:43

shogun::CMath::INFTY
static const float64_t INFTY
infinity
Definition: Math.h:2048

shogun::CInference::get_inference_type
virtual EInferenceType get_inference_type() const
Definition: Inference.h:104

shogun::CLikelihoodModel::get_second_derivative
virtual SGVector< float64_t > get_second_derivative(const CLabels *lab, SGVector< float64_t > func, const TParameter *param) const
Definition: LikelihoodModel.h:210

shogun::CLabels::get_num_labels
virtual int32_t get_num_labels() const =0

eigen3.h

shogun::CSingleLaplaceInferenceMethod::m_d2lp
SGVector< float64_t > m_d2lp
Definition: SingleLaplaceInferenceMethod.h:231

shogun::CInference::m_kernel
CKernel * m_kernel
Definition: Inference.h:469

Eigen::Map
Definition: SGMatrix.h:24

SG_SWARNING
#define SG_SWARNING(...)
Definition: SGIO.h:178

SingleLaplaceInferenceMethod.h

shogun::CSingleLaplaceNewtonOptimizer
The build-in minimizer for SingleLaplaceInference.
Definition: SingleLaplaceInferenceMethod.h:251

Eigen
Definition: SGMatrix.h:20

shogun::CSingleLaplaceInferenceMethod::m_sW
SGVector< float64_t > m_sW
Definition: SingleLaplaceInferenceMethod.h:228

shogun::TParameter
parameter struct
Definition: base/Parameter.h:32

shogun::INF_LAPLACE_SINGLE
Definition: Inference.h:61

shogun::CSingleLaplaceInferenceMethod::get_derivative_wrt_inference_method
virtual SGVector< float64_t > get_derivative_wrt_inference_method(const TParameter *param)
Definition: SingleLaplaceInferenceMethod.cpp:599

REQUIRE
#define REQUIRE(x,...)
Definition: SGIO.h:206

shogun::CSingleLaplaceInferenceMethod::update_deriv
virtual void update_deriv()
Definition: SingleLaplaceInferenceMethod.cpp:543

shogun::SGMatrix::num_cols
index_t num_cols
Definition: SGMatrix.h:376

shogun::CMeanFunction::get_mean_vector
virtual SGVector< float64_t > get_mean_vector(const CFeatures *features) const =0

shogun::CStudentsTLikelihood::get_degrees_freedom
float64_t get_degrees_freedom() const
Definition: StudentsTLikelihood.h:98

shogun::LT_STUDENTST
Definition: LikelihoodModel.h:51

shogun::CMeanFunction
An abstract class of the mean function.
Definition: MeanFunction.h:49

shogun::SGVector::scale
void scale(T alpha)
Scale vector inplace.
Definition: SGVector.cpp:841

SG_REF
#define SG_REF(x)
Definition: SGObject.h:54

shogun::SGMatrix::num_rows
index_t num_rows
Definition: SGMatrix.h:374

shogun::SGMatrix< float64_t >

shogun::CInference::m_features
CFeatures * m_features
Definition: Inference.h:478

shogun::MS_NOT_AVAILABLE
Definition: SGObject.h:92

shogun::CInference::m_ktrtr
SGMatrix< float64_t > m_ktrtr
Definition: Inference.h:493

shogun::CSingleLaplaceInferenceMethod::get_negative_log_marginal_likelihood
virtual float64_t get_negative_log_marginal_likelihood()
Definition: SingleLaplaceInferenceMethod.cpp:312

shogun::CInference::m_mean
CMeanFunction * m_mean
Definition: Inference.h:472

shogun::CSingleLaplaceNewtonOptimizer::set_target
void set_target(CSingleLaplaceInferenceMethod *obj)
Definition: SingleLaplaceInferenceMethod.cpp:131

shogun::CSingleLaplaceInferenceMethod::obtain_from_generic
static CSingleLaplaceInferenceMethod * obtain_from_generic(CInference *inference)
Definition: SingleLaplaceInferenceMethod.cpp:295

shogun::CSingleLaplaceInferenceMethod::m_Psi
float64_t m_Psi
Definition: SingleLaplaceInferenceMethod.h:246

shogun::CSingleLaplaceInferenceMethod::~CSingleLaplaceInferenceMethod
virtual ~CSingleLaplaceInferenceMethod()
Definition: SingleLaplaceInferenceMethod.cpp:308

shogun::SGVector::vlen
index_t vlen
Definition: SGVector.h:494

shogun::SGVector::zero
void zero()
Definition: SGVector.cpp:136

shogun::SGVector::vector
T * vector
Definition: SGVector.h:492

shogun::CSingleLaplaceInferenceMethod::m_Z
SGMatrix< float64_t > m_Z
Definition: SingleLaplaceInferenceMethod.h:240

shogun::CSGObject
Class SGObject is the base class of all shogun objects.
Definition: SGObject.h:115

shogun::CSingleLaplaceInferenceMethod::get_derivative_wrt_mean
virtual SGVector< float64_t > get_derivative_wrt_mean(const TParameter *param)
Definition: SingleLaplaceInferenceMethod.cpp:706

shogun::SGVector< float64_t >

shogun::CInference::m_labels
CLabels * m_labels
Definition: Inference.h:481

shogun::FirstOrderMinimizer::unset_cost_function
virtual void unset_cost_function(bool is_unref=true)
Definition: FirstOrderMinimizer.h:94

float64_t
double float64_t
Definition: common.h:50

shogun::CSingleLaplaceInferenceMethod::m_d3lp
SGVector< float64_t > m_d3lp
Definition: SingleLaplaceInferenceMethod.h:234

shogun::CSingleLaplaceInferenceMethod::update_init
virtual void update_init()
Definition: SingleLaplaceInferenceMethod.cpp:440

shogun::CLaplaceInference::m_dlp
SGVector< float64_t > m_dlp
Definition: LaplaceInference.h:148

shogun::CSingleLaplaceInferenceMethod::get_diagonal_vector
virtual SGVector< float64_t > get_diagonal_vector()
Definition: SingleLaplaceInferenceMethod.cpp:287

shogun::SGVector::sum
static T sum(T *vec, int32_t len)
Return sum(vec)
Definition: SGVector.h:354

shogun::CInference::m_L
SGMatrix< float64_t > m_L
Definition: Inference.h:487

shogun::FirstOrderCostFunction
The first order cost function base class.
Definition: FirstOrderCostFunction.h:51

Eigen::MatrixXd
Matrix< float64_t,-1,-1, 0,-1,-1 > MatrixXd
Definition: KLInference.h:52

shogun::Minimizer::minimize
virtual float64_t minimize()=0

shogun::CSingleLaplaceInferenceMethod::get_posterior_mean
virtual SGVector< float64_t > get_posterior_mean()
Definition: SingleLaplaceInferenceMethod.cpp:739

shogun::CStudentsTLikelihood
Class that models a Student's-t likelihood.
Definition: StudentsTLikelihood.h:57

shogun::CSingleLaplaceInferenceMethod::get_derivative_wrt_kernel
virtual SGVector< float64_t > get_derivative_wrt_kernel(const TParameter *param)
Definition: SingleLaplaceInferenceMethod.cpp:664

shogun::CInference::register_minimizer
virtual void register_minimizer(Minimizer *minimizer)
Definition: Inference.cpp:128

shogun::CSingleLaplaceInferenceMethod::CSingleLaplaceNewtonOptimizer
friend class CSingleLaplaceNewtonOptimizer
Definition: SingleLaplaceInferenceMethod.h:42

shogun::CMeanFunction::get_parameter_derivative
virtual SGVector< float64_t > get_parameter_derivative(const CFeatures *features, const TParameter *param, index_t index=-1)
Definition: MeanFunction.h:73

SG_UNREF
#define SG_UNREF(x)
Definition: SGObject.h:55

shogun::CSingleLaplaceInferenceMethod::m_mean_f
SGVector< float64_t > m_mean_f
Definition: SingleLaplaceInferenceMethod.h:225

SG_DEBUG
#define SG_DEBUG(...)
Definition: SGIO.h:107

shogun::CSingleLaplaceInferenceMethod::get_psi_wrt_alpha
float64_t get_psi_wrt_alpha()
Definition: SingleLaplaceInferenceMethod.cpp:755

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

shogun::CLaplaceInference
The Laplace approximation inference method base class.
Definition: LaplaceInference.h:51

shogun::CInference
The Inference Method base class.
Definition: Inference.h:81

shogun::CInference::m_minimizer
Minimizer * m_minimizer
Definition: Inference.h:466

shogun::CSingleLaplaceInferenceMethod::SingleLaplaceInferenceMethodCostFunction
friend class SingleLaplaceInferenceMethodCostFunction
Definition: SingleLaplaceInferenceMethod.h:43

shogun::CLaplaceInference::m_Sigma
SGMatrix< float64_t > m_Sigma
Definition: LaplaceInference.h:157

shogun::CLaplaceInference::compute_gradient
virtual void compute_gradient()
Definition: LaplaceInference.cpp:70

shogun::CFeatures
The class Features is the base class of all feature objects.
Definition: Features.h:68

SG_SERROR
#define SG_SERROR(...)
Definition: SGIO.h:179

shogun::CSingleLaplaceNewtonOptimizer::unset_target
void unset_target(bool is_unref)
Definition: SingleLaplaceInferenceMethod.cpp:142

shogun::CSingleLaplaceInferenceMethod::get_name
virtual const char * get_name() const
Definition: SingleLaplaceInferenceMethod.h:65

shogun::CMath::exp
static float64_t exp(float64_t x)
Definition: Math.h:621

Eigen::Matrix
Definition: SGMatrix.h:22

shogun::CKernel::get_parameter_gradient
virtual SGMatrix< float64_t > get_parameter_gradient(const TParameter *param, index_t index=-1)
Definition: Kernel.h:851

shogun::SGVector::clone
SGVector< T > clone() const
Definition: SGVector.cpp:207

shogun::CLikelihoodModel::get_log_probability_derivative_f
virtual SGVector< float64_t > get_log_probability_derivative_f(const CLabels *lab, SGVector< float64_t > func, index_t i) const =0

shogun::CLaplaceInference::m_W
SGVector< float64_t > m_W
Definition: LaplaceInference.h:151

shogun::SGMatrix::inverse
static void inverse(SGMatrix< float64_t > matrix)
inverses square matrix in-place
Definition: SGMatrix.cpp:881

shogun::CKernel
The Kernel base class.
Definition: Kernel.h:159

shogun::CLikelihoodModel::get_third_derivative
virtual SGVector< float64_t > get_third_derivative(const CLabels *lab, SGVector< float64_t > func, const TParameter *param) const
Definition: LikelihoodModel.h:227

shogun::CInference::m_gradient_update
bool m_gradient_update
Definition: Inference.h:499

shogun::CSingleLaplaceInferenceMethod::m_dfhat
SGVector< float64_t > m_dfhat
Definition: SingleLaplaceInferenceMethod.h:237

shogun::Minimizer
The minimizer base class.
Definition: Minimizer.h:43

SG_ADD
#define SG_ADD(...)
Definition: SGObject.h:84

shogun::CSingleLaplaceInferenceMethod::m_g
SGVector< float64_t > m_g
Definition: SingleLaplaceInferenceMethod.h:243

shogun::CStudentsTLikelihood::obtain_from_generic
static CStudentsTLikelihood * obtain_from_generic(CLikelihoodModel *likelihood)
Definition: StudentsTLikelihood.cpp:287

shogun::CLikelihoodModel::get_first_derivative
virtual SGVector< float64_t > get_first_derivative(const CLabels *lab, SGVector< float64_t > func, const TParameter *param) const
Definition: LikelihoodModel.h:192

shogun::CSingleLaplaceInferenceMethod
The SingleLaplace approximation inference method class for regression and binary Classification.
Definition: SingleLaplaceInferenceMethod.h:40

shogun::CInference::m_model
CLikelihoodModel * m_model
Definition: Inference.h:475

shogun::CSGObject::parameter_hash_changed
virtual bool parameter_hash_changed()
Definition: SGObject.cpp:295

shogun::CLikelihoodModel
The Likelihood model base class.
Definition: LikelihoodModel.h:62

shogun::CSingleLaplaceInferenceMethod::get_derivative_wrt_likelihood_model
virtual SGVector< float64_t > get_derivative_wrt_likelihood_model(const TParameter *param)
Definition: SingleLaplaceInferenceMethod.cpp:630

shogun::FirstOrderMinimizer::set_cost_function
virtual void set_cost_function(FirstOrderCostFunction *fun)
Definition: FirstOrderMinimizer.cpp:42

StudentsTLikelihood.h

shogun::CInference::m_alpha
SGVector< float64_t > m_alpha
Definition: Inference.h:484

shogun::CSingleLaplaceInferenceMethod::update_approx_cov
virtual void update_approx_cov()
Definition: SingleLaplaceInferenceMethod.cpp:353

shogun::CSingleLaplaceInferenceMethod::get_gradient_wrt_alpha
void get_gradient_wrt_alpha(SGVector< float64_t > gradient)
Definition: SingleLaplaceInferenceMethod.cpp:775

shogun::FirstOrderMinimizer
The first order minimizer base class.
Definition: FirstOrderMinimizer.h:52

FirstOrderMinimizer.h

shogun::CSingleLaplaceInferenceMethod::register_minimizer
virtual void register_minimizer(Minimizer *minimizer)
Definition: SingleLaplaceInferenceMethod.cpp:491