en/latest/MultiLaplaceInferenceMethod_8cpp_source.html

 /*

  * Copyright (c) The Shogun Machine Learning Toolbox

  * Written (w) 2014 Wu Lin

  * All rights reserved.

  *

  * Redistribution and use in source and binary forms, with or without

  * modification, are permitted provided that the following conditions are met:

  *

  * 1. Redistributions of source code must retain the above copyright notice, this

  *    list of conditions and the following disclaimer.

  * 2. Redistributions in binary form must reproduce the above copyright notice,

  *    this list of conditions and the following disclaimer in the documentation

  *    and/or other materials provided with the distribution.

  *

  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND

  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED

  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE

  * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR

  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES

  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND

  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS

  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

  *

  * The views and conclusions contained in the software and documentation are those

  * of the authors and should not be interpreted as representing official policies,

  * either expressed or implied, of the Shogun Development Team.

  *

  *

  * Code adapted from

  * https://gist.github.com/yorkerlin/14ace49f2278f3859614

  * Gaussian Process Machine Learning Toolbox

  * http://www.gaussianprocess.org/gpml/code/matlab/doc/

  * and

  * GPstuff - Gaussian process models for Bayesian analysis

  * http://becs.aalto.fi/en/research/bayes/gpstuff/

  *

  * The reference pseudo code is the algorithm 3.3 of the GPML textbook

  */


 #include <shogun/machine/gp/MultiLaplaceInferenceMethod.h>


 #include <shogun/mathematics/eigen3.h>

 #include <shogun/labels/MulticlassLabels.h>

 #include <shogun/mathematics/Math.h>

 #include <shogun/lib/external/brent.h>


 using namespace shogun;

 using namespace Eigen;


 namespace shogun

 {


 #ifndef DOXYGEN_SHOULD_SKIP_THIS


 class CMultiPsiLine : public func_base

 {

 public:

     float64_t log_scale;

     MatrixXd K;

     VectorXd dalpha;

     VectorXd start_alpha;

     Map<VectorXd>* alpha;

     SGVector<float64_t>* dlp;

     SGVector<float64_t>* f;

     SGVector<float64_t>* m;

     CLikelihoodModel* lik;

     CLabels* lab;


     virtual double operator() (double x)

     {

         const index_t C=((CMulticlassLabels*)lab)->get_num_classes();

         const index_t n=((CMulticlassLabels*)lab)->get_num_labels();

         Map<VectorXd> eigen_f(f->vector, f->vlen);

         Map<VectorXd> eigen_m(m->vector, m->vlen);


         // compute alpha=alpha+x*dalpha and f=K*alpha+m

         (*alpha)=start_alpha+x*dalpha;


         float64_t result=0;

         for(index_t bl=0; bl<C; bl++)

         {

             eigen_f.block(bl*n,0,n,1)=K*alpha->block(bl*n,0,n,1)*CMath::exp(log_scale*2.0);

             result+=alpha->block(bl*n,0,n,1).dot(eigen_f.block(bl*n,0,n,1))/2.0;

             eigen_f.block(bl*n,0,n,1)+=eigen_m;

         }


         // get first and second derivatives of log likelihood

         (*dlp)=lik->get_log_probability_derivative_f(lab, (*f), 1);


         result -=SGVector<float64_t>::sum(lik->get_log_probability_f(lab, *f));


         return result;

     }

 };


 #endif /* DOXYGEN_SHOULD_SKIP_THIS */


 CMultiLaplaceInferenceMethod::CMultiLaplaceInferenceMethod() : CLaplaceInference()

 {

     init();

 }


 CMultiLaplaceInferenceMethod::CMultiLaplaceInferenceMethod(CKernel* kern,

         CFeatures* feat, CMeanFunction* m, CLabels* lab, CLikelihoodModel* mod)

         : CLaplaceInference(kern, feat, m, lab, mod)

 {

     init();

 }


 void CMultiLaplaceInferenceMethod::init()

 {

     m_iter=20;

     m_tolerance=1e-6;

     m_opt_tolerance=1e-10;

     m_opt_max=10;


     m_nlz=0;

     SG_ADD(&m_nlz, "nlz", "negative log marginal likelihood ", MS_NOT_AVAILABLE);

     SG_ADD(&m_U, "U", "the matrix used to compute gradient wrt hyperparameters", MS_NOT_AVAILABLE);


     SG_ADD(&m_tolerance, "tolerance", "amount of tolerance for Newton's iterations", MS_NOT_AVAILABLE);

     SG_ADD(&m_iter, "iter", "max Newton's iterations", MS_NOT_AVAILABLE);

     SG_ADD(&m_opt_tolerance, "opt_tolerance", "amount of tolerance for Brent's minimization method", MS_NOT_AVAILABLE);

     SG_ADD(&m_opt_max, "opt_max", "max iterations for Brent's minimization method", MS_NOT_AVAILABLE);

 }


 CMultiLaplaceInferenceMethod::~CMultiLaplaceInferenceMethod()

 {

 }


 void CMultiLaplaceInferenceMethod::check_members() const

 {

     CInference::check_members();


     REQUIRE(m_labels->get_label_type()==LT_MULTICLASS,

         "Labels must be type of CMulticlassLabels\n");

     REQUIRE(m_model->supports_multiclass(),

         "likelihood model should support multi-classification\n");

 }


 SGVector<float64_t> CMultiLaplaceInferenceMethod::get_diagonal_vector()

 {

     if (parameter_hash_changed())

         update();


     get_dpi_helper();


     return SGVector<float64_t>(m_W);

 }


 float64_t CMultiLaplaceInferenceMethod::get_negative_log_marginal_likelihood()

 {

     if (parameter_hash_changed())

         update();


     return m_nlz;

 }


 SGVector<float64_t> CMultiLaplaceInferenceMethod::get_derivative_wrt_likelihood_model(

         const TParameter* param)

 {

     //SoftMax likelihood does not have this kind of derivative

     SG_ERROR("Not Implemented!\n");

     return SGVector<float64_t> ();

 }


 CMultiLaplaceInferenceMethod* CMultiLaplaceInferenceMethod::obtain_from_generic(

         CInference* inference)

 {

     if (inference==NULL)

         return NULL;


     if (inference->get_inference_type()!=INF_LAPLACE_MULTIPLE)

         SG_SERROR("Provided inference is not of type CMultiLaplaceInferenceMethod!\n")


     SG_REF(inference);

     return (CMultiLaplaceInferenceMethod*)inference;

 }


 void CMultiLaplaceInferenceMethod::update_approx_cov()

 {

     //Sigma=K-K*(E-E*R(M*M')^{-1}*R'*E)*K

     const index_t C=((CMulticlassLabels*)m_labels)->get_num_classes();

     const index_t n=m_labels->get_num_labels();

     Map<MatrixXd> eigen_M(m_L.matrix, m_L.num_rows, m_L.num_cols);

     Map<MatrixXd> eigen_E(m_E.matrix, m_E.num_rows, m_E.num_cols);

     Map<MatrixXd> eigen_K(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);


     m_Sigma=SGMatrix<float64_t>(C*n, C*n);

     Map<MatrixXd> eigen_Sigma(m_Sigma.matrix, m_Sigma.num_rows, m_Sigma.num_cols);

     eigen_Sigma.fill(0);


     MatrixXd eigen_U(C*n,n);

     for(index_t bl=0; bl<C; bl++)

     {

         eigen_U.block(bl*n,0,n,n)=eigen_K*CMath::exp(m_log_scale*2.0)*eigen_E.block(0,bl*n,n,n);

         eigen_Sigma.block(bl*n,bl*n,n,n)=(MatrixXd::Identity(n,n)-eigen_U.block(bl*n,0,n,n))*(eigen_K*CMath::exp(m_log_scale*2.0));

     }

     MatrixXd eigen_V=eigen_M.triangularView<Upper>().adjoint().solve(eigen_U.transpose());

     eigen_Sigma+=eigen_V.transpose()*eigen_V;

 }


 void CMultiLaplaceInferenceMethod::update_chol()

 {

 }


 void CMultiLaplaceInferenceMethod::get_dpi_helper()

 {

     const index_t C=((CMulticlassLabels*)m_labels)->get_num_classes();

     const index_t n=m_labels->get_num_labels();

     Map<VectorXd> eigen_dpi(m_W.vector, m_W.vlen);

     Map<MatrixXd> eigen_dpi_matrix(eigen_dpi.data(),n,C);


     Map<VectorXd> eigen_mu(m_mu, m_mu.vlen);

     Map<MatrixXd> eigen_mu_matrix(eigen_mu.data(),n,C);

     // with log_sum_exp trick

     VectorXd max_coeff=eigen_mu_matrix.rowwise().maxCoeff();

     eigen_dpi_matrix=eigen_mu_matrix.array().colwise()-max_coeff.array();

     VectorXd log_sum_exp=((eigen_dpi_matrix.array().exp()).rowwise().sum()).array().log();

     eigen_dpi_matrix=(eigen_dpi_matrix.array().colwise()-log_sum_exp.array()).exp();


     // without log_sum_exp trick

     //eigen_dpi_matrix=eigen_mu_matrix.array().exp();

     //VectorXd tmp_for_dpi=eigen_dpi_matrix.rowwise().sum();

     //eigen_dpi_matrix=eigen_dpi_matrix.array().colwise()/tmp_for_dpi.array();

 }


 void CMultiLaplaceInferenceMethod::update_alpha()

 {

     float64_t Psi_Old = CMath::INFTY;

     float64_t Psi_New;

     float64_t Psi_Def;

     const index_t C=((CMulticlassLabels*)m_labels)->get_num_classes();

     const index_t n=m_labels->get_num_labels();


     // get mean vector and create eigen representation of it

     SGVector<float64_t> mean=m_mean->get_mean_vector(m_features);

     Map<VectorXd> eigen_mean_bl(mean.vector, mean.vlen);

     VectorXd eigen_mean=eigen_mean_bl.replicate(C,1);


     // create eigen representation of kernel matrix

     Map<MatrixXd> eigen_ktrtr(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);


     // create shogun and eigen representation of function vector

     m_mu=SGVector<float64_t>(mean.vlen*C);

     Map<VectorXd> eigen_mu(m_mu, m_mu.vlen);


     // f = mean as default value

     eigen_mu=eigen_mean;


     Psi_Def=-SGVector<float64_t>::sum(m_model->get_log_probability_f(

             m_labels, m_mu));


     if (m_alpha.vlen!=C*n)

     {

         // set alpha a zero vector

         m_alpha=SGVector<float64_t>(C*n);

         m_alpha.zero();

         Psi_New=Psi_Def;

         m_E=SGMatrix<float64_t>(n,C*n);

         m_L=SGMatrix<float64_t>(n,n);

         m_W=SGVector<float64_t>(C*n);

     }

     else

     {

         Map<VectorXd> alpha(m_alpha.vector, m_alpha.vlen);

         for(index_t bl=0; bl<C; bl++)

             eigen_mu.block(bl*n,0,n,1)=eigen_ktrtr*CMath::exp(m_log_scale*2.0)*alpha.block(bl*n,0,n,1);


         //alpha'*(f-m)/2.0

         Psi_New=alpha.dot(eigen_mu)/2.0;

         // compute f = K * alpha + m

         eigen_mu+=eigen_mean;


         Psi_New-=SGVector<float64_t>::sum(m_model->get_log_probability_f(m_labels, m_mu));


         // if default is better, then use it

         if (Psi_Def < Psi_New)

         {

             m_alpha.zero();

             eigen_mu=eigen_mean;

             Psi_New=Psi_Def;

         }

     }


     Map<VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);

     Map<VectorXd> eigen_W(m_W.vector, m_W.vlen);

     Map<MatrixXd> eigen_L(m_L.matrix, m_L.num_rows, m_L.num_cols);

     Map<MatrixXd> eigen_E(m_E.matrix, m_E.num_rows, m_E.num_cols);


     // get first derivative of log probability function

     m_dlp=m_model->get_log_probability_derivative_f(m_labels, m_mu, 1);


     index_t iter=0;

     Map<MatrixXd> & eigen_M=eigen_L;


     while (Psi_Old-Psi_New>m_tolerance && iter<m_iter)

     {

         Map<VectorXd> eigen_dlp(m_dlp.vector, m_dlp.vlen);


         get_dpi_helper();

         Map<VectorXd> eigen_dpi(m_W.vector, m_W.vlen);


         Psi_Old = Psi_New;

         iter++;


         m_nlz=0;


         for(index_t bl=0; bl<C; bl++)

         {

             VectorXd eigen_sD=eigen_dpi.block(bl*n,0,n,1).cwiseSqrt();

             LLT<MatrixXd> chol_tmp((eigen_sD*eigen_sD.transpose()).cwiseProduct(eigen_ktrtr*CMath::exp(m_log_scale*2.0))+

                 MatrixXd::Identity(m_ktrtr.num_rows, m_ktrtr.num_cols));

             MatrixXd eigen_L_tmp=chol_tmp.matrixU();

             MatrixXd eigen_E_bl=eigen_L_tmp.triangularView<Upper>().adjoint().solve(MatrixXd(eigen_sD.asDiagonal()));

             eigen_E_bl=eigen_E_bl.transpose()*eigen_E_bl;

             eigen_E.block(0,bl*n,n,n)=eigen_E_bl;

             if (bl==0)

                 eigen_M=eigen_E_bl;

             else

                 eigen_M+=eigen_E_bl;

             m_nlz+=eigen_L_tmp.diagonal().array().log().sum();

         }


         LLT<MatrixXd> chol_tmp(eigen_M);

         eigen_M = chol_tmp.matrixU();

         m_nlz+=eigen_M.diagonal().array().log().sum();


         VectorXd eigen_b=eigen_dlp;

         Map<VectorXd> & tmp1=eigen_dlp;

         tmp1=eigen_dpi.array()*(eigen_mu-eigen_mean).array();

         Map<MatrixXd> m_tmp(tmp1.data(),n,C);

         VectorXd tmp2=m_tmp.array().rowwise().sum();


         for(index_t bl=0; bl<C; bl++)

             eigen_b.block(bl*n,0,n,1)+=eigen_dpi.block(bl*n,0,n,1).cwiseProduct(eigen_mu.block(bl*n,0,n,1)-eigen_mean_bl-tmp2);


         Map<VectorXd> &eigen_c=eigen_W;

         for(index_t bl=0; bl<C; bl++)

             eigen_c.block(bl*n,0,n,1)=eigen_E.block(0,bl*n,n,n)*(eigen_ktrtr*CMath::exp(m_log_scale*2.0)*eigen_b.block(bl*n,0,n,1));


         Map<MatrixXd> c_tmp(eigen_c.data(),n,C);


         VectorXd tmp3=c_tmp.array().rowwise().sum();

         VectorXd tmp4=eigen_M.triangularView<Upper>().adjoint().solve(tmp3);


         VectorXd &eigen_dalpha=eigen_b;

         eigen_dalpha+=eigen_E.transpose()*(eigen_M.triangularView<Upper>().solve(tmp4))-eigen_c-eigen_alpha;


         // perform Brent's optimization

         CMultiPsiLine func;


         func.log_scale=m_log_scale;

         func.K=eigen_ktrtr;

         func.dalpha=eigen_dalpha;

         func.start_alpha=eigen_alpha;

         func.alpha=&eigen_alpha;

         func.dlp=&m_dlp;

         func.f=&m_mu;

         func.m=&mean;

         func.lik=m_model;

         func.lab=m_labels;


         float64_t x;

         Psi_New=local_min(0, m_opt_max, m_opt_tolerance, func, x);

         m_nlz+=Psi_New;

     }


     if (Psi_Old-Psi_New>m_tolerance && iter>=m_iter)

     {

         SG_WARNING("Max iterations (%d) reached, but convergence level (%f) is not yet below tolerance (%f)\n", m_iter, Psi_Old-Psi_New, m_tolerance);

     }

 }


 void CMultiLaplaceInferenceMethod::update_deriv()

 {

     const index_t C=((CMulticlassLabels*)m_labels)->get_num_classes();

     const index_t n=m_labels->get_num_labels();

     m_U=SGMatrix<float64_t>(n, n*C);

     Map<MatrixXd> eigen_U(m_U.matrix, m_U.num_rows, m_U.num_cols);

     Map<MatrixXd> eigen_M(m_L.matrix, m_L.num_rows, m_L.num_cols);

     Map<MatrixXd> eigen_E(m_E.matrix, m_E.num_rows, m_E.num_cols);

     eigen_U=eigen_M.triangularView<Upper>().adjoint().solve(eigen_E);

 }


 float64_t CMultiLaplaceInferenceMethod::get_derivative_helper(SGMatrix<float64_t> dK)

 {

     Map<MatrixXd> eigen_dK(dK.matrix, dK.num_rows, dK.num_cols);

     //currently only explicit term is computed

     const index_t C=((CMulticlassLabels*)m_labels)->get_num_classes();

     const index_t n=m_labels->get_num_labels();

     Map<MatrixXd> eigen_U(m_U.matrix, m_U.num_rows, m_U.num_cols);

     Map<MatrixXd> eigen_E(m_E.matrix, m_E.num_rows, m_E.num_cols);

     Map<VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);

     float64_t result=0;

     //currently only explicit term is computed

     for(index_t bl=0; bl<C; bl++)

     {

         result+=((eigen_E.block(0,bl*n,n,n)-eigen_U.block(0,bl*n,n,n).transpose()*eigen_U.block(0,bl*n,n,n)).array()

             *eigen_dK.array()).sum();

         result-=(eigen_dK*eigen_alpha.block(bl*n,0,n,1)).dot(eigen_alpha.block(bl*n,0,n,1));

     }


     return result/2.0;

 }


 SGVector<float64_t> CMultiLaplaceInferenceMethod::get_derivative_wrt_inference_method(

         const TParameter* param)

 {

     REQUIRE(!strcmp(param->m_name, "log_scale"), "Can't compute derivative of "

             "the nagative log marginal likelihood wrt %s.%s parameter\n",

             get_name(), param->m_name)


     Map<MatrixXd> eigen_K(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);


     SGVector<float64_t> result(1);


     // compute derivative K wrt scale


     result[0]=get_derivative_helper(m_ktrtr);

     result[0]*=CMath::exp(m_log_scale*2.0)*2.0;


     return result;

 }


 SGVector<float64_t> CMultiLaplaceInferenceMethod::get_derivative_wrt_kernel(

         const TParameter* param)

 {

     // create eigen representation of K, Z, dfhat, dlp and alpha

     Map<MatrixXd> eigen_K(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);


     REQUIRE(param, "Param not set\n");

     SGVector<float64_t> result;

     int64_t len=const_cast<TParameter *>(param)->m_datatype.get_num_elements();

     result=SGVector<float64_t>(len);


     for (index_t i=0; i<result.vlen; i++)

     {

         SGMatrix<float64_t> dK;


         if (result.vlen==1)

             dK=m_kernel->get_parameter_gradient(param);

         else

             dK=m_kernel->get_parameter_gradient(param, i);


         result[i]=get_derivative_helper(dK);

         result[i]*=CMath::exp(m_log_scale*2.0);

     }


     return result;

 }


 SGVector<float64_t> CMultiLaplaceInferenceMethod::get_derivative_wrt_mean(

         const TParameter* param)

 {

     // create eigen representation of K, Z, dfhat and alpha

     Map<MatrixXd> eigen_K(m_ktrtr.matrix, m_ktrtr.num_rows, m_ktrtr.num_cols);

     Map<VectorXd> eigen_alpha(m_alpha.vector, m_alpha.vlen);

     const index_t C=((CMulticlassLabels*)m_labels)->get_num_classes();

     const index_t n=m_labels->get_num_labels();


     REQUIRE(param, "Param not set\n");

     SGVector<float64_t> result;

     int64_t len=const_cast<TParameter *>(param)->m_datatype.get_num_elements();

     result=SGVector<float64_t>(len);


     for (index_t i=0; i<result.vlen; i++)

     {

         SGVector<float64_t> dmu;


         if (result.vlen==1)

             dmu=m_mean->get_parameter_derivative(m_features, param);

         else

             dmu=m_mean->get_parameter_derivative(m_features, param, i);


         Map<VectorXd> eigen_dmu(dmu.vector, dmu.vlen);


         result[i]=0;

         //currently only compute the explicit term

         for(index_t bl=0; bl<C; bl++)

             result[i]-=eigen_alpha.block(bl*n,0,n,1).dot(eigen_dmu);

     }


     return result;

 }


 SGVector<float64_t> CMultiLaplaceInferenceMethod::get_posterior_mean()

 {

     compute_gradient();


     SGVector<float64_t> res(m_mu.vlen);

     Map<VectorXd> eigen_res(res.vector, res.vlen);

     const index_t C=((CMulticlassLabels*)m_labels)->get_num_classes();


     SGVector<float64_t> mean=m_mean->get_mean_vector(m_features);

     Map<VectorXd> eigen_mean_bl(mean.vector, mean.vlen);

     VectorXd eigen_mean=eigen_mean_bl.replicate(C,1);


     Map<VectorXd> eigen_mu(m_mu, m_mu.vlen);

     eigen_res=eigen_mu-eigen_mean;


     return res;

 }


 }


shogun::CInference::m_log_scale
float64_t m_log_scale
Definition: Inference.h:490

shogun::CLikelihoodModel::get_log_probability_f
virtual SGVector< float64_t > get_log_probability_f(const CLabels *lab, SGVector< float64_t > func) const =0

shogun::CMultiLaplaceInferenceMethod::~CMultiLaplaceInferenceMethod
virtual ~CMultiLaplaceInferenceMethod()
Definition: MultiLaplaceInferenceMethod.cpp:130

shogun::CMultiLaplaceInferenceMethod::m_iter
index_t m_iter
Definition: MultiLaplaceInferenceMethod.h:292

shogun::CLikelihoodModel::supports_multiclass
virtual bool supports_multiclass() const
Definition: LikelihoodModel.h:335

shogun::TParameter::m_name
char * m_name
Definition: base/Parameter.h:145

shogun::CMultiLaplaceInferenceMethod::get_derivative_helper
virtual float64_t get_derivative_helper(SGMatrix< float64_t > dK)
Definition: MultiLaplaceInferenceMethod.cpp:391

shogun::CMultiLaplaceInferenceMethod::m_opt_max
float64_t m_opt_max
Definition: MultiLaplaceInferenceMethod.h:298

shogun::CLabels::get_label_type
virtual ELabelType get_label_type() const =0

shogun::CMultiLaplaceInferenceMethod::update_approx_cov
virtual void update_approx_cov()
Definition: MultiLaplaceInferenceMethod.cpp:184

shogun::CLaplaceInference::m_mu
SGVector< float64_t > m_mu
Definition: LaplaceInference.h:154

Math.h

shogun::SGMatrix::matrix
T * matrix
Definition: SGMatrix.h:372

index_t
int32_t index_t
Definition: common.h:62

shogun::linalg::dot
Vector::Scalar dot(Vector a, Vector b)
Definition: Redux.h:58

shogun::CLabels
The class Labels models labels, i.e. class assignments of objects.
Definition: Labels.h:43

shogun::CMath::INFTY
static const float64_t INFTY
infinity
Definition: Math.h:2048

shogun::CInference::get_inference_type
virtual EInferenceType get_inference_type() const
Definition: Inference.h:104

shogun::CLabels::get_num_labels
virtual int32_t get_num_labels() const =0

shogun::CMultiLaplaceInferenceMethod
The Laplace approximation inference method class for multi classification.
Definition: MultiLaplaceInferenceMethod.h:69

eigen3.h

LT_MULTICLASS
multi-class labels 0,1,...
Definition: LabelTypes.h:20

shogun::CInference::m_kernel
CKernel * m_kernel
Definition: Inference.h:469

Eigen::Map
Definition: SGMatrix.h:24

shogun::CMultiLaplaceInferenceMethod::get_name
virtual const char * get_name() const
Definition: MultiLaplaceInferenceMethod.h:93

shogun::CMultiLaplaceInferenceMethod::get_derivative_wrt_likelihood_model
virtual SGVector< float64_t > get_derivative_wrt_likelihood_model(const TParameter *param)
Definition: MultiLaplaceInferenceMethod.cpp:162

shogun::INF_LAPLACE_MULTIPLE
Definition: Inference.h:62

shogun::CMultiLaplaceInferenceMethod::m_tolerance
float64_t m_tolerance
Definition: MultiLaplaceInferenceMethod.h:289

Eigen
Definition: SGMatrix.h:20

shogun::CMultiLaplaceInferenceMethod::get_diagonal_vector
virtual SGVector< float64_t > get_diagonal_vector()
Definition: MultiLaplaceInferenceMethod.cpp:144

shogun::TParameter
parameter struct
Definition: base/Parameter.h:32

SG_ERROR
#define SG_ERROR(...)
Definition: SGIO.h:129

REQUIRE
#define REQUIRE(x,...)
Definition: SGIO.h:206

shogun::SGMatrix::num_cols
index_t num_cols
Definition: SGMatrix.h:376

shogun::CMeanFunction::get_mean_vector
virtual SGVector< float64_t > get_mean_vector(const CFeatures *features) const =0

shogun::CMultiLaplaceInferenceMethod::get_posterior_mean
virtual SGVector< float64_t > get_posterior_mean()
Definition: MultiLaplaceInferenceMethod.cpp:492

MultiLaplaceInferenceMethod.h

shogun::CInference::m_E
SGMatrix< float64_t > m_E
Definition: Inference.h:496

shogun::CMeanFunction
An abstract class of the mean function.
Definition: MeanFunction.h:49

shogun::CMultiLaplaceInferenceMethod::check_members
virtual void check_members() const
Definition: MultiLaplaceInferenceMethod.cpp:134

shogun::CMultiLaplaceInferenceMethod::m_nlz
float64_t m_nlz
Definition: MultiLaplaceInferenceMethod.h:269

SG_REF
#define SG_REF(x)
Definition: SGObject.h:54

shogun::SGMatrix::num_rows
index_t num_rows
Definition: SGMatrix.h:374

shogun::SGMatrix< float64_t >

shogun::CInference::m_features
CFeatures * m_features
Definition: Inference.h:478

shogun::MS_NOT_AVAILABLE
Definition: SGObject.h:92

shogun::CInference::m_ktrtr
SGMatrix< float64_t > m_ktrtr
Definition: Inference.h:493

shogun::CInference::m_mean
CMeanFunction * m_mean
Definition: Inference.h:472

shogun::CMulticlassLabels
Multiclass Labels for multi-class classification.
Definition: MulticlassLabels.h:36

shogun::CMultiLaplaceInferenceMethod::m_U
SGMatrix< float64_t > m_U
Definition: MultiLaplaceInferenceMethod.h:266

shogun::CMultiLaplaceInferenceMethod::get_dpi_helper
virtual void get_dpi_helper()
Definition: MultiLaplaceInferenceMethod.cpp:211

shogun::SGVector::vlen
index_t vlen
Definition: SGVector.h:494

shogun::SGVector::zero
void zero()
Definition: SGVector.cpp:136

shogun::SGVector::vector
T * vector
Definition: SGVector.h:492

shogun::SGVector< float64_t >

shogun::CInference::m_labels
CLabels * m_labels
Definition: Inference.h:481

shogun::CMultiLaplaceInferenceMethod::get_derivative_wrt_inference_method
virtual SGVector< float64_t > get_derivative_wrt_inference_method(const TParameter *param)
Definition: MultiLaplaceInferenceMethod.cpp:412

float64_t
double float64_t
Definition: common.h:50

shogun::CLaplaceInference::m_dlp
SGVector< float64_t > m_dlp
Definition: LaplaceInference.h:148

shogun::SGVector::sum
static T sum(T *vec, int32_t len)
Return sum(vec)
Definition: SGVector.h:354

shogun::CInference::m_L
SGMatrix< float64_t > m_L
Definition: Inference.h:487

Eigen::MatrixXd
Matrix< float64_t,-1,-1, 0,-1,-1 > MatrixXd
Definition: KLInference.h:52

shogun::CMultiLaplaceInferenceMethod::update_chol
virtual void update_chol()
Definition: MultiLaplaceInferenceMethod.cpp:207

shogun::CMultiLaplaceInferenceMethod::m_opt_tolerance
float64_t m_opt_tolerance
Definition: MultiLaplaceInferenceMethod.h:295

shogun::CMultiLaplaceInferenceMethod::CMultiLaplaceInferenceMethod
CMultiLaplaceInferenceMethod()
Definition: MultiLaplaceInferenceMethod.cpp:101

shogun::CMultiLaplaceInferenceMethod::get_derivative_wrt_mean
virtual SGVector< float64_t > get_derivative_wrt_mean(const TParameter *param)
Definition: MultiLaplaceInferenceMethod.cpp:458

shogun::CMultiLaplaceInferenceMethod::get_negative_log_marginal_likelihood
virtual float64_t get_negative_log_marginal_likelihood()
Definition: MultiLaplaceInferenceMethod.cpp:154

shogun::CMeanFunction::get_parameter_derivative
virtual SGVector< float64_t > get_parameter_derivative(const CFeatures *features, const TParameter *param, index_t index=-1)
Definition: MeanFunction.h:73

MulticlassLabels.h

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

shogun::CLaplaceInference
The Laplace approximation inference method base class.
Definition: LaplaceInference.h:51

shogun::CMultiLaplaceInferenceMethod::update_alpha
virtual void update_alpha()
Definition: MultiLaplaceInferenceMethod.cpp:232

shogun::CInference
The Inference Method base class.
Definition: Inference.h:81

shogun::CLaplaceInference::m_Sigma
SGMatrix< float64_t > m_Sigma
Definition: LaplaceInference.h:157

shogun::CLaplaceInference::compute_gradient
virtual void compute_gradient()
Definition: LaplaceInference.cpp:70

shogun::CFeatures
The class Features is the base class of all feature objects.
Definition: Features.h:68

SG_SERROR
#define SG_SERROR(...)
Definition: SGIO.h:179

shogun::CMath::exp
static float64_t exp(float64_t x)
Definition: Math.h:621

Eigen::Matrix
Definition: SGMatrix.h:22

shogun::CKernel::get_parameter_gradient
virtual SGMatrix< float64_t > get_parameter_gradient(const TParameter *param, index_t index=-1)
Definition: Kernel.h:851

shogun::CLikelihoodModel::get_log_probability_derivative_f
virtual SGVector< float64_t > get_log_probability_derivative_f(const CLabels *lab, SGVector< float64_t > func, index_t i) const =0

shogun::CLaplaceInference::m_W
SGVector< float64_t > m_W
Definition: LaplaceInference.h:151

shogun::CKernel
The Kernel base class.
Definition: Kernel.h:159

SG_WARNING
#define SG_WARNING(...)
Definition: SGIO.h:128

SG_ADD
#define SG_ADD(...)
Definition: SGObject.h:84

shogun::CMultiLaplaceInferenceMethod::obtain_from_generic
static CMultiLaplaceInferenceMethod * obtain_from_generic(CInference *inference)
Definition: MultiLaplaceInferenceMethod.cpp:170

shogun::CMultiLaplaceInferenceMethod::update_deriv
virtual void update_deriv()
Definition: MultiLaplaceInferenceMethod.cpp:380

shogun::CMultiLaplaceInferenceMethod::get_derivative_wrt_kernel
virtual SGVector< float64_t > get_derivative_wrt_kernel(const TParameter *param)
Definition: MultiLaplaceInferenceMethod.cpp:431

shogun::CInference::m_model
CLikelihoodModel * m_model
Definition: Inference.h:475

shogun::CSGObject::parameter_hash_changed
virtual bool parameter_hash_changed()
Definition: SGObject.cpp:295

shogun::CLaplaceInference::update
virtual void update()
Definition: LaplaceInference.cpp:82

shogun::CLikelihoodModel
The Likelihood model base class.
Definition: LikelihoodModel.h:62

shogun::CInference::m_alpha
SGVector< float64_t > m_alpha
Definition: Inference.h:484

shogun::CInference::check_members
virtual void check_members() const
Definition: Inference.cpp:322