en/latest/KLLowerTriangularInference_8cpp_source.html

  /*

  * Copyright (c) The Shogun Machine Learning Toolbox

  * Written (w) 2014 Wu Lin

  * All rights reserved.

  *

  * Redistribution and use in source and binary forms, with or without

  * modification, are permitted provided that the following conditions are met:

  *

  * 1. Redistributions of source code must retain the above copyright notice, this

  *    list of conditions and the following disclaimer.

  * 2. Redistributions in binary form must reproduce the above copyright notice,

  *    this list of conditions and the following disclaimer in the documentation

  *    and/or other materials provided with the distribution.

  *

  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND

  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED

  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE

  * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR

  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES

  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND

  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS

  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

  *

  * The views and conclusions contained in the software and documentation are those

  * of the authors and should not be interpreted as representing official policies,

  * either expressed or implied, of the Shogun Development Team.

  *

  * Code adapted from

  * http://hannes.nickisch.org/code/approxXX.tar.gz

  * and Gaussian Process Machine Learning Toolbox

  * http://www.gaussianprocess.org/gpml/code/matlab/doc/

  * and the reference paper is

  * Challis, Edward, and David Barber.

  * "Concave Gaussian variational approximations for inference in large-scale Bayesian linear models."

  * International conference on Artificial Intelligence and Statistics. 2011.

  *

  * This code specifically adapted from function in approxKL.m and infKL.m

  */


 #include <shogun/machine/gp/KLLowerTriangularInference.h>


 #include <shogun/mathematics/eigen3.h>

 #include <shogun/mathematics/Math.h>

 #include <shogun/mathematics/Statistics.h>


 using namespace Eigen;


 namespace shogun

 {


 CKLLowerTriangularInference::CKLLowerTriangularInference() : CKLInference()

 {

     init();

 }


 CKLLowerTriangularInference::CKLLowerTriangularInference(CKernel* kern,

         CFeatures* feat, CMeanFunction* m, CLabels* lab, CLikelihoodModel* mod)

         : CKLInference(kern, feat, m, lab, mod)

 {

     init();

 }


 void CKLLowerTriangularInference::init()

 {

     SG_ADD(&m_InvK_Sigma, "invk_Sigma",

         "K^{-1}Sigma'",

         MS_NOT_AVAILABLE);

     SG_ADD(&m_mean_vec, "mean_vec",

         "The mean vector generated from mean function",

         MS_NOT_AVAILABLE);

     SG_ADD(&m_log_det_Kernel, "log_det_kernel",

         "The Log-determinant of Kernel",

         MS_NOT_AVAILABLE);


     SG_ADD(&m_Kernel_LsD, "L_sqrt_D",

         "The L*sqrt(D) matrix, where L and D are defined in LDLT factorization on Kernel*sq(m_scale)",

         MS_NOT_AVAILABLE);

     SG_ADD(&m_Kernel_P, "Permutation_P",

         "The permutation sequence of P, where P are defined in LDLT factorization on Kernel*sq(m_scale)",

         MS_NOT_AVAILABLE);

     m_log_det_Kernel=0;

 }


 CKLLowerTriangularInference::~CKLLowerTriangularInference()

 {

 }


 SGVector<float64_t> CKLLowerTriangularInference::get_diagonal_vector()

 {

     return SGVector<float64_t>();

 }


 void CKLLowerTriangularInference::update_deriv()

 {

 }


 void CKLLowerTriangularInference::update_init()

 {

     Eigen::LDLT<Eigen::MatrixXd> ldlt=update_init_helper();

     MatrixXd Kernel_D=ldlt.vectorD();

     MatrixXd Kernel_L=ldlt.matrixL();

     m_Kernel_LsD=SGMatrix<float64_t>(m_ktrtr.num_rows, m_ktrtr.num_cols);

     m_Kernel_LsD.zero();

     Map<MatrixXd> eigen_Kernel_LsD(m_Kernel_LsD.matrix, m_Kernel_LsD.num_rows, m_Kernel_LsD.num_cols);

     eigen_Kernel_LsD.triangularView<Lower>()=Kernel_L*Kernel_D.array().sqrt().matrix().asDiagonal();

     m_log_det_Kernel=2.0*eigen_Kernel_LsD.diagonal().array().abs().log().sum();


     m_Kernel_P=SGVector<index_t>(m_ktrtr.num_rows);

     for (index_t i=0; i<m_Kernel_P.vlen; i++)

         m_Kernel_P[i]=i;

     Map<VectorXi> eigen_Kernel_P(m_Kernel_P.vector, m_Kernel_P.vlen);

     eigen_Kernel_P=ldlt.transpositionsP()*eigen_Kernel_P;


     m_mean_vec=m_mean->get_mean_vector(m_features);

 }


 MatrixXd CKLLowerTriangularInference::solve_inverse(MatrixXd eigen_A)

 {

     Map<VectorXi> eigen_Kernel_P(m_Kernel_P.vector, m_Kernel_P.vlen);

     Map<MatrixXd> eigen_Kernel_LsD(m_Kernel_LsD.matrix, m_Kernel_LsD.num_rows, m_Kernel_LsD.num_cols);


     //re-construct the Permutation Matrix

     PermutationMatrix<Dynamic> P(m_Kernel_P.vlen);

     P.setIdentity();

     SGVector<index_t> tmp=m_Kernel_P.clone();

     for (index_t i=0; i<tmp.vlen; i++)

     {

         while(tmp[i]>i)

         {

             P.applyTranspositionOnTheLeft(i,tmp[i]);

             index_t idx=tmp[i];

             tmp[i]=tmp[idx];

             tmp[idx]=idx;

         }

     }

     P=P.transpose();

     //(P'LDL'P)\eigen_A

     MatrixXd tmp1=P*eigen_A;

     MatrixXd tmp2=eigen_Kernel_LsD.triangularView<Lower>().solve(tmp1);

     MatrixXd tmp3=eigen_Kernel_LsD.triangularView<Lower>().transpose().solve(tmp2);

     return P.transpose()*tmp3;

 }


 float64_t CKLLowerTriangularInference::get_derivative_related_cov(SGMatrix<float64_t> dK)

 {

     Map<MatrixXd> eigen_dK(dK.matrix, dK.num_rows, dK.num_cols);

     Map<VectorXd> eigen_alpha(m_alpha.vector, m_mu.vlen);

     Map<VectorXd> eigen_mu(m_mu.vector, m_mu.vlen);

     Map<MatrixXd> eigen_InvK_Sigma(m_InvK_Sigma.matrix, m_InvK_Sigma.num_rows, m_InvK_Sigma.num_cols);


     //dnlZ(j)=0.5*sum(sum(dK.*(K\((eye(n)- (invK_V+alpha*m'))')),2),1);

     MatrixXd tmp1=eigen_InvK_Sigma+eigen_alpha*(eigen_mu.transpose());

     MatrixXd tmp2=(MatrixXd::Identity(m_ktrtr.num_rows,m_ktrtr.num_cols)-tmp1).transpose();

     MatrixXd tmp3=solve_inverse(tmp2);

     return 0.5*(tmp3.array()*eigen_dK.array()).sum();

 }


 void CKLLowerTriangularInference::update_approx_cov()

 {

 }


 void CKLLowerTriangularInference::update_chol()

 {

     update_Sigma();

     update_InvK_Sigma();


     m_L=SGMatrix<float64_t>(m_ktrtr.num_rows, m_ktrtr.num_cols);

     Map<MatrixXd> eigen_L(m_L.matrix, m_L.num_rows, m_L.num_cols);

     Map<MatrixXd> eigen_InvK_Sigma(m_InvK_Sigma.matrix, m_InvK_Sigma.num_rows, m_InvK_Sigma.num_cols);

     MatrixXd tmp2=(eigen_InvK_Sigma-MatrixXd::Identity(m_ktrtr.num_rows,m_ktrtr.num_cols)).transpose();


     eigen_L=solve_inverse(tmp2);

 }


 } /* namespace shogun */


shogun::CKLLowerTriangularInference::m_Kernel_LsD
SGMatrix< float64_t > m_Kernel_LsD
Definition: KLLowerTriangularInference.h:136

shogun::CKLLowerTriangularInference::~CKLLowerTriangularInference
virtual ~CKLLowerTriangularInference()
Definition: KLLowerTriangularInference.cpp:86

Math.h

shogun::CKLLowerTriangularInference::update_deriv
virtual void update_deriv()
Definition: KLLowerTriangularInference.cpp:98

shogun::CKLLowerTriangularInference::m_mean_vec
SGVector< float64_t > m_mean_vec
Definition: KLLowerTriangularInference.h:130

shogun::SGMatrix::matrix
T * matrix
Definition: SGMatrix.h:372

index_t
int32_t index_t
Definition: common.h:62

shogun::CLabels
The class Labels models labels, i.e. class assignments of objects.
Definition: Labels.h:43

eigen3.h

Eigen::Map
Definition: SGMatrix.h:24

Eigen
Definition: SGMatrix.h:20

Statistics.h

shogun::SGMatrix::num_cols
index_t num_cols
Definition: SGMatrix.h:376

shogun::CMeanFunction::get_mean_vector
virtual SGVector< float64_t > get_mean_vector(const CFeatures *features) const =0

shogun::CMeanFunction
An abstract class of the mean function.
Definition: MeanFunction.h:49

shogun::CKLLowerTriangularInference::update_InvK_Sigma
virtual void update_InvK_Sigma()=0

shogun::SGMatrix::zero
void zero()
Definition: SGMatrix.cpp:136

shogun::SGMatrix::num_rows
index_t num_rows
Definition: SGMatrix.h:374

shogun::CKLInference::update_init_helper
virtual Eigen::LDLT< Eigen::MatrixXd, 0x1 > update_init_helper()
Definition: KLInference.cpp:229

shogun::SGMatrix< float64_t >

shogun::CInference::m_features
CFeatures * m_features
Definition: Inference.h:478

shogun::MS_NOT_AVAILABLE
Definition: SGObject.h:92

shogun::CInference::m_ktrtr
SGMatrix< float64_t > m_ktrtr
Definition: Inference.h:493

shogun::CKLLowerTriangularInference::get_derivative_related_cov
virtual float64_t get_derivative_related_cov(SGMatrix< float64_t > dK)
Definition: KLLowerTriangularInference.cpp:152

shogun::CInference::m_mean
CMeanFunction * m_mean
Definition: Inference.h:472

shogun::SGVector::vlen
index_t vlen
Definition: SGVector.h:494

shogun::SGVector::vector
T * vector
Definition: SGVector.h:492

shogun::CKLInference
The KL approximation inference method class.
Definition: KLInference.h:75

KLLowerTriangularInference.h

shogun::SGVector< float64_t >

shogun::CKLLowerTriangularInference::update_init
virtual void update_init()
Definition: KLLowerTriangularInference.cpp:105

float64_t
double float64_t
Definition: common.h:50

shogun::CKLLowerTriangularInference::CKLLowerTriangularInference
CKLLowerTriangularInference()
Definition: KLLowerTriangularInference.cpp:53

shogun::CKLInference::m_mu
SGVector< float64_t > m_mu
Definition: KLInference.h:367

shogun::CInference::m_L
SGMatrix< float64_t > m_L
Definition: Inference.h:487

shogun::CKLLowerTriangularInference::solve_inverse
Eigen::MatrixXd solve_inverse(Eigen::MatrixXd A)
Definition: KLLowerTriangularInference.cpp:125

shogun::CKLLowerTriangularInference::update_approx_cov
virtual void update_approx_cov()
Definition: KLLowerTriangularInference.cpp:166

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

shogun::CFeatures
The class Features is the base class of all feature objects.
Definition: Features.h:68

Eigen::LDLT
Definition: KLInference.h:52

Eigen::Matrix
Definition: SGMatrix.h:22

shogun::SGVector::clone
SGVector< T > clone() const
Definition: SGVector.cpp:207

shogun::CKLLowerTriangularInference::update_chol
virtual void update_chol()
Definition: KLLowerTriangularInference.cpp:173

shogun::CKernel
The Kernel base class.
Definition: Kernel.h:159

shogun::CKLLowerTriangularInference::get_diagonal_vector
virtual SGVector< float64_t > get_diagonal_vector()
Definition: KLLowerTriangularInference.cpp:90

shogun::CKLLowerTriangularInference::m_Kernel_P
SGVector< index_t > m_Kernel_P
Definition: KLLowerTriangularInference.h:139

shogun::CKLLowerTriangularInference::m_InvK_Sigma
SGMatrix< float64_t > m_InvK_Sigma
Definition: KLLowerTriangularInference.h:127

SG_ADD
#define SG_ADD(...)
Definition: SGObject.h:84

shogun::CKLLowerTriangularInference::m_log_det_Kernel
float64_t m_log_det_Kernel
Definition: KLLowerTriangularInference.h:133

shogun::CKLLowerTriangularInference::update_Sigma
virtual void update_Sigma()=0

shogun::CLikelihoodModel
The Likelihood model base class.
Definition: LikelihoodModel.h:62

shogun::CInference::m_alpha
SGVector< float64_t > m_alpha
Definition: Inference.h:484