cn/current/KLInferenceMethod_8h_source.html

 /*

  * Copyright (c) The Shogun Machine Learning Toolbox

  * Written (w) 2014 Wu Lin

  * All rights reserved.

  *

  * Redistribution and use in source and binary forms, with or without

  * modification, are permitted provided that the following conditions are met:

  *

  * 1. Redistributions of source code must retain the above copyright notice, this

  *    list of conditions and the following disclaimer.

  * 2. Redistributions in binary form must reproduce the above copyright notice,

  *    this list of conditions and the following disclaimer in the documentation

  *    and/or other materials provided with the distribution.

  *

  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND

  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED

  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE

  * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR

  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES

  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND

  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS

  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

  *

  * The views and conclusions contained in the software and documentation are those

  * of the authors and should not be interpreted as representing official policies,

  * either expressed or implied, of the Shogun Development Team.

  *

  * Code adapted from

  * http://hannes.nickisch.org/code/approxXX.tar.gz

  * and Gaussian Process Machine Learning Toolbox

  * http://www.gaussianprocess.org/gpml/code/matlab/doc/

  * and the reference paper is

  * Nickisch, Hannes, and Carl Edward Rasmussen.

  * "Approximations for Binary Gaussian Process Classification."

  * Journal of Machine Learning Research 9.10 (2008).

  *

  */


 #ifndef _KLINFERENCEMETHOD_H_

 #define _KLINFERENCEMETHOD_H_


 #include <shogun/lib/config.h>


 #ifdef HAVE_EIGEN3

 #include <shogun/machine/gp/InferenceMethod.h>

 #include <shogun/optimization/lbfgs/lbfgs.h>

 #include <shogun/machine/gp/VariationalGaussianLikelihood.h>


 namespace Eigen

 {

     template <class, int, int, int, int, int> class Matrix;

     template <class, int> class LDLT;


     typedef Matrix<float64_t,-1,-1,0,-1,-1> MatrixXd;

 }


 namespace shogun

 {


 class CKLInferenceMethod: public CInferenceMethod

 {

 public:

     CKLInferenceMethod();


     CKLInferenceMethod(CKernel* kernel, CFeatures* features,

             CMeanFunction* mean, CLabels* labels, CLikelihoodModel* model);


     virtual ~CKLInferenceMethod();


     virtual EInferenceType get_inference_type() const { return INF_KL; }


     virtual const char* get_name() const { return "KLInferenceMethod"; }


     virtual float64_t get_negative_log_marginal_likelihood();


     virtual SGVector<float64_t> get_posterior_mean();


     virtual SGMatrix<float64_t> get_posterior_covariance();


     virtual bool supports_regression() const

     {

         check_members();

         return m_model->supports_regression();

     }


     virtual bool supports_binary() const

     {

         check_members();

         return m_model->supports_binary();

     }


     virtual void set_model(CLikelihoodModel* mod);


     virtual void update();


     /* set L-BFGS parameters

      * For details please see shogun/optimization/lbfgs/lbfgs.h

      * @param m The number of corrections to approximate the inverse hessian matrix.

      * Default value is 100.

      * @param max_linesearch The maximum number of trials to do line search for each L-BFGS update.

      * Default value is 1000.

      * @param linesearch The line search algorithm.

      * Default value is using the backtracking with the strong Wolfe condition line search

      * @param max_iterations The maximum number of iterations for L-BFGS update.

      * Default value is 1000.

      * @param delta Delta for convergence test based on the change of function value.

      * Default value is 0.

      * @param past Distance for delta-based convergence test.

      * Default value is 0.

      * @param epsilon Epsilon for convergence test based on the change of gradient.

      * Default value is 1e-5

      * @param min_step The minimum step of the line search.

      * The default value is 1e-20

      * @param max_step The maximum step of the line search.

      * The default value is 1e+20

      * @param ftol A parameter used in Armijo condition.

      * Default value is 1e-4

      * @param wolfe A parameter used in curvature condition.

      * Default value is 0.9

      * @param gtol A parameter used in Morethuente linesearch to control the accuracy.

      * Default value is 0.9

      * @param xtol The machine precision for floating-point values.

      * Default value is 1e-16.

      * @param orthantwise_c Coeefficient for the L1 norm of variables.

      * This parameter should be set to zero for standard minimization problems.

      * Setting this parameter to a positive value activates

      * Orthant-Wise Limited-memory Quasi-Newton (OWL-QN) method. Default value is 0.

      * @param orthantwise_start Start index for computing L1 norm of the variables.

      * This parameter is valid only for OWL-QN method. Default value is 0.

      * @param orthantwise_end End index for computing L1 norm of the variables.

      * Default value is 1.

      */

     virtual void set_lbfgs_parameters(int m = 100,

             int max_linesearch = 1000,

             int linesearch = LBFGS_LINESEARCH_BACKTRACKING_STRONG_WOLFE,

             int max_iterations = 1000,

             float64_t delta = 0.0,

             int past = 0,

             float64_t epsilon = 1e-5,

             float64_t min_step = 1e-20,

             float64_t max_step = 1e+20,

             float64_t ftol = 1e-4,

             float64_t wolfe = 0.9,

             float64_t gtol = 0.9,

             float64_t xtol = 1e-16,

             float64_t orthantwise_c = 0.0,

             int orthantwise_start = 0,

             int orthantwise_end = 1);


     virtual SGMatrix<float64_t> get_cholesky();


     virtual void set_noise_factor(float64_t noise_factor);


     virtual void set_max_attempt(index_t max_attempt);


     virtual void set_exp_factor(float64_t exp_factor);


     virtual void set_min_coeff_kernel(float64_t min_coeff_kernel);

 protected:


     virtual void compute_gradient();


     float64_t m_min_coeff_kernel;


     float64_t m_noise_factor;


     float64_t m_exp_factor;


     index_t m_max_attempt;


     virtual void update_init();


     virtual Eigen::LDLT<Eigen::MatrixXd,0x1> update_init_helper();


     virtual CVariationalGaussianLikelihood* get_variational_likelihood() const;


     virtual void check_variational_likelihood(CLikelihoodModel* mod) const;


     virtual void update_approx_cov()=0;


     virtual float64_t get_derivative_related_cov(SGMatrix<float64_t> dK)=0;


     virtual float64_t lbfgs_optimization();


     virtual SGVector<float64_t> get_derivative_wrt_inference_method(

             const TParameter* param);


     virtual SGVector<float64_t> get_derivative_wrt_likelihood_model(

             const TParameter* param);


     virtual SGVector<float64_t> get_derivative_wrt_kernel(

             const TParameter* param);


     virtual SGVector<float64_t> get_derivative_wrt_mean(

             const TParameter* param);


     virtual float64_t get_negative_log_marginal_likelihood_helper()=0;


     virtual float64_t get_nlml_wrt_parameters();


     virtual void get_gradient_of_nlml_wrt_parameters(SGVector<float64_t> gradient)=0;


     virtual bool lbfgs_precompute()=0;


     SGVector<float64_t> m_mu;


     SGMatrix<float64_t> m_Sigma;


     SGVector<float64_t> m_s2;


     /* The number of corrections to approximate the inverse hessian matrix.*/

     int m_m;


     /* The maximum number of trials to do line search for each L-BFGS update.*/

     int m_max_linesearch;


     /* The line search algorithm.*/

     int m_linesearch;


     /* The maximum number of iterations for L-BFGS update.*/

     int m_max_iterations;


     /* Delta for convergence test based on the change of function value.*/

     float64_t m_delta;


     /* Distance for delta-based convergence test.*/

     int m_past;


     /* Epsilon for convergence test based on the change of gradient.*/

     float64_t m_epsilon;


     /* The minimum step of the line search.*/

     float64_t m_min_step;


     /* The maximum step of the line search.*/

     float64_t m_max_step;


     /* A parameter used in Armijo condition.*/

     float64_t m_ftol;


     /* A parameter used in curvature condition.*/

     float64_t m_wolfe;


     /* A parameter used in Morethuente linesearch to control the accuracy.*/

     float64_t m_gtol;


     /* The machine precision for floating-point values.*/

     float64_t m_xtol;


     /* Coeefficient for the L1 norm of variables.*/

     float64_t m_orthantwise_c;


     /* Start index for computing L1 norm of the variables.*/

     int m_orthantwise_start;


     /* End index for computing L1 norm of the variables.*/

     int m_orthantwise_end;


 private:

     void init();


     static float64_t evaluate(void *obj,

             const float64_t *parameters,

             float64_t *gradient,

             const int dim,

             const float64_t step);


 };

 }

 #endif /* HAVE_EIGEN3 */

 #endif /* _KLINFERENCEMETHOD_H_ */

shogun::CKLInferenceMethod::set_lbfgs_parameters
virtual void set_lbfgs_parameters(int m=100, int max_linesearch=1000, int linesearch=LBFGS_LINESEARCH_BACKTRACKING_STRONG_WOLFE, int max_iterations=1000, float64_t delta=0.0, int past=0, float64_t epsilon=1e-5, float64_t min_step=1e-20, float64_t max_step=1e+20, float64_t ftol=1e-4, float64_t wolfe=0.9, float64_t gtol=0.9, float64_t xtol=1e-16, float64_t orthantwise_c=0.0, int orthantwise_start=0, int orthantwise_end=1)
Definition: KLInferenceMethod.cpp:293

shogun::CKLInferenceMethod::m_min_step
float64_t m_min_step
Definition: KLInferenceMethod.h:449

shogun::CKLInferenceMethod::m_orthantwise_c
float64_t m_orthantwise_c
Definition: KLInferenceMethod.h:467

shogun::CKLInferenceMethod::supports_regression
virtual bool supports_regression() const
Definition: KLInferenceMethod.h:157

shogun::CKLInferenceMethod::m_xtol
float64_t m_xtol
Definition: KLInferenceMethod.h:464

shogun::CKLInferenceMethod::get_derivative_wrt_likelihood_model
virtual SGVector< float64_t > get_derivative_wrt_likelihood_model(const TParameter *param)
Definition: KLInferenceMethod.cpp:337

shogun::CKLInferenceMethod::get_cholesky
virtual SGMatrix< float64_t > get_cholesky()
Definition: KLInferenceMethod.cpp:451

shogun::CInferenceMethod
The Inference Method base class.
Definition: InferenceMethod.h:81

shogun::CKLInferenceMethod::m_epsilon
float64_t m_epsilon
Definition: KLInferenceMethod.h:446

shogun::CKLInferenceMethod::m_ftol
float64_t m_ftol
Definition: KLInferenceMethod.h:455

shogun::CKLInferenceMethod::set_exp_factor
virtual void set_exp_factor(float64_t exp_factor)
Definition: KLInferenceMethod.cpp:201

index_t
int32_t index_t
Definition: common.h:62

shogun::CLabels
The class Labels models labels, i.e. class assignments of objects.
Definition: Labels.h:43

shogun::LBFGS_LINESEARCH_BACKTRACKING_STRONG_WOLFE
Definition: lbfgs.h:167

shogun::CVariationalGaussianLikelihood
The variational Gaussian Likelihood base class. The variational distribution is Gaussian.
Definition: VariationalGaussianLikelihood.h:49

shogun::CKLInferenceMethod::m_m
int m_m
Definition: KLInferenceMethod.h:428

Eigen
Definition: SGMatrix.h:20

shogun::TParameter
parameter struct
Definition: base/Parameter.h:32

config.h

shogun::CKLInferenceMethod::update_init
virtual void update_init()
Definition: KLInferenceMethod.cpp:207

shogun::CKLInferenceMethod::update_approx_cov
virtual void update_approx_cov()=0

shogun::CKLInferenceMethod::m_past
int m_past
Definition: KLInferenceMethod.h:443

shogun::CKLInferenceMethod::get_derivative_wrt_mean
virtual SGVector< float64_t > get_derivative_wrt_mean(const TParameter *param)
Definition: KLInferenceMethod.cpp:353

shogun::CKLInferenceMethod::lbfgs_precompute
virtual bool lbfgs_precompute()=0

shogun::CMeanFunction
An abstract class of the mean function.
Definition: MeanFunction.h:49

shogun::CKLInferenceMethod::get_name
virtual const char * get_name() const
Definition: KLInferenceMethod.h:105

shogun::SGMatrix< float64_t >

shogun::CKLInferenceMethod::m_max_iterations
int m_max_iterations
Definition: KLInferenceMethod.h:437

shogun::epsilon
static const float64_t epsilon
Definition: libbmrm.cpp:25

shogun::CKLInferenceMethod::m_Sigma
SGMatrix< float64_t > m_Sigma
Definition: KLInferenceMethod.h:420

shogun::CKLInferenceMethod::m_min_coeff_kernel
float64_t m_min_coeff_kernel
Definition: KLInferenceMethod.h:291

shogun::SGVector< float64_t >

shogun::CKLInferenceMethod::get_negative_log_marginal_likelihood
virtual float64_t get_negative_log_marginal_likelihood()
Definition: KLInferenceMethod.cpp:329

shogun::CKLInferenceMethod::set_min_coeff_kernel
virtual void set_min_coeff_kernel(float64_t min_coeff_kernel)
Definition: KLInferenceMethod.cpp:189

shogun::CKLInferenceMethod::check_variational_likelihood
virtual void check_variational_likelihood(CLikelihoodModel *mod) const
Definition: KLInferenceMethod.cpp:57

shogun::INF_KL
Definition: InferenceMethod.h:64

shogun::CKLInferenceMethod::lbfgs_optimization
virtual float64_t lbfgs_optimization()
Definition: KLInferenceMethod.cpp:382

float64_t
double float64_t
Definition: common.h:50

shogun::CKLInferenceMethod::m_linesearch
int m_linesearch
Definition: KLInferenceMethod.h:434

shogun::CKLInferenceMethod::get_derivative_wrt_inference_method
virtual SGVector< float64_t > get_derivative_wrt_inference_method(const TParameter *param)
Definition: KLInferenceMethod.cpp:411

shogun::CLikelihoodModel::supports_regression
virtual bool supports_regression() const
Definition: LikelihoodModel.h:323

shogun::EInferenceType
EInferenceType
Definition: InferenceMethod.h:53

shogun::CKLInferenceMethod::set_max_attempt
virtual void set_max_attempt(index_t max_attempt)
Definition: KLInferenceMethod.cpp:195

shogun::CKLInferenceMethod::get_posterior_mean
virtual SGVector< float64_t > get_posterior_mean()
Definition: KLInferenceMethod.cpp:244

shogun::CLikelihoodModel::supports_binary
virtual bool supports_binary() const
Definition: LikelihoodModel.h:329

shogun::CKLInferenceMethod::get_derivative_related_cov
virtual float64_t get_derivative_related_cov(SGMatrix< float64_t > dK)=0

shogun::CKLInferenceMethod::get_posterior_covariance
virtual SGMatrix< float64_t > get_posterior_covariance()
Definition: KLInferenceMethod.cpp:251

shogun::CKLInferenceMethod::m_orthantwise_end
int m_orthantwise_end
Definition: KLInferenceMethod.h:473

Eigen::MatrixXd
Matrix< float64_t,-1,-1, 0,-1,-1 > MatrixXd
Definition: KLInferenceMethod.h:54

shogun::CKLInferenceMethod::update_init_helper
virtual Eigen::LDLT< Eigen::MatrixXd, 0x1 > update_init_helper()
Definition: KLInferenceMethod.cpp:212

shogun::CKLInferenceMethod
The KL approximation inference method class.
Definition: KLInferenceMethod.h:78

shogun::CKLInferenceMethod::CKLInferenceMethod
CKLInferenceMethod()
Definition: KLInferenceMethod.cpp:44

shogun::CKLInferenceMethod::get_nlml_wrt_parameters
virtual float64_t get_nlml_wrt_parameters()
Definition: KLInferenceMethod.cpp:286

shogun::CKLInferenceMethod::m_wolfe
float64_t m_wolfe
Definition: KLInferenceMethod.h:458

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

shogun::CKLInferenceMethod::set_noise_factor
virtual void set_noise_factor(float64_t noise_factor)
Definition: KLInferenceMethod.cpp:183

shogun::CKLInferenceMethod::m_exp_factor
float64_t m_exp_factor
Definition: KLInferenceMethod.h:297

lbfgs.h

shogun::CKLInferenceMethod::get_derivative_wrt_kernel
virtual SGVector< float64_t > get_derivative_wrt_kernel(const TParameter *param)
Definition: KLInferenceMethod.cpp:427

shogun::CKLInferenceMethod::supports_binary
virtual bool supports_binary() const
Definition: KLInferenceMethod.h:167

shogun::CKLInferenceMethod::m_orthantwise_start
int m_orthantwise_start
Definition: KLInferenceMethod.h:470

shogun::CFeatures
The class Features is the base class of all feature objects.
Definition: Features.h:68

Eigen::LDLT
Definition: KLInferenceMethod.h:54

Eigen::Matrix
Definition: SGMatrix.h:22

shogun::CKLInferenceMethod::m_mu
SGVector< float64_t > m_mu
Definition: KLInferenceMethod.h:417

shogun::CKLInferenceMethod::m_s2
SGVector< float64_t > m_s2
Definition: KLInferenceMethod.h:425

shogun::CInferenceMethod::check_members
virtual void check_members() const
Definition: InferenceMethod.cpp:309

shogun::CKernel
The Kernel base class.
Definition: Kernel.h:158

shogun::CKLInferenceMethod::get_gradient_of_nlml_wrt_parameters
virtual void get_gradient_of_nlml_wrt_parameters(SGVector< float64_t > gradient)=0

shogun::CKLInferenceMethod::get_variational_likelihood
virtual CVariationalGaussianLikelihood * get_variational_likelihood() const
Definition: KLInferenceMethod.cpp:279

VariationalGaussianLikelihood.h

shogun::CKLInferenceMethod::m_delta
float64_t m_delta
Definition: KLInferenceMethod.h:440

shogun::CKLInferenceMethod::m_max_attempt
index_t m_max_attempt
Definition: KLInferenceMethod.h:300

shogun::CKLInferenceMethod::m_max_linesearch
int m_max_linesearch
Definition: KLInferenceMethod.h:431

shogun::CKLInferenceMethod::m_gtol
float64_t m_gtol
Definition: KLInferenceMethod.h:461

shogun::CKLInferenceMethod::~CKLInferenceMethod
virtual ~CKLInferenceMethod()
Definition: KLInferenceMethod.cpp:152

shogun::CKLInferenceMethod::set_model
virtual void set_model(CLikelihoodModel *mod)
Definition: KLInferenceMethod.cpp:67

delta
#define delta
Definition: sfa.cpp:23

shogun::CLikelihoodModel
The Likelihood model base class.
Definition: LikelihoodModel.h:62

shogun::CKLInferenceMethod::get_negative_log_marginal_likelihood_helper
virtual float64_t get_negative_log_marginal_likelihood_helper()=0

shogun::CKLInferenceMethod::m_max_step
float64_t m_max_step
Definition: KLInferenceMethod.h:452

shogun::CKLInferenceMethod::compute_gradient
virtual void compute_gradient()
Definition: KLInferenceMethod.cpp:156

shogun::CInferenceMethod::m_model
CLikelihoodModel * m_model
Definition: InferenceMethod.h:466

shogun::CKLInferenceMethod::get_inference_type
virtual EInferenceType get_inference_type() const
Definition: KLInferenceMethod.h:99

shogun::CKLInferenceMethod::update
virtual void update()
Definition: KLInferenceMethod.cpp:169

InferenceMethod.h

shogun::CKLInferenceMethod::m_noise_factor
float64_t m_noise_factor
Definition: KLInferenceMethod.h:294