en/latest/ProbitLikelihood_8cpp_source.html

 /*

  * Copyright (c) The Shogun Machine Learning Toolbox

  * Written (W) 2013 Roman Votyakov

  * All rights reserved.

  *

  * Redistribution and use in source and binary forms, with or without

  * modification, are permitted provided that the following conditions are met:

  *

  * 1. Redistributions of source code must retain the above copyright notice, this

  *    list of conditions and the following disclaimer.

  * 2. Redistributions in binary form must reproduce the above copyright notice,

  *    this list of conditions and the following disclaimer in the documentation

  *    and/or other materials provided with the distribution.

  *

  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND

  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED

  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE

  * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR

  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES

  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND

  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS

  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

  *

  * The views and conclusions contained in the software and documentation are those

  * of the authors and should not be interpreted as representing official policies,

  * either expressed or implied, of the Shogun Development Team.

  *

  */

 #include <shogun/machine/gp/ProbitLikelihood.h>


 #include <shogun/labels/BinaryLabels.h>

 #include <shogun/mathematics/eigen3.h>

 #include <shogun/mathematics/Statistics.h>


 using namespace shogun;

 using namespace Eigen;


 CProbitLikelihood::CProbitLikelihood()

 {

 }


 CProbitLikelihood::~CProbitLikelihood()

 {

 }


 SGVector<float64_t> CProbitLikelihood::get_predictive_means(

         SGVector<float64_t> mu, SGVector<float64_t> s2, const CLabels* lab) const

 {

     SGVector<float64_t> lp=get_log_zeroth_moments(mu, s2, lab);

     Map<VectorXd> eigen_lp(lp.vector, lp.vlen);


     SGVector<float64_t> r(lp.vlen);

     Map<VectorXd> eigen_r(r.vector, r.vlen);


     // evaluate predictive mean: ymu=2*p-1

     eigen_r=2.0*eigen_lp.array().exp()-1.0;


     return r;

 }


 SGVector<float64_t> CProbitLikelihood::get_predictive_variances(

         SGVector<float64_t> mu, SGVector<float64_t> s2, const CLabels* lab) const

 {

     SGVector<float64_t> lp=get_log_zeroth_moments(mu, s2, lab);

     Map<VectorXd> eigen_lp(lp.vector, lp.vlen);


     SGVector<float64_t> r(lp.vlen);

     Map<VectorXd> eigen_r(r.vector, r.vlen);


     // evaluate predictive variance: ys2=1-(2*p-1).^2

     eigen_r=1-(2.0*eigen_lp.array().exp()-1.0).square();


     return r;

 }


 SGVector<float64_t> CProbitLikelihood::get_log_probability_f(const CLabels* lab,

         SGVector<float64_t> func) const

 {

     // check the parameters

     REQUIRE(lab, "Labels are required (lab should not be NULL)\n")

     REQUIRE(lab->get_label_type()==LT_BINARY,

             "Labels must be type of CBinaryLabels\n")

     REQUIRE(lab->get_num_labels()==func.vlen, "Number of labels must match "

             "length of the function vector\n")


     SGVector<float64_t> y=((CBinaryLabels*)lab)->get_labels();

     Map<VectorXd> eigen_y(y.vector, y.vlen);


     Map<VectorXd> eigen_f(func.vector, func.vlen);


     SGVector<float64_t> r(func.vlen);

     Map<VectorXd> eigen_r(r.vector, r.vlen);


     // compute log pobability: log(normal_cdf(f.*y))

     eigen_r=eigen_y.cwiseProduct(eigen_f);


     for (index_t i=0; i<eigen_r.size(); i++)

         eigen_r[i]=CStatistics::lnormal_cdf(eigen_r[i]);


     return r;

 }


 SGVector<float64_t> CProbitLikelihood::get_log_probability_derivative_f(

         const CLabels* lab, SGVector<float64_t> func, index_t i) const

 {

     // check the parameters

     REQUIRE(lab, "Labels are required (lab should not be NULL)\n")

     REQUIRE(lab->get_label_type()==LT_BINARY,

             "Labels must be type of CBinaryLabels\n")

     REQUIRE(lab->get_num_labels()==func.vlen, "Number of labels must match "

             "length of the function vector\n")

     REQUIRE(i>=1 && i<=3, "Index for derivative should be 1, 2 or 3\n")


     SGVector<float64_t> y=((CBinaryLabels*)lab)->get_labels();

     Map<VectorXd> eigen_y(y.vector, y.vlen);


     Map<VectorXd> eigen_f(func.vector, func.vlen);


     SGVector<float64_t> dlp(func.vlen);

     Map<VectorXd> eigen_dlp(dlp.vector, dlp.vlen);


     VectorXd eigen_yf=eigen_y.cwiseProduct(eigen_f);


     for (index_t j=0; j<eigen_yf.size(); j++)

     {

         float64_t v = eigen_yf[j];

         if (v<CStatistics::ERFC_CASE2)

         {

             //dlp( id2) = abs(den./num) * sqrt(2/pi); % strictly positive first derivative

             eigen_dlp[j]=CMath::sqrt(2.0/CMath::PI)

                 /CMath::abs(CStatistics::erfc8_weighted_sum(v));

         }

         else

         {

             //dlp(~id2) = exp(-z(~id2).*z(~id2)/2-lp(~id2))/sqrt(2*pi); % safe computation

             eigen_dlp[j]=CMath::exp(-v*v/2.0-CStatistics::lnormal_cdf(v))

                 /CMath::sqrt(2.0*CMath::PI);

         }

     }


     SGVector<float64_t> r(func.vlen);

     Map<VectorXd> eigen_r(r.vector, r.vlen);


     // compute derivatives of log probability wrt f


     if (i==1)

         eigen_r=eigen_dlp;

     else

         //d2lp = -dlp.*abs(z+dlp);             % strictly negative second derivative

         eigen_r=(-eigen_dlp.array()*((eigen_yf.array()+eigen_dlp.array()).abs().array())).matrix();


     if (i==3)

         //d3lp = -d2lp.*abs(z+2*dlp)-dlp;     % strictly positive third derivative

         eigen_r=(-eigen_r.array()*((eigen_yf.array()+2.0*eigen_dlp.array()).abs().array())

          -eigen_dlp.array()).matrix();


     if (i==1 || i==3)

     {

         //varargout{2} = y.*varargout{2}

         //varargout{4} = y.*varargout{4}

         eigen_r=(eigen_r.array()*eigen_y.array()).matrix();

     }


     return r;

 }


 SGVector<float64_t> CProbitLikelihood::get_log_zeroth_moments(

         SGVector<float64_t> mu, SGVector<float64_t> s2, const CLabels* lab) const

 {

     SGVector<float64_t> y;


     if (lab)

     {

         REQUIRE((mu.vlen==s2.vlen) && (mu.vlen==lab->get_num_labels()),

                 "Length of the vector of means (%d), length of the vector of "

                 "variances (%d) and number of labels (%d) should be the same\n",

                 mu.vlen, s2.vlen, lab->get_num_labels())

         REQUIRE(lab->get_label_type()==LT_BINARY,

                 "Labels must be type of CBinaryLabels\n")


         y=((CBinaryLabels*)lab)->get_labels();

     }

     else

     {

         REQUIRE(mu.vlen==s2.vlen, "Length of the vector of means (%d) and "

                 "length of the vector of variances (%d) should be the same\n",

                 mu.vlen, s2.vlen)


         y=SGVector<float64_t>(mu.vlen);

         y.set_const(1.0);

     }


     Map<VectorXd> eigen_y(y.vector, y.vlen);

     Map<VectorXd> eigen_mu(mu.vector, mu.vlen);

     Map<VectorXd> eigen_s2(s2.vector, s2.vlen);


     SGVector<float64_t> r(y.vlen);

     Map<VectorXd> eigen_r(r.vector, r.vlen);


     // compute: lp=log(normal_cdf((mu.*y)./sqrt(1+sigma^2)))

     eigen_r=eigen_mu.array()*eigen_y.array()/((1.0+eigen_s2.array()).sqrt());


     for (index_t i=0; i<eigen_r.size(); i++)

         eigen_r[i]=CStatistics::lnormal_cdf(eigen_r[i]);


     return r;

 }


 float64_t CProbitLikelihood::get_first_moment(SGVector<float64_t> mu,

         SGVector<float64_t> s2, const CLabels *lab, index_t i) const

 {

     // check the parameters

     REQUIRE(lab, "Labels are required (lab should not be NULL)\n")

     REQUIRE((mu.vlen==s2.vlen) && (mu.vlen==lab->get_num_labels()),

             "Length of the vector of means (%d), length of the vector of "

             "variances (%d) and number of labels (%d) should be the same\n",

             mu.vlen, s2.vlen, lab->get_num_labels())

     REQUIRE(i>=0 && i<=mu.vlen, "Index (%d) out of bounds!\n", i)

     REQUIRE(lab->get_label_type()==LT_BINARY,

             "Labels must be type of CBinaryLabels\n")


     SGVector<float64_t> y=((CBinaryLabels*)lab)->get_labels();


     float64_t z=y[i]*mu[i]/CMath::sqrt(1.0+s2[i]);


     // compute ncdf=normal_cdf(z)

     float64_t ncdf=CStatistics::normal_cdf(z);


     // compute npdf=normal_pdf(z)=(1/sqrt(2*pi))*exp(-z.^2/2)

     float64_t npdf=(1.0/CMath::sqrt(2.0*CMath::PI))*CMath::exp(-0.5*CMath::sq(z));


     // compute the 1st moment: E[x] = mu + (y*s2*N(z))/(Phi(z)*sqrt(1+s2))

     float64_t Ex=mu[i]+(npdf/ncdf)*(y[i]*s2[i])/CMath::sqrt(1.0+s2[i]);


     return Ex;

 }


 float64_t CProbitLikelihood::get_second_moment(SGVector<float64_t> mu,

         SGVector<float64_t> s2, const CLabels *lab, index_t i) const

 {

     // check the parameters

     REQUIRE(lab, "Labels are required (lab should not be NULL)\n")

     REQUIRE((mu.vlen==s2.vlen) && (mu.vlen==lab->get_num_labels()),

             "Length of the vector of means (%d), length of the vector of "

             "variances (%d) and number of labels (%d) should be the same\n",

             mu.vlen, s2.vlen, lab->get_num_labels())

     REQUIRE(i>=0 && i<=mu.vlen, "Index (%d) out of bounds!\n", i)

     REQUIRE(lab->get_label_type()==LT_BINARY,

             "Labels must be type of CBinaryLabels\n")


     SGVector<float64_t> y=((CBinaryLabels*)lab)->get_labels();


     float64_t z=y[i]*mu[i]/CMath::sqrt(1.0+s2[i]);


     // compute ncdf=normal_cdf(z)

     float64_t ncdf=CStatistics::normal_cdf(z);


     // compute npdf=normal_pdf(z)=(1/sqrt(2*pi))*exp(-z.^2/2)

     float64_t npdf=(1.0/CMath::sqrt(2.0*CMath::PI))*CMath::exp(-0.5*CMath::sq(z));


     SGVector<float64_t> r(y.vlen);

     Map<VectorXd> eigen_r(r.vector, r.vlen);


     // compute the 2nd moment:

     // Var[x] = s2 - (s2^2*N(z))/((1+s2)*Phi(z))*(z+N(z)/Phi(z))

     float64_t Var=s2[i]-(CMath::sq(s2[i])/(1.0+s2[i]))*(npdf/ncdf)*(z+(npdf/ncdf));


     return Var;

 }


shogun::CLabels::get_label_type
virtual ELabelType get_label_type() const =0

LT_BINARY
binary labels +1/-1
Definition: LabelTypes.h:18

index_t
int32_t index_t
Definition: common.h:62

shogun::CLabels
The class Labels models labels, i.e. class assignments of objects.
Definition: Labels.h:43

shogun::CLabels::get_num_labels
virtual int32_t get_num_labels() const =0

eigen3.h

Eigen::Map
Definition: SGMatrix.h:24

shogun::CMath::sq
static T sq(T x)
Definition: Math.h:450

Eigen
Definition: SGMatrix.h:20

Statistics.h

REQUIRE
#define REQUIRE(x,...)
Definition: SGIO.h:206

shogun::CStatistics::ERFC_CASE2
static const float64_t ERFC_CASE2
Definition: Statistics.h:407

shogun::CProbitLikelihood::get_predictive_variances
virtual SGVector< float64_t > get_predictive_variances(SGVector< float64_t > mu, SGVector< float64_t > s2, const CLabels *lab=NULL) const
Definition: ProbitLikelihood.cpp:64

BinaryLabels.h

shogun::CStatistics::lnormal_cdf
static float64_t lnormal_cdf(float64_t x)
Definition: Statistics.cpp:418

shogun::SGVector::vlen
index_t vlen
Definition: SGVector.h:494

shogun::SGVector::vector
T * vector
Definition: SGVector.h:492

shogun::CProbitLikelihood::get_log_probability_f
virtual SGVector< float64_t > get_log_probability_f(const CLabels *lab, SGVector< float64_t > func) const
Definition: ProbitLikelihood.cpp:79

shogun::SGVector< float64_t >

shogun::CProbitLikelihood::CProbitLikelihood
CProbitLikelihood()
Definition: ProbitLikelihood.cpp:41

float64_t
double float64_t
Definition: common.h:50

shogun::CProbitLikelihood::get_log_zeroth_moments
virtual SGVector< float64_t > get_log_zeroth_moments(SGVector< float64_t > mu, SGVector< float64_t > s2, const CLabels *lab) const
Definition: ProbitLikelihood.cpp:170

shogun::CProbitLikelihood::get_predictive_means
virtual SGVector< float64_t > get_predictive_means(SGVector< float64_t > mu, SGVector< float64_t > s2, const CLabels *lab=NULL) const
Definition: ProbitLikelihood.cpp:49

shogun::CProbitLikelihood::~CProbitLikelihood
virtual ~CProbitLikelihood()
Definition: ProbitLikelihood.cpp:45

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

shogun::CStatistics::erfc8_weighted_sum
static float64_t erfc8_weighted_sum(float64_t x)
Definition: Statistics.cpp:464

shogun::CMath::exp
static float64_t exp(float64_t x)
Definition: Math.h:621

shogun::CProbitLikelihood::get_first_moment
virtual float64_t get_first_moment(SGVector< float64_t > mu, SGVector< float64_t > s2, const CLabels *lab, index_t i) const
Definition: ProbitLikelihood.cpp:212

shogun::CStatistics::normal_cdf
static float64_t normal_cdf(float64_t x, float64_t std_dev=1)
Definition: Statistics.cpp:508

shogun::CBinaryLabels
Binary Labels for binary classification.
Definition: BinaryLabels.h:37

ProbitLikelihood.h

shogun::CMath::sqrt
static float32_t sqrt(float32_t x)
Definition: Math.h:459

shogun::CProbitLikelihood::get_log_probability_derivative_f
virtual SGVector< float64_t > get_log_probability_derivative_f(const CLabels *lab, SGVector< float64_t > func, index_t i) const
Definition: ProbitLikelihood.cpp:106

shogun::CProbitLikelihood::get_second_moment
virtual float64_t get_second_moment(SGVector< float64_t > mu, SGVector< float64_t > s2, const CLabels *lab, index_t i) const
Definition: ProbitLikelihood.cpp:241

shogun::SGVector::set_const
void set_const(T const_elem)
Definition: SGVector.cpp:150

shogun::CMath::abs
static T abs(T a)
Definition: Math.h:179

shogun::CMath::PI
static const float64_t PI
Definition: Math.h:2055