en/latest/MCLDA_8cpp_source.html

 /*

  * This program is free software; you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation; either version 3 of the License, or

  * (at your option) any later version.

  *

  * Written (W) 2013 Kevin Hughes

  * Copyright (C) 2013 Kevin Hughes

  *

  * Thanks to Fernando Jose Iglesias Garcia (shogun)

  *           and Matthieu Perrot (scikit-learn)

  */


 #include <shogun/lib/common.h>


 #include <shogun/multiclass/MCLDA.h>

 #include <shogun/machine/NativeMulticlassMachine.h>

 #include <shogun/features/Features.h>

 #include <shogun/labels/Labels.h>

 #include <shogun/labels/MulticlassLabels.h>

 #include <shogun/mathematics/Math.h>


 #include <shogun/mathematics/eigen3.h>


 using namespace shogun;

 using namespace Eigen;


 CMCLDA::CMCLDA(float64_t tolerance, bool store_cov)

 : CNativeMulticlassMachine()

 {

     init();

     m_tolerance=tolerance;

     m_store_cov=store_cov;


 }


 CMCLDA::CMCLDA(CDenseFeatures<float64_t>* traindat, CLabels* trainlab, float64_t tolerance, bool store_cov)

 : CNativeMulticlassMachine()

 {

     init();


     m_tolerance=tolerance;

     m_store_cov=store_cov;


     set_features(traindat);

     set_labels(trainlab);

 }


 CMCLDA::~CMCLDA()

 {

     SG_UNREF(m_features);


     cleanup();

 }


 void CMCLDA::init()

 {

     SG_ADD(&m_tolerance, "m_tolerance", "Tolerance member.", MS_AVAILABLE);

     SG_ADD(&m_store_cov, "m_store_cov", "Store covariance member", MS_NOT_AVAILABLE);

     SG_ADD((CSGObject**) &m_features, "m_features", "Feature object.", MS_NOT_AVAILABLE);

     SG_ADD(&m_means, "m_means", "Mean vectors list", MS_NOT_AVAILABLE);

     SG_ADD(&m_cov, "m_cov", "covariance matrix", MS_NOT_AVAILABLE);

     SG_ADD(&m_xbar, "m_xbar", "total mean", MS_NOT_AVAILABLE);

     SG_ADD(&m_scalings, "m_scalings", "scalings", MS_NOT_AVAILABLE);

     SG_ADD(&m_rank, "m_rank", "rank", MS_NOT_AVAILABLE);

     SG_ADD(&m_coef, "m_coef", "weight vector", MS_NOT_AVAILABLE);

     SG_ADD(&m_intercept, "m_intercept", "intercept", MS_NOT_AVAILABLE);


     m_features  = NULL;

     m_num_classes=0;

     m_dim=0;

     m_rank=0;

 }


 void CMCLDA::cleanup()

 {

     m_num_classes = 0;

 }


 CMulticlassLabels* CMCLDA::apply_multiclass(CFeatures* data)

 {

     if (data)

     {

         if (!data->has_property(FP_DOT))

             SG_ERROR("Specified features are not of type CDotFeatures\n")


         set_features((CDotFeatures*) data);

     }


     if (!m_features)

         return NULL;


     int32_t num_vecs = m_features->get_num_vectors();

     ASSERT(num_vecs > 0)

     ASSERT( m_dim == m_features->get_dim_feature_space() );


     // collect features into a matrix

     CDenseFeatures< float64_t >* rf = (CDenseFeatures< float64_t >*) m_features;


     MatrixXd X(num_vecs, m_dim);


     int32_t vlen;

     bool vfree;

     float64_t* vec;

     Map< VectorXd > Em_xbar(m_xbar, m_dim);

     for (int i = 0; i < num_vecs; i++)

     {

         vec = rf->get_feature_vector(i, vlen, vfree);

         ASSERT(vec)


         Map< VectorXd > Evec(vec, vlen);


         X.row(i) = Evec - Em_xbar;


         rf->free_feature_vector(vec, i, vfree);

     }


 #ifdef DEBUG_MCLDA

     SG_PRINT("\n>>> Displaying X ...\n")

     SGMatrix< float64_t >::display_matrix(X.data(), num_vecs, m_dim);

 #endif


     // center and scale data

     MatrixXd Xs(num_vecs, m_rank);

     Map< MatrixXd > Em_scalings(m_scalings.matrix, m_dim, m_rank);

     Xs = X*Em_scalings;


 #ifdef DEBUG_MCLDA

     SG_PRINT("\n>>> Displaying Xs ...\n")

     SGMatrix< float64_t >::display_matrix(Xs.data(), num_vecs, m_rank);

 #endif


     // decision function

     MatrixXd d(num_vecs, m_num_classes);

     Map< MatrixXd > Em_coef(m_coef.matrix, m_num_classes, m_rank);

     Map< VectorXd > Em_intercept(m_intercept.vector, m_num_classes);

     d = (Xs*Em_coef.transpose()).rowwise() + Em_intercept.transpose();


 #ifdef DEBUG_MCLDA

     SG_PRINT("\n>>> Displaying d ...\n")

     SGMatrix< float64_t >::display_matrix(d.data(), num_vecs, m_num_classes);

 #endif


     // argmax to apply labels

     CMulticlassLabels* out = new CMulticlassLabels(num_vecs);

     for (int i = 0; i < num_vecs; i++)

         out->set_label(i, CMath::arg_max(d.data()+i, num_vecs, m_num_classes));


     return out;

 }


 bool CMCLDA::train_machine(CFeatures* data)

 {

     if (!m_labels)

         SG_ERROR("No labels allocated in MCLDA training\n")


     if (data)

     {

         if (!data->has_property(FP_DOT))

             SG_ERROR("Speficied features are not of type CDotFeatures\n")


         set_features((CDotFeatures*) data);

     }


     if (!m_features)

         SG_ERROR("No features allocated in MCLDA training\n")


     SGVector< int32_t > train_labels = ((CMulticlassLabels*) m_labels)->get_int_labels();


     if (!train_labels.vector)

         SG_ERROR("No train_labels allocated in MCLDA training\n")


     cleanup();


     m_num_classes = ((CMulticlassLabels*) m_labels)->get_num_classes();

     m_dim = m_features->get_dim_feature_space();

     int32_t num_vec  = m_features->get_num_vectors();


     if (num_vec != train_labels.vlen)

         SG_ERROR("Dimension mismatch between features and labels in MCLDA training")


     int32_t* class_idxs = SG_MALLOC(int32_t, num_vec*m_num_classes);

     int32_t* class_nums = SG_MALLOC(int32_t, m_num_classes); // number of examples of each class

     memset(class_nums, 0, m_num_classes*sizeof(int32_t));


     for (int i = 0; i < train_labels.vlen; i++)

     {

         int32_t class_idx = train_labels.vector[i];


         if (class_idx < 0 || class_idx >= m_num_classes)

         {

             SG_ERROR("found label out of {0, 1, 2, ..., num_classes-1}...")

             return false;

         }

         else

         {

             class_idxs[ class_idx*num_vec + class_nums[class_idx]++ ] = i;

         }

     }


     for (int i = 0; i < m_num_classes; i++)

     {

         if (class_nums[i] <= 0)

         {

             SG_ERROR("What? One class with no elements\n")

             return false;

         }

     }


     CDenseFeatures< float64_t >* rf = (CDenseFeatures< float64_t >*) m_features;


     // if ( m_store_cov )

         index_t * cov_dims = SG_MALLOC(index_t, 3);

         cov_dims[0] = m_dim;

         cov_dims[1] = m_dim;

         cov_dims[2] = m_num_classes;

         SGNDArray< float64_t > covs(cov_dims, 3);


     m_means = SGMatrix< float64_t >(m_dim, m_num_classes, true);


     // matrix of all samples

     MatrixXd X =  MatrixXd::Zero(num_vec, m_dim);

     int32_t iX = 0;


     m_means.zero();

     m_cov.zero();


     int32_t vlen;

     bool vfree;

     float64_t* vec;

     for (int k = 0; k < m_num_classes; k++)

     {

         // gather all the samples for class k into buffer and calculate the mean of class k

         MatrixXd buffer(class_nums[k], m_dim);

         Map< VectorXd > Em_mean(m_means.get_column_vector(k), m_dim);

         for (int i = 0; i < class_nums[k]; i++)

         {

             vec = rf->get_feature_vector(class_idxs[k*num_vec + i], vlen, vfree);

             ASSERT(vec)


             Map< VectorXd > Evec(vec, vlen);

             Em_mean += Evec;

             buffer.row(i) = Evec;


             rf->free_feature_vector(vec, class_idxs[k*num_vec + i], vfree);

         }


         Em_mean /= class_nums[k];


         // subtract the mean of class k from each sample of class k and store the centered data in Xc

         for (int i = 0; i < class_nums[k]; i++)

         {

             buffer.row(i) -= Em_mean;

             X.row(iX) += buffer.row(i);

             iX++;

         }


         if (m_store_cov)

         {

             // calc cov = buffer.T * buffer

             Map< MatrixXd > Em_cov_k(covs.get_matrix(k), m_dim, m_dim);

             Em_cov_k = buffer.transpose() * buffer;

         }

     }


 #ifdef DEBUG_MCLDA

     SG_PRINT("\n>>> Displaying means ...\n")

     SGMatrix< float64_t >::display_matrix(m_means.matrix, m_dim, m_num_classes);

 #endif


     if (m_store_cov)

     {

         m_cov = SGMatrix< float64_t >(m_dim, m_dim, true);

         m_cov.zero();

         Map< MatrixXd > Em_cov(m_cov.matrix, m_dim, m_dim);


         for (int k = 0; k < m_num_classes; k++)

         {

             Map< MatrixXd > Em_cov_k(covs.get_matrix(k), m_dim, m_dim);

             Em_cov += Em_cov_k;

         }


         Em_cov /= m_num_classes;

     }


 #ifdef DEBUG_MCLDA

     if (m_store_cov)

     {

         SG_PRINT("\n>>> Displaying cov ...\n")

         SGMatrix< float64_t >::display_matrix(m_cov.matrix, m_dim, m_dim);

     }

 #endif


     // 1) within (univariate) scaling by with classes std-dev


     // std-dev of X

     m_xbar = SGVector< float64_t >(m_dim);

     m_xbar.zero();

     Map< VectorXd > Em_xbar(m_xbar.vector, m_dim);

     Em_xbar = X.colwise().sum();

     Em_xbar /= num_vec;


     VectorXd std = VectorXd::Zero(m_dim);

     std = (X.rowwise() - Em_xbar.transpose()).array().pow(2).colwise().sum();

     std = std.array() / num_vec;


     for (int j = 0; j < m_dim; j++)

         if(std[j] == 0)

             std[j] = 1;


     float64_t fac = 1.0 / (num_vec - m_num_classes);


 #ifdef DEBUG_MCLDA

     SG_PRINT("\n>>> Displaying m_xbar ...\n")

     SGVector< float64_t >::display_vector(m_xbar.vector, m_dim);


     SG_PRINT("\n>>> Displaying std ...\n")

     SGVector< float64_t >::display_vector(std.data(), m_dim);

 #endif


     // 2) Within variance scaling

     for (int i = 0; i < num_vec; i++)

         X.row(i) = sqrt(fac) * X.row(i).array() / std.transpose().array();


     // SVD of centered (within)scaled data

     VectorXd S(m_dim);

     MatrixXd V(m_dim, m_dim);


     Eigen::JacobiSVD<MatrixXd> eSvd;

     eSvd.compute(X,Eigen::ComputeFullV);

     memcpy(S.data(), eSvd.singularValues().data(), m_dim*sizeof(float64_t));

     memcpy(V.data(), eSvd.matrixV().data(), m_dim*m_dim*sizeof(float64_t));

     V.transposeInPlace();


     int rank = 0;

     while (rank < m_dim && S[rank] > m_tolerance)

     {

         rank++;

     }


     if (rank < m_dim)

         SG_ERROR("Warning: Variables are collinear\n")


     MatrixXd scalings(m_dim, rank);

     for (int i = 0; i < m_dim; i++)

         for (int j = 0; j < rank; j++)

             scalings(i,j) = V(j,i) / std[j] / S[j];


 #ifdef DEBUG_MCLDA

     SG_PRINT("\n>>> Displaying scalings ...\n")

     SGMatrix< float64_t >::display_matrix(scalings.data(), m_dim, rank);

 #endif


     // 3) Between variance scaling


     // Xc = m_means dot scalings

     MatrixXd Xc(m_num_classes, rank);

     Map< MatrixXd > Em_means(m_means.matrix, m_dim, m_num_classes);

     Xc = (Em_means.transpose()*scalings);


     for (int i = 0; i < m_num_classes; i++)

         Xc.row(i) *= sqrt(class_nums[i] * fac);


     // Centers are living in a space with n_classes-1 dim (maximum)

     // Use svd to find projection in the space spanned by the

     // (n_classes) centers

     S = VectorXd(rank);

     V = MatrixXd(rank, rank);


     eSvd.compute(Xc,Eigen::ComputeFullV);

     memcpy(S.data(), eSvd.singularValues().data(), rank*sizeof(float64_t));

     memcpy(V.data(), eSvd.matrixV().data(), rank*rank*sizeof(float64_t));


     m_rank = 0;

     while (m_rank < rank && S[m_rank] > m_tolerance*S[0])

     {

         m_rank++;

     }


     // compose the scalings

     m_scalings  = SGMatrix< float64_t >(rank, m_rank);

     Map< MatrixXd > Em_scalings(m_scalings.matrix, rank, m_rank);

     Em_scalings = scalings * V.leftCols(m_rank);


 #ifdef DEBUG_MCLDA

     SG_PRINT("\n>>> Displaying m_scalings ...\n")

     SGMatrix< float64_t >::display_matrix(m_scalings.matrix, rank, m_rank);

 #endif


     // weight vectors / centroids

     MatrixXd meansc(m_dim, m_num_classes);

     meansc = Em_means.colwise() - Em_xbar;


     m_coef = SGMatrix< float64_t >(m_num_classes, m_rank);

     Map< MatrixXd > Em_coef(m_coef.matrix, m_num_classes, m_rank);

     Em_coef = meansc.transpose() * Em_scalings;


 #ifdef DEBUG_MCLDA

     SG_PRINT("\n>>> Displaying m_coefs ...\n")

     SGMatrix< float64_t >::display_matrix(m_coef.matrix, m_num_classes, m_rank);

 #endif


     // intercept

     m_intercept  = SGVector< float64_t >(m_num_classes);

     m_intercept.zero();

     for (int j = 0; j < m_num_classes; j++)

         m_intercept[j] = -0.5*m_coef[j]*m_coef[j] + log(class_nums[j]/float(num_vec));


 #ifdef DEBUG_MCLDA

     SG_PRINT("\n>>> Displaying m_intercept ...\n")

     SGVector< float64_t >::display_vector(m_intercept.vector, m_num_classes);

 #endif


     SG_FREE(class_idxs);

     SG_FREE(class_nums);


     return true;

 }


shogun::SGMatrix::display_matrix
void display_matrix(const char *name="matrix") const
Definition: SGMatrix.cpp:390

shogun::CMCLDA::CMCLDA
CMCLDA(float64_t tolerance=1e-4, bool store_cov=false)
Definition: MCLDA.cpp:29

shogun::CDenseFeatures< float64_t >

shogun::CMath::arg_max
static int32_t arg_max(T *vec, int32_t inc, int32_t len, T *maxv_ptr=NULL)
Definition: Math.h:262

shogun::CDenseFeatures::get_feature_vector
ST * get_feature_vector(int32_t num, int32_t &len, bool &dofree)
Definition: DenseFeatures.cpp:90

Math.h

shogun::CNativeMulticlassMachine
experimental abstract native multiclass machine class
Definition: NativeMulticlassMachine.h:23

shogun::CMCLDA::~CMCLDA
virtual ~CMCLDA()
Definition: MCLDA.cpp:50

shogun::SGMatrix::matrix
T * matrix
Definition: SGMatrix.h:372

index_t
int32_t index_t
Definition: common.h:62

shogun::SGMatrix::data
T * data() const
Definition: SGMatrix.h:179

shogun::CMCLDA::apply_multiclass
virtual CMulticlassLabels * apply_multiclass(CFeatures *data=NULL)
Definition: MCLDA.cpp:81

shogun::CMCLDA::train_machine
virtual bool train_machine(CFeatures *data=NULL)
Definition: MCLDA.cpp:153

shogun::CLabels
The class Labels models labels, i.e. class assignments of objects.
Definition: Labels.h:43

eigen3.h

Eigen::Map
Definition: SGMatrix.h:24

Eigen
Definition: SGMatrix.h:20

shogun::CFeatures::get_num_vectors
virtual int32_t get_num_vectors() const =0

std
Definition: basetag.h:132

shogun::CMachine::m_labels
CLabels * m_labels
Definition: Machine.h:361

SG_ERROR
#define SG_ERROR(...)
Definition: SGIO.h:129

shogun::CMCLDA::set_features
virtual void set_features(CDotFeatures *feat)
Definition: MCLDA.h:90

shogun::CDotFeatures
Features that support dot products among other operations.
Definition: DotFeatures.h:44

shogun::SGMatrix::zero
void zero()
Definition: SGMatrix.cpp:136

shogun::SGMatrix< float64_t >

shogun::SGNDArray::get_matrix
T * get_matrix(index_t matIdx) const
Definition: SGNDArray.h:72

shogun::MS_NOT_AVAILABLE
Definition: SGObject.h:92

shogun::CDotFeatures::get_dim_feature_space
virtual int32_t get_dim_feature_space() const =0

shogun::SGVector::display_vector
void display_vector(const char *name="vector", const char *prefix="") const
Definition: SGVector.cpp:354

shogun::CMulticlassLabels
Multiclass Labels for multi-class classification.
Definition: MulticlassLabels.h:36

NativeMulticlassMachine.h

shogun::SGVector::vlen
index_t vlen
Definition: SGVector.h:494

shogun::SGVector::zero
void zero()
Definition: SGVector.cpp:136

shogun::SGVector::vector
T * vector
Definition: SGVector.h:492

SG_PRINT
#define SG_PRINT(...)
Definition: SGIO.h:137

ASSERT
#define ASSERT(x)
Definition: SGIO.h:201

shogun::CSGObject
Class SGObject is the base class of all shogun objects.
Definition: SGObject.h:115

shogun::SGVector< int32_t >

float64_t
double float64_t
Definition: common.h:50

shogun::SGMatrix::get_column_vector
T * get_column_vector(index_t col) const
Definition: SGMatrix.h:113

Eigen::MatrixXd
Matrix< float64_t,-1,-1, 0,-1,-1 > MatrixXd
Definition: KLInference.h:52

Labels.h

shogun::MS_AVAILABLE
Definition: SGObject.h:93

SG_UNREF
#define SG_UNREF(x)
Definition: SGObject.h:55

MulticlassLabels.h

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

shogun::CDenseFeatures::free_feature_vector
void free_feature_vector(ST *feat_vec, int32_t num, bool dofree)
Definition: DenseFeatures.cpp:192

shogun::CFeatures
The class Features is the base class of all feature objects.
Definition: Features.h:68

Eigen::Matrix
Definition: SGMatrix.h:22

Features.h

common.h

shogun::FP_DOT
Definition: FeatureTypes.h:68

SG_ADD
#define SG_ADD(...)
Definition: SGObject.h:84

MCLDA.h

shogun::CFeatures::has_property
bool has_property(EFeatureProperty p) const
Definition: Features.cpp:295

shogun::SGNDArray< float64_t >

shogun::CMulticlassMachine::set_labels
virtual void set_labels(CLabels *lab)
Definition: MulticlassMachine.cpp:52