en/latest/FisherLDA_8cpp_source.html

 /*

  * Copyright (c) 2014, Shogun Toolbox Foundation

  * All rights reserved.

  *

  * Redistribution and use in source and binary forms, with or without

  * modification, are permitted provided that the following conditions are met:


  * 1. Redistributions of source code must retain the above copyright notice,

  * this list of conditions and the following disclaimer.

  *

  * 2. Redistributions in binary form must reproduce the above copyright notice,

  * this list of conditions and the following disclaimer in the documentation

  * and/or other materials provided with the distribution.

  *

  * 3. Neither the name of the copyright holder nor the names of its

  * contributors may be used to endorse or promote products derived from this

  * software without specific prior written permission.


  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"

  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE

  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE

  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR

  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF

  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS

  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN

  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)

  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

  * POSSIBILITY OF SUCH DAMAGE.

  *

  * Written (W) 2014 Abhijeet Kislay

  */

 #include <shogun/lib/config.h>


 #include <shogun/lib/common.h>

 #include <shogun/io/SGIO.h>

 #include <shogun/preprocessor/DensePreprocessor.h>

 #include <shogun/features/DenseFeatures.h>

 #include <shogun/features/Features.h>

 #include <shogun/labels/MulticlassLabels.h>

 #include <shogun/mathematics/eigen3.h>

 #include <shogun/preprocessor/FisherLDA.h>

 #include <shogun/preprocessor/DimensionReductionPreprocessor.h>

 #include <shogun/mathematics/eigen3.h>

 #include <vector>


 using namespace std;

 using namespace Eigen;

 using namespace shogun;


 CFisherLDA::CFisherLDA (EFLDAMethod method, float64_t thresh):

     CDimensionReductionPreprocessor()

 {

     initialize_parameters();

     m_method=method;

     m_threshold=thresh;

 }


 void CFisherLDA::initialize_parameters()

 {

     m_method=AUTO_FLDA;

     m_threshold=0.01;

     m_num_dim=0;

     SG_ADD(&m_method, "FLDA_method","method for performing FLDA",

             MS_NOT_AVAILABLE);

     SG_ADD(&m_num_dim, "final_dimensions","dimensions to be retained",

             MS_NOT_AVAILABLE);

     SG_ADD(&m_transformation_matrix, "transformation_matrix","Transformation"

             " matrix (Eigenvectors of covariance matrix).", MS_NOT_AVAILABLE);

     SG_ADD(&m_mean_vector, "mean_vector", "Mean Vector.", MS_NOT_AVAILABLE);

     SG_ADD(&m_eigenvalues_vector, "eigenvalues_vector",

             "Vector with Eigenvalues.", MS_NOT_AVAILABLE);

 }


 CFisherLDA::~CFisherLDA()

 {

 }


 bool CFisherLDA::fit(CFeatures *features, CLabels *labels, int32_t num_dimensions)

 {

     REQUIRE(features, "Features are not provided!\n")


     REQUIRE(features->get_feature_class()==C_DENSE,

             "LDA only works with dense features. you provided %s\n",

             features->get_name());


     REQUIRE(features->get_feature_type()==F_DREAL,

             "LDA only works with real features.\n");


     REQUIRE(labels, "Labels for the given features are not specified!\n")


     REQUIRE(labels->get_label_type()==LT_MULTICLASS, "The labels should be of "

             "the type MulticlassLabels! you provided %s\n", labels->get_name());


     SGMatrix<float64_t> feature_matrix=((CDenseFeatures<float64_t>*)features)

                                         ->get_feature_matrix();


     SGVector<float64_t> labels_vector=((CMulticlassLabels*)labels)->get_labels();


     int32_t num_vectors=feature_matrix.num_cols;

     int32_t num_features=feature_matrix.num_rows;


     REQUIRE(labels_vector.vlen==num_vectors,"The number of samples provided (%d)"

             " must be equal to the number of labels provided(%d)\n",num_vectors,

             labels_vector.vlen);


     // C holds the number of unique classes.

     int32_t C=((CMulticlassLabels*)labels)->get_num_classes();


     REQUIRE(C>1, "At least two classes are needed to perform LDA.\n")


     int32_t i=0;

     int32_t j=0;


     m_num_dim=num_dimensions;

     // max target dimension allowed.

     // int32_t max_dim_allowed=C-1;


     // clip number if Dimensions to be a valid number

     if ((m_num_dim<=0) || (m_num_dim>(C-1)))

         m_num_dim=(C-1);


     MatrixXd fmatrix=Map<MatrixXd>(feature_matrix.matrix, num_features,

                                     num_vectors);

     Map<VectorXd> lvector(labels_vector.vector, num_vectors);


     // holds the total mean

     m_mean_vector=SGVector<float64_t>(num_features);

     Map<VectorXd>mean_total (m_mean_vector.vector, num_features);

     mean_total=VectorXd::Zero(num_features);

     // holds the mean for each class

     vector<VectorXd> mean_class(C);


     // holds the frequency for each class.

     // i.e the i'th element holds the number

     // of times class i is observed.

     VectorXd num_class=VectorXd::Zero(C);


     // calculate the class means and the total means.

     for (i=0; i<C; i++)

     {

         mean_class[i]=VectorXd::Zero(num_features);

         for (j=0; j<num_vectors; j++)

         {

             if (i==lvector[j])

             {

                 num_class[i]++;

                 mean_class[i]+=fmatrix.col(j);

             }

         }

         mean_class[i]/=(float64_t)num_class[i];

         mean_total+=mean_class[i];

     }

     mean_total/=(float64_t)C;


     // Subtract the class means from the 'respective' data.

     // e.g all data belonging to class 0 is subtracted by

     // the mean of class 0 data.

     for (i=0; i<C; i++)

         for (j=0; j<num_vectors; j++)

             if (i==lvector[j])

                 fmatrix.col(j)-=mean_class[i];


     if ((m_method==CANVAR_FLDA) ||

             (m_method==AUTO_FLDA && num_vectors<num_features))

     {

         // holds the  fmatrix for each class

         vector<MatrixXd> centered_class_i(C);

         VectorXd temp=num_class;

         MatrixXd Sw=MatrixXd::Zero(num_features, num_features);

         for (i=0; i<C; i++)

         {

             centered_class_i[i]=MatrixXd::Zero(num_features, num_class[i]);

             for (j=0; j<num_vectors; j++)

                 if (i==lvector[j])

                     centered_class_i[i].col(num_class[i]-(temp[i]--))

                         =fmatrix.col(j);

             Sw+=(centered_class_i[i]*centered_class_i[i].transpose())

                 *num_class[i]/(float64_t)(num_class[i]-1);

         }


         // within class matrix for cannonical variates implementation

         MatrixXd Sb(num_features, C);

         for (i=0; i<C; i++)

         Sb.col(i)=sqrt(num_class[i])*(mean_class[i]-mean_total);


         MatrixXd fmatrix1=Map<MatrixXd>(feature_matrix.matrix, num_features,

                                     num_vectors);


         JacobiSVD<MatrixXd> svd(fmatrix1, ComputeThinU | ComputeThinV);

         // basis to represent the solution

         MatrixXd Q;


         if(num_features>num_vectors)

         {

             j=0;

             for (i=0;i<num_vectors;i++)

                 if (svd.singularValues()(i)>m_threshold)

                     j++;

                 else

                     break;

             Q=svd.matrixU().leftCols(j);

         }

         else

             Q=svd.matrixU();


         // Sb is the modified between scatter

         Sb=(Q.transpose())*Sb*(Sb.transpose())*Q;

         // Sw is the modified within scatter

         Sw=Q.transpose()*Sw*Q;


         // to find SVD((inverse(Chol(Sw)))' * Sb * (inverse(Chol(Sw))))

         //1.get Cw=Chol(Sw)

         //find the decomposition of Cw'

         HouseholderQR<MatrixXd> decomposition(Sw.llt().matrixU().transpose());

         //2.get P=inv(Cw')*Sb

         //MatrixXd P=decomposition.solve(Sb);

         //3. final value to be put in SVD will be therefore:

         // final_ output = (inv(Cw')*(P'))';

         //MatrixXd X_final_chol=(decomposition.solve(P.transpose())).transpose();

         JacobiSVD<MatrixXd> svd2(decomposition.solve

                 (decomposition.solve(Sb).transpose()).transpose(),ComputeThinU);

         m_transformation_matrix=SGMatrix<float64_t> (num_features, m_num_dim);

         Map<MatrixXd> eigenVectors(m_transformation_matrix.matrix, num_features,

                                     m_num_dim);


         eigenVectors=Q*(svd2.matrixU()).leftCols(m_num_dim);


         m_eigenvalues_vector=SGVector<float64_t>(m_num_dim);

         Map<VectorXd> eigenValues (m_eigenvalues_vector.vector, m_num_dim);

         eigenValues=svd2.singularValues().topRows(m_num_dim);

     }

     else

     {

         // For holding the within class scatter.

         MatrixXd Sw=fmatrix*fmatrix.transpose();


         // For holding the between class scatter.

         MatrixXd Sb(num_features, C);


         for (i=0; i<C; i++)

             Sb.col(i)=mean_class[i];


         Sb=Sb-mean_total.rowwise().replicate(C);

         Sb=Sb*Sb.transpose();


         // calculate the Ax=b problem

         // where A=Sw

         // b=Sb

         // x=M

         // MatrixXd M=Sw.householderQr().solve(Sb);

         // calculate the eigenvalues and eigenvectors of M.

         EigenSolver<MatrixXd> es(Sw.householderQr().solve(Sb));


         MatrixXd all_eigenvectors=es.eigenvectors().real();

         VectorXd all_eigenvalues=es.eigenvalues().real();


         std::vector<pair<float64_t, int32_t> > data(num_features);

         for (i=0; i<num_features; i++)

         {

             data[i].first=all_eigenvalues[i];

             data[i].second=i;

         }

         // sort the eigenvalues.

         std::sort (data.begin(), data.end());


         // keep 'm_num_dim' numbers of top Eigenvalues

         m_eigenvalues_vector=SGVector<float64_t> (m_num_dim);

         Map<VectorXd> eigenValues(m_eigenvalues_vector.vector, m_num_dim);


         // keep 'm_num_dim' numbers of EigenVectors

         // corresponding to their respective eigenvalues

         m_transformation_matrix=SGMatrix<float64_t> (num_features, m_num_dim);

         Map<MatrixXd> eigenVectors(m_transformation_matrix.matrix, num_features,

                                     m_num_dim);


         for (i=0; i<m_num_dim; i++)

         {

             eigenValues[i]=data[num_features-i-1].first;

             eigenVectors.col(i)=all_eigenvectors.col(data[num_features-i-1].second);

         }

     }

     return true;

 }


 void CFisherLDA::cleanup()

 {

     m_transformation_matrix=SGMatrix<float64_t>();

     m_mean_vector=SGVector<float64_t>();

     m_eigenvalues_vector=SGVector<float64_t>();

 }


 SGMatrix<float64_t> CFisherLDA::apply_to_feature_matrix(CFeatures*features)

 {

     REQUIRE(features->get_feature_class()==C_DENSE,

             "LDA only works with dense features\n");


     REQUIRE(features->get_feature_type()==F_DREAL,

             "LDA only works with real features\n");


     SGMatrix<float64_t> m=((CDenseFeatures<float64_t>*)

                             features)->get_feature_matrix();


     int32_t num_vectors=m.num_cols;

     int32_t num_features=m.num_rows;


     SG_INFO("Transforming feature matrix\n")

     Map<MatrixXd> transform_matrix(m_transformation_matrix.matrix,

             m_transformation_matrix.num_rows, m_transformation_matrix.num_cols);


     SG_INFO("get Feature matrix: %ix%i\n", num_vectors, num_features)


     Map<MatrixXd> feature_matrix (m.matrix, num_features, num_vectors);


     feature_matrix.block (0, 0, m_num_dim, num_vectors)=

             transform_matrix.transpose()*feature_matrix;


     SG_INFO("Form matrix of target dimension")

     for (int32_t col=0; col<num_vectors; col++)

     {

         for (int32_t row=0; row<m_num_dim; row++)

             m[col*m_num_dim+row]=feature_matrix(row, col);

     }

     m.num_rows=m_num_dim;

     m.num_cols=num_vectors;

     ((CDenseFeatures<float64_t>*)features)->set_feature_matrix(m);

     return m;

 }


 SGVector<float64_t> CFisherLDA::apply_to_feature_vector(SGVector<float64_t> vector)

 {

     SGVector<float64_t> result = SGVector<float64_t>(m_num_dim);

     Map<VectorXd> resultVec(result.vector, m_num_dim);

     Map<VectorXd> inputVec(vector.vector, vector.vlen);


     Map<VectorXd> mean(m_mean_vector.vector, m_mean_vector.vlen);

     Map<MatrixXd> transformMat(m_transformation_matrix.matrix,

         m_transformation_matrix.num_rows, m_transformation_matrix.num_cols);


     resultVec=transformMat.transpose()*inputVec;

     return result;

 }


 SGMatrix<float64_t> CFisherLDA::get_transformation_matrix()

 {

     return m_transformation_matrix;

 }


 SGVector<float64_t> CFisherLDA::get_eigenvalues()

 {

     return m_eigenvalues_vector;

 }


 SGVector<float64_t> CFisherLDA::get_mean()

 {

     return m_mean_vector;

 }

shogun::CSGObject::get_name
virtual const char * get_name() const =0

shogun::AUTO_FLDA
Definition: FisherLDA.h:53

FisherLDA.h

shogun::CDimensionReductionPreprocessor
the class DimensionReductionPreprocessor, a base class for preprocessors used to lower the dimensiona...
Definition: DimensionReductionPreprocessor.h:32

SG_INFO
#define SG_INFO(...)
Definition: SGIO.h:118

shogun::CLabels::get_label_type
virtual ELabelType get_label_type() const =0

shogun::CFisherLDA::m_method
int32_t m_method
Definition: FisherLDA.h:162

shogun::CDenseFeatures< float64_t >

shogun::CFisherLDA::apply_to_feature_matrix
virtual SGMatrix< float64_t > apply_to_feature_matrix(CFeatures *features)
Definition: FisherLDA.cpp:293

shogun::CFisherLDA::get_transformation_matrix
SGMatrix< float64_t > get_transformation_matrix()
Definition: FisherLDA.cpp:344

shogun::CFisherLDA::fit
virtual bool fit(CFeatures *features, CLabels *labels, int32_t num_dimensions=0)
Definition: FisherLDA.cpp:79

shogun::SGMatrix::matrix
T * matrix
Definition: SGMatrix.h:372

shogun::CFisherLDA::apply_to_feature_vector
virtual SGVector< float64_t > apply_to_feature_vector(SGVector< float64_t > vector)
Definition: FisherLDA.cpp:330

DimensionReductionPreprocessor.h

shogun::CLabels
The class Labels models labels, i.e. class assignments of objects.
Definition: Labels.h:43

SGIO.h

eigen3.h

LT_MULTICLASS
multi-class labels 0,1,...
Definition: LabelTypes.h:20

Eigen::Map
Definition: SGMatrix.h:24

Eigen
Definition: SGMatrix.h:20

config.h

std
Definition: basetag.h:132

REQUIRE
#define REQUIRE(x,...)
Definition: SGIO.h:206

shogun::SGMatrix::num_cols
index_t num_cols
Definition: SGMatrix.h:376

shogun::CFisherLDA::~CFisherLDA
virtual ~CFisherLDA()
Definition: FisherLDA.cpp:75

shogun::SGMatrix::num_rows
index_t num_rows
Definition: SGMatrix.h:374

shogun::SGMatrix< float64_t >

shogun::MS_NOT_AVAILABLE
Definition: SGObject.h:92

shogun::CMulticlassLabels
Multiclass Labels for multi-class classification.
Definition: MulticlassLabels.h:36

shogun::SGVector::vlen
index_t vlen
Definition: SGVector.h:494

shogun::SGVector::vector
T * vector
Definition: SGVector.h:492

shogun::F_DREAL
Definition: FeatureTypes.h:32

shogun::SGVector< float64_t >

float64_t
double float64_t
Definition: common.h:50

shogun::CFeatures::get_feature_class
virtual EFeatureClass get_feature_class() const =0

shogun::C_DENSE
Definition: FeatureTypes.h:41

shogun::CFisherLDA::m_transformation_matrix
SGMatrix< float64_t > m_transformation_matrix
Definition: FisherLDA.h:156

shogun::CFisherLDA::m_mean_vector
SGVector< float64_t > m_mean_vector
Definition: FisherLDA.h:164

MulticlassLabels.h

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

shogun::CFeatures
The class Features is the base class of all feature objects.
Definition: Features.h:68

Eigen::Matrix
Definition: SGMatrix.h:22

Features.h

DenseFeatures.h

shogun::CANVAR_FLDA
Definition: FisherLDA.h:55

common.h

shogun::CFisherLDA::m_eigenvalues_vector
SGVector< float64_t > m_eigenvalues_vector
Definition: FisherLDA.h:166

DensePreprocessor.h

shogun::EFLDAMethod
EFLDAMethod
Definition: FisherLDA.h:48

shogun::CFisherLDA::m_threshold
float64_t m_threshold
Definition: FisherLDA.h:160

SG_ADD
#define SG_ADD(...)
Definition: SGObject.h:84

shogun::CFisherLDA::m_num_dim
int32_t m_num_dim
Definition: FisherLDA.h:158

shogun::CFisherLDA::get_mean
SGVector< float64_t > get_mean()
Definition: FisherLDA.cpp:354

shogun::CFeatures::get_feature_type
virtual EFeatureType get_feature_type() const =0

shogun::CFisherLDA::cleanup
virtual void cleanup()
Definition: FisherLDA.cpp:286

shogun::CFisherLDA::get_eigenvalues
SGVector< float64_t > get_eigenvalues()
Definition: FisherLDA.cpp:349