en/latest/LMNNImpl_8cpp_source.html

 /*

  * This program is free software; you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation; either version 3 of the License, or

  * (at your option) any later version.

  *

  * Written (W) 2013 Fernando J. Iglesias Garcia

  * Copyright (C) 2013 Fernando J. Iglesias Garcia

  */


 #include <shogun/metric/LMNNImpl.h>


 #include <shogun/multiclass/KNN.h>

 #include <shogun/preprocessor/PruneVarSubMean.h>

 #include <shogun/preprocessor/PCA.h>


 #include <iterator>


 // column-wise sum of the squared elements of a matrix

 #define SUMSQCOLS(A)    ((A).array().square().colwise().sum())


 using namespace shogun;

 using namespace Eigen;


 CImpostorNode::CImpostorNode(index_t ex, index_t tar, index_t imp)

 : example(ex), target(tar), impostor(imp)

 {

 }


 bool CImpostorNode::operator<(const CImpostorNode& rhs) const

 {

     if (example == rhs.example)

     {

         if (target == rhs.target)

             return impostor < rhs.impostor;

         else

             return target < rhs.target;

     }

     else

         return example < rhs.example;

 }


 void CLMNNImpl::check_training_setup(CFeatures* features, const CLabels* labels,

         SGMatrix<float64_t>& init_transform)

 {

     REQUIRE(features->has_property(FP_DOT),

             "LMNN can only be applied to features that support dot products\n")

     REQUIRE(labels->get_label_type()==LT_MULTICLASS,

             "LMNN supports only MulticlassLabels\n")

     REQUIRE(labels->get_num_labels()==features->get_num_vectors(),

             "The number of feature vectors must be equal to the number of labels\n")

     //FIXME this requirement should be dropped in the future

     REQUIRE(features->get_feature_class()==C_DENSE,

             "Currently, LMNN supports only DenseFeatures\n")


     // cast is safe, we ensure above that features are dense

     CDenseFeatures<float64_t>* x = static_cast<CDenseFeatures<float64_t>*>(features);


     if (init_transform.num_rows==0)

         init_transform = CLMNNImpl::compute_pca_transform(x);


     REQUIRE(init_transform.num_rows==x->get_num_features() &&

             init_transform.num_rows==init_transform.num_cols,

             "The initial transform must be a square matrix of size equal to the "

             "number of features\n")

 }


 SGMatrix<index_t> CLMNNImpl::find_target_nn(CDenseFeatures<float64_t>* x,

         CMulticlassLabels* y, int32_t k)

 {

     SG_SDEBUG("Entering CLMNNImpl::find_target_nn().\n")


     // get the number of features

     int32_t d = x->get_num_features();

     SGMatrix<index_t> target_neighbors(k, x->get_num_vectors());

     SGVector<float64_t> unique_labels = y->get_unique_labels();

     CDenseFeatures<float64_t>* features_slice = new CDenseFeatures<float64_t>();

     CMulticlassLabels* labels_slice = new CMulticlassLabels();

     SGVector<index_t> idxsmap(x->get_num_vectors());


     // increase ref count because a KNN instance will be created for each slice, and it

     // decreses the ref count of its labels and features when destroyed

     SG_REF(features_slice)

     SG_REF(labels_slice)


     for (index_t i = 0; i < unique_labels.vlen; ++i)

     {

         int32_t slice_size = 0;

         for (int32_t j = 0; j < y->get_num_labels(); ++j)

         {

             if (y->get_label(j)==unique_labels[i])

             {

                 idxsmap[slice_size] = j;

                 ++slice_size;

             }

         }


         MatrixXd slice_mat(d, slice_size);

         for (int32_t j = 0; j < slice_size; ++j)

             slice_mat.col(j) = Map<const VectorXd>(x->get_feature_vector(idxsmap[j]).vector, d);


         features_slice->set_feature_matrix(SGMatrix<float64_t>(slice_mat.data(), d, slice_size, false));


         //FIXME the labels are not actually necessary to get the nearest neighbors, the

         //features suffice. The labels are needed when we want to classify.

         SGVector<float64_t> labels_vec(slice_size);

         labels_vec.set_const(unique_labels[i]);

         labels_slice->set_labels(labels_vec);


         CKNN* knn = new CKNN(k+1, new CEuclideanDistance(features_slice, features_slice), labels_slice);

         SGMatrix<int32_t> target_slice = knn->nearest_neighbors();

         // sanity check

         ASSERT(target_slice.num_rows==k+1 && target_slice.num_cols==slice_size)


         for (index_t j = 0; j < target_slice.num_cols; ++j)

         {

             for (index_t l = 1; l < target_slice.num_rows; ++l)

                 target_neighbors(l-1, idxsmap[j]) = idxsmap[ target_slice(l,j) ];

         }


         // clean up knn

         SG_UNREF(knn)

     }


     // clean up features and labels

     SG_UNREF(features_slice)

     SG_UNREF(labels_slice)


     SG_SDEBUG("Leaving CLMNNImpl::find_target_nn().\n")


     return target_neighbors;

 }


 MatrixXd CLMNNImpl::sum_outer_products(CDenseFeatures<float64_t>* x, const SGMatrix<index_t> target_nn)

 {

     // get the number of features

     int32_t d = x->get_num_features();

     // initialize the sum of outer products (sop)

     MatrixXd sop(d,d);

     sop.setZero();

     // map the feature matrix (each column is a feature vector) to an Eigen matrix

     Map<const MatrixXd> X(x->get_feature_matrix().matrix, d, x->get_num_vectors());


     // sum the outer products stored in C using the indices specified in target_nn

     for (index_t i = 0; i < target_nn.num_cols; ++i)

     {

         for (index_t j = 0; j < target_nn.num_rows; ++j)

         {

             VectorXd dx = X.col(i) - X.col(target_nn(j,i));

             sop += dx*dx.transpose();

         }

     }


     return sop;

 }


 ImpostorsSetType CLMNNImpl::find_impostors(CDenseFeatures<float64_t>* x,

         CMulticlassLabels* y, const MatrixXd& L, const SGMatrix<index_t> target_nn,

         const uint32_t iter, const uint32_t correction)

 {

     SG_SDEBUG("Entering CLMNNImpl::find_impostors().\n")


     // get the number of examples from data

     int32_t n = x->get_num_vectors();

     // get the number of features

     int32_t d = x->get_num_features();

     // get the number of neighbors

     int32_t k = target_nn.num_rows;


     // map the feature matrix (each column is a feature vector) to an Eigen matrix

     Map<const MatrixXd> X(x->get_feature_matrix().matrix, d, n);

     // transform the feature vectors

     MatrixXd LX = L*X;


     // compute square distances plus margin from examples to target neighbors

     MatrixXd sqdists = CLMNNImpl::compute_sqdists(LX,target_nn);


     // initialize impostors set

     ImpostorsSetType N;

     // exact impostors set shared between calls to this method

     static ImpostorsSetType Nexact;


     // impostors search

     REQUIRE(correction>0, "The number of iterations between exact updates of the "

             "impostors set must be greater than 0\n")

     if ((iter % correction)==0)

     {

         Nexact = CLMNNImpl::find_impostors_exact(LX, sqdists, y, target_nn, k);

         N = Nexact;

     }

     else

     {

         N = CLMNNImpl::find_impostors_approx(LX, sqdists, Nexact, target_nn);

     }


     SG_SDEBUG("Leaving CLMNNImpl::find_impostors().\n")


     return N;

 }


 void CLMNNImpl::update_gradient(CDenseFeatures<float64_t>* x, MatrixXd& G,

         const ImpostorsSetType& Nc, const ImpostorsSetType& Np, float64_t regularization)

 {

     // compute the difference sets

     ImpostorsSetType Np_Nc, Nc_Np;

     set_difference(Np.begin(), Np.end(), Nc.begin(), Nc.end(), inserter(Np_Nc, Np_Nc.begin()));

     set_difference(Nc.begin(), Nc.end(), Np.begin(), Np.end(), inserter(Nc_Np, Nc_Np.begin()));


     // map the feature matrix (each column is a feature vector) to an Eigen matrix

     Map<const MatrixXd> X(x->get_feature_matrix().matrix, x->get_num_features(), x->get_num_vectors());


     // remove the gradient contributions of the impostors that were in the previous

     // set but disappeared in the current

     for (ImpostorsSetType::iterator it = Np_Nc.begin(); it != Np_Nc.end(); ++it)

     {

         VectorXd dx1 = X.col(it->example) - X.col(it->target);

         VectorXd dx2 = X.col(it->example) - X.col(it->impostor);

         G -= regularization*(dx1*dx1.transpose() - dx2*dx2.transpose());

     }


     // add the gradient contributions of the new impostors

     for (ImpostorsSetType::iterator it = Nc_Np.begin(); it != Nc_Np.end(); ++it)

     {

         VectorXd dx1 = X.col(it->example) - X.col(it->target);

         VectorXd dx2 = X.col(it->example) - X.col(it->impostor);

         G += regularization*(dx1*dx1.transpose() - dx2*dx2.transpose());

     }

 }


 void CLMNNImpl::gradient_step(MatrixXd& L, const MatrixXd& G, float64_t stepsize, bool diagonal)

 {

     if (diagonal)

     {

         // compute M as the square of L

         MatrixXd M = L.transpose()*L;

         // do step in M along the gradient direction

         M -= stepsize*G;

         // keep only the elements in the diagonal of M

         VectorXd m = M.diagonal();


         VectorXd zero;

         zero.resize(m.size());

         zero.setZero();


         // return to representation in L

         VectorXd l = m.array().max(zero.array()).array().sqrt();

         L = l.asDiagonal();

     }

     else

     {

         // do step in L along the gradient direction (no need to project M then)

         L -= stepsize*(2*L*G);

     }

 }


 void CLMNNImpl::correct_stepsize(float64_t& stepsize, const SGVector<float64_t> obj, const uint32_t iter)

 {

     if (iter > 0)

     {

         // Difference between current and previous objective

         float64_t delta = obj[iter] - obj[iter-1];


         if (delta > 0)

         {

             // The objective has increased, we have probably jumped over the optimum,

             // thus, decrease the step size

             stepsize *= 0.5;

         }

         else

         {

             // The objective has decreased, we are in the right direction,

             // increase the step size

             stepsize *= 1.01;

         }

     }

 }


 bool CLMNNImpl::check_termination(float64_t stepsize, const SGVector<float64_t> obj, uint32_t iter, uint32_t maxiter, float64_t stepsize_threshold, float64_t obj_threshold)

 {

     if (iter >= maxiter-1)

     {

         SG_SWARNING("Maximum number of iterations reached before convergence.");

         return true;

     }


     if (stepsize < stepsize_threshold)

     {

         SG_SDEBUG("Step size too small to make more progress. Convergence reached.\n");

         return true;

     }


     if (iter >= 10)

     {

         for (int32_t i = 0; i < 3; ++i)

         {

             if (CMath::abs(obj[iter-i]-obj[iter-i-1]) >= obj_threshold)

                 return false;

         }


         SG_SDEBUG("No more progress in the objective. Convergence reached.\n");

         return true;

     }


     // For the rest of the cases, do not stop LMNN.

     return false;

 }


 SGMatrix<float64_t> CLMNNImpl::compute_pca_transform(CDenseFeatures<float64_t>* features)

 {

     SG_SDEBUG("Initializing LMNN transform using PCA.\n");


     // Substract the mean of the features

     // Create clone of the features to keep the input features unmodified

     CDenseFeatures<float64_t>* cloned_features =

             new CDenseFeatures<float64_t>(features->get_feature_matrix().clone());

     CPruneVarSubMean* mean_substractor =

             new CPruneVarSubMean(false); // false to avoid variance normalization

     mean_substractor->init(cloned_features);

     mean_substractor->apply_to_feature_matrix(cloned_features);


     // Obtain the linear transform applying PCA

     CPCA* pca = new CPCA();

     pca->set_target_dim(cloned_features->get_num_features());

     pca->init(cloned_features);

     SGMatrix<float64_t> pca_transform = pca->get_transformation_matrix();


     SG_UNREF(pca);

     SG_UNREF(mean_substractor);

     SG_UNREF(cloned_features);


     return pca_transform;

 }


 MatrixXd CLMNNImpl::compute_sqdists(MatrixXd& LX, const SGMatrix<index_t> target_nn)

 {

     // get the number of examples

     ASSERT(LX.cols()==target_nn.num_cols)

     int32_t n = LX.cols();

     // get the number of features

     int32_t d = LX.rows();

     // get the number of neighbors

     int32_t k = target_nn.num_rows;


     // create Shogun features from LX to later apply subset

     SGMatrix<float64_t> lx_mat(LX.data(), d, n, false);

     CDenseFeatures<float64_t>* lx = new CDenseFeatures<float64_t>(lx_mat);


     // initialize distances

     MatrixXd sqdists(k,n);

     sqdists.setZero();

     for (int32_t i = 0; i < k; ++i)

     {

         //FIXME avoid copying the rows of target_nn and access them directly. Maybe

         //find_target_nn should be changed to return the output transposed wrt how it is

         //done atm.

         SGVector<index_t> subset_vec = target_nn.get_row_vector(i);

         lx->add_subset(subset_vec);

         // after the subset, there are still n columns, i.e. the subset is used to

         // modify the order of the columns in x according to the target neighbors

         sqdists.row(i) = SUMSQCOLS(LX - Map<const MatrixXd>(lx->get_feature_matrix().matrix, d, n)) + 1;

         lx->remove_subset();

     }


     // clean up features used to apply subset

     SG_UNREF(lx);


     return sqdists;

 }


 ImpostorsSetType CLMNNImpl::find_impostors_exact(MatrixXd& LX, const MatrixXd& sqdists,

         CMulticlassLabels* y, const SGMatrix<index_t> target_nn, int32_t k)

 {

     SG_SDEBUG("Entering CLMNNImpl::find_impostors_exact().\n")


     // initialize empty impostors set

     ImpostorsSetType N = ImpostorsSetType();


     // get the number of examples from data

     int32_t n = LX.cols();

     // get the number of features

     int32_t d = LX.rows();

     // create Shogun features from LX to later apply subset

     SGMatrix<float64_t> lx_mat(LX.data(), d, n, false);

     CDenseFeatures<float64_t>* lx = new CDenseFeatures<float64_t>(lx_mat);


     // get a vector with unique label values

     SGVector<float64_t> unique = y->get_unique_labels();


     // for each label except from the largest one

     for (index_t i = 0; i < unique.vlen-1; ++i)

     {

         // get the indices of the examples labelled as unique[i]

         std::vector<index_t> iidxs = CLMNNImpl::get_examples_label(y,unique[i]);

         // get the indices of the examples that have a larger label value, so that

         // pairwise distances are computed once

         std::vector<index_t> gtidxs = CLMNNImpl::get_examples_gtlabel(y,unique[i]);


         // get distance with features indexed by iidxs and gtidxs separated

         CEuclideanDistance* euclidean = CLMNNImpl::setup_distance(lx,iidxs,gtidxs);

         euclidean->set_disable_sqrt(true);


         for (int32_t j = 0; j < k; ++j)

         {

             for (std::size_t ii = 0; ii < iidxs.size(); ++ii)

             {

                 for (std::size_t jj = 0; jj < gtidxs.size(); ++jj)

                 {

                     // FIXME study if using upper bounded distances can be an improvement

                     float64_t distance = euclidean->distance(ii,jj);


                     if (distance <= sqdists(j,iidxs[ii]))

                         N.insert( CImpostorNode(iidxs[ii], target_nn(j,iidxs[ii]), gtidxs[jj]) );


                     if (distance <= sqdists(j,gtidxs[jj]))

                         N.insert( CImpostorNode(gtidxs[jj], target_nn(j,gtidxs[jj]), iidxs[ii]) );

                 }

             }

         }


         SG_UNREF(euclidean);

     }


     SG_UNREF(lx);


     SG_SDEBUG("Leaving CLMNNImpl::find_impostors_exact().\n")


     return N;

 }


 ImpostorsSetType CLMNNImpl::find_impostors_approx(MatrixXd& LX, const MatrixXd& sqdists,

         const ImpostorsSetType& Nexact, const SGMatrix<index_t> target_nn)

 {

     SG_SDEBUG("Entering CLMNNImpl::find_impostors_approx().\n")


     // initialize empty impostors set

     ImpostorsSetType N = ImpostorsSetType();


     // compute square distances from examples to impostors

     SGVector<float64_t> impostors_sqdists = CLMNNImpl::compute_impostors_sqdists(LX,Nexact);


     // find in the exact set of impostors computed last, the triplets that remain impostors

     index_t i = 0;

     for (ImpostorsSetType::iterator it = Nexact.begin(); it != Nexact.end(); ++it)

     {

         // find in target_nn(:,it->example) the position of the target neighbor it->target

         index_t target_idx = 0;

         while (target_nn(target_idx, it->example)!=it->target && target_idx<target_nn.num_rows)

             ++target_idx;


         REQUIRE(target_idx<target_nn.num_rows, "The index of the target neighbour in the "

                 "impostors set was not found in the target neighbours matrix. "

                 "There must be a bug in find_impostors_exact.\n")


         if ( impostors_sqdists[i++] <= sqdists(target_idx, it->example) )

             N.insert(*it);

     }


     SG_SDEBUG("Leaving CLMNNImpl::find_impostors_approx().\n")


     return N;

 }


 SGVector<float64_t> CLMNNImpl::compute_impostors_sqdists(MatrixXd& LX, const ImpostorsSetType& Nexact)

 {

     // get the number of examples

     int32_t n = LX.cols();

     // get the number of features

     int32_t d = LX.rows();

     // get the number of impostors

     size_t num_impostors = Nexact.size();


     // create Shogun features from LX and distance

     SGMatrix<float64_t> lx_mat(LX.data(), d, n, false);

     CDenseFeatures<float64_t>* lx = new CDenseFeatures<float64_t>(lx_mat);

     CEuclideanDistance* euclidean = new CEuclideanDistance(lx,lx);

     euclidean->set_disable_sqrt(true);


     // initialize vector of square distances

     SGVector<float64_t> sqdists(num_impostors);

     // compute square distances

     index_t i = 0;

     for (ImpostorsSetType::iterator it = Nexact.begin(); it != Nexact.end(); ++it)

         sqdists[i++] = euclidean->distance(it->example,it->impostor);


     // clean up distance

     SG_UNREF(euclidean);


     return sqdists;

 }


 std::vector<index_t> CLMNNImpl::get_examples_label(CMulticlassLabels* y,

         float64_t yi)

 {

     // indices of the examples with label equal to yi

     std::vector<index_t> idxs;


     for (index_t i = 0; i < index_t(y->get_num_labels()); ++i)

     {

         if (y->get_label(i) == yi)

             idxs.push_back(i);

     }


     return idxs;

 }


 std::vector<index_t> CLMNNImpl::get_examples_gtlabel(CMulticlassLabels* y,

         float64_t yi)

 {

     // indices of the examples with label equal greater than yi

     std::vector<index_t> idxs;


     for (index_t i = 0; i < index_t(y->get_num_labels()); ++i)

     {

         if (y->get_label(i) > yi)

             idxs.push_back(i);

     }


     return idxs;

 }


 CEuclideanDistance* CLMNNImpl::setup_distance(CDenseFeatures<float64_t>* x,

         std::vector<index_t>& a, std::vector<index_t>& b)

 {

     // create new features only containing examples whose indices are in a

     x->add_subset(SGVector<index_t>(a.data(), a.size(), false));

     CDenseFeatures<float64_t>* afeats = new CDenseFeatures<float64_t>(x->get_feature_matrix());

     x->remove_subset();


     // create new features only containing examples whose indices are in b

     x->add_subset(SGVector<index_t>(b.data(), b.size(), false));

     CDenseFeatures<float64_t>* bfeats = new CDenseFeatures<float64_t>(x->get_feature_matrix());

     x->remove_subset();


     // create and return distance

     CEuclideanDistance* euclidean = new CEuclideanDistance(afeats,bfeats);

     return euclidean;

 }


shogun::distance
float distance(CJLCoverTreePoint p1, CJLCoverTreePoint p2, float64_t upper_bound)
Definition: JLCoverTreePoint.h:138

shogun::operator<
bool operator<(const BaseTag &first, const BaseTag &second)
Definition: basetag.h:125

shogun::CLabels::get_label_type
virtual ELabelType get_label_type() const =0

shogun::CDenseFeatures< float64_t >

shogun::CDenseFeatures::get_feature_vector
ST * get_feature_vector(int32_t num, int32_t &len, bool &dofree)
Definition: DenseFeatures.cpp:90

shogun::CDenseFeatures::get_num_features
int32_t get_num_features() const
Definition: DenseFeatures.cpp:427

shogun::CDenseLabels::get_num_labels
virtual int32_t get_num_labels() const
Definition: DenseLabels.cpp:201

shogun::SGMatrix::matrix
T * matrix
Definition: SGMatrix.h:372

index_t
int32_t index_t
Definition: common.h:62

shogun::CLabels
The class Labels models labels, i.e. class assignments of objects.
Definition: Labels.h:43

shogun::CLabels::get_num_labels
virtual int32_t get_num_labels() const =0

LT_MULTICLASS
multi-class labels 0,1,...
Definition: LabelTypes.h:20

shogun::CDenseFeatures::get_feature_matrix
SGMatrix< ST > get_feature_matrix()
Definition: DenseFeatures.cpp:268

Eigen::Map
Definition: SGMatrix.h:24

SG_SWARNING
#define SG_SWARNING(...)
Definition: SGIO.h:178

Eigen
Definition: SGMatrix.h:20

shogun::SGMatrix::clone
SGMatrix< T > clone()
Definition: SGMatrix.cpp:256

shogun::CFeatures::get_num_vectors
virtual int32_t get_num_vectors() const =0

REQUIRE
#define REQUIRE(x,...)
Definition: SGIO.h:206

shogun::SGMatrix::num_cols
index_t num_cols
Definition: SGMatrix.h:376

shogun::CDenseLabels::get_label
float64_t get_label(int32_t idx)
Definition: DenseLabels.cpp:184

shogun::CKNN::nearest_neighbors
SGMatrix< index_t > nearest_neighbors()
Definition: KNN.cpp:122

SG_REF
#define SG_REF(x)
Definition: SGObject.h:54

shogun::SGMatrix::num_rows
index_t num_rows
Definition: SGMatrix.h:374

shogun::SGMatrix< float64_t >

shogun::CPruneVarSubMean
Preprocessor PruneVarSubMean will substract the mean and remove features that have zero variance...
Definition: PruneVarSubMean.h:30

shogun::CMulticlassLabels
Multiclass Labels for multi-class classification.
Definition: MulticlassLabels.h:36

shogun::SGVector::size
int32_t size() const
Definition: SGVector.h:113

ASSERT
#define ASSERT(x)
Definition: SGIO.h:201

shogun::CEuclideanDistance::set_disable_sqrt
virtual void set_disable_sqrt(bool state)
Definition: EuclideanDistance.h:121

shogun::SGVector
shogun vector
Definition: base/Parameter.h:28

float64_t
double float64_t
Definition: common.h:50

LMNNImpl.h

SUMSQCOLS
#define SUMSQCOLS(A)
useful shorthands to perform operations with Eigen matrices
Definition: LMNNImpl.cpp:23

shogun::CDimensionReductionPreprocessor::set_target_dim
void set_target_dim(int32_t dim)
Definition: DimensionReductionPreprocessor.cpp:70

shogun::CFeatures::get_feature_class
virtual EFeatureClass get_feature_class() const =0

shogun::CKNN
Class KNN, an implementation of the standard k-nearest neigbor classifier.
Definition: KNN.h:68

shogun::CPCA::init
virtual bool init(CFeatures *features)
Definition: PCA.cpp:83

shogun::C_DENSE
Definition: FeatureTypes.h:41

shogun::CDistance::distance
virtual float64_t distance(int32_t idx_a, int32_t idx_b)
Definition: Distance.cpp:206

SG_UNREF
#define SG_UNREF(x)
Definition: SGObject.h:55

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

SG_SDEBUG
#define SG_SDEBUG(...)
Definition: SGIO.h:168

shogun::CFeatures::remove_subset
virtual void remove_subset()
Definition: Features.cpp:322

shogun::CFeatures
The class Features is the base class of all feature objects.
Definition: Features.h:68

KNN.h

Eigen::Matrix
Definition: SGMatrix.h:22

shogun::CPCA
Preprocessor PCA performs principial component analysis on input feature vectors/matrices. When the init method in PCA is called with proper feature matrix X (with say N number of vectors and D feature dimension), a transformation matrix is computed and stored internally. This transformation matrix is then used to transform all D-dimensional feature vectors or feature matrices (with D feature dimensions) supplied via apply_to_feature_matrix or apply_to_feature_vector methods. This tranformation outputs the T-Dimensional approximation of all these input vectors and matrices (where T<=min(D,N)). The transformation matrix is essentially a DxT matrix, the columns of which correspond to the eigenvectors of the covariance matrix(XX') having top T eigenvalues.
Definition: PCA.h:112

shogun::FP_DOT
Definition: FeatureTypes.h:68

PruneVarSubMean.h

shogun::SGMatrix::get_row_vector
SGVector< T > get_row_vector(index_t row) const
Definition: SGMatrix.cpp:1084

shogun::CFeatures::has_property
bool has_property(EFeatureProperty p) const
Definition: Features.cpp:295

PCA.h

shogun::CEuclideanDistance
class EuclideanDistance
Definition: EuclideanDistance.h:58

shogun::CFeatures::add_subset
virtual void add_subset(SGVector< index_t > subset)
Definition: Features.cpp:310

shogun::CPCA::get_transformation_matrix
SGMatrix< float64_t > get_transformation_matrix()
Definition: PCA.cpp:349