en/current/RescaleFeatures_8cpp_source.html

 /*

  * This program is free software; you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation; either version 3 of the License, or

  * (at your option) any later version.

  *

  * Written (W) 20013 Viktor Gal

  * Copyright (C) 2013 Viktor Gal

  */


 #include <shogun/preprocessor/RescaleFeatures.h>


 using namespace shogun;


 CRescaleFeatures::CRescaleFeatures()

  : CDensePreprocessor<float64_t>(),

  m_initialized(false)

 {

     register_parameters();

 }


 CRescaleFeatures::~CRescaleFeatures()

 {

     cleanup();

 }


 bool CRescaleFeatures::init(CFeatures* features)

 {

     if (!m_initialized)

     {

         ASSERT(features->get_feature_class()==C_DENSE);

         ASSERT(features->get_feature_type()==F_DREAL);


         CDenseFeatures<float64_t>* simple_features=(CDenseFeatures<float64_t>*) features;

         int32_t num_examples = simple_features->get_num_vectors();

         int32_t num_features = simple_features->get_num_features();

         REQUIRE(num_examples > 1,

                         "number of feature vectors should be at least 2!\n");


         SG_INFO("Extracting min and range values for each feature\n")


         m_min = SGVector<float64_t>(num_features);

         m_range = SGVector<float64_t>(num_features);

         SGMatrix<float64_t> feature_matrix=((CDenseFeatures<float64_t>*)features)->get_feature_matrix();

         for (index_t i = 0; i < num_features; i++)

         {

             SGVector<float64_t> vec = feature_matrix.get_row_vector(i);

             float64_t cur_min = vec[0];

             float64_t cur_max = vec[0];


             /* find the max and min values in one loop */

             for (index_t j = 1; j < vec.vlen; j++)

             {

                 cur_min = CMath::min(vec[j], cur_min);

                 cur_max = CMath::max(vec[j], cur_max);

             }


             /* only rescale if range > 0 */

             if ((cur_max - cur_min) > 0) {

                 m_min[i] = cur_min;

                 m_range[i] = 1.0/(cur_max - cur_min);

             }

             else {

                 m_min[i] = 0.0;

                 m_range[i] = 1.0;

             }

         }


         m_initialized = true;


         return true;

     }


     return false;

 }


 void CRescaleFeatures::cleanup()

 {

     m_initialized = false;

 }


 SGMatrix<float64_t> CRescaleFeatures::apply_to_feature_matrix(CFeatures* features)

 {

     ASSERT(m_initialized);


     SGMatrix<float64_t> feature_matrix=((CDenseFeatures<float64_t>*)features)->get_feature_matrix();

     ASSERT(feature_matrix.num_rows == m_min.vlen);


     for (index_t i = 0; i < feature_matrix.num_cols; i++)

     {

         float64_t* vec = feature_matrix.get_column_vector(i);

         SGVector<float64_t>::vec1_plus_scalar_times_vec2(vec, -1.0, m_min.vector, feature_matrix.num_rows);

         for (index_t j = 0; j < feature_matrix.num_rows; j++) {

             vec[j] *= m_range[j];

         }

     }


     return feature_matrix;

 }


 SGVector<float64_t> CRescaleFeatures::apply_to_feature_vector(SGVector<float64_t> vector)

 {

     ASSERT(m_initialized);

     ASSERT(m_min.vlen == vector.vlen);


     float64_t* ret = SG_MALLOC(float64_t, vector.vlen);

     SGVector<float64_t>::add(ret, 1.0, vector.vector, -1.0, m_min.vector, vector.vlen);

     for (index_t i = 0; i < vector.vlen; i++) {

         ret[i] *= m_range[i];

     }


     return SGVector<float64_t>(ret,vector.vlen);

 }


 void CRescaleFeatures::register_parameters()

 {

     SG_ADD(&m_min, "min", "minimum values of each feature", MS_NOT_AVAILABLE);

     SG_ADD(&m_range, "range", "Reciprocal of the range of each feature", MS_NOT_AVAILABLE);

     SG_ADD(&m_initialized, "initialized", "Indicator of the state of the preprocessor.", MS_NOT_AVAILABLE);

 }

SG_INFO
#define SG_INFO(...)
Definition: SGIO.h:118

shogun::CDenseFeatures< float64_t >

index_t
int32_t index_t
Definition: common.h:62

shogun::CRescaleFeatures::~CRescaleFeatures
virtual ~CRescaleFeatures()
Definition: RescaleFeatures.cpp:22

shogun::CFeatures::get_num_vectors
virtual int32_t get_num_vectors() const =0

REQUIRE
#define REQUIRE(x,...)
Definition: SGIO.h:206

shogun::SGMatrix::num_cols
index_t num_cols
Definition: SGMatrix.h:378

shogun::SGMatrix::num_rows
index_t num_rows
Definition: SGMatrix.h:376

shogun::SGMatrix< float64_t >

shogun::MS_NOT_AVAILABLE
Definition: SGObject.h:89

shogun::CRescaleFeatures::apply_to_feature_vector
virtual SGVector< float64_t > apply_to_feature_vector(SGVector< float64_t > vector)
Definition: RescaleFeatures.cpp:101

shogun::CRescaleFeatures::CRescaleFeatures
CRescaleFeatures()
Definition: RescaleFeatures.cpp:15

shogun::SGVector::vlen
index_t vlen
Definition: SGVector.h:494

shogun::SGVector::vector
T * vector
Definition: SGVector.h:492

shogun::F_DREAL
Definition: FeatureTypes.h:32

ASSERT
#define ASSERT(x)
Definition: SGIO.h:201

shogun::CDensePreprocessor
Template class DensePreprocessor, base class for preprocessors (cf. CPreprocessor) that apply to CDen...
Definition: DensePreprocessor.h:33

RescaleFeatures.h

shogun::SGVector< float64_t >

float64_t
double float64_t
Definition: common.h:50

shogun::CRescaleFeatures::cleanup
virtual void cleanup()
Definition: RescaleFeatures.cpp:77

shogun::CRescaleFeatures::apply_to_feature_matrix
virtual SGMatrix< float64_t > apply_to_feature_matrix(CFeatures *features)
Definition: RescaleFeatures.cpp:82

shogun::CFeatures::get_feature_class
virtual EFeatureClass get_feature_class() const =0

shogun::SGMatrix::get_column_vector
T * get_column_vector(index_t col) const
Definition: SGMatrix.h:115

shogun::CMath::max
static T max(T a, T b)
Definition: Math.h:168

shogun::C_DENSE
Definition: FeatureTypes.h:41

shogun::SGVector::vec1_plus_scalar_times_vec2
static void vec1_plus_scalar_times_vec2(T *vec1, const T scalar, const T *vec2, int32_t n)
x=x+alpha*y
Definition: SGVector.cpp:531

shogun::CRescaleFeatures::m_min
SGVector< float64_t > m_min
Definition: RescaleFeatures.h:75

shogun::CRescaleFeatures::m_initialized
bool m_initialized
Definition: RescaleFeatures.h:79

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

shogun::CRescaleFeatures::m_range
SGVector< float64_t > m_range
Definition: RescaleFeatures.h:77

shogun::CFeatures
The class Features is the base class of all feature objects.
Definition: Features.h:68

shogun::CMath::min
static T min(T a, T b)
Definition: Math.h:157

SG_ADD
#define SG_ADD(...)
Definition: SGObject.h:81

shogun::CFeatures::get_feature_type
virtual EFeatureType get_feature_type() const =0

shogun::SGVector::add
void add(const SGVector< T > x)
Definition: SGVector.cpp:281