en/current/ExplicitSpecFeatures_8cpp_source.html

 /*

  * This program is free software; you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation; either version 3 of the License, or

  * (at your option) any later version.

  *

  * Written (W) 2009 Soeren Sonnenburg

  * Copyright (C) 2009 Fraunhofer Institute FIRST and Max-Planck-Society

  */


 #include <shogun/features/ExplicitSpecFeatures.h>

 #include <shogun/mathematics/Math.h>

 #include <shogun/io/SGIO.h>


 using namespace shogun;


 CExplicitSpecFeatures::CExplicitSpecFeatures() :CDotFeatures()

 {

     SG_UNSTABLE("CExplicitSpecFeatures::CExplicitSpecFeatures()",

                 "\n");


     use_normalization = false;

     num_strings = 0;

     alphabet_size = 0;


     spec_size = 0;

     k_spectrum = NULL;

 }


 CExplicitSpecFeatures::CExplicitSpecFeatures(CStringFeatures<uint16_t>* str, bool normalize) : CDotFeatures()

 {

     ASSERT(str)


     use_normalization=normalize;

     num_strings = str->get_num_vectors();

     spec_size = str->get_num_symbols();


     obtain_kmer_spectrum(str);


     SG_DEBUG("SPEC size=%d, num_str=%d\n", spec_size, num_strings)

 }


 CExplicitSpecFeatures::CExplicitSpecFeatures(const CExplicitSpecFeatures& orig) : CDotFeatures(orig),

     num_strings(orig.num_strings), alphabet_size(orig.alphabet_size), spec_size(orig.spec_size)

 {

     k_spectrum= SG_MALLOC(float64_t*, num_strings);

     for (int32_t i=0; i<num_strings; i++)

         k_spectrum[i]=SGVector<float64_t>::clone_vector(k_spectrum[i], spec_size);

 }


 CExplicitSpecFeatures::~CExplicitSpecFeatures()

 {

     delete_kmer_spectrum();

 }


 int32_t CExplicitSpecFeatures::get_dim_feature_space() const

 {

     return spec_size;

 }


 float64_t CExplicitSpecFeatures::dot(int32_t vec_idx1, CDotFeatures* df, int32_t vec_idx2)

 {

     ASSERT(df)

     ASSERT(df->get_feature_type() == get_feature_type())

     ASSERT(df->get_feature_class() == get_feature_class())

     CExplicitSpecFeatures* sf = (CExplicitSpecFeatures*) df;


     ASSERT(vec_idx1 < num_strings)

     ASSERT(vec_idx2 < sf->num_strings)

     float64_t* vec1=k_spectrum[vec_idx1];

     float64_t* vec2=sf->k_spectrum[vec_idx2];


     return CMath::dot(vec1, vec2, spec_size);

 }


 float64_t CExplicitSpecFeatures::dense_dot(int32_t vec_idx1, const float64_t* vec2, int32_t vec2_len)

 {

     ASSERT(vec2_len == spec_size)

     ASSERT(vec_idx1 < num_strings)

     float64_t* vec1=k_spectrum[vec_idx1];

     float64_t result=0;


     for (int32_t i=0; i<spec_size; i++)

         result+=vec1[i]*vec2[i];


     return result;

 }


 void CExplicitSpecFeatures::add_to_dense_vec(float64_t alpha, int32_t vec_idx1, float64_t* vec2, int32_t vec2_len, bool abs_val)

 {

     ASSERT(vec2_len == spec_size)

     ASSERT(vec_idx1 < num_strings)

     float64_t* vec1=k_spectrum[vec_idx1];


     if (abs_val)

     {

         for (int32_t i=0; i<spec_size; i++)

             vec2[i]+=alpha*CMath::abs(vec1[i]);

     }

     else

     {

         for (int32_t i=0; i<spec_size; i++)

             vec2[i]+=alpha*vec1[i];

     }

 }


 void CExplicitSpecFeatures::obtain_kmer_spectrum(CStringFeatures<uint16_t>* str)

 {

     k_spectrum= SG_MALLOC(float64_t*, num_strings);


     for (int32_t i=0; i<num_strings; i++)

     {

         k_spectrum[i]=SG_MALLOC(float64_t, spec_size);

         memset(k_spectrum[i], 0, sizeof(float64_t)*spec_size);


         int32_t len=0;

         bool free_fv;

         uint16_t* fv=str->get_feature_vector(i, len, free_fv);


         for (int32_t j=0; j<len; j++)

             k_spectrum[i][fv[j]]++;


         str->free_feature_vector(fv, i, free_fv);


         if (use_normalization)

         {

             float64_t n=0;

             for (int32_t j=0; j<spec_size; j++)

                 n+=CMath::sq(k_spectrum[i][j]);


             n=CMath::sqrt(n);


             for (int32_t j=0; j<spec_size; j++)

                 k_spectrum[i][j]/=n;

         }

     }

 }


 void CExplicitSpecFeatures::delete_kmer_spectrum()

 {

     for (int32_t i=0; i<num_strings; i++)

         SG_FREE(k_spectrum[i]);


     SG_FREE(k_spectrum);

     k_spectrum=NULL;

 }


 CFeatures* CExplicitSpecFeatures::duplicate() const

 {

     return new CExplicitSpecFeatures(*this);

 }


 void* CExplicitSpecFeatures::get_feature_iterator(int32_t vector_index)

 {

     SG_NOTIMPLEMENTED

     return NULL;

 }


 bool CExplicitSpecFeatures::get_next_feature(int32_t& index, float64_t& value, void* iterator)

 {

     SG_NOTIMPLEMENTED

     return false;

 }


 void CExplicitSpecFeatures::free_feature_iterator(void* iterator)

 {

     SG_NOTIMPLEMENTED

 }


 int32_t CExplicitSpecFeatures::get_nnz_features_for_vector(int32_t num)

 {

     SG_NOTIMPLEMENTED

     return 0;

 }


 EFeatureType CExplicitSpecFeatures::get_feature_type() const

 {

     return F_UNKNOWN;

 }


 EFeatureClass CExplicitSpecFeatures::get_feature_class() const

 {

     return C_SPEC;

 }


 int32_t CExplicitSpecFeatures::get_num_vectors() const

 {

     return num_strings;

 }

shogun::CExplicitSpecFeatures::alphabet_size
int32_t alphabet_size
Definition: ExplicitSpecFeatures.h:183

ExplicitSpecFeatures.h

shogun::CStringFeatures::get_feature_vector
SGVector< ST > get_feature_vector(int32_t num)
Definition: StringFeatures.cpp:223

shogun::F_UNKNOWN
Definition: FeatureTypes.h:21

shogun::CExplicitSpecFeatures::delete_kmer_spectrum
void delete_kmer_spectrum()
Definition: ExplicitSpecFeatures.cpp:140

shogun::CExplicitSpecFeatures::k_spectrum
float64_t ** k_spectrum
Definition: ExplicitSpecFeatures.h:188

shogun::CStringFeatures< uint16_t >

Math.h

shogun::CExplicitSpecFeatures::obtain_kmer_spectrum
void obtain_kmer_spectrum(CStringFeatures< uint16_t > *str)
Definition: ExplicitSpecFeatures.cpp:108

shogun::CExplicitSpecFeatures::dot
virtual float64_t dot(int32_t vec_idx1, CDotFeatures *df, int32_t vec_idx2)
Definition: ExplicitSpecFeatures.cpp:62

SGIO.h

shogun::CExplicitSpecFeatures::get_next_feature
virtual bool get_next_feature(int32_t &index, float64_t &value, void *iterator)
Definition: ExplicitSpecFeatures.cpp:162

shogun::CExplicitSpecFeatures::get_dim_feature_space
virtual int32_t get_dim_feature_space() const
Definition: ExplicitSpecFeatures.cpp:57

shogun::CStringFeatures::get_num_vectors
virtual int32_t get_num_vectors() const
Definition: StringFeatures.cpp:420

shogun::CMath::sq
static T sq(T x)
Definition: Math.h:450

SG_NOTIMPLEMENTED
#define SG_NOTIMPLEMENTED
Definition: SGIO.h:139

shogun::CExplicitSpecFeatures::num_strings
int32_t num_strings
Definition: ExplicitSpecFeatures.h:181

shogun::CExplicitSpecFeatures::duplicate
virtual CFeatures * duplicate() const
Definition: ExplicitSpecFeatures.cpp:149

shogun::CStringFeatures::free_feature_vector
void free_feature_vector(ST *feat_vec, int32_t num, bool dofree)
Definition: StringFeatures.cpp:357

shogun::CDotFeatures
Features that support dot products among other operations.
Definition: DotFeatures.h:44

shogun::EFeatureClass
EFeatureClass
shogun feature class
Definition: FeatureTypes.h:38

shogun::CStringFeatures::get_num_symbols
floatmax_t get_num_symbols()
Definition: StringFeatures.cpp:425

ASSERT
#define ASSERT(x)
Definition: SGIO.h:201

shogun::CExplicitSpecFeatures::~CExplicitSpecFeatures
virtual ~CExplicitSpecFeatures()
Definition: ExplicitSpecFeatures.cpp:52

shogun::CExplicitSpecFeatures::spec_size
int32_t spec_size
Definition: ExplicitSpecFeatures.h:186

shogun::SGVector
shogun vector
Definition: base/Parameter.h:28

shogun::CExplicitSpecFeatures::add_to_dense_vec
virtual void add_to_dense_vec(float64_t alpha, int32_t vec_idx1, float64_t *vec2, int32_t vec2_len, bool abs_val=false)
Definition: ExplicitSpecFeatures.cpp:90

float64_t
double float64_t
Definition: common.h:50

shogun::CFeatures::get_feature_class
virtual EFeatureClass get_feature_class() const =0

shogun::CExplicitSpecFeatures::CExplicitSpecFeatures
CExplicitSpecFeatures()
Definition: ExplicitSpecFeatures.cpp:17

shogun::CExplicitSpecFeatures::get_num_vectors
virtual int32_t get_num_vectors() const
Definition: ExplicitSpecFeatures.cpp:189

shogun::CMath::dot
static float64_t dot(const bool *v1, const bool *v2, int32_t n)
Compute dot product between v1 and v2 (blas optimized)
Definition: Math.h:627

shogun::CExplicitSpecFeatures
Features that compute the Spectrum Kernel feature space explicitly.
Definition: ExplicitSpecFeatures.h:28

shogun::CExplicitSpecFeatures::get_feature_type
virtual EFeatureType get_feature_type() const
Definition: ExplicitSpecFeatures.cpp:179

shogun::EFeatureType
EFeatureType
shogun feature type
Definition: FeatureTypes.h:19

shogun::CExplicitSpecFeatures::free_feature_iterator
virtual void free_feature_iterator(void *iterator)
Definition: ExplicitSpecFeatures.cpp:168

SG_DEBUG
#define SG_DEBUG(...)
Definition: SGIO.h:107

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

shogun::CFeatures
The class Features is the base class of all feature objects.
Definition: Features.h:68

shogun::CExplicitSpecFeatures::dense_dot
virtual float64_t dense_dot(int32_t vec_idx1, const float64_t *vec2, int32_t vec2_len)
Definition: ExplicitSpecFeatures.cpp:77

shogun::C_SPEC
Definition: FeatureTypes.h:47

shogun::CMath::sqrt
static float32_t sqrt(float32_t x)
Definition: Math.h:459

shogun::CExplicitSpecFeatures::get_nnz_features_for_vector
virtual int32_t get_nnz_features_for_vector(int32_t num)
Definition: ExplicitSpecFeatures.cpp:173

SG_UNSTABLE
#define SG_UNSTABLE(func,...)
Definition: SGIO.h:132

shogun::CExplicitSpecFeatures::use_normalization
bool use_normalization
Definition: ExplicitSpecFeatures.h:179

shogun::CFeatures::get_feature_type
virtual EFeatureType get_feature_type() const =0

shogun::CExplicitSpecFeatures::get_feature_class
virtual EFeatureClass get_feature_class() const
Definition: ExplicitSpecFeatures.cpp:184

shogun::CMath::abs
static T abs(T a)
Definition: Math.h:179

shogun::CExplicitSpecFeatures::get_feature_iterator
virtual void * get_feature_iterator(int32_t vector_index)
Definition: ExplicitSpecFeatures.cpp:156