en/current/OnlineLibLinear_8cpp_source.html

 /*

  * This program is free software; you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation; either version 3 of the License, or

  * (at your option) any later version.

  *

  * Written (W) 2007-2010 Soeren Sonnenburg

  * Written (W) 2011 Shashwat Lal Das

  * Modifications (W) 2013 Thoralf Klein

  * Copyright (c) 2007-2009 The LIBLINEAR Project.

  * Copyright (C) 2007-2010 Fraunhofer Institute FIRST and Max-Planck-Society

  */


 #include <shogun/classifier/svm/OnlineLibLinear.h>

 #include <shogun/features/streaming/StreamingDenseFeatures.h>

 #include <shogun/features/streaming/StreamingSparseFeatures.h>

 #include <shogun/mathematics/Math.h>

 #include <shogun/lib/Time.h>


 using namespace shogun;


 COnlineLibLinear::COnlineLibLinear()

         : COnlineLinearMachine()

 {

         init();

 }


 COnlineLibLinear::COnlineLibLinear(float64_t C_reg)

 {

         init();

         C1=C_reg;

         C2=C_reg;

         use_bias=true;

 }


 COnlineLibLinear::COnlineLibLinear(

         float64_t C_reg, CStreamingDotFeatures* traindat)

 {

         init();

         C1=C_reg;

         C2=C_reg;

         use_bias=true;


         set_features(traindat);

 }


 COnlineLibLinear::COnlineLibLinear(COnlineLibLinear *mch)

 {

     init();

     C1 = mch->C1;

     C2 = mch->C2;

     use_bias = mch->use_bias;


     set_features(mch->features);


     w_dim = mch->w_dim;

     if (w_dim > 0)

     {

         w = SG_MALLOC(float32_t, w_dim);

         memcpy(w, mch->w, w_dim*sizeof(float32_t));

     }

     else

     {

         w = NULL;

     }

     bias = mch->bias;

 }


 void COnlineLibLinear::init()

 {

     C1=1;

     C2=1;

     Cp=1;

     Cn=1;

     use_bias=false;


     m_parameters->add(&C1, "C1",  "C Cost constant 1.");

     m_parameters->add(&C2, "C2",  "C Cost constant 2.");

     m_parameters->add(&use_bias, "use_bias",  "Indicates if bias is used.");


     PG = 0;

     PGmax_old = CMath::INFTY;

     PGmin_old = -CMath::INFTY;

     PGmax_new = -CMath::INFTY;

     PGmin_new = CMath::INFTY;


     diag[0]=0;diag[1]=0;diag[2]=0;

     upper_bound[0]=Cn;upper_bound[1]=0;upper_bound[2]=Cp;


     v = 0;

     nSV = 0;


     // TODO: "local" variables only used in one method

     C = 0;

     d = 0;

     G = 0;

     QD = 0;

     alpha_current = 0;

 }


 COnlineLibLinear::~COnlineLibLinear()

 {

 }


 void COnlineLibLinear::start_train()

 {

     Cp = C1;

     Cn = C2;

     bias = false;


     PGmax_old = CMath::INFTY;

     PGmin_old = -CMath::INFTY;

     PGmax_new = -CMath::INFTY;

     PGmin_new = CMath::INFTY;


     diag[0]=0;diag[1]=0;diag[2]=0;

     upper_bound[0]=Cn;upper_bound[1]=0;upper_bound[2]=Cp;


     v = 0;

     nSV = 0;

 }


 void COnlineLibLinear::stop_train()

 {

     float64_t gap = PGmax_new - PGmin_new;


     SG_DONE()

     SG_INFO("Optimization finished.\n")


     // calculate objective value

     for (int32_t i=0; i<w_dim; i++)

         v += w[i]*w[i];

     v += bias*bias;


     SG_INFO("Objective value = %lf\n", v/2)

     SG_INFO("nSV = %d\n", nSV)

     SG_INFO("gap = %g\n", gap)

 }


 void COnlineLibLinear::train_one(SGVector<float32_t> ex, float64_t label)

 {

     alpha_current = 0;

     int32_t y_current = 0;

     if (label > 0)

         y_current = +1;

     else

         y_current = -1;


     QD = diag[y_current + 1];

     // Dot product of vector with itself

     QD += CMath::dot(ex.vector, ex.vector, ex.vlen);


     // Dot product of vector with learned weights

     G = CMath::dot(ex.vector, w, w_dim);


     if (use_bias)

         G += bias;

     G = G*y_current - 1;

     // LINEAR TERM PART?


     C = upper_bound[y_current + 1];

     G += alpha_current*diag[y_current + 1]; // Can be eliminated, since diag = 0 vector


     PG = 0;

     if (alpha_current == 0) // This condition will always be true in the online version

     {

         if (G > PGmax_old)

         {

             return;

         }

         else if (G < 0)

             PG = G;

     }

     else if (alpha_current == C)

     {

         if (G < PGmin_old)

         {

             return;

         }

         else if (G > 0)

             PG = G;

     }

     else

         PG = G;


     PGmax_new = CMath::max(PGmax_new, PG);

     PGmin_new = CMath::min(PGmin_new, PG);


     if (fabs(PG) > 1.0e-12)

     {

         float64_t alpha_old = alpha_current;

         alpha_current = CMath::min(CMath::max(alpha_current - G/QD, 0.0), C);

         d = (alpha_current - alpha_old) * y_current;


         for (int32_t i=0; i < w_dim; ++i)

             w[i] += d*ex[i];


         if (use_bias)

             bias += d;

     }


     v += alpha_current*(alpha_current*diag[y_current + 1] - 2);

     if (alpha_current > 0)

         nSV++;

 }


 void COnlineLibLinear::train_one(SGSparseVector<float32_t> ex, float64_t label)

 {

     alpha_current = 0;

     int32_t y_current = 0;

     if (label > 0)

         y_current = +1;

     else

         y_current = -1;


     QD = diag[y_current + 1];

     // Dot product of vector with itself

     QD += SGSparseVector<float32_t>::sparse_dot(ex, ex);


     // Dot product of vector with learned weights

     G = ex.dense_dot(1.0,w,w_dim,0.0);


     if (use_bias)

         G += bias;

     G = G*y_current - 1;

     // LINEAR TERM PART?


     C = upper_bound[y_current + 1];

     G += alpha_current*diag[y_current + 1]; // Can be eliminated, since diag = 0 vector


     PG = 0;

     if (alpha_current == 0) // This condition will always be true in the online version

     {

         if (G > PGmax_old)

         {

             return;

         }

         else if (G < 0)

             PG = G;

     }

     else if (alpha_current == C)

     {

         if (G < PGmin_old)

         {

             return;

         }

         else if (G > 0)

             PG = G;

     }

     else

         PG = G;


     PGmax_new = CMath::max(PGmax_new, PG);

     PGmin_new = CMath::min(PGmin_new, PG);


     if (fabs(PG) > 1.0e-12)

     {

         float64_t alpha_old = alpha_current;

         alpha_current = CMath::min(CMath::max(alpha_current - G/QD, 0.0), C);

         d = (alpha_current - alpha_old) * y_current;


         for (int32_t i=0; i < ex.num_feat_entries; i++)

             w[ex.features[i].feat_index] += d*ex.features[i].entry;


         if (use_bias)

             bias += d;

     }


     v += alpha_current*(alpha_current*diag[y_current + 1] - 2);

     if (alpha_current > 0)

         nSV++;

 }


 void COnlineLibLinear::train_example(CStreamingDotFeatures *feature, float64_t label)

 {

     features->expand_if_required(w, w_dim);


     if (features->get_feature_class() == C_STREAMING_DENSE) {

         CStreamingDenseFeatures<float32_t> *feat =

             dynamic_cast<CStreamingDenseFeatures<float32_t> *>(feature);

         if (feat == NULL)

             SG_ERROR("Expected streaming dense feature <float32_t>\n")


         train_one(feat->get_vector(), label);

     }

     else if (features->get_feature_class() == C_STREAMING_SPARSE) {

         CStreamingSparseFeatures<float32_t> *feat =

             dynamic_cast<CStreamingSparseFeatures<float32_t> *>(feature);

         if (feat == NULL)

             SG_ERROR("Expected streaming sparse feature <float32_t>\n")


         train_one(feat->get_vector(), label);

     }

     else {

         SG_NOTIMPLEMENTED

     }

 }

shogun::COnlineLibLinear::COnlineLibLinear
COnlineLibLinear()
Definition: OnlineLibLinear.cpp:22

SG_INFO
#define SG_INFO(...)
Definition: SGIO.h:118

SG_DONE
#define SG_DONE()
Definition: SGIO.h:157

shogun::COnlineLinearMachine
Class OnlineLinearMachine is a generic interface for linear machines like classifiers which work thro...
Definition: OnlineLinearMachine.h:53

OnlineLibLinear.h

shogun::SGSparseVector::sparse_dot
T sparse_dot(const SGSparseVector< T > &v)
Definition: SGSparseVector.cpp:123

Math.h

shogun::CStreamingDenseFeatures< float32_t >

shogun::CMath::INFTY
static const float64_t INFTY
infinity
Definition: Math.h:2048

shogun::CStreamingDenseFeatures::get_vector
SGVector< T > get_vector()
Definition: StreamingDenseFeatures.cpp:234

Time.h

SG_ERROR
#define SG_ERROR(...)
Definition: SGIO.h:129

SG_NOTIMPLEMENTED
#define SG_NOTIMPLEMENTED
Definition: SGIO.h:139

shogun::CSGObject::m_parameters
Parameter * m_parameters
Definition: SGObject.h:378

StreamingDenseFeatures.h

shogun::CStreamingSparseFeatures::get_vector
SGSparseVector< T > get_vector()
Definition: StreamingSparseFeatures.cpp:331

shogun::COnlineLibLinear::train_one
virtual void train_one(SGVector< float32_t > ex, float64_t label)
Definition: OnlineLibLinear.cpp:141

shogun::SGSparseVector::num_feat_entries
index_t num_feat_entries
Definition: SGSparseVector.h:212

shogun::COnlineLibLinear::stop_train
virtual void stop_train()
Definition: OnlineLibLinear.cpp:124

shogun::COnlineLinearMachine::set_features
virtual void set_features(CStreamingDotFeatures *feat)
Definition: OnlineLinearMachine.h:149

shogun::COnlineLibLinear::train_example
virtual void train_example(CStreamingDotFeatures *feature, float64_t label)
Definition: OnlineLibLinear.cpp:277

shogun::COnlineLinearMachine::w
float32_t * w
Definition: OnlineLinearMachine.h:255

shogun::COnlineLinearMachine::bias
float32_t bias
Definition: OnlineLinearMachine.h:257

shogun::Parameter::add
void add(bool *param, const char *name, const char *description="")
Definition: Parameter.cpp:37

shogun::SGVector::vlen
index_t vlen
Definition: SGVector.h:494

shogun::SGVector::vector
T * vector
Definition: SGVector.h:492

shogun::SGVector< float32_t >

shogun::COnlineLibLinear::~COnlineLibLinear
virtual ~COnlineLibLinear()
Definition: OnlineLibLinear.cpp:102

float64_t
double float64_t
Definition: common.h:50

shogun::CStreamingDotFeatures::expand_if_required
virtual void expand_if_required(float32_t *&vec, int32_t &len)
Definition: StreamingDotFeatures.cpp:53

shogun::CFeatures::get_feature_class
virtual EFeatureClass get_feature_class() const =0

shogun::CMath::max
static T max(T a, T b)
Definition: Math.h:168

shogun::CMath::dot
static float64_t dot(const bool *v1, const bool *v2, int32_t n)
Compute dot product between v1 and v2 (blas optimized)
Definition: Math.h:627

StreamingSparseFeatures.h

shogun::CStreamingDotFeatures
Streaming features that support dot products among other operations.
Definition: StreamingDotFeatures.h:47

shogun::SGSparseVector::features
SGSparseVectorEntry< T > * features
Definition: SGSparseVector.h:215

shogun::SGSparseVector::dense_dot
T dense_dot(T alpha, T *vec, int32_t dim, T b)
Definition: SGSparseVector.cpp:58

shogun::C_STREAMING_DENSE
Definition: FeatureTypes.h:50

float32_t
float float32_t
Definition: common.h:49

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

shogun::COnlineLibLinear
Class implementing a purely online version of CLibLinear, using the L2R_L1LOSS_SVC_DUAL solver only...
Definition: OnlineLibLinear.h:39

shogun::COnlineLinearMachine::features
CStreamingDotFeatures * features
Definition: OnlineLinearMachine.h:259

shogun::CMath::min
static T min(T a, T b)
Definition: Math.h:157

shogun::C_STREAMING_SPARSE
Definition: FeatureTypes.h:51

shogun::SGSparseVector
template class SGSparseVector The assumtion is that the stored SGSparseVectorEntry* vector is orde...
Definition: base/Parameter.h:29

shogun::CStreamingSparseFeatures
This class implements streaming features with sparse feature vectors. The vector is represented as an...
Definition: StreamingSparseFeatures.h:48

shogun::COnlineLibLinear::start_train
virtual void start_train()
Definition: OnlineLibLinear.cpp:106

shogun::COnlineLinearMachine::w_dim
int32_t w_dim
Definition: OnlineLinearMachine.h:253