en/latest/StochasticSOSVM_8cpp_source.html

 /*

  * This program is free software; you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation; either version 3 of the License, or

  * (at your option) any later version.

  *

  * Written (W) 2013 Shell Hu

  * Copyright (C) 2013 Shell Hu

  */


 #include <shogun/mathematics/Math.h>

 #include <shogun/structure/StochasticSOSVM.h>

 #include <shogun/labels/LabelsFactory.h>

 #include <shogun/lib/SGVector.h>


 using namespace shogun;


 CStochasticSOSVM::CStochasticSOSVM()

 : CLinearStructuredOutputMachine()

 {

     init();

 }


 CStochasticSOSVM::CStochasticSOSVM(

         CStructuredModel*  model,

         CStructuredLabels* labs,

         bool do_weighted_averaging,

         bool verbose)

 : CLinearStructuredOutputMachine(model, labs)

 {

     REQUIRE(model != NULL && labs != NULL,

         "%s::CStochasticSOSVM(): model and labels cannot be NULL!\n", get_name());


     REQUIRE(labs->get_num_labels() > 0,

         "%s::CStochasticSOSVM(): number of labels should be greater than 0!\n", get_name());


     init();

     m_lambda = 1.0 / labs->get_num_labels();

     m_do_weighted_averaging = do_weighted_averaging;

     m_verbose = verbose;

 }


 void CStochasticSOSVM::init()

 {

     SG_ADD(&m_lambda, "lambda", "Regularization constant", MS_NOT_AVAILABLE);

     SG_ADD(&m_num_iter, "num_iter", "Number of iterations", MS_NOT_AVAILABLE);

     SG_ADD(&m_do_weighted_averaging, "do_weighted_averaging", "Do weighted averaging", MS_NOT_AVAILABLE);

     SG_ADD(&m_debug_multiplier, "debug_multiplier", "Debug multiplier", MS_NOT_AVAILABLE);

     SG_ADD(&m_rand_seed, "rand_seed", "Random seed", MS_NOT_AVAILABLE);


     m_lambda = 1.0;

     m_num_iter = 50;

     m_do_weighted_averaging = true;

     m_debug_multiplier = 0;

     m_rand_seed = 1;

 }


 CStochasticSOSVM::~CStochasticSOSVM()

 {

 }


 EMachineType CStochasticSOSVM::get_classifier_type()

 {

     return CT_STOCHASTICSOSVM;

 }


 bool CStochasticSOSVM::train_machine(CFeatures* data)

 {

     SG_DEBUG("Entering CStochasticSOSVM::train_machine.\n");

     if (data)

         set_features(data);


     // Initialize the model for training

     m_model->init_training();

     // Check that the scenary is correct to start with training

     m_model->check_training_setup();

     SG_DEBUG("The training setup is correct.\n");


     // Dimensionality of the joint feature space

     int32_t M = m_model->get_dim();

     // Number of training examples

     int32_t N = CLabelsFactory::to_structured(m_labels)->get_num_labels();


     SG_DEBUG("M=%d, N =%d.\n", M, N);


     // Initialize the weight vector

     m_w = SGVector<float64_t>(M);

     m_w.zero();


     SGVector<float64_t> w_avg;

     if (m_do_weighted_averaging)

         w_avg = m_w.clone();


     // logging

     if (m_verbose)

     {

         if (m_helper != NULL)

             SG_UNREF(m_helper);


         m_helper = new CSOSVMHelper();

         SG_REF(m_helper);

     }


     int32_t debug_iter = 1;

     if (m_debug_multiplier == 0)

     {

         debug_iter = N;

         m_debug_multiplier = 100;

     }


     CMath::init_random(m_rand_seed);


     // Main loop

     int32_t k = 0;

     for (int32_t pi = 0; pi < m_num_iter; ++pi)

     {

         for (int32_t si = 0; si < N; ++si)

         {

             // 1) Picking random example

             int32_t i = CMath::random(0, N-1);


             // 2) solve the loss-augmented inference for point i

             CResultSet* result = m_model->argmax(m_w, i);


             // 3) get the subgradient

             // psi_i(y) := phi(x_i,y_i) - phi(x_i, y)

             SGVector<float64_t> psi_i(M);

             SGVector<float64_t> w_s(M);


             if (result->psi_computed)

             {

                 SGVector<float64_t>::add(psi_i.vector,

                     1.0, result->psi_truth.vector, -1.0, result->psi_pred.vector,

                     psi_i.vlen);

             }

             else if(result->psi_computed_sparse)

             {

                 psi_i.zero();

                 result->psi_pred_sparse.add_to_dense(1.0, psi_i.vector, psi_i.vlen);

                 result->psi_truth_sparse.add_to_dense(-1.0, psi_i.vector, psi_i.vlen);

             }

             else

             {

                 SG_ERROR("model(%s) should have either of psi_computed or psi_computed_sparse"

                         "to be set true\n", m_model->get_name());

             }


             w_s = psi_i.clone();

             w_s.scale(1.0 / (N*m_lambda));


             // 4) step-size gamma

             float64_t gamma = 1.0 / (k+1.0);


             // 5) finally update the weights

             SGVector<float64_t>::add(m_w.vector,

                 1.0-gamma, m_w.vector, gamma*N, w_s.vector, m_w.vlen);


             // 6) Optionally, update the weighted average

             if (m_do_weighted_averaging)

             {

                 float64_t rho = 2.0 / (k+2.0);

                 SGVector<float64_t>::add(w_avg.vector,

                     1.0-rho, w_avg.vector, rho, m_w.vector, w_avg.vlen);

             }


             k += 1;

             SG_UNREF(result);


             // Debug: compute objective and training error

             if (m_verbose && k == debug_iter)

             {

                 SGVector<float64_t> w_debug;

                 if (m_do_weighted_averaging)

                     w_debug = w_avg.clone();

                 else

                     w_debug = m_w.clone();


                 float64_t primal = CSOSVMHelper::primal_objective(w_debug, m_model, m_lambda);

                 float64_t train_error = CSOSVMHelper::average_loss(w_debug, m_model);


                 SG_DEBUG("pass %d (iteration %d), SVM primal = %f, train_error = %f \n",

                     pi, k, primal, train_error);


                 m_helper->add_debug_info(primal, (1.0*k) / N, train_error);


                 debug_iter = CMath::min(debug_iter+N, debug_iter*(1+m_debug_multiplier/100));

             }

         }

     }


     if (m_do_weighted_averaging)

         m_w = w_avg.clone();


     if (m_verbose)

         m_helper->terminate();


     SG_DEBUG("Leaving CStochasticSOSVM::train_machine.\n");

     return true;

 }


 float64_t CStochasticSOSVM::get_lambda() const

 {

     return m_lambda;

 }


 void CStochasticSOSVM::set_lambda(float64_t lbda)

 {

     m_lambda = lbda;

 }


 int32_t CStochasticSOSVM::get_num_iter() const

 {

     return m_num_iter;

 }


 void CStochasticSOSVM::set_num_iter(int32_t num_iter)

 {

     m_num_iter = num_iter;

 }


 int32_t CStochasticSOSVM::get_debug_multiplier() const

 {

     return m_debug_multiplier;

 }


 void CStochasticSOSVM::set_debug_multiplier(int32_t multiplier)

 {

     m_debug_multiplier = multiplier;

 }


 uint32_t CStochasticSOSVM::get_rand_seed() const

 {

     return m_rand_seed;

 }


 void CStochasticSOSVM::set_rand_seed(uint32_t rand_seed)

 {

     m_rand_seed = rand_seed;

 }


shogun::CResultSet::psi_truth
SGVector< float64_t > psi_truth
Definition: StructuredModel.h:72

shogun::EMachineType
EMachineType
Definition: Machine.h:33

shogun::CStructuredLabels
Base class of the labels used in Structured Output (SO) problems.
Definition: StructuredLabels.h:25

shogun::CStochasticSOSVM::get_rand_seed
uint32_t get_rand_seed() const
Definition: StochasticSOSVM.cpp:231

Math.h

shogun::CStochasticSOSVM::get_debug_multiplier
int32_t get_debug_multiplier() const
Definition: StochasticSOSVM.cpp:221

LabelsFactory.h

shogun::CSOSVMHelper::terminate
void terminate()
Definition: SOSVMHelper.cpp:157

shogun::CResultSet::psi_computed_sparse
bool psi_computed_sparse
Definition: StructuredModel.h:66

shogun::CStochasticSOSVM::set_debug_multiplier
void set_debug_multiplier(int32_t multiplier)
Definition: StochasticSOSVM.cpp:226

shogun::CT_STOCHASTICSOSVM
Definition: Machine.h:89

shogun::CMachine::m_labels
CLabels * m_labels
Definition: Machine.h:361

SG_ERROR
#define SG_ERROR(...)
Definition: SGIO.h:129

REQUIRE
#define REQUIRE(x,...)
Definition: SGIO.h:206

shogun::CStochasticSOSVM::get_name
virtual const char * get_name() const
Definition: StochasticSOSVM.h:52

shogun::CStochasticSOSVM::train_machine
virtual bool train_machine(CFeatures *data=NULL)
Definition: StochasticSOSVM.cpp:67

shogun::CSOSVMHelper::primal_objective
static float64_t primal_objective(SGVector< float64_t > w, CStructuredModel *model, float64_t lbda)
Definition: SOSVMHelper.cpp:57

shogun::CStructuredOutputMachine::m_model
CStructuredModel * m_model
Definition: StructuredOutputMachine.h:214

shogun::CStructuredModel::get_dim
virtual int32_t get_dim() const =0

shogun::CStochasticSOSVM::set_num_iter
void set_num_iter(int32_t num_iter)
Definition: StochasticSOSVM.cpp:216

shogun::SGVector::scale
void scale(T alpha)
Scale vector inplace.
Definition: SGVector.cpp:841

SG_REF
#define SG_REF(x)
Definition: SGObject.h:54

shogun::CMath::random
static uint64_t random()
Definition: Math.h:1019

shogun::MS_NOT_AVAILABLE
Definition: SGObject.h:92

shogun::CStochasticSOSVM::set_rand_seed
void set_rand_seed(uint32_t rand_seed)
Definition: StochasticSOSVM.cpp:236

shogun::CStructuredModel::init_training
virtual void init_training()
Definition: StructuredModel.cpp:178

shogun::CStochasticSOSVM::~CStochasticSOSVM
~CStochasticSOSVM()
Definition: StochasticSOSVM.cpp:58

shogun::SGVector::vlen
index_t vlen
Definition: SGVector.h:494

shogun::SGVector::zero
void zero()
Definition: SGVector.cpp:136

shogun::SGVector::vector
T * vector
Definition: SGVector.h:492

shogun::CStructuredOutputMachine::set_features
void set_features(CFeatures *f)
Definition: StructuredOutputMachine.cpp:74

shogun::SGVector< float64_t >

shogun::CStructuredOutputMachine::m_helper
CSOSVMHelper * m_helper
Definition: StructuredOutputMachine.h:223

shogun::CMath::init_random
static void init_random(uint32_t initseed=0)
Definition: Math.h:1006

shogun::SGSparseVector::add_to_dense
void add_to_dense(T alpha, T *vec, int32_t dim, bool abs_val=false)
Definition: SGSparseVector.cpp:78

float64_t
double float64_t
Definition: common.h:50

shogun::CSOSVMHelper
class CSOSVMHelper contains helper functions to compute primal objectives, dual objectives, average training losses, duality gaps etc. These values will be recorded to check convergence. This class is inspired by the matlab implementation of the block coordinate Frank-Wolfe SOSVM solver [1].
Definition: SOSVMHelper.h:31

StochasticSOSVM.h

shogun::CStructuredModel::check_training_setup
virtual bool check_training_setup() const
Definition: StructuredModel.cpp:183

shogun::CSOSVMHelper::average_loss
static float64_t average_loss(SGVector< float64_t > w, CStructuredModel *model, bool is_ub=false)
Definition: SOSVMHelper.cpp:88

shogun::CResultSet::psi_computed
bool psi_computed
Definition: StructuredModel.h:69

shogun::CStructuredOutputMachine::m_verbose
bool m_verbose
Definition: StructuredOutputMachine.h:226

shogun::CStructuredModel
Class CStructuredModel that represents the application specific model and contains most of the applic...
Definition: StructuredModel.h:101

shogun::CResultSet
Definition: StructuredModel.h:51

SG_UNREF
#define SG_UNREF(x)
Definition: SGObject.h:55

SG_DEBUG
#define SG_DEBUG(...)
Definition: SGIO.h:107

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

shogun::CStructuredModel::argmax
virtual CResultSet * argmax(SGVector< float64_t > w, int32_t feat_idx, bool const training=true)=0

shogun::CSOSVMHelper::add_debug_info
virtual void add_debug_info(float64_t primal, float64_t eff_pass, float64_t train_error, float64_t dual=-1, float64_t dgap=-1)
Definition: SOSVMHelper.cpp:108

shogun::CStructuredLabels::get_num_labels
virtual int32_t get_num_labels() const
Definition: StructuredLabels.cpp:76

shogun::CFeatures
The class Features is the base class of all feature objects.
Definition: Features.h:68

shogun::CMath::min
static T min(T a, T b)
Definition: Math.h:157

shogun::SGVector::clone
SGVector< T > clone() const
Definition: SGVector.cpp:207

shogun::CLinearStructuredOutputMachine::m_w
SGVector< float64_t > m_w
Definition: LinearStructuredOutputMachine.h:82

shogun::CStochasticSOSVM::CStochasticSOSVM
CStochasticSOSVM()
Definition: StochasticSOSVM.cpp:18

shogun::CStochasticSOSVM::set_lambda
void set_lambda(float64_t lbda)
Definition: StochasticSOSVM.cpp:206

shogun::CResultSet::psi_pred
SGVector< float64_t > psi_pred
Definition: StructuredModel.h:75

shogun::CStochasticSOSVM::get_classifier_type
virtual EMachineType get_classifier_type()
Definition: StochasticSOSVM.cpp:62

shogun::CResultSet::psi_truth_sparse
SGSparseVector< float64_t > psi_truth_sparse
Definition: StructuredModel.h:78

shogun::CLabelsFactory::to_structured
static CStructuredLabels * to_structured(CLabels *base_labels)
Definition: LabelsFactory.cpp:57

SG_ADD
#define SG_ADD(...)
Definition: SGObject.h:84

shogun::CStructuredModel::get_name
virtual const char * get_name() const
Definition: StructuredModel.h:260

SGVector.h

shogun::CStochasticSOSVM::get_lambda
float64_t get_lambda() const
Definition: StochasticSOSVM.cpp:201

shogun::CResultSet::psi_pred_sparse
SGSparseVector< float64_t > psi_pred_sparse
Definition: StructuredModel.h:81

shogun::CLinearStructuredOutputMachine
Definition: LinearStructuredOutputMachine.h:26

shogun::SGVector::add
void add(const SGVector< T > x)
Definition: SGVector.cpp:279

shogun::CStochasticSOSVM::get_num_iter
int32_t get_num_iter() const
Definition: StochasticSOSVM.cpp:211