en/current/FWSOSVM_8cpp_source.html

 /*

  * This program is free software; you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation; either version 3 of the License, or

  * (at your option) any later version.

  *

  * Written (W) 2014 Shell Hu

  * Copyright (C) 2014 Shell Hu

  */


 #include <shogun/mathematics/Math.h>

 #include <shogun/structure/FWSOSVM.h>

 #include <shogun/labels/LabelsFactory.h>

 #include <shogun/lib/SGVector.h>


 using namespace shogun;


 CFWSOSVM::CFWSOSVM()

 : CLinearStructuredOutputMachine()

 {

     init();

 }


 CFWSOSVM::CFWSOSVM(

         CStructuredModel*  model,

         CStructuredLabels* labs,

         bool do_line_search,

         bool verbose)

 : CLinearStructuredOutputMachine(model, labs)

 {

     REQUIRE(model != NULL && labs != NULL,

         "%s::CFWSOSVM(): model and labels cannot be NULL!\n", get_name());


     REQUIRE(labs->get_num_labels() > 0,

         "%s::CFWSOSVM(): number of labels should be greater than 0!\n", get_name());


     init();

     m_lambda = 1.0 / labs->get_num_labels();

     m_do_line_search = do_line_search;

     m_verbose = verbose;

 }


 void CFWSOSVM::init()

 {

     SG_ADD(&m_lambda, "lambda", "Regularization constant", MS_NOT_AVAILABLE);

     SG_ADD(&m_num_iter, "num_iter", "Number of iterations", MS_NOT_AVAILABLE);

     SG_ADD(&m_do_line_search, "do_line_search", "Do line search", MS_NOT_AVAILABLE);

     SG_ADD(&m_gap_threshold, "gap_threshold", "Gap threshold", MS_NOT_AVAILABLE);

     SG_ADD(&m_ell, "ell", "Average loss", MS_NOT_AVAILABLE);


     m_lambda = 1.0;

     m_num_iter = 50;

     m_do_line_search = true;

     m_gap_threshold = 0.1;

     m_ell = 0;

 }


 CFWSOSVM::~CFWSOSVM()

 {

 }


 EMachineType CFWSOSVM::get_classifier_type()

 {

     return CT_FWSOSVM;

 }


 bool CFWSOSVM::train_machine(CFeatures* data)

 {

     SG_DEBUG("Entering CFWSOSVM::train_machine.\n");

     if (data)

         set_features(data);


     // Initialize the model for training

     m_model->init_training();

     // Check that the scenary is correct to start with training

     m_model->check_training_setup();

     SG_DEBUG("The training setup is correct.\n");


     // Dimensionality of the joint feature space

     int32_t M = m_model->get_dim();

     // Number of training examples

     int32_t N = CLabelsFactory::to_structured(m_labels)->get_num_labels();


     SG_DEBUG("M=%d, N =%d.\n", M, N);


     // Initialize the weight vector

     m_w = SGVector<float64_t>(M);

     m_w.zero();


     // Initialize the average loss

     m_ell = 0;


     // logging

     if (m_verbose)

     {

         if (m_helper != NULL)

             SG_UNREF(m_helper);


         m_helper = new CSOSVMHelper();

         SG_REF(m_helper);

     }


     // Main loop

     int32_t k = 0;

     SGVector<float64_t> w_s(M);

     float64_t ell_s = 0;

     for (int32_t pi = 0; pi < m_num_iter; ++pi)

     {

         // init w_s and ell_s

         k = pi;

         w_s.zero();

         ell_s = 0;


         for (int32_t si = 0; si < N; ++si)

         {

             // 1) solve the loss-augmented inference for point si

             CResultSet* result = m_model->argmax(m_w, si);


             // 2) get the subgradient

             // psi_i(y) := phi(x_i,y_i) - phi(x_i, y_pred)

             SGVector<float64_t> psi_i(M);

             if (result->psi_computed)

             {

                 SGVector<float64_t>::add(psi_i.vector,

                     1.0, result->psi_truth.vector, -1.0, result->psi_pred.vector,

                     psi_i.vlen);

             }

             else if(result->psi_computed_sparse)

             {

                 psi_i.zero();

                 result->psi_pred_sparse.add_to_dense(1.0, psi_i.vector, psi_i.vlen);

                 result->psi_truth_sparse.add_to_dense(-1.0, psi_i.vector, psi_i.vlen);

             }

             else

             {

                 SG_ERROR("model(%s) should have either of psi_computed or psi_computed_sparse"

                         "to be set true\n", m_model->get_name());

             }


             // 3) loss_i = L(y_i, y_pred)

             float64_t loss_i = result->delta;

             ASSERT(loss_i - CMath::dot(m_w.vector, psi_i.vector, m_w.vlen) >= -1e-12);


             // 4) update w_s and ell_s

             w_s.add(psi_i);

             ell_s += loss_i;


             SG_UNREF(result);


         } // end si


         w_s.scale(1.0 / (N*m_lambda));

         ell_s /= N;


         // 5) duality gap

         SGVector<float64_t> w_diff = m_w.clone();

         SGVector<float64_t>::add(w_diff.vector, 1.0, m_w.vector, -1.0, w_s.vector, w_s.vlen);

         float64_t dual_gap = m_lambda * CMath::dot(m_w.vector, w_diff.vector, m_w.vlen) - m_ell + ell_s;


         // Debug: compute primal and dual objectives and training error

         if (m_verbose)

         {

             float64_t primal = CSOSVMHelper::primal_objective(m_w, m_model, m_lambda);

             float64_t dual = CSOSVMHelper::dual_objective(m_w, m_ell, m_lambda);

             ASSERT(CMath::fequals_abs(primal - dual, dual_gap, 1e-12));

             float64_t train_error = CSOSVMHelper::average_loss(m_w, m_model); // Note train_error isn't ell_s


             SG_SPRINT("pass %d (iteration %d), primal = %f, dual = %f, duality gap = %f, train_error = %f \n",

                 pi, k, primal, dual, dual_gap, train_error);


             m_helper->add_debug_info(primal, (1.0*k) / N, train_error, dual, dual_gap);

         }


         // 6) check duality gap

         if (dual_gap <= m_gap_threshold)

         {

             SG_DEBUG("iteration %d...\n", k);

             SG_DEBUG("current gap: %f, gap_threshold: %f\n", dual_gap, m_gap_threshold);

             SG_DEBUG("Duality gap below threshold -- stopping!\n");

             break; // stop main loop

         }

         else

         {

             SG_DEBUG("iteration %d...\n", k);

             SG_DEBUG("current gap: %f.\n", dual_gap);

         }


         // 7) step-size gamma

         float64_t gamma = 1.0 / (k+1.0);

         if (m_do_line_search)

         {

             gamma = dual_gap / (m_lambda \

                     * (CMath::dot(w_diff.vector, w_diff.vector, w_diff.vlen) + 1e-12));

             gamma = ((gamma > 1 ? 1 : gamma) < 0) ? 0 : gamma; // clip to [0,1], or max(0,min(1,gamma))

         }


         // 8) finally update w and ell

         SGVector<float64_t>::add(m_w.vector, 1.0-gamma, m_w.vector, gamma, w_s.vector, m_w.vlen);

         m_ell = (1.0-gamma) * m_ell + gamma * ell_s;


     } // end pi


     if (m_verbose)

         m_helper->terminate();


     SG_DEBUG("Leaving CFWSOSVM::train_machine.\n");

     return true;

 }


 float64_t CFWSOSVM::get_lambda() const

 {

     return m_lambda;

 }


 void CFWSOSVM::set_lambda(float64_t lbda)

 {

     m_lambda = lbda;

 }


 int32_t CFWSOSVM::get_num_iter() const

 {

     return m_num_iter;

 }


 void CFWSOSVM::set_num_iter(int32_t num_iter)

 {

     m_num_iter = num_iter;

 }


 float64_t CFWSOSVM::get_gap_threshold() const

 {

     return m_gap_threshold;

 }


 void CFWSOSVM::set_gap_threshold(float64_t gap_threshold)

 {

     m_gap_threshold = gap_threshold;

 }


 float64_t CFWSOSVM::get_ell() const

 {

     return m_ell;

 }


 void CFWSOSVM::set_ell(float64_t ell)

 {

     m_ell = ell;

 }


shogun::CResultSet::psi_truth
SGVector< float64_t > psi_truth
Definition: StructuredModel.h:72

shogun::EMachineType
EMachineType
Definition: Machine.h:33

shogun::CStructuredLabels
Base class of the labels used in Structured Output (SO) problems.
Definition: StructuredLabels.h:25

shogun::CFWSOSVM::set_ell
void set_ell(float64_t ell)
Definition: FWSOSVM.cpp:245

shogun::CFWSOSVM::CFWSOSVM
CFWSOSVM()
Definition: FWSOSVM.cpp:18

Math.h

LabelsFactory.h

shogun::CSOSVMHelper::terminate
void terminate()
Definition: SOSVMHelper.cpp:157

shogun::CResultSet::psi_computed_sparse
bool psi_computed_sparse
Definition: StructuredModel.h:66

shogun::CMachine::m_labels
CLabels * m_labels
Definition: Machine.h:361

SG_ERROR
#define SG_ERROR(...)
Definition: SGIO.h:129

REQUIRE
#define REQUIRE(x,...)
Definition: SGIO.h:206

shogun::CSOSVMHelper::primal_objective
static float64_t primal_objective(SGVector< float64_t > w, CStructuredModel *model, float64_t lbda)
Definition: SOSVMHelper.cpp:57

shogun::CStructuredOutputMachine::m_model
CStructuredModel * m_model
Definition: StructuredOutputMachine.h:214

shogun::CStructuredModel::get_dim
virtual int32_t get_dim() const =0

FWSOSVM.h

shogun::CT_FWSOSVM
Definition: Machine.h:92

shogun::CMath::fequals_abs
static bool fequals_abs(const T &a, const T &b, const float64_t eps)
Definition: Math.h:318

shogun::SGVector::scale
void scale(T alpha)
Scale vector inplace.
Definition: SGVector.cpp:843

SG_REF
#define SG_REF(x)
Definition: SGObject.h:51

shogun::CFWSOSVM::get_lambda
float64_t get_lambda() const
Definition: FWSOSVM.cpp:210

shogun::CFWSOSVM::get_num_iter
int32_t get_num_iter() const
Definition: FWSOSVM.cpp:220

shogun::MS_NOT_AVAILABLE
Definition: SGObject.h:89

shogun::CFWSOSVM::train_machine
virtual bool train_machine(CFeatures *data=NULL)
Definition: FWSOSVM.cpp:67

shogun::CStructuredModel::init_training
virtual void init_training()
Definition: StructuredModel.cpp:178

shogun::SGVector::vlen
index_t vlen
Definition: SGVector.h:494

shogun::SGVector::zero
void zero()
Definition: SGVector.cpp:138

shogun::SGVector::vector
T * vector
Definition: SGVector.h:492

SG_SPRINT
#define SG_SPRINT(...)
Definition: SGIO.h:180

shogun::CFWSOSVM::set_lambda
void set_lambda(float64_t lbda)
Definition: FWSOSVM.cpp:215

ASSERT
#define ASSERT(x)
Definition: SGIO.h:201

shogun::CFWSOSVM::get_gap_threshold
float64_t get_gap_threshold() const
Definition: FWSOSVM.cpp:230

shogun::CStructuredOutputMachine::set_features
void set_features(CFeatures *f)
Definition: StructuredOutputMachine.cpp:74

shogun::SGVector< float64_t >

shogun::CStructuredOutputMachine::m_helper
CSOSVMHelper * m_helper
Definition: StructuredOutputMachine.h:223

shogun::SGSparseVector::add_to_dense
void add_to_dense(T alpha, T *vec, int32_t dim, bool abs_val=false)
Definition: SGSparseVector.cpp:78

float64_t
double float64_t
Definition: common.h:50

shogun::CSOSVMHelper::dual_objective
static float64_t dual_objective(SGVector< float64_t > w, float64_t aloss, float64_t lbda)
Definition: SOSVMHelper.cpp:83

shogun::CSOSVMHelper
class CSOSVMHelper contains helper functions to compute primal objectives, dual objectives, average training losses, duality gaps etc. These values will be recorded to check convergence. This class is inspired by the matlab implementation of the block coordinate Frank-Wolfe SOSVM solver [1].
Definition: SOSVMHelper.h:31

shogun::CFWSOSVM::~CFWSOSVM
~CFWSOSVM()
Definition: FWSOSVM.cpp:58

shogun::CFWSOSVM::set_gap_threshold
void set_gap_threshold(float64_t gap_threshold)
Definition: FWSOSVM.cpp:235

shogun::CFWSOSVM::get_ell
float64_t get_ell() const
Definition: FWSOSVM.cpp:240

shogun::CMath::dot
static float64_t dot(const bool *v1, const bool *v2, int32_t n)
Compute dot product between v1 and v2 (blas optimized)
Definition: Math.h:627

shogun::CStructuredModel::check_training_setup
virtual bool check_training_setup() const
Definition: StructuredModel.cpp:183

shogun::CSOSVMHelper::average_loss
static float64_t average_loss(SGVector< float64_t > w, CStructuredModel *model, bool is_ub=false)
Definition: SOSVMHelper.cpp:88

shogun::CResultSet::psi_computed
bool psi_computed
Definition: StructuredModel.h:69

shogun::CStructuredOutputMachine::m_verbose
bool m_verbose
Definition: StructuredOutputMachine.h:226

shogun::CStructuredModel
Class CStructuredModel that represents the application specific model and contains most of the applic...
Definition: StructuredModel.h:101

shogun::CResultSet
Definition: StructuredModel.h:51

SG_UNREF
#define SG_UNREF(x)
Definition: SGObject.h:52

SG_DEBUG
#define SG_DEBUG(...)
Definition: SGIO.h:107

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

shogun::CFWSOSVM::get_name
virtual const char * get_name() const
Definition: FWSOSVM.h:46

shogun::CStructuredModel::argmax
virtual CResultSet * argmax(SGVector< float64_t > w, int32_t feat_idx, bool const training=true)=0

shogun::CSOSVMHelper::add_debug_info
virtual void add_debug_info(float64_t primal, float64_t eff_pass, float64_t train_error, float64_t dual=-1, float64_t dgap=-1)
Definition: SOSVMHelper.cpp:108

shogun::CStructuredLabels::get_num_labels
virtual int32_t get_num_labels() const
Definition: StructuredLabels.cpp:76

shogun::CFeatures
The class Features is the base class of all feature objects.
Definition: Features.h:68

shogun::SGVector::clone
SGVector< T > clone() const
Definition: SGVector.cpp:209

shogun::CLinearStructuredOutputMachine::m_w
SGVector< float64_t > m_w
Definition: LinearStructuredOutputMachine.h:82

shogun::CFWSOSVM::set_num_iter
void set_num_iter(int32_t num_iter)
Definition: FWSOSVM.cpp:225

shogun::CResultSet::delta
float64_t delta
Definition: StructuredModel.h:88

shogun::CResultSet::psi_pred
SGVector< float64_t > psi_pred
Definition: StructuredModel.h:75

shogun::CResultSet::psi_truth_sparse
SGSparseVector< float64_t > psi_truth_sparse
Definition: StructuredModel.h:78

shogun::CLabelsFactory::to_structured
static CStructuredLabels * to_structured(CLabels *base_labels)
Definition: LabelsFactory.cpp:57

SG_ADD
#define SG_ADD(...)
Definition: SGObject.h:81

shogun::CStructuredModel::get_name
virtual const char * get_name() const
Definition: StructuredModel.h:260

shogun::CFWSOSVM::get_classifier_type
virtual EMachineType get_classifier_type()
Definition: FWSOSVM.cpp:62

SGVector.h

shogun::CResultSet::psi_pred_sparse
SGSparseVector< float64_t > psi_pred_sparse
Definition: StructuredModel.h:81

shogun::CLinearStructuredOutputMachine
Definition: LinearStructuredOutputMachine.h:26

shogun::SGVector::add
void add(const SGVector< T > x)
Definition: SGVector.cpp:281