cn/current/PrimalMosekSOSVM_8cpp_source.html

 /*

  * This program is free software; you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation; either version 3 of the License, or

  * (at your option) any later version.

  *

  * Written (W) 2014 Shell Hu

  * Written (W) 2012 Fernando José Iglesias García

  * Copyright (C) 2012 Fernando José Iglesias García

  */


 #ifdef USE_MOSEK


 #include <shogun/lib/DynamicObjectArray.h>

 #include <shogun/lib/List.h>

 #include <shogun/mathematics/Math.h>

 #include <shogun/structure/PrimalMosekSOSVM.h>

 #include <shogun/loss/HingeLoss.h>


 using namespace shogun;


 CPrimalMosekSOSVM::CPrimalMosekSOSVM()

 : CLinearStructuredOutputMachine(),

     po_value(0.0)

 {

     init();

 }


 CPrimalMosekSOSVM::CPrimalMosekSOSVM(

         CStructuredModel*  model,

         CStructuredLabels* labs)

 : CLinearStructuredOutputMachine(model, labs),

     po_value(0.0)

 {

     init();

 }


 void CPrimalMosekSOSVM::init()

 {

     SG_ADD(&m_slacks, "slacks", "Slacks vector", MS_NOT_AVAILABLE);

     //FIXME model selection available for SO machines

     SG_ADD(&m_regularization, "regularization", "Regularization constant", MS_NOT_AVAILABLE);

     SG_ADD(&m_epsilon, "epsilon", "Violation tolerance", MS_NOT_AVAILABLE);

     SG_ADD(&m_lb, "lb", "Lower bounds", MS_NOT_AVAILABLE);

     SG_ADD(&m_ub, "ub", "Upper bounds", MS_NOT_AVAILABLE);


     m_regularization = 1.0;

     m_epsilon = 0.0;

 }


 CPrimalMosekSOSVM::~CPrimalMosekSOSVM()

 {

 }


 bool CPrimalMosekSOSVM::train_machine(CFeatures* data)

 {

     SG_DEBUG("Entering CPrimalMosekSOSVM::train_machine.\n");

     if (data)

         set_features(data);


     CFeatures* model_features = get_features();

     // Initialize the model for training

     m_model->init_training();

     // Check that the scenary is correct to start with training

     m_model->check_training_setup();

     SG_DEBUG("The training setup is correct.\n");


     // Dimensionality of the joint feature space

     int32_t M = m_model->get_dim();

     // Number of auxiliary variables in the optimization vector

     int32_t num_aux = m_model->get_num_aux();

     // Number of auxiliary constraints

     int32_t num_aux_con = m_model->get_num_aux_con();

     // Number of training examples

     int32_t N = model_features->get_num_vectors();


     SG_DEBUG("M=%d, N =%d, num_aux=%d, num_aux_con=%d.\n", M, N, num_aux, num_aux_con);


     // Interface with MOSEK

     CMosek* mosek = new CMosek(0, M+num_aux+N);

     SG_REF(mosek);

     REQUIRE(mosek->get_rescode() == MSK_RES_OK, "Mosek object could not be properly created in PrimalMosekSOSVM training.\n");


     // Initialize the terms of the optimization problem

     SGMatrix< float64_t > A, B, C;

     SGVector< float64_t > a, b, lb, ub;

     m_model->init_primal_opt(m_regularization, A, a, B, b, lb, ub, C);


     REQUIRE(lb.vlen == 0 || lb.vlen == M,

         "%s::train_machine(): lb.vlen can only be 0 or w.vlen!\n", get_name());


     REQUIRE(ub.vlen == 0 || ub.vlen == M,

         "%s::train_machine(): ub.vlen can only be 0 or w.vlen!\n", get_name());


     if (lb.vlen == M)

         set_lower_bounds(lb);


     if (ub.vlen == M)

         set_upper_bounds(ub);


     SG_DEBUG("Regularization used in PrimalMosekSOSVM equal to %.2f.\n", m_regularization);


     // Input terms of the problem that do not change between iterations

     REQUIRE(mosek->init_sosvm(M, N, num_aux, num_aux_con, C, m_lb, m_ub, A, b) == MSK_RES_OK,

         "Mosek error in PrimalMosekSOSVM initializing SO-SVM.\n")


     // Initialize the weight vector

     m_w = SGVector< float64_t >(M);

     m_w.zero();


     m_slacks = SGVector< float64_t >(N);

     m_slacks.zero();


     // Initialize the list of constraints

     // Each element in results is a list of CResultSet with the constraints

     // associated to each training example

     CDynamicObjectArray* results = new CDynamicObjectArray(N);

     SG_REF(results);

     for ( int32_t i = 0 ; i < N ; ++i )

     {

         CList* list = new CList(true);

         results->push_back(list);

     }


     // Initialize variables used in the loop

     int32_t     num_con     = num_aux_con;  // number of constraints

     int32_t     old_num_con = num_con;

     bool        exception   = false;

     index_t     iteration   = 0;


     SGVector< float64_t > sol(M+num_aux+N);

     sol.zero();


     SGVector< float64_t > aux(num_aux);


     do

     {

         SG_DEBUG("Iteration #%d: Cutting plane training with num_con=%d and old_num_con=%d.\n",

                 iteration, num_con, old_num_con);


         old_num_con = num_con;


         for ( int32_t i = 0 ; i < N ; ++i )

         {

             // Predict the result of the ith training example (loss-aug)

             CResultSet* result = m_model->argmax(m_w, i);


             // Compute the loss associated with the prediction (surrogate loss, max(0, \tilde{H}))

             float64_t slack = CHingeLoss().loss( compute_loss_arg(result) );

             CList* cur_list = (CList*) results->get_element(i);


             // Update the list of constraints

             if ( cur_list->get_num_elements() > 0 )

             {

                 // Find the maximum loss within the elements of

                 // the list of constraints

                 CResultSet* cur_res = (CResultSet*) cur_list->get_first_element();

                 float64_t max_slack = -CMath::INFTY;


                 while ( cur_res != NULL )

                 {

                     max_slack = CMath::max(max_slack, CHingeLoss().loss( compute_loss_arg(cur_res) ));


                     SG_UNREF(cur_res);

                     cur_res = (CResultSet*) cur_list->get_next_element();

                 }


                 if ( slack > max_slack + m_epsilon )

                 {

                     // The current training example is a

                     // violated constraint

                     if ( ! insert_result(cur_list, result) )

                     {

                         exception = true;

                         break;

                     }


                     add_constraint(mosek, result, num_con, i);

                     ++num_con;

                 }

             }

             else

             {

                 // First iteration of do ... while, add constraint

                 if ( ! insert_result(cur_list, result) )

                 {

                     exception = true;

                     break;

                 }


                 add_constraint(mosek, result, num_con, i);

                 ++num_con;

             }


             SG_UNREF(cur_list);

             SG_UNREF(result);

         }


         // Solve the QP

         SG_DEBUG("Entering Mosek QP solver.\n");


         mosek->optimize(sol);

         for ( int32_t i = 0 ; i < M+num_aux+N ; ++i )

         {

             if ( i < M )

                 m_w[i] = sol[i];

             else if ( i < M+num_aux )

                 aux[i-M] = sol[i];

             else

                 m_slacks[i-M-num_aux] = sol[i];

         }


         SG_DEBUG("QP solved. The primal objective value is %.4f.\n", mosek->get_primal_objective_value());


         ++iteration;


     } while ( old_num_con != num_con && ! exception );


     po_value = mosek->get_primal_objective_value();


     // Free resources

     SG_UNREF(results);

     SG_UNREF(mosek);

     SG_UNREF(model_features);

     return true;

 }


 float64_t CPrimalMosekSOSVM::compute_loss_arg(CResultSet* result) const

 {

     // Dimensionality of the joint feature space

     int32_t M = m_w.vlen;


     if(result->psi_computed)

     {

         return  CMath::dot(m_w.vector, result->psi_pred.vector, M) +

             result->delta -

             CMath::dot(m_w.vector, result->psi_truth.vector, M);

     }

     else if(result->psi_computed_sparse)

     {

         return result->psi_pred_sparse.dense_dot(1.0, m_w.vector, m_w.vlen, 0) +

             result->delta -

             result->psi_truth_sparse.dense_dot(1.0, m_w.vector, m_w.vlen, 0);

     }

     else

     {

         SG_ERROR("model(%s) should have either of psi_computed or psi_computed_sparse"

                 "to be set true\n", m_model->get_name());

         return 0;

     }

 }


 bool CPrimalMosekSOSVM::insert_result(CList* result_list, CResultSet* result) const

 {

     bool succeed = result_list->insert_element(result);


     if ( ! succeed )

     {

         SG_PRINT("ResultSet could not be inserted in the list..."

              "aborting training of PrimalMosekSOSVM\n");

     }


     return succeed;

 }


 bool CPrimalMosekSOSVM::add_constraint(

         CMosek* mosek,

         CResultSet* result,

         index_t con_idx,

         index_t train_idx) const

 {

     int32_t M = m_model->get_dim();

     SGVector< float64_t > dPsi(M);


     if (result->psi_computed)

     {

         for ( int i = 0 ; i < M ; ++i )

             dPsi[i] = result->psi_pred[i] - result->psi_truth[i]; // -dPsi(y)

     }

     else if(result->psi_computed_sparse)

     {

         dPsi.zero();

         result->psi_pred_sparse.add_to_dense(1.0, dPsi.vector, dPsi.vlen);

         result->psi_truth_sparse.add_to_dense(-1.0, dPsi.vector, dPsi.vlen);

     }

     else

     {

         SG_ERROR("model(%s) should have either of psi_computed or psi_computed_sparse"

                 "to be set true\n", m_model->get_name());

     }


     return ( mosek->add_constraint_sosvm(dPsi, con_idx, train_idx,

             m_model->get_num_aux(), -result->delta) == MSK_RES_OK );

 }


 float64_t CPrimalMosekSOSVM::compute_primal_objective() const

 {

     return po_value;

 }


 EMachineType CPrimalMosekSOSVM::get_classifier_type()

 {

     return CT_PRIMALMOSEKSOSVM;

 }


 void CPrimalMosekSOSVM::set_regularization(float64_t C)

 {

     m_regularization = C;

 }


 void CPrimalMosekSOSVM::set_epsilon(float64_t epsilon)

 {

     m_epsilon = epsilon;

 }


 void CPrimalMosekSOSVM::set_lower_bounds(SGVector< float64_t > lb)

 {

     m_lb = lb.clone();

 }


 void CPrimalMosekSOSVM::set_upper_bounds(SGVector< float64_t > ub)

 {

     m_ub = ub.clone();

 }


 #endif /* USE_MOSEK */

shogun::CResultSet::psi_truth
SGVector< float64_t > psi_truth
Definition: StructuredModel.h:72

shogun::CHingeLoss::loss
float64_t loss(float64_t prediction, float64_t label)
Definition: HingeLoss.cpp:22

shogun::EMachineType
EMachineType
Definition: Machine.h:33

shogun::CStructuredLabels
Base class of the labels used in Structured Output (SO) problems.
Definition: StructuredLabels.h:25

shogun::CPreprocessor::init
virtual bool init(CFeatures *features)=0

shogun::CList::get_next_element
CSGObject * get_next_element()
Definition: List.h:185

Math.h

index_t
int32_t index_t
Definition: common.h:62

shogun::CMath::INFTY
static const float64_t INFTY
infinity
Definition: Math.h:2048

shogun::CResultSet::psi_computed_sparse
bool psi_computed_sparse
Definition: StructuredModel.h:66

shogun::CFeatures::get_num_vectors
virtual int32_t get_num_vectors() const =0

SG_ERROR
#define SG_ERROR(...)
Definition: SGIO.h:129

DynamicObjectArray.h

REQUIRE
#define REQUIRE(x,...)
Definition: SGIO.h:206

SG_REF
#define SG_REF(x)
Definition: SGObject.h:51

shogun::SGMatrix< float64_t >

shogun::MS_NOT_AVAILABLE
Definition: SGObject.h:89

shogun::epsilon
static const float64_t epsilon
Definition: libbmrm.cpp:25

shogun::SGVector::vlen
index_t vlen
Definition: SGVector.h:494

shogun::CList::get_first_element
CSGObject * get_first_element()
Definition: List.h:151

shogun::SGVector::zero
void zero()
Definition: SGVector.cpp:138

shogun::SGVector::vector
T * vector
Definition: SGVector.h:492

SG_PRINT
#define SG_PRINT(...)
Definition: SGIO.h:137

shogun::SGVector< float64_t >

shogun::SGSparseVector::add_to_dense
void add_to_dense(T alpha, T *vec, int32_t dim, bool abs_val=false)
Definition: SGSparseVector.cpp:78

float64_t
double float64_t
Definition: common.h:50

PrimalMosekSOSVM.h

shogun::CList::get_num_elements
int32_t get_num_elements()
Definition: List.h:145

shogun::CMath::max
static T max(T a, T b)
Definition: Math.h:168

shogun::CDynamicObjectArray
Dynamic array class for CSGObject pointers that creates an array that can be used like a list or an a...
Definition: DynamicObjectArray.h:31

List.h

shogun::CMath::dot
static float64_t dot(const bool *v1, const bool *v2, int32_t n)
Compute dot product between v1 and v2 (blas optimized)
Definition: Math.h:627

shogun::SGSparseVector::dense_dot
T dense_dot(T alpha, T *vec, int32_t dim, T b)
Definition: SGSparseVector.cpp:58

shogun::CResultSet::psi_computed
bool psi_computed
Definition: StructuredModel.h:69

HingeLoss.h

shogun::CStructuredModel
Class CStructuredModel that represents the application specific model and contains most of the applic...
Definition: StructuredModel.h:101

shogun::CResultSet
Definition: StructuredModel.h:51

SG_UNREF
#define SG_UNREF(x)
Definition: SGObject.h:52

SG_DEBUG
#define SG_DEBUG(...)
Definition: SGIO.h:107

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

shogun::CFeatures
The class Features is the base class of all feature objects.
Definition: Features.h:68

shogun::CT_PRIMALMOSEKSOSVM
Definition: Machine.h:85

shogun::SGVector::clone
SGVector< T > clone() const
Definition: SGVector.cpp:209

shogun::CResultSet::argmax
CStructuredData * argmax
Definition: StructuredModel.h:63

shogun::CResultSet::delta
float64_t delta
Definition: StructuredModel.h:88

shogun::CResultSet::psi_pred
SGVector< float64_t > psi_pred
Definition: StructuredModel.h:75

shogun::CDynamicObjectArray::get_element
CSGObject * get_element(int32_t index) const
Definition: DynamicObjectArray.h:194

shogun::CHingeLoss
CHingeLoss implements the hinge loss function.
Definition: HingeLoss.h:29

shogun::CResultSet::psi_truth_sparse
SGSparseVector< float64_t > psi_truth_sparse
Definition: StructuredModel.h:78

shogun::CDynamicObjectArray::push_back
void push_back(CSGObject *e)
Definition: DynamicObjectArray.h:299

set_epsilon
void set_epsilon(float *begin, float max)
Definition: JLCoverTree.h:512

SG_ADD
#define SG_ADD(...)
Definition: SGObject.h:81

shogun::CResultSet::psi_pred_sparse
SGSparseVector< float64_t > psi_pred_sparse
Definition: StructuredModel.h:81

shogun::CLinearStructuredOutputMachine
Definition: LinearStructuredOutputMachine.h:26

shogun::CList
Class List implements a doubly connected list for low-level-objects.
Definition: List.h:84

shogun::CList::insert_element
bool insert_element(CSGObject *data)
Definition: List.h:447