en/latest/GradientModelSelection_8cpp_source.html

 /*

  * This program is free software; you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation; either version 3 of the License, or

  * (at your option) any later version.

  *

  * Written (W) 2013 Roman Votyakov

  * Copyright (C) 2012 Jacob Walker

  */


 #include <shogun/modelselection/GradientModelSelection.h>

 #ifdef USE_GPL_SHOGUN


 #ifdef HAVE_NLOPT


 #include <shogun/evaluation/GradientResult.h>

 #include <shogun/modelselection/ParameterCombination.h>

 #include <shogun/modelselection/ModelSelectionParameters.h>

 #include <shogun/machine/Machine.h>

 #include <nlopt.h>


 using namespace shogun;


 #ifndef DOXYGEN_SHOULD_SKIP_THIS


 struct nlopt_params

 {

     CMachineEvaluation* machine_eval;


     CParameterCombination* current_combination;


     CMap<TParameter*, CSGObject*>* parameter_dictionary;


     bool print_state;

 };


 double nlopt_function(unsigned n, const double* x, double* grad, void* func_data)

 {

     nlopt_params* params=(nlopt_params*)func_data;


     CMachineEvaluation* machine_eval=params->machine_eval;

     CParameterCombination* current_combination=params->current_combination;

     CMap<TParameter*, CSGObject*>* parameter_dictionary=params->parameter_dictionary;

     bool print_state=params->print_state;


     index_t offset=0;


     // set parameters from vector x

     for (index_t i=0; i<parameter_dictionary->get_num_elements(); i++)

     {

         CMapNode<TParameter*, CSGObject*>* node=parameter_dictionary->get_node_ptr(i);


         TParameter* param=node->key;

         CSGObject* parent=node->data;


         if (param->m_datatype.m_ctype==CT_VECTOR ||

                 param->m_datatype.m_ctype==CT_SGVECTOR ||

                 param->m_datatype.m_ctype==CT_SGMATRIX ||

                 param->m_datatype.m_ctype==CT_MATRIX)

         {


             for (index_t j=0; j<param->m_datatype.get_num_elements(); j++)

             {


                 bool result=current_combination->set_parameter(param->m_name,

                         (float64_t)x[offset++], parent, j);

                  REQUIRE(result, "Parameter %s not found in combination tree\n",

                          param->m_name)

             }

         }

         else

         {

             bool result=current_combination->set_parameter(param->m_name,

                     (float64_t)x[offset++], parent);

             REQUIRE(result, "Parameter %s not found in combination tree\n",

                     param->m_name)

         }

     }


     // apply current combination to the machine

     CMachine* machine=machine_eval->get_machine();

     current_combination->apply_to_machine(machine);

     if (print_state)

     {

         SG_SPRINT("Current combination\n");

         current_combination->print_tree();

     }

     SG_UNREF(machine);


     // evaluate the machine

     CEvaluationResult* evaluation_result=machine_eval->evaluate();

     CGradientResult* gradient_result=CGradientResult::obtain_from_generic(

             evaluation_result);

     SG_UNREF(evaluation_result);


     if (print_state)

     {

         SG_SPRINT("Current result\n");

         gradient_result->print_result();

     }


     // get value of the function, gradients and parameter dictionary

     SGVector<float64_t> value=gradient_result->get_value();

     CMap<TParameter*, SGVector<float64_t> >* gradient=gradient_result->get_gradient();

     CMap<TParameter*, CSGObject*>* gradient_dictionary=

         gradient_result->get_paramter_dictionary();

     SG_UNREF(gradient_result);


     offset=0;


     // set derivative for each parameter from parameter dictionary

     for (index_t i=0; i<parameter_dictionary->get_num_elements(); i++)

     {

         CMapNode<TParameter*, CSGObject*>* node=parameter_dictionary->get_node_ptr(i);


         SGVector<float64_t> derivative;


         for (index_t j=0; j<gradient_dictionary->get_num_elements(); j++)

         {

             CMapNode<TParameter*, CSGObject*>* gradient_node=

                 gradient_dictionary->get_node_ptr(j);


             if (gradient_node->data==node->data &&

                     !strcmp(gradient_node->key->m_name, node->key->m_name))

             {

                 derivative=gradient->get_element(gradient_node->key);

             }

         }


         REQUIRE(derivative.vlen, "Can't find gradient wrt %s parameter!\n",

                 node->key->m_name);


         memcpy(grad+offset, derivative.vector, sizeof(double)*derivative.vlen);


         offset+=derivative.vlen;

     }


     SG_UNREF(gradient);

     SG_UNREF(gradient_dictionary);


     return (double)(SGVector<float64_t>::sum(value));

 }


 #endif /* DOXYGEN_SHOULD_SKIP_THIS */


 CGradientModelSelection::CGradientModelSelection() : CModelSelection()

 {

     init();

 }


 CGradientModelSelection::CGradientModelSelection(CMachineEvaluation* machine_eval,

         CModelSelectionParameters* model_parameters)

         : CModelSelection(machine_eval, model_parameters)

 {

     init();

 }


 CGradientModelSelection::~CGradientModelSelection()

 {

 }


 void CGradientModelSelection::init()

 {

     m_max_evaluations=1000;

     m_grad_tolerance=1e-6;


     SG_ADD(&m_grad_tolerance, "gradient_tolerance", "Gradient tolerance",

             MS_NOT_AVAILABLE);

     SG_ADD(&m_max_evaluations, "max_evaluations", "Maximum number of evaluations",

             MS_NOT_AVAILABLE);

 }


 CParameterCombination* CGradientModelSelection::select_model(bool print_state)

 {

     if (!m_model_parameters)

     {

         CMachine* machine=m_machine_eval->get_machine();


         CParameterCombination* current_combination=new CParameterCombination(machine);

         SG_REF(current_combination);


         if (print_state)

         {

             SG_PRINT("Initial combination:\n");

             current_combination->print_tree();

         }


         // get total length of variables

         index_t total_variables=current_combination->get_parameters_length();


         // build parameter->value map

         CMap<TParameter*, SGVector<float64_t> >* argument=

             new CMap<TParameter*, SGVector<float64_t> >();

         current_combination->build_parameter_values_map(argument);


         //  unroll current parameter combination into vector

         SGVector<double> x(total_variables);

         index_t offset=0;


         for (index_t i=0; i<argument->get_num_elements(); i++)

         {

             CMapNode<TParameter*, SGVector<float64_t> >* node=argument->get_node_ptr(i);

             memcpy(x.vector+offset, node->data.vector, sizeof(double)*node->data.vlen);

             offset+=node->data.vlen;

         }


         SG_UNREF(argument);


         // create nlopt object and choose MMA (Method of Moving Asymptotes)

         // optimization algorithm

         nlopt_opt opt=nlopt_create(NLOPT_LD_MMA, total_variables);


         // currently we assume all parameters are positive

         // (this is NOT true when inducing points and Full Matrix GaussianARDKernel are optimized)

         // create lower bound vector (lb=-inf)

         //SGVector<double> lower_bound(total_variables);

         //lower_bound.set_const(1e-6);


         // create upper bound vector (ub=inf)

         //SGVector<double> upper_bound(total_variables);

         //upper_bound.set_const(HUGE_VAL);


         // set upper and lower bound

         //nlopt_set_lower_bounds(opt, lower_bound.vector);

         //nlopt_set_upper_bounds(opt, upper_bound.vector);


         // set maximum number of evaluations

         nlopt_set_maxeval(opt, m_max_evaluations);


         // set absolute argument tolearance

         nlopt_set_xtol_abs1(opt, m_grad_tolerance);

         nlopt_set_ftol_abs(opt, m_grad_tolerance);


         // build parameter->sgobject map from current parameter combination

         CMap<TParameter*, CSGObject*>* parameter_dictionary=

             new CMap<TParameter*, CSGObject*>();

         current_combination->build_parameter_parent_map(parameter_dictionary);


         // nlopt parameters

         nlopt_params params;


         params.current_combination=current_combination;

         params.machine_eval=m_machine_eval;

         params.print_state=print_state;

         params.parameter_dictionary=parameter_dictionary;


         // choose evaluation direction (minimize or maximize objective function)

         if (m_machine_eval->get_evaluation_direction()==ED_MINIMIZE)

         {

             if (print_state)

                 SG_PRINT("Minimizing objective function:\n");


             nlopt_set_min_objective(opt, nlopt_function, &params);

         }

         else

         {

             if (print_state)

                 SG_PRINT("Maximizing objective function:\n");


             nlopt_set_max_objective(opt, nlopt_function, &params);

         }


         // the minimum objective value, upon return

         double minf;


         // optimize our function

         nlopt_result result=nlopt_optimize(opt, x.vector, &minf);


         REQUIRE(result>0, "NLopt failed while optimizing objective function!\n");


         if (print_state)

         {

             SG_PRINT("Best combination:\n");

             current_combination->print_tree();

         }


         // clean up

         nlopt_destroy(opt);

         SG_UNREF(machine);

         SG_UNREF(parameter_dictionary);


         return current_combination;

     }

     else

     {

         SG_NOTIMPLEMENTED

         return NULL;

     }

 }


 #endif /* HAVE_NLOPT */


 #endif //USE_GPL_SHOGUN

GradientModelSelection.h

node
Definition: JLCoverTree.h:42

shogun::TParameter::m_name
char * m_name
Definition: base/Parameter.h:145

ModelSelectionParameters.h

index_t
int32_t index_t
Definition: common.h:62

shogun::CParameterCombination::set_parameter
bool set_parameter(const char *name, T value, CSGObject *parent, index_t index=-1)
Definition: ParameterCombination.h:141

GradientResult.h

shogun::CMap::get_element
T get_element(const K &key)
Definition: Map.h:171

shogun::ED_MINIMIZE
Definition: Evaluation.h:31

shogun::TParameter
parameter struct
Definition: base/Parameter.h:32

REQUIRE
#define REQUIRE(x,...)
Definition: SGIO.h:206

SG_NOTIMPLEMENTED
#define SG_NOTIMPLEMENTED
Definition: SGIO.h:139

shogun::TSGDataType::get_num_elements
int64_t get_num_elements()
Definition: DataType.cpp:464

shogun::CParameterCombination::print_tree
void print_tree(int prefix_num=0) const
Definition: ParameterCombination.cpp:307

SG_REF
#define SG_REF(x)
Definition: SGObject.h:54

shogun::CMachine
A generic learning machine interface.
Definition: Machine.h:143

shogun::CModelSelectionParameters
Class to select parameters and their ranges for model selection. The structure is organized as a tree...
Definition: ModelSelectionParameters.h:71

shogun::MS_NOT_AVAILABLE
Definition: SGObject.h:92

shogun::CGradientResult::print_result
virtual void print_result()
Definition: GradientResult.h:76

shogun::CMap::get_node_ptr
CMapNode< K, T > * get_node_ptr(int32_t index)
Definition: Map.h:247

shogun::CMachineEvaluation::evaluate
virtual CEvaluationResult * evaluate()=0

shogun::CModelSelection
Abstract base class for model selection.
Definition: ModelSelection.h:31

shogun::CGradientResult::obtain_from_generic
static CGradientResult * obtain_from_generic(CEvaluationResult *eval_result)
Definition: GradientResult.h:55

shogun::TParameter::m_datatype
TSGDataType m_datatype
Definition: base/Parameter.h:141

shogun::SGVector::vlen
index_t vlen
Definition: SGVector.h:494

shogun::SGVector::vector
T * vector
Definition: SGVector.h:492

SG_PRINT
#define SG_PRINT(...)
Definition: SGIO.h:137

SG_SPRINT
#define SG_SPRINT(...)
Definition: SGIO.h:180

shogun::CSGObject
Class SGObject is the base class of all shogun objects.
Definition: SGObject.h:115

shogun::CMachineEvaluation::get_machine
CMachine * get_machine() const
Definition: MachineEvaluation.cpp:104

shogun::SGVector< float64_t >

shogun::CGradientResult::get_paramter_dictionary
virtual CMap< TParameter *, CSGObject * > * get_paramter_dictionary()
Definition: GradientResult.h:206

float64_t
double float64_t
Definition: common.h:50

shogun::CEvaluationResult
Abstract class that contains the result generated by the MachineEvaluation class. ...
Definition: EvaluationResult.h:32

shogun::CMachineEvaluation
Machine Evaluation is an abstract class that evaluates a machine according to some criterion...
Definition: MachineEvaluation.h:36

shogun::CGradientResult::get_gradient
virtual CMap< TParameter *, SGVector< float64_t > > * get_gradient()
Definition: GradientResult.h:184

shogun::SGVector::sum
static T sum(T *vec, int32_t len)
Return sum(vec)
Definition: SGVector.h:354

shogun::CParameterCombination
Class that holds ONE combination of parameters for a learning machine. The structure is organized as ...
Definition: ParameterCombination.h:43

shogun::CParameterCombination::build_parameter_parent_map
virtual void build_parameter_parent_map(CMap< TParameter *, CSGObject * > *parent_map)
Definition: ParameterCombination.cpp:807

Machine.h

shogun::TSGDataType::m_ctype
EContainerType m_ctype
Definition: DataType.h:71

SG_UNREF
#define SG_UNREF(x)
Definition: SGObject.h:55

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

shogun::CGradientResult
Container class that returns results from GradientEvaluation. It contains the function value as well ...
Definition: GradientResult.h:26

ParameterCombination.h

shogun::CGradientResult::get_value
virtual SGVector< float64_t > get_value()
Definition: GradientResult.h:153

shogun::CParameterCombination::get_parameters_length
virtual uint32_t get_parameters_length()
Definition: ParameterCombination.h:241

shogun::CParameterCombination::build_parameter_values_map
virtual void build_parameter_values_map(CMap< TParameter *, SGVector< float64_t > > *values_map)
Definition: ParameterCombination.cpp:768

shogun::CMap::get_num_elements
int32_t get_num_elements() const
Definition: Map.h:211

SG_ADD
#define SG_ADD(...)
Definition: SGObject.h:84

shogun::CParameterCombination::apply_to_machine
void apply_to_machine(CMachine *machine) const
Definition: ParameterCombination.cpp:707

shogun::CMap
the class CMap, a map based on the hash-table. w: http://en.wikipedia.org/wiki/Hash_table ...
Definition: SGObject.h:39