en/latest/LBFGSMinimizer_8cpp_source.html

  /*

  * Copyright (c) The Shogun Machine Learning Toolbox

  * Written (w) 2015 Wu Lin

  * All rights reserved.

  *

  * Redistribution and use in source and binary forms, with or without

  * modification, are permitted provided that the following conditions are met:

  *

  * 1. Redistributions of source code must retain the above copyright notice, this

  *    list of conditions and the following disclaimer.

  * 2. Redistributions in binary form must reproduce the above copyright notice,

  *    this list of conditions and the following disclaimer in the documentation

  *    and/or other materials provided with the distribution.

  *

  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND

  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED

  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE

  * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR

  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES

  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND

  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS

  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

  *

  * The views and conclusions contained in the software and documentation are those

  * of the authors and should not be interpreted as representing official policies,

  * either expressed or implied, of the Shogun Development Team.

  *

  */

 #include <shogun/optimization/lbfgs/LBFGSMinimizer.h>

 #include <shogun/optimization/FirstOrderBoundConstraintsCostFunction.h>

 #include <shogun/base/Parameter.h>


 namespace shogun

 {

 CLBFGSMinimizer::CLBFGSMinimizer()

     :FirstOrderMinimizer()

 {

     init();

 }


 CLBFGSMinimizer::~CLBFGSMinimizer()

 {

 }


 CLBFGSMinimizer::CLBFGSMinimizer(FirstOrderCostFunction *fun)

     :FirstOrderMinimizer(fun)

 {

     FirstOrderBoundConstraintsCostFunction* bound_constraints_fun

         =dynamic_cast<FirstOrderBoundConstraintsCostFunction *>(m_fun);

     if(m_fun && bound_constraints_fun)

     {

         SG_SWARNING("The minimizer does not support constrained minimization. All constraints will be ignored.\n")

     }

     init();

 }


 void CLBFGSMinimizer::init()

 {

     set_lbfgs_parameters();

     m_min_step=1e-6;

     m_xtol=1e-6;

     SG_ADD(&m_linesearch_id, "CLBFGSMinimizer__m_linesearch_id",

         "linesearch_id in CLBFGSMinimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_m, "CLBFGSMinimizer__m_m",

         "m in CLBFGSMinimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_max_linesearch, "CLBFGSMinimizer__m_max_linesearch",

         "max_linesearch in CLBFGSMinimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_max_iterations, "CLBFGSMinimizer__m_max_iterations",

         "max_iterations in CLBFGSMinimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_delta, "CLBFGSMinimizer__m_delta",

         "delta in CLBFGSMinimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_past, "CLBFGSMinimizer__m_past",

         "past in CLBFGSMinimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_epsilon, "CLBFGSMinimizer__m_epsilon",

         "epsilon in CLBFGSMinimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_min_step, "CLBFGSMinimizer__m_min_step",

         "min_step in CLBFGSMinimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_max_step, "CLBFGSMinimizer__m_max_step",

         "max_step in CLBFGSMinimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_ftol, "CLBFGSMinimizer__m_ftol",

         "ftol in CLBFGSMinimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_wolfe, "CLBFGSMinimizer__m_wolfe",

         "wolfe in CLBFGSMinimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_gtol, "CLBFGSMinimizer__m_gtol",

         "gtol in CLBFGSMinimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_xtol, "CLBFGSMinimizer__m_xtol",

         "xtol in CLBFGSMinimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_orthantwise_c, "CLBFGSMinimizer__m_orthantwise_c",

         "orthantwise_c in CLBFGSMinimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_orthantwise_start, "CLBFGSMinimizer__m_orthantwise_start",

         "orthantwise_start in CLBFGSMinimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_orthantwise_end, "CLBFGSMinimizer__m_orthantwise_end",

         "orthantwise_end in CLBFGSMinimizer", MS_NOT_AVAILABLE);

     SG_ADD(&m_target_variable, "CLBFGSMinimizer__m_target_variable",

         "m_target_variable in CLBFGSMinimizer", MS_NOT_AVAILABLE);

 }


 void CLBFGSMinimizer::set_lbfgs_parameters(

         int32_t m,

         int32_t max_linesearch,

         ELBFGSLineSearch linesearch,

         int32_t max_iterations,

         float64_t delta,

         int32_t past,

         float64_t epsilon,

         float64_t min_step,

         float64_t max_step,

         float64_t ftol,

         float64_t wolfe,

         float64_t gtol,

         float64_t xtol,

         float64_t orthantwise_c,

         int32_t orthantwise_start,

         int32_t orthantwise_end)

 {

     m_m = m;

     m_max_linesearch = max_linesearch;

     m_linesearch_id = LBFGSLineSearchHelper::get_lbfgs_linear_search_id(linesearch);

     m_max_iterations = max_iterations;

     m_delta = delta;

     m_past = past;

     m_epsilon = epsilon;

     m_min_step = min_step;

     m_max_step = max_step;

     m_ftol = ftol;

     m_wolfe = wolfe;

     m_gtol = gtol;

     m_xtol = xtol;

     m_orthantwise_c = orthantwise_c;

     m_orthantwise_start = orthantwise_start;

     m_orthantwise_end = orthantwise_end;

 }


 void CLBFGSMinimizer::init_minimization()

 {

     REQUIRE(m_fun, "Cost function not set!\n");

     m_target_variable=m_fun->obtain_variable_reference();

     REQUIRE(m_target_variable.vlen>0,"Target variable from cost function must not empty!\n");

 }


 float64_t CLBFGSMinimizer::minimize()

 {

     lbfgs_parameter_t lbfgs_param;

     lbfgs_param.m = m_m;

     lbfgs_param.max_linesearch = m_max_linesearch;

     lbfgs_param.linesearch = LBFGSLineSearchHelper::get_lbfgs_linear_search(m_linesearch_id);

     lbfgs_param.max_iterations = m_max_iterations;

     lbfgs_param.delta = m_delta;

     lbfgs_param.past = m_past;

     lbfgs_param.epsilon = m_epsilon;

     lbfgs_param.min_step = m_min_step;

     lbfgs_param.max_step = m_max_step;

     lbfgs_param.ftol = m_ftol;

     lbfgs_param.wolfe = m_wolfe;

     lbfgs_param.gtol = m_gtol;

     lbfgs_param.xtol = m_xtol;

     lbfgs_param.orthantwise_c = m_orthantwise_c;

     lbfgs_param.orthantwise_start = m_orthantwise_start;

     lbfgs_param.orthantwise_end = m_orthantwise_end;


     init_minimization();


     float64_t cost=0.0;

     int32_t error_code=lbfgs(m_target_variable.vlen, m_target_variable.vector,

         &cost, CLBFGSMinimizer::evaluate,

         NULL, this, &lbfgs_param);


     if(error_code!=0 && error_code!=LBFGS_ALREADY_MINIMIZED)

     {

         SG_SWARNING("Error(s) happened during L-BFGS optimization (error code:%d)\n",

             error_code);

     }


     return cost;

 }


 float64_t CLBFGSMinimizer::evaluate(void *obj, const float64_t *variable,

     float64_t *gradient, const int32_t dim, const float64_t step)

 {

     /* Note that parameters = parameters_pre_iter - step * gradient_pre_iter */

     CLBFGSMinimizer * obj_prt

         = static_cast<CLBFGSMinimizer *>(obj);


     REQUIRE(obj_prt, "The instance object passed to L-BFGS optimizer should not be NULL\n");


     float64_t cost=obj_prt->m_fun->get_cost();


     if (CMath::is_nan(cost) || CMath::is_infinity(cost))

         return cost;


     //get the gradient wrt variable_new

     SGVector<float64_t> grad=obj_prt->m_fun->get_gradient();

     REQUIRE(grad.vlen==dim,

         "The length of gradient (%d) and the length of variable (%d) do not match\n",

         grad.vlen,dim);


     std::copy(grad.vector,grad.vector+dim,gradient);

     return cost;

 }


 }

shogun::FirstOrderCostFunction::get_gradient
virtual SGVector< float64_t > get_gradient()=0

shogun::CLBFGSMinimizer::minimize
virtual float64_t minimize()
Definition: LBFGSMinimizer.cpp:143

shogun::lbfgs_parameter_t::linesearch
int linesearch
Definition: lbfgs.h:234

shogun::lbfgs_parameter_t::m
int m
Definition: lbfgs.h:186

shogun::lbfgs_parameter_t::max_linesearch
int max_linesearch
Definition: lbfgs.h:241

shogun::lbfgs
int32_t lbfgs(int32_t n, float64_t *x, float64_t *ptr_fx, lbfgs_evaluate_t proc_evaluate, lbfgs_progress_t proc_progress, void *instance, lbfgs_parameter_t *_param, lbfgs_adjust_step_t proc_adjust_step)
Definition: lbfgs.cpp:208

shogun::CLBFGSMinimizer::init_minimization
virtual void init_minimization()
Definition: LBFGSMinimizer.cpp:136

shogun::lbfgs_parameter_t::orthantwise_end
int orthantwise_end
Definition: lbfgs.h:336

shogun::CLBFGSMinimizer::m_linesearch_id
int8_t m_linesearch_id
Definition: LBFGSMinimizer.h:150

shogun::CLBFGSMinimizer::CLBFGSMinimizer
CLBFGSMinimizer()
Definition: LBFGSMinimizer.cpp:37

Parameter.h

SG_SWARNING
#define SG_SWARNING(...)
Definition: SGIO.h:178

shogun::CLBFGSMinimizer::m_gtol
float64_t m_gtol
Definition: LBFGSMinimizer.h:177

FirstOrderBoundConstraintsCostFunction.h

shogun::lbfgs_parameter_t::orthantwise_c
float64_t orthantwise_c
Definition: lbfgs.h:313

shogun::FirstOrderMinimizer::m_fun
FirstOrderCostFunction * m_fun
Definition: FirstOrderMinimizer.h:146

shogun::CLBFGSMinimizer::m_orthantwise_end
int32_t m_orthantwise_end
Definition: LBFGSMinimizer.h:189

REQUIRE
#define REQUIRE(x,...)
Definition: SGIO.h:206

LBFGSMinimizer.h

shogun::lbfgs_parameter_t::max_iterations
int max_iterations
Definition: lbfgs.h:227

shogun::CLBFGSMinimizer::m_max_linesearch
int32_t m_max_linesearch
Definition: LBFGSMinimizer.h:147

shogun::lbfgs_parameter_t::max_step
float64_t max_step
Definition: lbfgs.h:259

shogun::FirstOrderBoundConstraintsCostFunction
The first order cost function base class with bound constrains.
Definition: FirstOrderBoundConstraintsCostFunction.h:45

shogun::CLBFGSMinimizer::m_orthantwise_c
float64_t m_orthantwise_c
Definition: LBFGSMinimizer.h:183

shogun::CLBFGSMinimizer
The class wraps the Shogun's C-style LBFGS minimizer.
Definition: LBFGSMinimizer.h:40

shogun::MS_NOT_AVAILABLE
Definition: SGObject.h:92

shogun::SGVector::vlen
index_t vlen
Definition: SGVector.h:494

shogun::SGVector::vector
T * vector
Definition: SGVector.h:492

shogun::SGVector< float64_t >

shogun::lbfgs_parameter_t::orthantwise_start
int orthantwise_start
Definition: lbfgs.h:327

float64_t
double float64_t
Definition: common.h:50

shogun::FirstOrderCostFunction
The first order cost function base class.
Definition: FirstOrderCostFunction.h:51

shogun::lbfgs_parameter_t::gtol
float64_t gtol
Definition: lbfgs.h:289

shogun::CLBFGSMinimizer::m_orthantwise_start
int32_t m_orthantwise_start
Definition: LBFGSMinimizer.h:186

shogun::FirstOrderCostFunction::get_cost
virtual float64_t get_cost()=0

shogun::CLBFGSMinimizer::m_m
int32_t m_m
Definition: LBFGSMinimizer.h:144

shogun::CLBFGSMinimizer::set_lbfgs_parameters
virtual void set_lbfgs_parameters(int32_t m=100, int32_t max_linesearch=1000, ELBFGSLineSearch linesearch=BACKTRACKING_STRONG_WOLFE, int32_t max_iterations=1000, float64_t delta=0.0, int32_t past=0, float64_t epsilon=1e-5, float64_t min_step=1e-20, float64_t max_step=1e+20, float64_t ftol=1e-4, float64_t wolfe=0.9, float64_t gtol=0.9, float64_t xtol=1e-16, float64_t orthantwise_c=0.0, int32_t orthantwise_start=0, int32_t orthantwise_end=1)
Definition: LBFGSMinimizer.cpp:100

shogun::CLBFGSMinimizer::m_max_iterations
int32_t m_max_iterations
Definition: LBFGSMinimizer.h:153

shogun::CLBFGSMinimizer::m_delta
float64_t m_delta
Definition: LBFGSMinimizer.h:156

shogun::CLBFGSMinimizer::m_xtol
float64_t m_xtol
Definition: LBFGSMinimizer.h:180

shogun::CLBFGSMinimizer::m_epsilon
float64_t m_epsilon
Definition: LBFGSMinimizer.h:162

shogun::lbfgs_parameter_t::past
int past
Definition: lbfgs.h:205

shogun
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18

shogun::CMath::is_infinity
static int is_infinity(double f)
checks whether a float is infinity
Definition: Math.cpp:247

shogun::CLBFGSMinimizer::m_ftol
float64_t m_ftol
Definition: LBFGSMinimizer.h:171

shogun::CMath::is_nan
static int is_nan(double f)
checks whether a float is nan
Definition: Math.cpp:234

shogun::ELBFGSLineSearch
ELBFGSLineSearch
Definition: lbfgscommon.h:13

shogun::lbfgs_parameter_t::epsilon
float64_t epsilon
Definition: lbfgs.h:196

shogun::lbfgs_parameter_t
Definition: lbfgs.h:177

shogun::lbfgs_parameter_t::delta
float64_t delta
Definition: lbfgs.h:217

shogun::lbfgs_parameter_t::ftol
float64_t ftol
Definition: lbfgs.h:266

shogun::CLBFGSMinimizer::m_max_step
float64_t m_max_step
Definition: LBFGSMinimizer.h:168

shogun::LBFGS_ALREADY_MINIMIZED
Definition: lbfgs.h:55

shogun::lbfgs_parameter_t::min_step
float64_t min_step
Definition: lbfgs.h:250

shogun::lbfgs_parameter_t::wolfe
float64_t wolfe
Definition: lbfgs.h:277

SG_ADD
#define SG_ADD(...)
Definition: SGObject.h:84

shogun::FirstOrderCostFunction::obtain_variable_reference
virtual SGVector< float64_t > obtain_variable_reference()=0

shogun::lbfgs_parameter_t::xtol
float64_t xtol
Definition: lbfgs.h:298

shogun::CLBFGSMinimizer::m_target_variable
SGVector< float64_t > m_target_variable
Definition: LBFGSMinimizer.h:192

shogun::CLBFGSMinimizer::~CLBFGSMinimizer
virtual ~CLBFGSMinimizer()
Definition: LBFGSMinimizer.cpp:43

shogun::CLBFGSMinimizer::m_min_step
float64_t m_min_step
Definition: LBFGSMinimizer.h:165

shogun::CLBFGSMinimizer::m_wolfe
float64_t m_wolfe
Definition: LBFGSMinimizer.h:174

shogun::CLBFGSMinimizer::m_past
int32_t m_past
Definition: LBFGSMinimizer.h:159

shogun::FirstOrderMinimizer
The first order minimizer base class.
Definition: FirstOrderMinimizer.h:52