SHOGUN  4.1.0
 All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Modules Pages
AdaDeltaUpdater.cpp
Go to the documentation of this file.
1 /*
2  * Copyright (c) The Shogun Machine Learning Toolbox
3  * Written (w) 2015 Wu Lin
4  * All rights reserved.
5  *
6  * Redistribution and use in source and binary forms, with or without
7  * modification, are permitted provided that the following conditions are met:
8  *
9  * 1. Redistributions of source code must retain the above copyright notice, this
10  * list of conditions and the following disclaimer.
11  * 2. Redistributions in binary form must reproduce the above copyright notice,
12  * this list of conditions and the following disclaimer in the documentation
13  * and/or other materials provided with the distribution.
14  *
15  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
16  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
17  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
18  * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
19  * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
20  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
21  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
22  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
23  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
24  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
25  *
26  * The views and conclusions contained in the software and documentation are those
27  * of the authors and should not be interpreted as representing official policies,
28  * either expressed or implied, of the Shogun Development Team.
29  *
30  */
31 
33 #include <shogun/lib/config.h>
34 using namespace shogun;
35 
38 {
39  init();
40 }
41 
44 {
45  init();
46  set_learning_rate(learning_rate);
47  set_epsilon(epsilon);
48  set_decay_factor(decay_factor);
49 }
50 
52 {
53  REQUIRE(learning_rate>0,"Learning_rate (%f) must be positive\n",
54  learning_rate);
55  m_build_in_learning_rate=learning_rate;
56 }
57 
59 {
60  REQUIRE(epsilon>=0,"Epsilon (%f) must be non-negative\n",
61  epsilon);
63 }
64 
66 {
67  REQUIRE(decay_factor>=0.0 && decay_factor<1.0,
68  "Decay factor (%f) must in [0,1)\n",
69  decay_factor);
70  m_decay_factor=decay_factor;
71 }
72 
74 {
75 }
76 
77 void AdaDeltaUpdater::init()
78 {
79  m_decay_factor=0.9;
80  m_epsilon=1e-6;
84 }
85 
87 {
89  REQUIRE(context, "Context must set\n");
90 
92  std::copy(m_gradient_accuracy.vector,
94  value.vector);
95  std::string key="AdaDeltaUpdater::m_gradient_accuracy";
96  context->save_data(key, value);
97 
101  value.vector);
102  key="AdaDeltaUpdater::m_gradient_delta_accuracy";
103  context->save_data(key, value);
104 }
105 
107 {
109  REQUIRE(context, "context must set\n");
110 
111  std::string key="AdaDeltaUpdater::m_gradient_accuracy";
114  std::copy(value.vector, value.vector+value.vlen,
116 
117  key="AdaDeltaUpdater::m_gradient_delta_accuracy";
118  value=context->get_data_sgvector_float64(key);
120  std::copy(value.vector, value.vector+value.vlen,
122 }
123 
125  float64_t gradient, index_t idx, float64_t learning_rate)
126 {
127  REQUIRE(idx>=0 && idx<m_gradient_accuracy.vlen,
128  "Index (%d) is invalid\n", idx);
129  REQUIRE(idx>=0 && idx<m_gradient_delta_accuracy.vlen,
130  "Index (%d) is invalid\n", idx);
132  (1.0-m_decay_factor)*gradient*gradient;
136  return res;
137 
138 }
139 
141  SGVector<float64_t> raw_negative_descend_direction, float64_t learning_rate)
142 {
143  REQUIRE(variable_reference.vlen>0,"variable_reference must set\n");
144  REQUIRE(variable_reference.vlen==raw_negative_descend_direction.vlen,
145  "The length of variable_reference (%d) and the length of gradient (%d) do not match\n",
146  variable_reference.vlen,raw_negative_descend_direction.vlen);
148  {
149  m_gradient_accuracy=SGVector<float64_t>(variable_reference.vlen);
151 
154  }
155  if(m_correction)
156  {
157  MomentumCorrection* momentum_correction=dynamic_cast<MomentumCorrection *>(m_correction);
158  if(momentum_correction)
159  {
160  if(!momentum_correction->is_initialized())
161  momentum_correction->initialize_previous_direction(variable_reference.vlen);
162  }
163 
164  for(index_t idx=0; idx<variable_reference.vlen; idx++)
165  {
167  variable_reference[idx], raw_negative_descend_direction[idx], idx, learning_rate);
168 
170  neg_des_dir, idx);
171  float64_t delta=pair.delta;
172  variable_reference[idx]+=pair.descend_direction;
174  (1.0-m_decay_factor)*(delta*delta-neg_des_dir*neg_des_dir);
175  }
176  }
177  else
178  {
179  DescendUpdaterWithCorrection::update_variable(variable_reference, raw_negative_descend_direction, learning_rate);
180  }
181 }
virtual void save_data(const std::string &key, SGVector< float64_t > value)
virtual void set_decay_factor(float64_t decay_factor)
SGVector< float64_t > m_gradient_delta_accuracy
int32_t index_t
Definition: common.h:62
The class is used to serialize and deserialize variables for the optimization framework.
virtual void load_from_context(CMinimizerContext *context)
#define REQUIRE(x,...)
Definition: SGIO.h:206
virtual void initialize_previous_direction(index_t len)
virtual SGVector< float64_t > get_data_sgvector_float64(const std::string &key)
static const float64_t epsilon
Definition: libbmrm.cpp:25
index_t vlen
Definition: SGVector.h:494
virtual DescendPair get_corrected_descend_direction(float64_t negative_descend_direction, index_t idx)=0
double float64_t
Definition: common.h:50
virtual void update_context(CMinimizerContext *context)
virtual void load_from_context(CMinimizerContext *context)
virtual void set_epsilon(float64_t epsilon)
virtual void update_variable(SGVector< float64_t > variable_reference, SGVector< float64_t > raw_negative_descend_direction, float64_t learning_rate)
all of classes and functions are contained in the shogun namespace
Definition: class_list.h:18
This is a base class for momentum correction methods.
This is a base class for descend update with descend based correction.
void scale(Matrix A, Matrix B, typename Matrix::Scalar alpha)
Definition: Core.h:93
virtual void update_variable(SGVector< float64_t > variable_reference, SGVector< float64_t > raw_negative_descend_direction, float64_t learning_rate)
static float32_t sqrt(float32_t x)
Definition: Math.h:459
virtual float64_t get_negative_descend_direction(float64_t variable, float64_t gradient, index_t idx, float64_t learning_rate)
SGVector< float64_t > m_gradient_accuracy
#define delta
Definition: sfa.cpp:23
virtual void set_learning_rate(float64_t learning_rate)
void set_const(T const_elem)
Definition: SGVector.cpp:152
virtual void update_context(CMinimizerContext *context)

SHOGUN Machine Learning Toolbox - Documentation