mlpack-3.0.0/doxygen/nadamax__update_8hpp_source.html

 #ifndef MLPACK_CORE_OPTIMIZERS_ADAM_NADAMAX_UPDATE_HPP
 #define MLPACK_CORE_OPTIMIZERS_ADAM_NADAMAX_UPDATE_HPP

 #include <mlpack/prereqs.hpp>

 namespace mlpack {
 namespace optimization {

 class NadaMaxUpdate
 {
  public:
   NadaMaxUpdate(const double epsilon = 1e-8,
                 const double beta1 = 0.9,
                 const double beta2 = 0.99,
                 const double scheduleDecay = 4e-3) :
       epsilon(epsilon),
       beta1(beta1),
       beta2(beta2),
       scheduleDecay(scheduleDecay),
       cumBeta1(1),
       iteration(0)
   {
     // Nothing to do.
   }

   void Initialize(const size_t rows, const size_t cols)
   {
     m = arma::zeros<arma::mat>(rows, cols);
     u = arma::zeros<arma::mat>(rows, cols);
   }

   void Update(arma::mat& iterate,
               const double stepSize,
               const arma::mat& gradient)
   {
     // Increment the iteration counter variable.
     ++iteration;

     // And update the iterate.
     m *= beta1;
     m += (1 - beta1) * gradient;

     u = arma::max(u * beta2, arma::abs(gradient));

     double beta1T = beta1 * (1 - (0.5 *
         std::pow(0.96, iteration * scheduleDecay)));

     double beta1T1 = beta1 * (1 - (0.5 *
         std::pow(0.96, (iteration + 1) * scheduleDecay)));

     cumBeta1 *= beta1T;

     const double biasCorrection1 = 1.0 - cumBeta1;

     const double biasCorrection2 = 1.0 - (cumBeta1 * beta1T1);

     if ((biasCorrection1 != 0) && (biasCorrection2 != 0))
     {
        iterate -= (stepSize * (((1 - beta1T) / biasCorrection1) * gradient
            + (beta1T1 / biasCorrection2) * m)) / (u + epsilon);
     }
   }

   double Epsilon() const { return epsilon; }
   double& Epsilon() { return epsilon; }

   double CumBeta1() const { return cumBeta1; }
   double& CumBeta1() { return cumBeta1; }

   double Beta1() const { return beta1; }
   double& Beta1() { return beta1; }

   double Beta2() const { return beta2; }
   double& Beta2() { return beta2; }

   double ScheduleDecay() const { return scheduleDecay; }
   double& ScheduleDecay() { return scheduleDecay; }

  private:
   // The epsilon value used to initialise the squared gradient parameter.
   double epsilon;

   // The smoothing parameter.
   double beta1;

   // The second moment coefficient.
   double beta2;

   // The exponential moving average of gradient values.
   arma::mat m;

   // The exponentially weighted infinity norm.
   arma::mat u;

   // The decay parameter for decay coefficients
   double scheduleDecay;

   // The cumulative product of decay coefficients
   double cumBeta1;

   // The number of iterations.
   double iteration;
 };

 } // namespace optimization
 } // namespace mlpack

 #endif
mlpack::optimization::NadaMaxUpdate::ScheduleDecay
double ScheduleDecay() const
Get the decay parameter for decay coefficients.
Definition: nadamax_update.hpp:136

mlpack::optimization::NadaMaxUpdate::Epsilon
double Epsilon() const
Get the value used to initialise the squared gradient parameter.
Definition: nadamax_update.hpp:116

mlpack::optimization::NadaMaxUpdate::NadaMaxUpdate
NadaMaxUpdate(const double epsilon=1e-8, const double beta1=0.9, const double beta2=0.99, const double scheduleDecay=4e-3)
Construct the NadaMax update policy with the given parameters.
Definition: nadamax_update.hpp:49

mlpack
.hpp
Definition: add_to_po.hpp:21

mlpack::optimization::NadaMaxUpdate::Update
void Update(arma::mat &iterate, const double stepSize, const arma::mat &gradient)
Update step for NadaMax.
Definition: nadamax_update.hpp:83

mlpack::optimization::NadaMaxUpdate::CumBeta1
double & CumBeta1()
Modify the value of the cumulative product of decay coefficients.
Definition: nadamax_update.hpp:123

prereqs.hpp
The core includes that mlpack expects; standard C++ includes and Armadillo.

mlpack::optimization::NadaMaxUpdate::Epsilon
double & Epsilon()
Modify the value used to initialise the squared gradient parameter.
Definition: nadamax_update.hpp:118

mlpack::optimization::NadaMaxUpdate::Beta1
double & Beta1()
Modify the smoothing parameter.
Definition: nadamax_update.hpp:128

mlpack::optimization::NadaMaxUpdate::ScheduleDecay
double & ScheduleDecay()
Modify the decay parameter for decay coefficients.
Definition: nadamax_update.hpp:138

mlpack::optimization::NadaMaxUpdate::Initialize
void Initialize(const size_t rows, const size_t cols)
The Initialize() method is called by the optimizer before the start of the iteration update process...
Definition: nadamax_update.hpp:70

mlpack::optimization::NadaMaxUpdate::Beta2
double Beta2() const
Get the second moment coefficient.
Definition: nadamax_update.hpp:131

mlpack::optimization::NadaMaxUpdate::CumBeta1
double CumBeta1() const
Get the value of the cumulative product of decay coefficients.
Definition: nadamax_update.hpp:121

mlpack::optimization::NadaMaxUpdate::Beta1
double Beta1() const
Get the smoothing parameter.
Definition: nadamax_update.hpp:126

mlpack::optimization::NadaMaxUpdate::Beta2
double & Beta2()
Modify the second moment coefficient.
Definition: nadamax_update.hpp:133

mlpack::optimization::NadaMaxUpdate
NadaMax is an optimizer that combines the AdaMax and NAG.
Definition: nadamax_update.hpp:37