mlpack-3.3.2/doxygen/training__config_8hpp_source.html

 #ifndef MLPACK_METHODS_RL_TRAINING_CONFIG_HPP
 #define MLPACK_METHODS_RL_TRAINING_CONFIG_HPP

 namespace mlpack {
 namespace rl {

 class TrainingConfig
 {
  public:
   TrainingConfig() :
       numWorkers(1),
       updateInterval(1),
       targetNetworkSyncInterval(100),
       stepLimit(0),
       explorationSteps(1),
       stepSize(0.01),
       discount(0.99),
       gradientLimit(40),
       doubleQLearning(false),
       noisyQLearning(false)
   { /* Nothing to do here. */ }

   TrainingConfig(
       size_t numWorkers,
       size_t updateInterval,
       size_t targetNetworkSyncInterval,
       size_t stepLimit,
       size_t explorationSteps,
       double stepSize,
       double discount,
       double gradientLimit,
       bool doubleQLearning,
       bool noisyQLearning) :
       numWorkers(numWorkers),
       updateInterval(updateInterval),
       targetNetworkSyncInterval(targetNetworkSyncInterval),
       stepLimit(stepLimit),
       explorationSteps(explorationSteps),
       stepSize(stepSize),
       discount(discount),
       gradientLimit(gradientLimit),
       doubleQLearning(doubleQLearning),
       noisyQLearning(noisyQLearning)
   { /* Nothing to do here. */ }

   size_t NumWorkers() const { return numWorkers; }
   size_t& NumWorkers() { return numWorkers; }

   size_t UpdateInterval() const { return updateInterval; }
   size_t& UpdateInterval() { return updateInterval; }

   size_t TargetNetworkSyncInterval() const
   { return targetNetworkSyncInterval; }
   size_t& TargetNetworkSyncInterval() { return targetNetworkSyncInterval; }

   size_t StepLimit() const { return stepLimit; }
   size_t& StepLimit() { return stepLimit; }

   size_t ExplorationSteps() const { return explorationSteps; }
   size_t& ExplorationSteps() { return explorationSteps; }

   double StepSize() const { return stepSize; }
   double& StepSize() { return stepSize; }

   double Discount() const { return discount; }
   double& Discount() { return discount; }

   double GradientLimit() const { return gradientLimit; }
   double& GradientLimit() { return gradientLimit; }

   bool DoubleQLearning() const { return doubleQLearning; }
   bool& DoubleQLearning() { return doubleQLearning; }

   bool NoisyQLearning() const { return noisyQLearning; }
   bool& NoisyQLearning() { return noisyQLearning; }

  private:
   size_t numWorkers;

   size_t updateInterval;

   size_t targetNetworkSyncInterval;

   size_t stepLimit;

   size_t explorationSteps;

   double stepSize;

   double discount;

   double gradientLimit;

   bool doubleQLearning;

   bool noisyQLearning;
 };

 } // namespace rl
 } // namespace mlpack

 #endif
mlpack::rl::TrainingConfig::Discount
double & Discount()
Modify the discount rate for future reward.
Definition: training_config.hpp:95

mlpack::rl::TrainingConfig::ExplorationSteps
size_t ExplorationSteps() const
Get the exploration steps.
Definition: training_config.hpp:83

mlpack
Linear algebra utility functions, generally performed on matrices or vectors.
Definition: add_to_po.hpp:21

mlpack::rl::TrainingConfig::NoisyQLearning
bool NoisyQLearning() const
Get the indicator of noisy q-learning.
Definition: training_config.hpp:108

mlpack::rl::TrainingConfig::NumWorkers
size_t NumWorkers() const
Get the amount of workers.
Definition: training_config.hpp:59

mlpack::rl::TrainingConfig::StepLimit
size_t StepLimit() const
Get the maximum steps of each episode.
Definition: training_config.hpp:75

mlpack::rl::TrainingConfig::TargetNetworkSyncInterval
size_t TargetNetworkSyncInterval() const
Get the interval for syncing target network.
Definition: training_config.hpp:69

mlpack::rl::TrainingConfig::StepLimit
size_t & StepLimit()
Modify the maximum steps of each episode.
Definition: training_config.hpp:80

mlpack::rl::TrainingConfig::TargetNetworkSyncInterval
size_t & TargetNetworkSyncInterval()
Modify the interval for syncing target network.
Definition: training_config.hpp:72

mlpack::rl::TrainingConfig
Definition: training_config.hpp:19

mlpack::rl::TrainingConfig::UpdateInterval
size_t UpdateInterval() const
Get the update interval.
Definition: training_config.hpp:64

mlpack::rl::TrainingConfig::Discount
double Discount() const
Get the discount rate for future reward.
Definition: training_config.hpp:93

mlpack::rl::TrainingConfig::NumWorkers
size_t & NumWorkers()
Modify the amount of workers.
Definition: training_config.hpp:61

mlpack::rl::TrainingConfig::DoubleQLearning
bool DoubleQLearning() const
Get the indicator of double q-learning.
Definition: training_config.hpp:103

mlpack::rl::TrainingConfig::TrainingConfig
TrainingConfig()
Definition: training_config.hpp:22

mlpack::rl::TrainingConfig::ExplorationSteps
size_t & ExplorationSteps()
Modify the exploration steps.
Definition: training_config.hpp:85

mlpack::rl::TrainingConfig::TrainingConfig
TrainingConfig(size_t numWorkers, size_t updateInterval, size_t targetNetworkSyncInterval, size_t stepLimit, size_t explorationSteps, double stepSize, double discount, double gradientLimit, bool doubleQLearning, bool noisyQLearning)
Definition: training_config.hpp:35

mlpack::rl::TrainingConfig::DoubleQLearning
bool & DoubleQLearning()
Modify the indicator of double q-learning.
Definition: training_config.hpp:105

mlpack::rl::TrainingConfig::GradientLimit
double GradientLimit() const
Get the limit of update gradient.
Definition: training_config.hpp:98

mlpack::rl::TrainingConfig::UpdateInterval
size_t & UpdateInterval()
Modify the update interval.
Definition: training_config.hpp:66

mlpack::rl::TrainingConfig::GradientLimit
double & GradientLimit()
Modify the limit of update gradient.
Definition: training_config.hpp:100

mlpack::rl::TrainingConfig::StepSize
double StepSize() const
Get the step size of the optimizer.
Definition: training_config.hpp:88

mlpack::rl::TrainingConfig::StepSize
double & StepSize()
Modify the step size of the optimizer.
Definition: training_config.hpp:90

mlpack::rl::TrainingConfig::NoisyQLearning
bool & NoisyQLearning()
Modify the indicator of double q-learning.
Definition: training_config.hpp:110