Public Member Functions
	TrainingConfig ()

	TrainingConfig (size_t numWorkers, size_t updateInterval, size_t targetNetworkSyncInterval, size_t stepLimit, size_t explorationSteps, double stepSize, double discount, double gradientLimit, bool doubleQLearning, bool noisyQLearning)

double	Discount () const
	Get the discount rate for future reward. More...

double &	Discount ()
	Modify the discount rate for future reward. More...

bool	DoubleQLearning () const
	Get the indicator of double q-learning. More...

bool &	DoubleQLearning ()
	Modify the indicator of double q-learning. More...

size_t	ExplorationSteps () const
	Get the exploration steps. More...

size_t &	ExplorationSteps ()
	Modify the exploration steps. More...

double	GradientLimit () const
	Get the limit of update gradient. More...

double &	GradientLimit ()
	Modify the limit of update gradient. More...

bool	NoisyQLearning () const
	Get the indicator of noisy q-learning. More...

bool &	NoisyQLearning ()
	Modify the indicator of double q-learning. More...

size_t	NumWorkers () const
	Get the amount of workers. More...

size_t &	NumWorkers ()
	Modify the amount of workers. More...

size_t	StepLimit () const
	Get the maximum steps of each episode. More...

size_t &	StepLimit ()
	Modify the maximum steps of each episode. More...

double	StepSize () const
	Get the step size of the optimizer. More...

double &	StepSize ()
	Modify the step size of the optimizer. More...

size_t	TargetNetworkSyncInterval () const
	Get the interval for syncing target network. More...

size_t &	TargetNetworkSyncInterval ()
	Modify the interval for syncing target network. More...

size_t	UpdateInterval () const
	Get the update interval. More...

size_t &	UpdateInterval ()
	Modify the update interval. More...

Detailed Description

Definition at line 19 of file training_config.hpp.

Constructor & Destructor Documentation

◆ TrainingConfig() [1/2]

TrainingConfig ( )

inline

Definition at line 22 of file training_config.hpp.

◆ TrainingConfig() [2/2]

TrainingConfig	(	size_t	numWorkers,
		size_t	updateInterval,
		size_t	targetNetworkSyncInterval,
		size_t	stepLimit,
		size_t	explorationSteps,
		double	stepSize,
		double	discount,
		double	gradientLimit,
		bool	doubleQLearning,
		bool	noisyQLearning
	)

inline

Definition at line 35 of file training_config.hpp.

Member Function Documentation

◆ Discount() [1/2]

double Discount ( ) const

inline

Get the discount rate for future reward.

Definition at line 93 of file training_config.hpp.

Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().

◆ Discount() [2/2]

double& Discount ( )

inline

Modify the discount rate for future reward.

Definition at line 95 of file training_config.hpp.

◆ DoubleQLearning() [1/2]

bool DoubleQLearning ( ) const

inline

Get the indicator of double q-learning.

Definition at line 103 of file training_config.hpp.

◆ DoubleQLearning() [2/2]

bool& DoubleQLearning ( )

inline

Modify the indicator of double q-learning.

Definition at line 105 of file training_config.hpp.

◆ ExplorationSteps() [1/2]

size_t ExplorationSteps ( ) const

inline

Get the exploration steps.

Definition at line 83 of file training_config.hpp.

◆ ExplorationSteps() [2/2]

size_t& ExplorationSteps ( )

inline

Modify the exploration steps.

Definition at line 85 of file training_config.hpp.

◆ GradientLimit() [1/2]

double GradientLimit ( ) const

inline

Get the limit of update gradient.

Definition at line 98 of file training_config.hpp.

Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().

◆ GradientLimit() [2/2]

double& GradientLimit ( )

inline

Modify the limit of update gradient.

Definition at line 100 of file training_config.hpp.

◆ NoisyQLearning() [1/2]

bool NoisyQLearning ( ) const

inline

Get the indicator of noisy q-learning.

Definition at line 108 of file training_config.hpp.

◆ NoisyQLearning() [2/2]

bool& NoisyQLearning ( )

inline

Modify the indicator of double q-learning.

Definition at line 110 of file training_config.hpp.

◆ NumWorkers() [1/2]

size_t NumWorkers ( ) const

inline

Get the amount of workers.

Definition at line 59 of file training_config.hpp.

◆ NumWorkers() [2/2]

size_t& NumWorkers ( )

inline

Modify the amount of workers.

Definition at line 61 of file training_config.hpp.

◆ StepLimit() [1/2]

size_t StepLimit ( ) const

inline

Get the maximum steps of each episode.

Definition at line 75 of file training_config.hpp.

Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().

◆ StepLimit() [2/2]

size_t& StepLimit ( )

inline

Modify the maximum steps of each episode.

Setting it to 0 means no limit.

Definition at line 80 of file training_config.hpp.

◆ StepSize() [1/2]

double StepSize ( ) const

inline

Get the step size of the optimizer.

Definition at line 88 of file training_config.hpp.

Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().

◆ StepSize() [2/2]

double& StepSize ( )

inline

Modify the step size of the optimizer.

Definition at line 90 of file training_config.hpp.

◆ TargetNetworkSyncInterval() [1/2]

size_t TargetNetworkSyncInterval ( ) const

inline

Get the interval for syncing target network.

Definition at line 69 of file training_config.hpp.

Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().

◆ TargetNetworkSyncInterval() [2/2]

size_t& TargetNetworkSyncInterval ( )

inline

Modify the interval for syncing target network.

Definition at line 72 of file training_config.hpp.

◆ UpdateInterval() [1/2]

size_t UpdateInterval ( ) const

inline

Get the update interval.

Definition at line 64 of file training_config.hpp.

Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().

◆ UpdateInterval() [2/2]

size_t& UpdateInterval ( )

inline

Modify the update interval.

Definition at line 66 of file training_config.hpp.

The documentation for this class was generated from the following file:

/var/www/mlpack.ratml.org/mlpack.org/_src/mlpack-3.3.2/src/mlpack/methods/reinforcement_learning/training_config.hpp

Public Member Functions

Detailed Description

Constructor & Destructor Documentation

◆ TrainingConfig() [1/2]

◆ TrainingConfig() [2/2]

Member Function Documentation

◆ Discount() [1/2]

◆ Discount() [2/2]

◆ DoubleQLearning() [1/2]

◆ DoubleQLearning() [2/2]

◆ ExplorationSteps() [1/2]

◆ ExplorationSteps() [2/2]

◆ GradientLimit() [1/2]

◆ GradientLimit() [2/2]

◆ NoisyQLearning() [1/2]

◆ NoisyQLearning() [2/2]

◆ NumWorkers() [1/2]

◆ NumWorkers() [2/2]

◆ StepLimit() [1/2]

◆ StepLimit() [2/2]

◆ StepSize() [1/2]

◆ StepSize() [2/2]

◆ TargetNetworkSyncInterval() [1/2]

◆ TargetNetworkSyncInterval() [2/2]

◆ UpdateInterval() [1/2]

◆ UpdateInterval() [2/2]