Aakash-kaushik/mlpack/training__config_8hpp_source.html

 #ifndef MLPACK_METHODS_RL_TRAINING_CONFIG_HPP
 #define MLPACK_METHODS_RL_TRAINING_CONFIG_HPP

 namespace mlpack {
 namespace rl {

 class TrainingConfig
 {
  public:
   TrainingConfig() :
       numWorkers(1),
       updateInterval(1),
       targetNetworkSyncInterval(100),
       stepLimit(200),
       explorationSteps(1),
       stepSize(0.01),
       discount(0.99),
       gradientLimit(40),
       doubleQLearning(false),
       noisyQLearning(false),
       isCategorical(false),
       atomSize(51),
       vMin(0),
       vMax(200),
       rho(0.005)
   { /* Nothing to do here. */ }

   TrainingConfig(
       size_t numWorkers,
       size_t updateInterval,
       size_t targetNetworkSyncInterval,
       size_t stepLimit,
       size_t explorationSteps,
       double stepSize,
       double discount,
       double gradientLimit,
       bool doubleQLearning,
       bool noisyQLearning,
       bool isCategorical,
       size_t atomSize,
       double vMin,
       double vMax,
       double rho) :
       numWorkers(numWorkers),
       updateInterval(updateInterval),
       targetNetworkSyncInterval(targetNetworkSyncInterval),
       stepLimit(stepLimit),
       explorationSteps(explorationSteps),
       stepSize(stepSize),
       discount(discount),
       gradientLimit(gradientLimit),
       doubleQLearning(doubleQLearning),
       noisyQLearning(noisyQLearning),
       isCategorical(isCategorical),
       atomSize(atomSize),
       vMin(vMin),
       vMax(vMax),
       rho(rho)
   { /* Nothing to do here. */ }

   size_t NumWorkers() const { return numWorkers; }
   size_t& NumWorkers() { return numWorkers; }

   size_t UpdateInterval() const { return updateInterval; }
   size_t& UpdateInterval() { return updateInterval; }

   size_t TargetNetworkSyncInterval() const
   { return targetNetworkSyncInterval; }
   size_t& TargetNetworkSyncInterval() { return targetNetworkSyncInterval; }

   size_t StepLimit() const { return stepLimit; }
   size_t& StepLimit() { return stepLimit; }

   size_t ExplorationSteps() const { return explorationSteps; }
   size_t& ExplorationSteps() { return explorationSteps; }

   double StepSize() const { return stepSize; }
   double& StepSize() { return stepSize; }

   double Discount() const { return discount; }
   double& Discount() { return discount; }

   double GradientLimit() const { return gradientLimit; }
   double& GradientLimit() { return gradientLimit; }

   bool DoubleQLearning() const { return doubleQLearning; }
   bool& DoubleQLearning() { return doubleQLearning; }

   bool NoisyQLearning() const { return noisyQLearning; }
   bool& NoisyQLearning() { return noisyQLearning; }

   bool IsCategorical() const { return isCategorical; }
   bool& IsCategorical() { return isCategorical; }

   size_t AtomSize() const { return atomSize; }
   size_t& AtomSize() { return atomSize; }

   double VMin() const { return vMin; }
   double& VMin() { return vMin; }

   double VMax() const { return vMax; }
   double& VMax() { return vMax; }

   double Rho() const { return rho; }
   double& Rho() { return rho; }

  private:
   size_t numWorkers;

   size_t updateInterval;

   size_t targetNetworkSyncInterval;

   size_t stepLimit;

   size_t explorationSteps;

   double stepSize;

   double discount;

   double gradientLimit;

   bool doubleQLearning;

   bool noisyQLearning;

   bool isCategorical;

   size_t atomSize;

   double vMin;

   double vMax;

   double rho;
 };

 } // namespace rl
 } // namespace mlpack

 #endif
mlpack::rl::TrainingConfig::UpdateInterval
size_t & UpdateInterval()
Modify the update interval.
Definition: training_config.hpp:81

mlpack::rl::TrainingConfig::DoubleQLearning
bool DoubleQLearning() const
Get the indicator of double q-learning.
Definition: training_config.hpp:118

mlpack::rl::TrainingConfig::TargetNetworkSyncInterval
size_t TargetNetworkSyncInterval() const
Get the interval for syncing target network.
Definition: training_config.hpp:84

mlpack
Linear algebra utility functions, generally performed on matrices or vectors.
Definition: cv.hpp:1

mlpack::rl::TrainingConfig::NumWorkers
size_t NumWorkers() const
Get the amount of workers.
Definition: training_config.hpp:74

mlpack::rl::TrainingConfig::VMin
double & VMin()
Modify the minimum value for support.
Definition: training_config.hpp:140

mlpack::rl::TrainingConfig::GradientLimit
double GradientLimit() const
Get the limit of update gradient.
Definition: training_config.hpp:113

mlpack::rl::TrainingConfig::VMax
double VMax() const
Get the maximum value for support.
Definition: training_config.hpp:143

mlpack::rl::TrainingConfig::NumWorkers
size_t & NumWorkers()
Modify the amount of workers.
Definition: training_config.hpp:76

mlpack::rl::TrainingConfig::Discount
double & Discount()
Modify the discount rate for future reward.
Definition: training_config.hpp:110

mlpack::rl::TrainingConfig::UpdateInterval
size_t UpdateInterval() const
Get the update interval.
Definition: training_config.hpp:79

mlpack::rl::TrainingConfig::StepSize
double StepSize() const
Get the step size of the optimizer.
Definition: training_config.hpp:103

mlpack::rl::TrainingConfig::VMin
double VMin() const
Get the minimum value for support.
Definition: training_config.hpp:138

mlpack::rl::TrainingConfig::Rho
double Rho() const
Get the rho value for sac.
Definition: training_config.hpp:148

mlpack::rl::TrainingConfig::StepLimit
size_t StepLimit() const
Get the maximum steps of each episode.
Definition: training_config.hpp:90

mlpack::rl::TrainingConfig::StepSize
double & StepSize()
Modify the step size of the optimizer.
Definition: training_config.hpp:105

mlpack::rl::TrainingConfig::TargetNetworkSyncInterval
size_t & TargetNetworkSyncInterval()
Modify the interval for syncing target network.
Definition: training_config.hpp:87

mlpack::rl::TrainingConfig::StepLimit
size_t & StepLimit()
Modify the maximum steps of each episode.
Definition: training_config.hpp:95

mlpack::rl::TrainingConfig::NoisyQLearning
bool NoisyQLearning() const
Get the indicator of noisy q-learning.
Definition: training_config.hpp:123

mlpack::rl::TrainingConfig
Definition: training_config.hpp:19

mlpack::rl::TrainingConfig::DoubleQLearning
bool & DoubleQLearning()
Modify the indicator of double q-learning.
Definition: training_config.hpp:120

mlpack::rl::TrainingConfig::Rho
double & Rho()
Modify the rho value for sac.
Definition: training_config.hpp:150

mlpack::rl::TrainingConfig::NoisyQLearning
bool & NoisyQLearning()
Modify the indicator of double q-learning.
Definition: training_config.hpp:125

mlpack::rl::TrainingConfig::GradientLimit
double & GradientLimit()
Modify the limit of update gradient.
Definition: training_config.hpp:115

mlpack::rl::TrainingConfig::ExplorationSteps
size_t & ExplorationSteps()
Modify the exploration steps.
Definition: training_config.hpp:100

mlpack::rl::TrainingConfig::Discount
double Discount() const
Get the discount rate for future reward.
Definition: training_config.hpp:108

mlpack::rl::TrainingConfig::IsCategorical
bool & IsCategorical()
Modify the indicator of categorical q-learning.
Definition: training_config.hpp:130

mlpack::rl::TrainingConfig::ExplorationSteps
size_t ExplorationSteps() const
Get the exploration steps.
Definition: training_config.hpp:98

mlpack::rl::TrainingConfig::IsCategorical
bool IsCategorical() const
Get the indicator of categorical q-learning.
Definition: training_config.hpp:128

mlpack::rl::TrainingConfig::VMax
double & VMax()
Modify the maximum value for support.
Definition: training_config.hpp:145

mlpack::rl::TrainingConfig::AtomSize
size_t AtomSize() const
Get the number of atoms.
Definition: training_config.hpp:133

mlpack::rl::TrainingConfig::AtomSize
size_t & AtomSize()
Modify the number of atoms.
Definition: training_config.hpp:135