Aakash-kaushik/mlpack/async__learning_8hpp_source.html

 #ifndef MLPACK_METHODS_RL_ASYNC_LEARNING_HPP
 #define MLPACK_METHODS_RL_ASYNC_LEARNING_HPP

 #include <mlpack/prereqs.hpp>
 #include "worker/one_step_q_learning_worker.hpp"
 #include "worker/one_step_sarsa_worker.hpp"
 #include "worker/n_step_q_learning_worker.hpp"
 #include "training_config.hpp"

 namespace mlpack {
 namespace rl {

 template <
   typename WorkerType,
   typename EnvironmentType,
   typename NetworkType,
   typename UpdaterType,
   typename PolicyType
 >
 class AsyncLearning
 {
  public:
   AsyncLearning(TrainingConfig config,
                 NetworkType network,
                 PolicyType policy,
                 UpdaterType updater = UpdaterType(),
                 EnvironmentType environment = EnvironmentType());

   template <typename Measure>
   void Train(Measure& measure);

   TrainingConfig& Config() { return config; }
   const TrainingConfig& Config() const { return config; }

   NetworkType& Network() { return learningNetwork; }
   const NetworkType& Network() const { return learningNetwork; }

   PolicyType& Policy() { return policy; }
   const PolicyType& Policy() const { return policy; }

   UpdaterType& Updater() { return updater; }
   const UpdaterType& Updater() const { return updater; }

   EnvironmentType& Environment() { return environment; }
   const EnvironmentType& Environment() const { return environment; }

  private:
   TrainingConfig config;

   NetworkType learningNetwork;

   PolicyType policy;

   UpdaterType updater;

   EnvironmentType environment;
 };

 template <
   typename EnvironmentType,
   typename NetworkType,
   typename UpdaterType,
   typename PolicyType
 >
 class OneStepQLearningWorker;

 template <
   typename EnvironmentType,
   typename NetworkType,
   typename UpdaterType,
   typename PolicyType
 >
 class OneStepSarsaWorker;

 template <
   typename EnvironmentType,
   typename NetworkType,
   typename UpdaterType,
   typename PolicyType
 >
 class NStepQLearningWorker;

 template <
   typename EnvironmentType,
   typename NetworkType,
   typename UpdaterType,
   typename PolicyType
 >
 using OneStepQLearning = AsyncLearning<OneStepQLearningWorker<EnvironmentType,
     NetworkType, UpdaterType, PolicyType>, EnvironmentType, NetworkType,
     UpdaterType, PolicyType>;

 template <
   typename EnvironmentType,
   typename NetworkType,
   typename UpdaterType,
   typename PolicyType
 >
 using OneStepSarsa = AsyncLearning<OneStepSarsaWorker<EnvironmentType,
     NetworkType, UpdaterType, PolicyType>, EnvironmentType, NetworkType,
     UpdaterType, PolicyType>;

 template <
   typename EnvironmentType,
   typename NetworkType,
   typename UpdaterType,
   typename PolicyType
 >
 using NStepQLearning = AsyncLearning<NStepQLearningWorker<EnvironmentType,
     NetworkType, UpdaterType, PolicyType>, EnvironmentType, NetworkType,
     UpdaterType, PolicyType>;

 } // namespace rl
 } // namespace mlpack

 // Include implementation
 #include "async_learning_impl.hpp"

 #endif
mlpack::rl::AsyncLearning::AsyncLearning
AsyncLearning(TrainingConfig config, NetworkType network, PolicyType policy, UpdaterType updater=UpdaterType(), EnvironmentType environment=EnvironmentType())
Construct an instance of the given async learning algorithm.
Definition: async_learning_impl.hpp:35

mlpack::rl::AsyncLearning::Updater
const UpdaterType & Updater() const
Modify optimizer.
Definition: async_learning.hpp:109

mlpack
Linear algebra utility functions, generally performed on matrices or vectors.
Definition: cv.hpp:1

mlpack::rl::AsyncLearning::Environment
const EnvironmentType & Environment() const
Modify the environment.
Definition: async_learning.hpp:114

prereqs.hpp
The core includes that mlpack expects; standard C++ includes and Armadillo.

n_step_q_learning_worker.hpp

mlpack::rl::AsyncLearning::Network
const NetworkType & Network() const
Modify learning network.
Definition: async_learning.hpp:99

mlpack::rl::AsyncLearning::Updater
UpdaterType & Updater()
Get optimizer.
Definition: async_learning.hpp:107

async_learning_impl.hpp

one_step_sarsa_worker.hpp

mlpack::rl::TrainingConfig
Definition: training_config.hpp:19

mlpack::rl::OneStepQLearningWorker
Forward declaration of OneStepQLearningWorker.
Definition: async_learning.hpp:147

mlpack::rl::AsyncLearning::Policy
const PolicyType & Policy() const
Modify behavior policy.
Definition: async_learning.hpp:104

mlpack::rl::AsyncLearning::Policy
PolicyType & Policy()
Get behavior policy.
Definition: async_learning.hpp:102

mlpack::rl::AsyncLearning::Config
const TrainingConfig & Config() const
Modify training config.
Definition: async_learning.hpp:94

training_config.hpp

mlpack::rl::AsyncLearning::Environment
EnvironmentType & Environment()
Get the environment.
Definition: async_learning.hpp:112

mlpack::rl::AsyncLearning::Train
void Train(Measure &measure)
Starting async training.
Definition: async_learning_impl.hpp:62

mlpack::rl::NStepQLearningWorker
Forward declaration of NStepQLearningWorker.
Definition: async_learning.hpp:179

mlpack::rl::AsyncLearning::Network
NetworkType & Network()
Get learning network.
Definition: async_learning.hpp:97

mlpack::rl::AsyncLearning
Wrapper of various asynchronous learning algorithms, e.g.
Definition: async_learning.hpp:57

one_step_q_learning_worker.hpp

mlpack::rl::OneStepSarsaWorker
Forward declaration of OneStepSarsaWorker.
Definition: async_learning.hpp:163

mlpack::rl::AsyncLearning::Config
TrainingConfig & Config()
Get training config.
Definition: async_learning.hpp:92