#include <aggregated_policy.hpp>
|
using | ActionType = typename PolicyType::ActionType |
| Convenient typedef for action.
|
|
|
| AggregatedPolicy (std::vector< PolicyType > policies, const arma::colvec &distribution) |
|
ActionType | Sample (const arma::colvec &actionValue, bool deterministic=false) |
| Sample an action based on given action values. More...
|
|
void | Anneal () |
| Exploration probability will anneal at each step.
|
|
template<typename PolicyType>
class mlpack::rl::AggregatedPolicy< PolicyType >
- Template Parameters
-
PolicyType | The type of the child policy. |
◆ AggregatedPolicy()
template<typename PolicyType >
- Parameters
-
policies | Child policies. |
distribution | Probability distribution for each child policy. User should make sure its size is same as the number of policies and the sum of its element is equal to 1. |
◆ Sample()
template<typename PolicyType >
Sample an action based on given action values.
- Parameters
-
actionValue | Values for each action. |
deterministic | Always select the action greedily. |
- Returns
- Sampled action.
The documentation for this class was generated from the following file: