#include <aggregated_policy.hpp>
|
|
using | ActionType = typename PolicyType::ActionType |
| | Convenient typedef for action.
|
| |
|
| | AggregatedPolicy (std::vector< PolicyType > policies, const arma::colvec &distribution) |
| |
| ActionType | Sample (const arma::colvec &actionValue, bool deterministic=false) |
| | Sample an action based on given action values. More...
|
| |
|
void | Anneal () |
| | Exploration probability will anneal at each step.
|
| |
template<typename PolicyType>
class mlpack::rl::AggregatedPolicy< PolicyType >
- Template Parameters
-
| PolicyType | The type of the child policy. |
◆ AggregatedPolicy()
template<typename PolicyType >
- Parameters
-
| policies | Child policies. |
| distribution | Probability distribution for each child policy. User should make sure its size is same as the number of policies and the sum of its element is equal to 1. |
◆ Sample()
template<typename PolicyType >
Sample an action based on given action values.
- Parameters
-
| actionValue | Values for each action. |
| deterministic | Always select the action greedily. |
- Returns
- Sampled action.
The documentation for this class was generated from the following file: