The EpsilonGreedyPolicy class.
More...
#include <epsilon_greedy_policy.h>
◆ output_type
The type returned when calling this->operator()
◆ EpsilonGreedyPolicy() [1/3]
| cuberl::rl::policies::EpsilonGreedyPolicy::EpsilonGreedyPolicy |
( |
real_t |
eps | ) |
|
|
inline |
Constructor. Creates an epsilon-greedy tabular policy.
◆ EpsilonGreedyPolicy() [2/3]
| cuberl::rl::policies::EpsilonGreedyPolicy::EpsilonGreedyPolicy |
( |
real_t |
eps, |
|
|
uint_t |
seed |
|
) |
| |
|
inlineexplicit |
Constructor. Creates an epsilon-greedy tabular policy.
◆ EpsilonGreedyPolicy() [3/3]
Constructor Creates an epsilon greedy policy with an epsilon decay strategy.
◆ decay_option()
Returns the decay option.
◆ eps_value()
| real_t cuberl::rl::policies::EpsilonGreedyPolicy::eps_value |
( |
| ) |
const |
|
inlinenoexcept |
Returns the value of the epsilon.
◆ get_action() [1/2]
template<typename MatType >
| output_type cuberl::rl::policies::EpsilonGreedyPolicy::get_action |
( |
const MatType & |
q_map, |
|
|
uint_t |
state_idx |
|
) |
| |
◆ get_action() [2/2]
template<typename VecTp >
get_action. Given a vector always returns the position of the maximum occuring element. If the given vector is empty returns CubeAIConsts::invalid_size_type
◆ on_episode()
| void cuberl::rl::policies::EpsilonGreedyPolicy::on_episode |
( |
uint_t |
episode_idx | ) |
|
|
noexcept |
any actions the policy should perform on the given episode index
◆ operator()() [1/2]
template<typename MapType >
| output_type cuberl::rl::policies::EpsilonGreedyPolicy::operator() |
( |
const MapType & |
q_map, |
|
|
uint_t |
state |
|
) |
| const |
operator() Select action for the given state
◆ operator()() [2/2]
template<typename VecType >
Get an action i.e. index from the given values.
◆ reset()
| void cuberl::rl::policies::EpsilonGreedyPolicy::reset |
( |
| ) |
|
|
inlinenoexcept |
◆ set_eps_value()
| void cuberl::rl::policies::EpsilonGreedyPolicy::set_eps_value |
( |
real_t |
eps | ) |
|
Set the epsilon value.
- Parameters
-
◆ EPSILON_DECAY_FACTOR
| constexpr real_t cuberl::rl::policies::EpsilonGreedyPolicy::EPSILON_DECAY_FACTOR = 0.01 |
|
staticconstexpr |
◆ MAX_EPS
| constexpr real_t cuberl::rl::policies::EpsilonGreedyPolicy::MAX_EPS = 1.0 |
|
staticconstexpr |
◆ MIN_EPS
| constexpr real_t cuberl::rl::policies::EpsilonGreedyPolicy::MIN_EPS = 0.01 |
|
staticconstexpr |
The documentation for this class was generated from the following file: