|
bitrl & cuberl Documentation
Simulation engine for reinforcement learning agents
|
Forward declaration. More...
#include <vector_time_step.h>
Public Types | |
| typedef StateType | state_type |
| state_ Type of the state | |
Public Member Functions | |
| VectorTimeStep ()=default | |
| Default construcotr. | |
| VectorTimeStep (const std::vector< TimeStepTp > &types, const std::vector< real_t > &rewards, const std::vector< state_type > &obs) | |
| VectorTimeStep. Constructor. | |
| VectorTimeStep (const std::vector< TimeStepTp > &types, const std::vector< real_t > &rewards, const std::vector< state_type > &obs, const std::vector< real_t > &discount_factors) | |
| VectorTimeStep. Constructor. | |
| VectorTimeStep (const std::vector< TimeStepTp > &types, const std::vector< real_t > &rewards, const std::vector< state_type > &obs, const std::vector< real_t > &discount_factors, std::unordered_map< std::string, std::any > &&extra) | |
| VectorTimeStep (const VectorTimeStep &other) | |
| TimeStep. | |
| VectorTimeStep & | operator= (const VectorTimeStep &other) |
| Assignment operator. | |
| VectorTimeStep (VectorTimeStep &&other) noexcept | |
| TimeStep. | |
| VectorTimeStep & | operator= (VectorTimeStep &&other) noexcept |
| operator = | |
| const std::vector< TimeStepTp > & | types () const noexcept |
| type | |
| const std::vector< state_type > & | observations () const |
| observation | |
| const std::vector< real_t > & | rewards () const noexcept |
| reward | |
| real_t | reward () const noexcept |
| Returns the sum of the rewards received. | |
| bool | done () const noexcept |
| Returns true if any time step is LAST. | |
| const std::vector< real_t > & | discounts () const noexcept |
| discount. Returns the discount factor | |
| bool | last () const noexcept |
| last | |
Forward declaration.
VectorTimeSetp class.
| typedef StateType bitrl::VectorTimeStep< StateType >::state_type |
state_ Type of the state
|
default |
Default construcotr.
| bitrl::VectorTimeStep< StateType >::VectorTimeStep | ( | const std::vector< TimeStepTp > & | types, |
| const std::vector< real_t > & | rewards, | ||
| const std::vector< state_type > & | obs | ||
| ) |
VectorTimeStep. Constructor.
| bitrl::VectorTimeStep< StateType >::VectorTimeStep | ( | const std::vector< TimeStepTp > & | types, |
| const std::vector< real_t > & | rewards, | ||
| const std::vector< state_type > & | obs, | ||
| const std::vector< real_t > & | discount_factors | ||
| ) |
VectorTimeStep. Constructor.
| bitrl::VectorTimeStep< StateType >::VectorTimeStep | ( | const std::vector< TimeStepTp > & | types, |
| const std::vector< real_t > & | rewards, | ||
| const std::vector< state_type > & | obs, | ||
| const std::vector< real_t > & | discount_factors, | ||
| std::unordered_map< std::string, std::any > && | extra | ||
| ) |
| bitrl::VectorTimeStep< StateType >::VectorTimeStep | ( | const VectorTimeStep< StateType > & | other | ) |
| other |
|
noexcept |
| other |
|
inlinenoexcept |
discount. Returns the discount factor
|
noexcept |
Returns true if any time step is LAST.
|
noexcept |
last
|
inline |
observation
| VectorTimeStep< StateType > & bitrl::VectorTimeStep< StateType >::operator= | ( | const VectorTimeStep< StateType > & | other | ) |
Assignment operator.
|
noexcept |
operator =
| other |
|
noexcept |
Returns the sum of the rewards received.
|
inlinenoexcept |
reward
|
inlinenoexcept |
type