4#include "cuberl/base/cubeai_config.h"
9#include "cuberl/data_structs/experience_buffer.h"
20template<
typename ActionType,
typename StateType>
25 typedef ActionType action_type;
32 > experience_tuple_type;
34 typedef cuberl::containers::ExperienceBuffer<experience_tuple_type> experience_buffer_type;
37 std::vector<real_t> rewards;
38 std::vector<real_t> policy_loss_values;
39 std::vector<real_t> critic_loss_values;
40 std::vector<uint_t> episode_duration;
45 template<typename T, uint_t index>
47 get(const std::vector<experience_tuple_type>& experience)const;
52template<typename ActionType, typename StateType>
53template<typename T, uint_t index>
55A2CMonitor<ActionType, StateType>::get(const std::vector<experience_tuple_type>& experience)
const{
57 std::vector<T> result;
58 result.reserve(experience.size());
60 auto b = experience.begin();
61 auto e = experience.end();
65 result.push_back(std::get<index>(item));
71template<
typename ActionType,
typename StateType>
73A2CMonitor<ActionType, StateType>::reset()noexcept{
75 policy_loss_values.clear();
77 episode_duration.clear();
double real_t
real_t
Definition bitrl_types.h:23
Various utilities used when working with RL problems.
Definition cuberl_types.h:16
std::pair< uint_t, uint_t > state_type
Definition example_15.cpp:28