1#ifndef UNIFORM_DISCRETE_POLICY_H
2#define UNIFORM_DISCRETE_POLICY_H
35 std::vector<std::pair<uint_t, real_t>>
operator()(
uint_t sidx)
const{
return (*
this)[sidx];}
45 void update(
uint_t sidx,
const std::vector<std::pair<uint_t, real_t>>& vals);
62 std::pair<uint_t, uint_t>
shape()
const{
return {n_states_, n_actions_};}
75 std::ostream&
print(std::ostream& out)
const;
97 std::vector<std::vector<std::pair<uint_t, real_t>>> state_actions_prob_;
double real_t
real_t
Definition bitrl_types.h:23
std::size_t uint_t
uint_t
Definition bitrl_types.h:43
bool operator==(const UniformDiscretePolicy &p1, const UniformDiscretePolicy &p2)
Definition uniform_discrete_policy.h:106
bool operator!=(const UniformDiscretePolicy &p1, const UniformDiscretePolicy &p2)
Definition uniform_discrete_policy.h:111
Various utilities used when working with RL problems.
Definition cuberl_types.h:16