|
bitrl & cuberl Documentation
Simulation engine for reinforcement learning agents
|
Base class for Nodes in a MC tree search. More...
#include <mcts_node.h>

Public Types | |
| typedef ActionTp | action_type |
| typedef StateTp | state_type |
Public Member Functions | |
| MCTSNodeBase (std::shared_ptr< MCTSNodeBase > parent, action_type action) | |
| MCTreeNodeBase. | |
| virtual | ~MCTSNodeBase ()=default |
| void | add_child (std::shared_ptr< MCTSNodeBase< ActionTp, StateTp > > child) |
| add_child | |
| void | add_child (std::shared_ptr< MCTSNodeBase< ActionTp, StateTp > > parent, action_type action) |
| add_child | |
| bool | has_children () const noexcept |
| has_children | |
| std::shared_ptr< MCTSNodeBase > | get_child (uint_t cidx) |
| get_child | |
| uint_t | n_children () const noexcept |
| n_children | |
| void | shuffle_children () noexcept |
| shuffle_children | |
| uint_t | n_explored_children () const noexcept |
| explored_children | |
| void | update_visits () noexcept |
| update_visits | |
| void | update_explored_children () noexcept |
| void | update_total_score (real_t score) noexcept |
| update_total_score | |
| real_t | ucb (real_t temperature) const |
| ucb | |
| std::shared_ptr< MCTSNodeBase > | max_ucb_child (real_t temperature) const |
| max_ucb_child | |
| real_t | win_pct () const |
| win_pct | |
| uint_t | total_visits () const noexcept |
| total_visits | |
| uint_t | get_action () const noexcept |
| get_action | |
| std::shared_ptr< MCTSNodeBase > | parent () |
| parent | |
Protected Attributes | |
| real_t | total_score_ |
| total_score_ | |
| uint_t | total_visits_ |
| total_visits_ | |
| uint_t | explored_children_ |
| explored_children_ | |
| action_type | action_ |
| action_ | |
| std::shared_ptr< MCTSNodeBase > | parent_ |
| parent_ | |
| std::vector< std::shared_ptr< MCTSNodeBase > > | children_ |
| children_ | |
Base class for Nodes in a MC tree search.
| typedef ActionTp cubeai::rl::algos::mc::MCTSNodeBase< ActionTp, StateTp >::action_type |
| typedef StateTp cubeai::rl::algos::mc::MCTSNodeBase< ActionTp, StateTp >::state_type |
| cubeai::rl::algos::mc::MCTSNodeBase< ActionTp, StateTp >::MCTSNodeBase | ( | std::shared_ptr< MCTSNodeBase< ActionTp, StateTp > > | parent, |
| action_type | action | ||
| ) |
MCTreeNodeBase.
| parent | |
| action |
|
virtualdefault |
| void cubeai::rl::algos::mc::MCTSNodeBase< ActionTp, StateTp >::add_child | ( | std::shared_ptr< MCTSNodeBase< ActionTp, StateTp > > | child | ) |
add_child
| child |
| void cubeai::rl::algos::mc::MCTSNodeBase< ActionTp, StateTp >::add_child | ( | std::shared_ptr< MCTSNodeBase< ActionTp, StateTp > > | parent, |
| action_type | action | ||
| ) |
add_child
| parent | |
| action |
|
inlinenoexcept |
get_action
|
inline |
get_child
| cidx |
|
inlinenoexcept |
has_children
| std::shared_ptr< MCTSNodeBase< ActionTp, StateTp > > cubeai::rl::algos::mc::MCTSNodeBase< ActionTp, StateTp >::max_ucb_child | ( | real_t | temperature | ) | const |
max_ucb_child
|
inlinenoexcept |
n_children
|
inlinenoexcept |
explored_children
|
inline |
parent
|
noexcept |
shuffle_children
|
inlinenoexcept |
total_visits
| real_t cubeai::rl::algos::mc::MCTSNodeBase< ActionTp, StateTp >::ucb | ( | real_t | temperature | ) | const |
ucb
| temperature |
|
inlinenoexcept |
|
inlinenoexcept |
update_total_score
| score |
|
inlinenoexcept |
update_visits
|
inline |
win_pct
|
protected |
action_
|
protected |
children_
|
protected |
explored_children_
|
protected |
parent_
|
protected |
total_score_
|
protected |
total_visits_