bitrl_cuberl_docs/reinforce__loss_8h_source.html

#ifndef REINFORCE_LOSS_H

#define REINFORCE_LOSS_H


#include "cuberl/base/cuberl_config.h"


#ifdef USE_PYTORCH


#include "cuberl/base/cuberl_types.h"

#include "bitrl/bitrl_consts.h"


#include <vector>


namespace cuberl {

namespace rl {

namespace algos {

namespace pg {


    //using namespace bitrl::consts;


std::vector<torch_tensor_t>

compute_loss_item(const std::vector<real_t>& rewards,

                  const std::vector<torch_tensor_t>& log_probs);


std::vector<real_t>

compute_baseline_with_constant(const std::vector<real_t>& rewards,

                               real_t constant);


std::vector<real_t>

compute_baseline_with_mean(const std::vector<real_t>& rewards);


std::vector<real_t>

compute_baseline_with_standardization(const std::vector<real_t>& rewards,

                                      real_t eps=bitrl::consts::TOLERANCE);


}

}

}

}


#endif

#endif

bitrl_consts.h

cuberl_types.h

bitrl::consts::TOLERANCE
const real_t TOLERANCE
Tolerance used around the library.
Definition bitrl_consts.h:31

bitrl::real_t
double real_t
real_t
Definition bitrl_types.h:23

cuberl
Various utilities used when working with RL problems.
Definition cuberl_types.h:16