mlpack-git/doxygen/aggregated__policy_8hpp_source.html

 #ifndef MLPACK_METHODS_RL_POLICY_AGGREGATED_POLICY_HPP
 #define MLPACK_METHODS_RL_POLICY_AGGREGATED_POLICY_HPP

 #include <mlpack/prereqs.hpp>
 #include <mlpack/core/dists/discrete_distribution.hpp>

 namespace mlpack {
 namespace rl {

 template <typename PolicyType>
 class AggregatedPolicy
 {
  public:
   using ActionType = typename PolicyType::ActionType;

   AggregatedPolicy(std::vector<PolicyType> policies,
                    const arma::colvec& distribution) :
       policies(std::move(policies)),
       sampler({distribution})
   { /* Nothing to do here. */ };

   ActionType Sample(const arma::colvec& actionValue, bool deterministic = false)
   {
     if (deterministic)
       return policies.front().Sample(actionValue, true);
     size_t selected = arma::as_scalar(sampler.Random());
     return policies[selected].Sample(actionValue, false);
   }

   void Anneal()
   {
     for (PolicyType& policy : policies)
       policy.Anneal();
   }

  private:
   std::vector<PolicyType> policies;

   distribution::DiscreteDistribution sampler;
 };

 } // namespace rl
 } // namespace mlpack

 #endif
mlpack
Linear algebra utility functions, generally performed on matrices or vectors.
Definition: add_to_cli11.hpp:21

mlpack::distribution::DiscreteDistribution
A discrete distribution where the only observations are discrete observations.
Definition: discrete_distribution.hpp:45

prereqs.hpp
The core includes that mlpack expects; standard C++ includes and Armadillo.

std
Definition: pointer_wrapper.hpp:23

mlpack::distribution::DiscreteDistribution::Random
arma::vec Random() const
Return a randomly generated observation (one-dimensional vector; one observation) according to the pr...

mlpack::rl::AggregatedPolicy::Anneal
void Anneal()
Exploration probability will anneal at each step.
Definition: aggregated_policy.hpp:63

mlpack::rl::AggregatedPolicy::Sample
ActionType Sample(const arma::colvec &actionValue, bool deterministic=false)
Sample an action based on given action values.
Definition: aggregated_policy.hpp:52

mlpack::rl::AggregatedPolicy::ActionType
typename PolicyType::ActionType ActionType
Convenient typedef for action.
Definition: aggregated_policy.hpp:31

mlpack::rl::AggregatedPolicy::AggregatedPolicy
AggregatedPolicy(std::vector< PolicyType > policies, const arma::colvec &distribution)
Definition: aggregated_policy.hpp:39

mlpack::rl::AggregatedPolicy
Definition: aggregated_policy.hpp:27

discrete_distribution.hpp