mlpack-git/doxygen/mountain__car_8hpp_source.html

 #ifndef MLPACK_METHODS_RL_ENVIRONMENT_MOUNTAIN_CAR_HPP
 #define MLPACK_METHODS_RL_ENVIRONMENT_MOUNTAIN_CAR_HPP

 #include <mlpack/prereqs.hpp>
 #include <mlpack/core/math/clamp.hpp>

 namespace mlpack {
 namespace rl {

 class MountainCar
 {
  public:
   class State
   {
    public:
     State(): data(dimension, arma::fill::zeros)
     { /* Nothing to do here. */ }

     State(const arma::colvec& data): data(data)
     { /* Nothing to do here. */ }

     arma::colvec& Data() { return data; }

     double Velocity() const { return data[0]; }
     double& Velocity() { return data[0]; }

     double Position() const { return data[1]; }
     double& Position() { return data[1]; }

     const arma::colvec& Encode() const { return data; }

     static constexpr size_t dimension = 2;

    private:
     arma::colvec data;
   };

   class Action
   {
    public:
     enum actions
     {
       backward,
       stop,
       forward
     };
     // To store the action.
     Action::actions action;

     // Track the size of the action space.
     static const size_t size = 3;
   };

   MountainCar(const size_t maxSteps = 200,
               const double positionMin = -1.2,
               const double positionMax = 0.6,
               const double positionGoal = 0.5,
               const double velocityMin = -0.07,
               const double velocityMax = 0.07,
               const double doneReward = 0) :
       maxSteps(maxSteps),
       positionMin(positionMin),
       positionMax(positionMax),
       positionGoal(positionGoal),
       velocityMin(velocityMin),
       velocityMax(velocityMax),
       doneReward(doneReward),
       stepsPerformed(0)
   { /* Nothing to do here */ }

   double Sample(const State& state,
                 const Action& action,
                 State& nextState)
   {
     // Update the number of steps performed.
     stepsPerformed++;

     // Calculate acceleration.
     int direction = action.action - 1;
     nextState.Velocity() = state.Velocity() + 0.001 * direction - 0.0025 *
         std::cos(3 * state.Position());
     nextState.Velocity() = math::ClampRange(nextState.Velocity(),
         velocityMin, velocityMax);

     // Update states.
     nextState.Position() = state.Position() + nextState.Velocity();
     nextState.Position() = math::ClampRange(nextState.Position(),
         positionMin, positionMax);

     if (nextState.Position() == positionMin && nextState.Velocity() < 0)
       nextState.Velocity() = 0.0;

     // Check if the episode has terminated.
     bool done = IsTerminal(nextState);

     // Do not reward the agent if time ran out.
     if (done && maxSteps != 0 && stepsPerformed >= maxSteps)
       return 0;
     else if (done)
       return doneReward;

     return -1;
   }

   double Sample(const State& state, const Action& action)
   {
     State nextState;
     return Sample(state, action, nextState);
   }

   State InitialSample()
   {
     State state;
     stepsPerformed = 0;
     state.Velocity() = 0.0;
     state.Position() = arma::as_scalar(arma::randu(1)) * 0.2 - 0.6;
     return state;
   }

   bool IsTerminal(const State& state) const
   {
     if (maxSteps != 0 && stepsPerformed >= maxSteps)
     {
       Log::Info << "Episode terminated due to the maximum number of steps"
           "being taken.";
       return true;
     }
     else if (state.Position() >= positionGoal)
     {
       Log::Info << "Episode terminated due to agent succeeding.";
       return true;
     }
     return false;
   }

   size_t StepsPerformed() const { return stepsPerformed; }

   size_t MaxSteps() const { return maxSteps; }
   size_t& MaxSteps() { return maxSteps; }

  private:
   size_t maxSteps;

   double positionMin;

   double positionMax;

   double positionGoal;

   double velocityMin;

   double velocityMax;

   double doneReward;

   size_t stepsPerformed;
 };

 } // namespace rl
 } // namespace mlpack

 #endif
mlpack::rl::MountainCar::Action
Implementation of action of Mountain Car.
Definition: mountain_car.hpp:79

mlpack::rl::MountainCar::IsTerminal
bool IsTerminal(const State &state) const
This function checks if the car has reached the terminal state.
Definition: mountain_car.hpp:202

mlpack::rl::MountainCar::MaxSteps
size_t MaxSteps() const
Get the maximum number of steps allowed.
Definition: mountain_car.hpp:222

mlpack
Linear algebra utility functions, generally performed on matrices or vectors.
Definition: add_to_cli11.hpp:21

mlpack::rl::MountainCar::InitialSample
State InitialSample()
Initial position is randomly generated within [-0.6, -0.4].
Definition: mountain_car.hpp:187

prereqs.hpp
The core includes that mlpack expects; standard C++ includes and Armadillo.

mlpack::rl::MountainCar::State::Encode
const arma::colvec & Encode() const
Encode the state to a column vector.
Definition: mountain_car.hpp:66

mlpack::rl::MountainCar::State::Position
double & Position()
Modify the position.
Definition: mountain_car.hpp:63

mlpack::rl::MountainCar::State::Velocity
double & Velocity()
Modify the velocity.
Definition: mountain_car.hpp:58

clamp.hpp
Miscellaneous math clamping routines.

mlpack::rl::MountainCar::Sample
double Sample(const State &state, const Action &action)
Dynamics of Mountain Car.
Definition: mountain_car.hpp:175

mlpack::Log::Info
static MLPACK_EXPORT util::PrefixedOutStream Info
Prints informational messages if –verbose is specified, prefixed with [INFO ].
Definition: log.hpp:84

mlpack::rl::MountainCar::State::State
State(const arma::colvec &data)
Construct a state based on the given data.
Definition: mountain_car.hpp:49

mlpack::rl::MountainCar::State::Data
arma::colvec & Data()
Modify the internal representation of the state.
Definition: mountain_car.hpp:53

mlpack::rl::MountainCar::MountainCar
MountainCar(const size_t maxSteps=200, const double positionMin=-1.2, const double positionMax=0.6, const double positionGoal=0.5, const double velocityMin=-0.07, const double velocityMax=0.07, const double doneReward=0)
Construct a Mountain Car instance using the given constant.
Definition: mountain_car.hpp:107

mlpack::rl::MountainCar::Action::stop
Definition: mountain_car.hpp:85

mlpack::rl::MountainCar::State
Implementation of state of Mountain Car.
Definition: mountain_car.hpp:35

mlpack::rl::MountainCar::State::State
State()
Construct a state instance.
Definition: mountain_car.hpp:41

mlpack::rl::MountainCar::Action::action
Action::actions action
Definition: mountain_car.hpp:89

mlpack::rl::MountainCar
Implementation of Mountain Car task.
Definition: mountain_car.hpp:28

mlpack::rl::MountainCar::StepsPerformed
size_t StepsPerformed() const
Get the number of steps performed.
Definition: mountain_car.hpp:219

mlpack::rl::MountainCar::MaxSteps
size_t & MaxSteps()
Set the maximum number of steps allowed.
Definition: mountain_car.hpp:224

mlpack::rl::MountainCar::Sample
double Sample(const State &state, const Action &action, State &nextState)
Dynamics of Mountain Car.
Definition: mountain_car.hpp:133

mlpack::rl::MountainCar::State::Position
double Position() const
Get the position.
Definition: mountain_car.hpp:61

mlpack::rl::MountainCar::State::dimension
static constexpr size_t dimension
Dimension of the encoded state.
Definition: mountain_car.hpp:69

mlpack::rl::MountainCar::State::Velocity
double Velocity() const
Get the velocity.
Definition: mountain_car.hpp:56

mlpack::rl::MountainCar::Action::backward
Definition: mountain_car.hpp:84

mlpack::math::ClampRange
double ClampRange(double value, const double rangeMin, const double rangeMax)
Clamp a number between a particular range.
Definition: clamp.hpp:53

mlpack::rl::MountainCar::Action::actions
actions
Definition: mountain_car.hpp:82