Forward declaration of NStepQLearningWorker. More...

Public Types
using	ActionType = typename EnvironmentType::Action

using	StateType = typename EnvironmentType::State

using	TransitionType = std::tuple< StateType, ActionType, double, StateType >

Public Member Functions
	NStepQLearningWorker (const UpdaterType &updater, const EnvironmentType &environment, const TrainingConfig &config, bool deterministic)
	Construct N-step Q-Learning worker with the given parameters and environment. More...

	NStepQLearningWorker (const NStepQLearningWorker &other)
	Copy another NStepQLearningWorker. More...

	NStepQLearningWorker (NStepQLearningWorker &&other)
	Take ownership of another NStepQLearningWorker. More...

	~NStepQLearningWorker ()
	Clean memory. More...

void	Initialize (NetworkType &learningNetwork)
	Initialize the worker. More...

NStepQLearningWorker &	operator= (const NStepQLearningWorker &other)
	Copy another NStepQLearningWorker. More...

NStepQLearningWorker &	operator= (NStepQLearningWorker &&other)
	Take ownership of another NStepQLearningWorker. More...

bool	Step (NetworkType &learningNetwork, NetworkType &targetNetwork, size_t &totalSteps, PolicyType &policy, double &totalReward)
	The agent will execute one step. More...

Detailed Description

template
<
typename
EnvironmentType
,
typename
NetworkType
,
typename
UpdaterType
,
typename
PolicyType
>

class mlpack::rl::NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >

Forward declaration of NStepQLearningWorker.

N-step Q-Learning worker.

Template Parameters

EnvironmentType	The type of the reinforcement learning task.
NetworkType	The type of the network model.
UpdaterType	The type of the optimizer.
PolicyType	The type of the behavior policy.

Definition at line 179 of file async_learning.hpp.

Member Typedef Documentation

◆ ActionType

using ActionType = typename EnvironmentType::Action

Definition at line 40 of file n_step_q_learning_worker.hpp.

◆ StateType

using StateType = typename EnvironmentType::State

Definition at line 39 of file n_step_q_learning_worker.hpp.

◆ TransitionType

using TransitionType = std::tuple<StateType, ActionType, double, StateType>

Definition at line 41 of file n_step_q_learning_worker.hpp.

Constructor & Destructor Documentation

◆ NStepQLearningWorker() [1/3]

NStepQLearningWorker	(	const UpdaterType &	updater,
		const EnvironmentType &	environment,
		const TrainingConfig &	config,
		bool	deterministic
	)

inline

Construct N-step Q-Learning worker with the given parameters and environment.

Parameters

updater	The optimizer.
environment	The reinforcement learning task.
config	Hyper-parameters.
deterministic	Whether it should be deterministic.

Definition at line 52 of file n_step_q_learning_worker.hpp.

◆ NStepQLearningWorker() [2/3]

NStepQLearningWorker ( const NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType > & other )

inline

Copy another NStepQLearningWorker.

Parameters

other NStepQLearningWorker to copy.

Definition at line 72 of file n_step_q_learning_worker.hpp.

◆ NStepQLearningWorker() [3/3]

NStepQLearningWorker ( NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType > && other )

inline

Take ownership of another NStepQLearningWorker.

Parameters

other NStepQLearningWorker to take ownership of.

Definition at line 102 of file n_step_q_learning_worker.hpp.

◆ ~NStepQLearningWorker()

~NStepQLearningWorker ( )

inline

Clean memory.

Definition at line 204 of file n_step_q_learning_worker.hpp.

Member Function Documentation

◆ Initialize()

void Initialize ( NetworkType & learningNetwork )

inline

Initialize the worker.

Parameters

learningNetwork The shared network.

Definition at line 215 of file n_step_q_learning_worker.hpp.

◆ operator=() [1/2]

NStepQLearningWorker& operator= ( const NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType > & other )

inline

Copy another NStepQLearningWorker.

Parameters

other NStepQLearningWorker to copy.

Definition at line 132 of file n_step_q_learning_worker.hpp.

◆ operator=() [2/2]

NStepQLearningWorker& operator= ( NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType > && other )

inline

Take ownership of another NStepQLearningWorker.

Parameters

other NStepQLearningWorker to take ownership of.

Definition at line 169 of file n_step_q_learning_worker.hpp.

◆ Step()

bool Step	(	NetworkType &	learningNetwork,
		NetworkType &	targetNetwork,
		size_t &	totalSteps,
		PolicyType &	policy,
		double &	totalReward
	)

inline

The agent will execute one step.

Parameters

learningNetwork	The shared learning network.
targetNetwork	The shared target network.
totalSteps	The shared counter for total steps.
policy	The shared behavior policy.
totalReward	This will be the episode return if the episode ends after this step. Otherwise this is invalid.

Returns: Indicate whether current episode ends after this step.

Definition at line 244 of file n_step_q_learning_worker.hpp.

References TrainingConfig::Discount(), TrainingConfig::GradientLimit(), TrainingConfig::StepLimit(), TrainingConfig::StepSize(), TrainingConfig::TargetNetworkSyncInterval(), and TrainingConfig::UpdateInterval().

The documentation for this class was generated from the following files:

/home/ryan/src/mlpack.org/_src/mlpack-git/src/mlpack/methods/reinforcement_learning/async_learning.hpp
/home/ryan/src/mlpack.org/_src/mlpack-git/src/mlpack/methods/reinforcement_learning/worker/n_step_q_learning_worker.hpp

Public Types

Public Member Functions

Detailed Description

template<typenameEnvironmentType,typenameNetworkType,typenameUpdaterType,typenamePolicyType> class mlpack::rl::NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >

Member Typedef Documentation

◆ ActionType

◆ StateType

◆ TransitionType

Constructor & Destructor Documentation

◆ NStepQLearningWorker() [1/3]

◆ NStepQLearningWorker() [2/3]

◆ NStepQLearningWorker() [3/3]

◆ ~NStepQLearningWorker()

Member Function Documentation

◆ Initialize()

◆ operator=() [1/2]

◆ operator=() [2/2]

◆ Step()

template
<
typename
EnvironmentType
,
typename
NetworkType
,
typename
UpdaterType
,
typename
PolicyType
>

class mlpack::rl::NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >