Public Member Functions | |
TrainingConfig () | |
TrainingConfig (size_t numWorkers, size_t updateInterval, size_t targetNetworkSyncInterval, size_t stepLimit, size_t explorationSteps, double stepSize, double discount, double gradientLimit, bool doubleQLearning, bool noisyQLearning, bool isCategorical, size_t atomSize, double vMin, double vMax, double rho) | |
size_t | AtomSize () const |
Get the number of atoms. More... | |
size_t & | AtomSize () |
Modify the number of atoms. More... | |
double | Discount () const |
Get the discount rate for future reward. More... | |
double & | Discount () |
Modify the discount rate for future reward. More... | |
bool | DoubleQLearning () const |
Get the indicator of double q-learning. More... | |
bool & | DoubleQLearning () |
Modify the indicator of double q-learning. More... | |
size_t | ExplorationSteps () const |
Get the exploration steps. More... | |
size_t & | ExplorationSteps () |
Modify the exploration steps. More... | |
double | GradientLimit () const |
Get the limit of update gradient. More... | |
double & | GradientLimit () |
Modify the limit of update gradient. More... | |
bool | IsCategorical () const |
Get the indicator of categorical q-learning. More... | |
bool & | IsCategorical () |
Modify the indicator of categorical q-learning. More... | |
bool | NoisyQLearning () const |
Get the indicator of noisy q-learning. More... | |
bool & | NoisyQLearning () |
Modify the indicator of double q-learning. More... | |
size_t | NumWorkers () const |
Get the amount of workers. More... | |
size_t & | NumWorkers () |
Modify the amount of workers. More... | |
double | Rho () const |
Get the rho value for sac. More... | |
double & | Rho () |
Modify the rho value for sac. More... | |
size_t | StepLimit () const |
Get the maximum steps of each episode. More... | |
size_t & | StepLimit () |
Modify the maximum steps of each episode. More... | |
double | StepSize () const |
Get the step size of the optimizer. More... | |
double & | StepSize () |
Modify the step size of the optimizer. More... | |
size_t | TargetNetworkSyncInterval () const |
Get the interval for syncing target network. More... | |
size_t & | TargetNetworkSyncInterval () |
Modify the interval for syncing target network. More... | |
size_t | UpdateInterval () const |
Get the update interval. More... | |
size_t & | UpdateInterval () |
Modify the update interval. More... | |
double | VMax () const |
Get the maximum value for support. More... | |
double & | VMax () |
Modify the maximum value for support. More... | |
double | VMin () const |
Get the minimum value for support. More... | |
double & | VMin () |
Modify the minimum value for support. More... | |
Definition at line 19 of file training_config.hpp.
|
inline |
Definition at line 22 of file training_config.hpp.
|
inline |
Definition at line 40 of file training_config.hpp.
|
inline |
Get the number of atoms.
Definition at line 133 of file training_config.hpp.
|
inline |
Modify the number of atoms.
Definition at line 135 of file training_config.hpp.
|
inline |
Get the discount rate for future reward.
Definition at line 108 of file training_config.hpp.
Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().
|
inline |
Modify the discount rate for future reward.
Definition at line 110 of file training_config.hpp.
|
inline |
Get the indicator of double q-learning.
Definition at line 118 of file training_config.hpp.
|
inline |
Modify the indicator of double q-learning.
Definition at line 120 of file training_config.hpp.
|
inline |
Get the exploration steps.
Definition at line 98 of file training_config.hpp.
|
inline |
Modify the exploration steps.
Definition at line 100 of file training_config.hpp.
|
inline |
Get the limit of update gradient.
Definition at line 113 of file training_config.hpp.
Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().
|
inline |
Modify the limit of update gradient.
Definition at line 115 of file training_config.hpp.
|
inline |
Get the indicator of categorical q-learning.
Definition at line 128 of file training_config.hpp.
|
inline |
Modify the indicator of categorical q-learning.
Definition at line 130 of file training_config.hpp.
|
inline |
Get the indicator of noisy q-learning.
Definition at line 123 of file training_config.hpp.
|
inline |
Modify the indicator of double q-learning.
Definition at line 125 of file training_config.hpp.
|
inline |
Get the amount of workers.
Definition at line 74 of file training_config.hpp.
|
inline |
Modify the amount of workers.
Definition at line 76 of file training_config.hpp.
|
inline |
Get the rho value for sac.
Definition at line 148 of file training_config.hpp.
|
inline |
Modify the rho value for sac.
Definition at line 150 of file training_config.hpp.
|
inline |
Get the maximum steps of each episode.
Definition at line 90 of file training_config.hpp.
Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().
|
inline |
Modify the maximum steps of each episode.
Setting it to 0 means no limit.
Definition at line 95 of file training_config.hpp.
|
inline |
Get the step size of the optimizer.
Definition at line 103 of file training_config.hpp.
Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().
|
inline |
Modify the step size of the optimizer.
Definition at line 105 of file training_config.hpp.
|
inline |
Get the interval for syncing target network.
Definition at line 84 of file training_config.hpp.
Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().
|
inline |
Modify the interval for syncing target network.
Definition at line 87 of file training_config.hpp.
|
inline |
Get the update interval.
Definition at line 79 of file training_config.hpp.
Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().
|
inline |
Modify the update interval.
Definition at line 81 of file training_config.hpp.
|
inline |
Get the maximum value for support.
Definition at line 143 of file training_config.hpp.
|
inline |
Modify the maximum value for support.
Definition at line 145 of file training_config.hpp.
|
inline |
Get the minimum value for support.
Definition at line 138 of file training_config.hpp.
|
inline |
Modify the minimum value for support.
Definition at line 140 of file training_config.hpp.