| Public Member Functions | |
| TrainingConfig () | |
| TrainingConfig (size_t numWorkers, size_t updateInterval, size_t targetNetworkSyncInterval, size_t stepLimit, size_t explorationSteps, double stepSize, double discount, double gradientLimit, bool doubleQLearning, bool noisyQLearning, bool isCategorical, size_t atomSize, double vMin, double vMax, double rho) | |
| size_t | AtomSize () const | 
| Get the number of atoms.  More... | |
| size_t & | AtomSize () | 
| Modify the number of atoms.  More... | |
| double | Discount () const | 
| Get the discount rate for future reward.  More... | |
| double & | Discount () | 
| Modify the discount rate for future reward.  More... | |
| bool | DoubleQLearning () const | 
| Get the indicator of double q-learning.  More... | |
| bool & | DoubleQLearning () | 
| Modify the indicator of double q-learning.  More... | |
| size_t | ExplorationSteps () const | 
| Get the exploration steps.  More... | |
| size_t & | ExplorationSteps () | 
| Modify the exploration steps.  More... | |
| double | GradientLimit () const | 
| Get the limit of update gradient.  More... | |
| double & | GradientLimit () | 
| Modify the limit of update gradient.  More... | |
| bool | IsCategorical () const | 
| Get the indicator of categorical q-learning.  More... | |
| bool & | IsCategorical () | 
| Modify the indicator of categorical q-learning.  More... | |
| bool | NoisyQLearning () const | 
| Get the indicator of noisy q-learning.  More... | |
| bool & | NoisyQLearning () | 
| Modify the indicator of double q-learning.  More... | |
| size_t | NumWorkers () const | 
| Get the amount of workers.  More... | |
| size_t & | NumWorkers () | 
| Modify the amount of workers.  More... | |
| double | Rho () const | 
| Get the rho value for sac.  More... | |
| double & | Rho () | 
| Modify the rho value for sac.  More... | |
| size_t | StepLimit () const | 
| Get the maximum steps of each episode.  More... | |
| size_t & | StepLimit () | 
| Modify the maximum steps of each episode.  More... | |
| double | StepSize () const | 
| Get the step size of the optimizer.  More... | |
| double & | StepSize () | 
| Modify the step size of the optimizer.  More... | |
| size_t | TargetNetworkSyncInterval () const | 
| Get the interval for syncing target network.  More... | |
| size_t & | TargetNetworkSyncInterval () | 
| Modify the interval for syncing target network.  More... | |
| size_t | UpdateInterval () const | 
| Get the update interval.  More... | |
| size_t & | UpdateInterval () | 
| Modify the update interval.  More... | |
| double | VMax () const | 
| Get the maximum value for support.  More... | |
| double & | VMax () | 
| Modify the maximum value for support.  More... | |
| double | VMin () const | 
| Get the minimum value for support.  More... | |
| double & | VMin () | 
| Modify the minimum value for support.  More... | |
Definition at line 19 of file training_config.hpp.
| 
 | inline | 
Definition at line 22 of file training_config.hpp.
| 
 | inline | 
Definition at line 40 of file training_config.hpp.
| 
 | inline | 
Get the number of atoms.
Definition at line 133 of file training_config.hpp.
| 
 | inline | 
Modify the number of atoms.
Definition at line 135 of file training_config.hpp.
| 
 | inline | 
Get the discount rate for future reward.
Definition at line 108 of file training_config.hpp.
Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().
| 
 | inline | 
Modify the discount rate for future reward.
Definition at line 110 of file training_config.hpp.
| 
 | inline | 
Get the indicator of double q-learning.
Definition at line 118 of file training_config.hpp.
| 
 | inline | 
Modify the indicator of double q-learning.
Definition at line 120 of file training_config.hpp.
| 
 | inline | 
Get the exploration steps.
Definition at line 98 of file training_config.hpp.
| 
 | inline | 
Modify the exploration steps.
Definition at line 100 of file training_config.hpp.
| 
 | inline | 
Get the limit of update gradient.
Definition at line 113 of file training_config.hpp.
Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().
| 
 | inline | 
Modify the limit of update gradient.
Definition at line 115 of file training_config.hpp.
| 
 | inline | 
Get the indicator of categorical q-learning.
Definition at line 128 of file training_config.hpp.
| 
 | inline | 
Modify the indicator of categorical q-learning.
Definition at line 130 of file training_config.hpp.
| 
 | inline | 
Get the indicator of noisy q-learning.
Definition at line 123 of file training_config.hpp.
| 
 | inline | 
Modify the indicator of double q-learning.
Definition at line 125 of file training_config.hpp.
| 
 | inline | 
Get the amount of workers.
Definition at line 74 of file training_config.hpp.
| 
 | inline | 
Modify the amount of workers.
Definition at line 76 of file training_config.hpp.
| 
 | inline | 
Get the rho value for sac.
Definition at line 148 of file training_config.hpp.
| 
 | inline | 
Modify the rho value for sac.
Definition at line 150 of file training_config.hpp.
| 
 | inline | 
Get the maximum steps of each episode.
Definition at line 90 of file training_config.hpp.
Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().
| 
 | inline | 
Modify the maximum steps of each episode.
Setting it to 0 means no limit.
Definition at line 95 of file training_config.hpp.
| 
 | inline | 
Get the step size of the optimizer.
Definition at line 103 of file training_config.hpp.
Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().
| 
 | inline | 
Modify the step size of the optimizer.
Definition at line 105 of file training_config.hpp.
| 
 | inline | 
Get the interval for syncing target network.
Definition at line 84 of file training_config.hpp.
Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().
| 
 | inline | 
Modify the interval for syncing target network.
Definition at line 87 of file training_config.hpp.
| 
 | inline | 
Get the update interval.
Definition at line 79 of file training_config.hpp.
Referenced by NStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), OneStepQLearningWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step(), and OneStepSarsaWorker< EnvironmentType, NetworkType, UpdaterType, PolicyType >::Step().
| 
 | inline | 
Modify the update interval.
Definition at line 81 of file training_config.hpp.
| 
 | inline | 
Get the maximum value for support.
Definition at line 143 of file training_config.hpp.
| 
 | inline | 
Modify the maximum value for support.
Definition at line 145 of file training_config.hpp.
| 
 | inline | 
Get the minimum value for support.
Definition at line 138 of file training_config.hpp.
| 
 | inline | 
Modify the minimum value for support.
Definition at line 140 of file training_config.hpp.