14 #ifndef MLPACK_METHODS_RL_ASYNC_LEARNING_HPP
15 #define MLPACK_METHODS_RL_ASYNC_LEARNING_HPP
52 typename EnvironmentType,
72 UpdaterType updater = UpdaterType(),
73 EnvironmentType environment = EnvironmentType());
88 template <
typename Measure>
97 NetworkType&
Network() {
return learningNetwork; }
99 const NetworkType&
Network()
const {
return learningNetwork; }
104 const PolicyType&
Policy()
const {
return policy; }
109 const UpdaterType&
Updater()
const {
return updater; }
114 const EnvironmentType&
Environment()
const {
return environment; }
121 NetworkType learningNetwork;
130 EnvironmentType environment;
142 typename EnvironmentType,
143 typename NetworkType,
144 typename UpdaterType,
147 class OneStepQLearningWorker;
158 typename EnvironmentType,
159 typename NetworkType,
160 typename UpdaterType,
163 class OneStepSarsaWorker;
174 typename EnvironmentType,
175 typename NetworkType,
176 typename UpdaterType,
179 class NStepQLearningWorker;
190 typename EnvironmentType,
191 typename NetworkType,
192 typename UpdaterType,
196 NetworkType, UpdaterType, PolicyType>, EnvironmentType, NetworkType,
197 UpdaterType, PolicyType>;
208 typename EnvironmentType,
209 typename NetworkType,
210 typename UpdaterType,
214 NetworkType, UpdaterType, PolicyType>, EnvironmentType, NetworkType,
215 UpdaterType, PolicyType>;
226 typename EnvironmentType,
227 typename NetworkType,
228 typename UpdaterType,
232 NetworkType, UpdaterType, PolicyType>, EnvironmentType, NetworkType,
233 UpdaterType, PolicyType>;
239 #include "async_learning_impl.hpp"