|
Mungojerrie
1.0
Mungojerrie
|
Go to the documentation of this file.
53 saveStratFilename =
"";
57 std::string dotLearnFilename;
59 std::string prismLearnFilename;
60 Verbosity::Level verbosity;
62 std::string saveQFilename;
63 std::string loadQFilename;
64 double checkpointFreq;
65 std::string saveStratFilename;
67 bool parallelizedUpdate;
72 friend std::ostream & operator<<(std::ostream & os, Qtype
const & Q);
91 void SarsaLambda(
double lambda,
bool replacingTrace,
unsigned int numEpisodes,
92 double alpha,
double linearAlphaDecay,
double discount,
93 double epsilon,
double linearExploreDecay,
double initValue);
107 void DoubleQLearning(
unsigned int numEpisodes,
double alpha,
double linearAlphaDecay,
108 double discount,
double epsilon,
double linearExploreDecay,
double initValue);
122 void QLearning(
unsigned int numEpisodes,
double alpha,
double linearAlphaDecay,
123 double discount,
double epsilon,
double linearExploreDecay,
double initValue);
141 double epsilon,
double linearExploreDecay,
double eta,
148 std::string dotLearnFilename;
149 std::string prismLearnFilename;
150 Verbosity::Level verbosity;
152 std::string saveQFilename;
153 std::string loadQFilename;
154 double checkpointFreq;
155 std::string saveStratFilename;
157 bool parallelizedUpdate;
158 static int constexpr progressBarLength = 25;
Interface between learner and model/objective.
Definition: Learner.hh:48
void DifferentialQLearning(unsigned int numEpisodes, double alpha, double linearAlphaDecay, double epsilon, double linearExploreDecay, double eta, double initValue)
Runs the Differential Q-learning algorithm.
Definition: Learner.cc:854
Learner(Gym gym, LearnerOptions options)
Constructor for learner.
Definition: Learner.cc:47
void QLearning(unsigned int numEpisodes, double alpha, double linearAlphaDecay, double discount, double epsilon, double linearExploreDecay, double initValue)
Runs the Q-learning algorithm.
Definition: Learner.cc:609
Class for a learning interface.
Definition: Gym.hh:253
Definition: Learner.hh:70
void SarsaLambda(double lambda, bool replacingTrace, unsigned int numEpisodes, double alpha, double linearAlphaDecay, double discount, double epsilon, double linearExploreDecay, double initValue)
Runs the Sarsa( ) algorithm.
Definition: Learner.cc:225
void DoubleQLearning(unsigned int numEpisodes, double alpha, double linearAlphaDecay, double discount, double epsilon, double linearExploreDecay, double initValue)
Runs the Double Q-learning algorithm.
Definition: Learner.cc:406