A | AIToolbox::MDP::OffPolicyBase | protected |
alpha_ | AIToolbox::MDP::OffPolicyBase | protected |
clearTraces() | AIToolbox::MDP::OffPolicyBase | |
discount_ | AIToolbox::MDP::OffPolicyBase | protected |
getA() const | AIToolbox::MDP::OffPolicyBase | |
getDiscount() const | AIToolbox::MDP::OffPolicyBase | |
getLambda() const | AIToolbox::MDP::TreeBackupLEvaluation | inline |
getLearningRate() const | AIToolbox::MDP::OffPolicyBase | |
getQFunction() const | AIToolbox::MDP::OffPolicyBase | |
getS() const | AIToolbox::MDP::OffPolicyBase | |
getTolerance() const | AIToolbox::MDP::OffPolicyBase | |
getTraces() const | AIToolbox::MDP::OffPolicyBase | |
OffPolicyBase(size_t s, size_t a, double discount=1.0, double alpha=0.1, double tolerance=0.001) | AIToolbox::MDP::OffPolicyBase | |
OffPolicyEvaluation(const PolicyInterface &target, double discount=1.0, double alpha=0.1, double tolerance=0.001) | AIToolbox::MDP::OffPolicyEvaluation< TreeBackupLEvaluation > | |
Parent typedef | AIToolbox::MDP::TreeBackupLEvaluation | |
q_ | AIToolbox::MDP::OffPolicyBase | protected |
S | AIToolbox::MDP::OffPolicyBase | protected |
setDiscount(double d) | AIToolbox::MDP::OffPolicyBase | |
setLambda(double l) | AIToolbox::MDP::TreeBackupLEvaluation | inline |
setLearningRate(double a) | AIToolbox::MDP::OffPolicyBase | |
setQFunction(const QFunction &qfun) | AIToolbox::MDP::OffPolicyBase | |
setTolerance(double t) | AIToolbox::MDP::OffPolicyBase | |
setTraces(const Traces &t) | AIToolbox::MDP::OffPolicyBase | |
stepUpdateQ(const size_t s, const size_t a, const size_t s1, const double rew) | AIToolbox::MDP::OffPolicyEvaluation< TreeBackupLEvaluation > | |
target_ | AIToolbox::MDP::OffPolicyEvaluation< TreeBackupLEvaluation > | protected |
tolerance_ | AIToolbox::MDP::OffPolicyBase | protected |
Trace typedef | AIToolbox::MDP::OffPolicyBase | |
Traces typedef | AIToolbox::MDP::OffPolicyBase | |
traces_ | AIToolbox::MDP::OffPolicyBase | protected |
TreeBackupLEvaluation(const PolicyInterface &target, const double discount, const double alpha, const double lambda, const double tolerance) | AIToolbox::MDP::TreeBackupLEvaluation | inline |
updateTraces(size_t s, size_t a, double error, double traceDiscount) | AIToolbox::MDP::OffPolicyBase | protected |