A | AIToolbox::PolicyInterface< void, void, size_t > | protected |
Base typedef | AIToolbox::Bandit::PolicyInterface | |
ESRLPolicy(size_t A, double a, unsigned timesteps, unsigned explorationPhases, unsigned window) | AIToolbox::Bandit::ESRLPolicy | |
getA() const | AIToolbox::PolicyInterface< void, void, size_t > | |
getActionProbability(const size_t &a) const override | AIToolbox::Bandit::ESRLPolicy | virtual |
AIToolbox::Bandit::PolicyInterface::getActionProbability(const void &s, const size_t &a) const=0 | AIToolbox::PolicyInterface< void, void, size_t > | pure virtual |
getAParam() const | AIToolbox::Bandit::ESRLPolicy | |
getExplorationPhases() const | AIToolbox::Bandit::ESRLPolicy | |
getPolicy() const override | AIToolbox::Bandit::ESRLPolicy | virtual |
getS() const | AIToolbox::PolicyInterface< void, void, size_t > | |
getTimesteps() const | AIToolbox::Bandit::ESRLPolicy | |
getWindowSize() const | AIToolbox::Bandit::ESRLPolicy | |
isExploiting() const | AIToolbox::Bandit::ESRLPolicy | |
PolicyInterface(void s, size_t a) | AIToolbox::PolicyInterface< void, void, size_t > | |
rand_ | AIToolbox::PolicyInterface< void, void, size_t > | mutableprotected |
S | AIToolbox::PolicyInterface< void, void, size_t > | protected |
sampleAction() const override | AIToolbox::Bandit::ESRLPolicy | virtual |
AIToolbox::Bandit::PolicyInterface::sampleAction(const void &s) const=0 | AIToolbox::PolicyInterface< void, void, size_t > | pure virtual |
setAParam(double a) | AIToolbox::Bandit::ESRLPolicy | |
setExplorationPhases(unsigned p) | AIToolbox::Bandit::ESRLPolicy | |
setTimesteps(unsigned t) | AIToolbox::Bandit::ESRLPolicy | |
setWindowSize(unsigned window) | AIToolbox::Bandit::ESRLPolicy | |
stepUpdateP(size_t a, bool result) | AIToolbox::Bandit::ESRLPolicy | |
~PolicyInterface() | AIToolbox::PolicyInterface< void, void, size_t > | virtual |