Scheduler
|
#include <eligibilityTraceAlgo.h>
Public Member Functions | |
EligibilityTraceAlgo (std::shared_ptr< Context > c, TabularActionValues *av) | |
virtual void | init () |
virtual void | end () |
virtual void | updateActionValues (state_t previousState, state_t nextState, action_t previousAction, double reward)=0 |
![]() | |
RlBackupAlgorithm (std::shared_ptr< Context > c, ActionValuesFunction *av) | |
virtual | ~RlBackupAlgorithm () |
virtual double | getMaxQ (state_t state) |
virtual std::pair< action_t, double > | getBestActionAndQ (state_t state) |
virtual action_t | getBestAction (state_t state) |
virtual void | updateBestActionAndQ (state_t state) |
virtual void | notifyUpdateNeeded () |
Protected Member Functions | |
void | updateState (state_t previousState, action_t previousAction, double reward) |
![]() | |
virtual void | initAlpha () |
virtual void | updateAlpha () |
virtual void | updateIfNeeded (state_t state) |
Protected Attributes | |
TabularActionValues * | tabularAv {nullptr} |
state_t | previousPreviousState {0} |
action_t | previousPreviousAction {0} |
double | previousReward {0.0} |
std::vector< std::vector< double > > | e |
double | lambda {0.5} |
double | discountFactor {0.5} |
size_t | stateSize {0} |
size_t | actionSize {0} |
![]() | |
std::shared_ptr< Context > | context {nullptr} |
ActionValuesFunction * | actionValues {nullptr} |
double | alpha {-1.0} |
double | alpha0 {0.1} |
double | alphaCounter {1.0} |
double | alphaDecaySpeed {1.0} |
bool | hyperbolic {false} |
bool | stepwise {false} |
unsigned long long | stepwiseCounter {0} |
unsigned long long int | stepLength {0} |
std::vector< double > | bestQ |
std::vector< action_t > | bestAction |
std::vector< bool > | needsUpdate |
Definition at line 19 of file eligibilityTraceAlgo.h.
|
inline |
Definition at line 22 of file eligibilityTraceAlgo.h.
|
virtual |
Implements Mdp::RlBackupAlgorithm.
Definition at line 32 of file eligibilityTraceAlgo.cpp.
|
virtual |
Implements Mdp::RlBackupAlgorithm.
Definition at line 21 of file eligibilityTraceAlgo.cpp.
|
pure virtual |
Implements Mdp::RlBackupAlgorithm.
Implemented in Mdp::WatkinsQLambda, Mdp::DelayedQLearning, Mdp::NaiveQLambda, and Mdp::SarsaLambda.
|
protected |
Definition at line 36 of file eligibilityTraceAlgo.cpp.
|
protected |
Definition at line 39 of file eligibilityTraceAlgo.h.
|
protected |
Definition at line 37 of file eligibilityTraceAlgo.h.
|
protected |
Definition at line 35 of file eligibilityTraceAlgo.h.
|
protected |
Definition at line 36 of file eligibilityTraceAlgo.h.
|
protected |
Definition at line 33 of file eligibilityTraceAlgo.h.
|
protected |
Definition at line 32 of file eligibilityTraceAlgo.h.
|
protected |
Definition at line 34 of file eligibilityTraceAlgo.h.
|
protected |
Definition at line 38 of file eligibilityTraceAlgo.h.
|
protected |
Definition at line 31 of file eligibilityTraceAlgo.h.