Scheduler
Public Member Functions | Protected Member Functions | Protected Attributes | List of all members
Mdp::RlBackupAlgorithm Class Referenceabstract

#include <rlBackupAlgorithm.h>

Inheritance diagram for Mdp::RlBackupAlgorithm:
Mdp::EligibilityTraceAlgo Mdp::QLearning Mdp::DelayedQLearning Mdp::NaiveQLambda Mdp::SarsaLambda Mdp::WatkinsQLambda

Public Member Functions

 RlBackupAlgorithm (std::shared_ptr< Context > c, ActionValuesFunction *av)
 
virtual ~RlBackupAlgorithm ()
 
virtual void init ()=0
 
virtual void updateActionValues (state_t previousState, state_t nextState, action_t previousAction, double reward)=0
 
virtual void end ()=0
 
virtual double getMaxQ (state_t state)
 
virtual std::pair< action_t, double > getBestActionAndQ (state_t state)
 
virtual action_t getBestAction (state_t state)
 
virtual void updateBestActionAndQ (state_t state)
 
virtual void notifyUpdateNeeded ()
 

Protected Member Functions

virtual void initAlpha ()
 
virtual void updateAlpha ()
 
virtual void updateIfNeeded (state_t state)
 

Protected Attributes

std::shared_ptr< Contextcontext {nullptr}
 
ActionValuesFunctionactionValues {nullptr}
 
double alpha {-1.0}
 
double alpha0 {0.1}
 
double alphaCounter {1.0}
 
double alphaDecaySpeed {1.0}
 
bool hyperbolic {false}
 
bool stepwise {false}
 
unsigned long long stepwiseCounter {0}
 
unsigned long long int stepLength {0}
 
std::vector< double > bestQ
 
std::vector< action_tbestAction
 
std::vector< bool > needsUpdate
 

Detailed Description

Definition at line 31 of file rlBackupAlgorithm.h.

Constructor & Destructor Documentation

RlBackupAlgorithm::RlBackupAlgorithm ( std::shared_ptr< Context c,
ActionValuesFunction av 
)

Definition at line 26 of file rlBackupAlgorithm.cpp.

virtual Mdp::RlBackupAlgorithm::~RlBackupAlgorithm ( )
inlinevirtual

Definition at line 35 of file rlBackupAlgorithm.h.

Member Function Documentation

virtual void Mdp::RlBackupAlgorithm::end ( )
pure virtual
action_t RlBackupAlgorithm::getBestAction ( state_t  state)
virtual

Definition at line 91 of file rlBackupAlgorithm.cpp.

std::pair< action_t, double > RlBackupAlgorithm::getBestActionAndQ ( state_t  state)
virtual

Definition at line 75 of file rlBackupAlgorithm.cpp.

double RlBackupAlgorithm::getMaxQ ( state_t  state)
virtual

Definition at line 41 of file rlBackupAlgorithm.cpp.

virtual void Mdp::RlBackupAlgorithm::init ( )
pure virtual
void RlBackupAlgorithm::initAlpha ( )
protectedvirtual

Definition at line 97 of file rlBackupAlgorithm.cpp.

void RlBackupAlgorithm::notifyUpdateNeeded ( )
virtual

Definition at line 35 of file rlBackupAlgorithm.cpp.

virtual void Mdp::RlBackupAlgorithm::updateActionValues ( state_t  previousState,
state_t  nextState,
action_t  previousAction,
double  reward 
)
pure virtual
void RlBackupAlgorithm::updateAlpha ( )
protectedvirtual

Definition at line 113 of file rlBackupAlgorithm.cpp.

void RlBackupAlgorithm::updateBestActionAndQ ( state_t  state)
virtual

Definition at line 51 of file rlBackupAlgorithm.cpp.

void RlBackupAlgorithm::updateIfNeeded ( state_t  state)
protectedvirtual

Definition at line 81 of file rlBackupAlgorithm.cpp.

Member Data Documentation

ActionValuesFunction* Mdp::RlBackupAlgorithm::actionValues {nullptr}
protected

Definition at line 53 of file rlBackupAlgorithm.h.

double Mdp::RlBackupAlgorithm::alpha {-1.0}
protected

Definition at line 54 of file rlBackupAlgorithm.h.

double Mdp::RlBackupAlgorithm::alpha0 {0.1}
protected

Definition at line 55 of file rlBackupAlgorithm.h.

double Mdp::RlBackupAlgorithm::alphaCounter {1.0}
protected

Definition at line 56 of file rlBackupAlgorithm.h.

double Mdp::RlBackupAlgorithm::alphaDecaySpeed {1.0}
protected

Definition at line 57 of file rlBackupAlgorithm.h.

std::vector<action_t> Mdp::RlBackupAlgorithm::bestAction
protected

Definition at line 65 of file rlBackupAlgorithm.h.

std::vector<double> Mdp::RlBackupAlgorithm::bestQ
protected

Definition at line 64 of file rlBackupAlgorithm.h.

std::shared_ptr<Context> Mdp::RlBackupAlgorithm::context {nullptr}
protected

Definition at line 52 of file rlBackupAlgorithm.h.

bool Mdp::RlBackupAlgorithm::hyperbolic {false}
protected

Definition at line 58 of file rlBackupAlgorithm.h.

std::vector<bool> Mdp::RlBackupAlgorithm::needsUpdate
protected

Definition at line 66 of file rlBackupAlgorithm.h.

unsigned long long int Mdp::RlBackupAlgorithm::stepLength {0}
protected

Definition at line 61 of file rlBackupAlgorithm.h.

bool Mdp::RlBackupAlgorithm::stepwise {false}
protected

Definition at line 59 of file rlBackupAlgorithm.h.

unsigned long long Mdp::RlBackupAlgorithm::stepwiseCounter {0}
protected

Definition at line 60 of file rlBackupAlgorithm.h.


The documentation for this class was generated from the following files: