Scheduler
All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Pages
delayedQLearning.cpp
Go to the documentation of this file.
1 
10 #include "delayedQLearning.h"
11 
12 using namespace Mdp;
13 
14 void DelayedQLearning::updateActionValues(state_t previousState, state_t /*nextState*/, action_t previousAction, double reward)
15 {
16  double delta = previousReward + discountFactor * getMaxQ(previousState);
18  delta -= av;
20  updateState(previousState, previousAction, reward);
21 }
22 
23 
24 
25 
26 
27 
28 
29 
30 
31 
32 
33 
34 
35 
36 
37 
38 
39 
40 
41 
42 
43 
44 
45 
46 
47 
48 
49 
50 
virtual double getValue(state_t state, action_t action)=0
TabularActionValues * tabularAv
void updateState(state_t previousState, action_t previousAction, double reward)
void updateValue(state_t state, action_t action, double value)
virtual void updateActionValues(state_t previousState, state_t nextState, action_t previousAction, double reward)
size_t action_t
Definition: action_impl.h:18
Definition: action.h:18
size_t state_t
Definition: state.h:19
ActionValuesFunction * actionValues
virtual double getMaxQ(state_t state)
Definition: reward.py:1