Scheduler
eligibilityTraceAlgo.cpp
Go to the documentation of this file.
1 
10 #include "eligibilityTraceAlgo.h"
11 
12 
13 #include <mdp/context.h>
14 #include <mdp/stateSpace.h>
15 #include <mdp/actionSpace.h>
16 #include <mdp/mdpConfiguration.h>
17 
18 
19 using namespace Mdp;
20 
22 {
23  e = std::vector<std::vector<double>>(context->stateSpace->size(),
24  std::vector<double>(context->actionSpace->size(), 0.0));
25  discountFactor = context->conf->getDoubleValue("mdp","discountFactor");
26  lambda = context->conf->getDoubleValue("reinforcementLearning","lambda");
27  stateSize = context->stateSpace->size();
28  actionSize = context->actionSpace->size();
29  initAlpha();
30 }
31 
33 {
34 }
35 
36 void EligibilityTraceAlgo::updateState(state_t previousState, action_t previousAction, double reward)
37 {
38  previousPreviousState = previousState;
39  previousPreviousAction = previousAction;
40  previousReward = reward;
41  updateAlpha();
42 }
43 
void updateState(state_t previousState, action_t previousAction, double reward)
std::vector< std::vector< double > > e
size_t action_t
Definition: action_impl.h:18
Definition: action.h:18
size_t state_t
Definition: state.h:19
std::shared_ptr< Context > context
Definition: reward.py:1