schedSim/mdpModel_8h_source.html

 #ifndef MDPMODEL_H
 #define MDPMODEL_H

 #include <iostream>
 #include <string>
 #include <vector>

 #include "action.h"
 #include "action_impl.h" /*FIXME this and the following should not be here...*/
 #include "state.h"

 namespace Mdp
 {

 class ActionSpace;
 class ConstraintList;
 struct Context;
 class StateSpace;
 class LearningStrategy;
 class MdpConfiguration;
 class Rewards;

 class MdpModel
 {
 public:
     MdpModel(std::shared_ptr<StateSpace> stateSpace,
              std::shared_ptr<ActionSpace> actionSpace,
              std::shared_ptr<MdpConfiguration> conf);
     virtual ~MdpModel();
     void init();
     void end();
     Action *selectAction(bool updateModel=true);
     Action *selectActionWithoutUpdate();

     /*Ideally we don't need to know about state and actions apart from what the builder easily provide*/
     void setConstraintList(std::shared_ptr<ConstraintList> list); //not very good... but necessary?
     void setRewards(std::shared_ptr<Rewards> rewards); //not very good... but necessary?

     void printReportsToFile(std::string folder);
     void printSummary(std::ostream& stream);
     void printPolicy(std::ostream& stream);
 protected:
     virtual void constructContext(std::shared_ptr<StateSpace> stateSpace,
                               std::shared_ptr<ActionSpace> actionSpace,
                               std::shared_ptr<MdpConfiguration> conf);
     virtual void setLearningStrategy();
     std::shared_ptr<Context> context;
     LearningStrategy *learningStrategy{nullptr};
     void record(state_t state, action_t action, double reward);

     std::vector<state_t> stateHistory;
     std::vector<action_t> actionHistory;
     std::vector<double> rewardHistory;
     bool recordHistory{false};
 };


 }
 #endif
Mdp::MdpModel::setLearningStrategy
virtual void setLearningStrategy()
Definition: mdpModel.cpp:42

Mdp::MdpModel::constructContext
virtual void constructContext(std::shared_ptr< StateSpace > stateSpace, std::shared_ptr< ActionSpace > actionSpace, std::shared_ptr< MdpConfiguration > conf)
Definition: mdpModel.cpp:48

Mdp::MdpModel::~MdpModel
virtual ~MdpModel()
Definition: mdpModel.cpp:68

Mdp::MdpModel::printPolicy
void printPolicy(std::ostream &stream)
Definition: mdpModel.cpp:122

Mdp::MdpModel::actionHistory
std::vector< action_t > actionHistory
Definition: mdpModel.h:79

Mdp::MdpModel::learningStrategy
LearningStrategy * learningStrategy
Definition: mdpModel.h:75

Mdp::MdpModel::record
void record(state_t state, action_t action, double reward)
Definition: mdpModel.cpp:129

Mdp::MdpModel::selectAction
Action * selectAction(bool updateModel=true)
Returns the optimal action for the current timestep.
Definition: mdpModel.cpp:89

Mdp::MdpModel::context
std::shared_ptr< Context > context
Definition: mdpModel.h:74

Mdp::Action
Definition: action.h:25

Mdp::MdpModel::stateHistory
std::vector< state_t > stateHistory
Definition: mdpModel.h:78

action.h

Mdp::MdpModel
The main class of the MDP framework.
Definition: mdpModel.h:35

Mdp::MdpModel::recordHistory
bool recordHistory
Definition: mdpModel.h:81

Mdp::action_t
size_t action_t
Definition: action_impl.h:18

Mdp::LearningStrategy
Definition: learningStrategy.h:21

Mdp
Definition: action.h:18

Mdp::MdpModel::rewardHistory
std::vector< double > rewardHistory
Definition: mdpModel.h:80

Mdp::MdpModel::selectActionWithoutUpdate
Action * selectActionWithoutUpdate()
similar to selectAction, but without updating the model
Definition: mdpModel.cpp:84

Mdp::MdpModel::setConstraintList
void setConstraintList(std::shared_ptr< ConstraintList > list)
Definition: mdpModel.cpp:162

Mdp::MdpModel::MdpModel
MdpModel(std::shared_ptr< StateSpace > stateSpace, std::shared_ptr< ActionSpace > actionSpace, std::shared_ptr< MdpConfiguration > conf)
Definition: mdpModel.cpp:34

state.h

Mdp::MdpModel::printSummary
void printSummary(std::ostream &stream)
Definition: mdpModel.cpp:141

Mdp::MdpModel::init
void init()
call this function first
Definition: mdpModel.cpp:72

Mdp::MdpModel::printReportsToFile
void printReportsToFile(std::string folder)
Print reports to file.
Definition: mdpModel.cpp:103

Mdp::MdpModel::end
void end()
call this function at the end
Definition: mdpModel.cpp:79

Mdp::MdpModel::setRewards
void setRewards(std::shared_ptr< Rewards > rewards)
Definition: mdpModel.cpp:167

Mdp::state_t
size_t state_t
Definition: state.h:19

reward
Definition: reward.py:1

action_impl.h