24 size_t S = c->stateSpace->size();
25 size_t A = c->actionSpace->size();
26 occurences = std::vector<std::vector<std::vector<int>>>(
S,
27 std::vector<std::vector<int>>(
A, std::vector<int>(
S, 0)));
35 previousState =
context->stateSpace->getState();
44 occurences[previousState][previousAction][state]++;
48 previousState = state;
49 previousAction =
context->policy->getAction(previousState);
54 void MatrixLearning::updateMatrix()
56 size_t S =
context->stateSpace->size();
57 size_t A =
context->actionSpace->size();
65 N += (double) occurences[
i][j][k];
69 context->matrix->set(
i, k, j, ((
double)occurences[
i][j][k])/N);
MatrixLearning(std::shared_ptr< Context > context)
std::shared_ptr< Context > context