Representation of MDPs - Githubissues

MDPs and its associated concepts may be represented using the following class structure,

class Action
{
    private string description;

   private Action(const string& description="");
   public static getObject(const string& description="");
   private ~Action();
   public void deleteObject();
   public string getDescription();
};

template <class _type>
class State
{
    private string description;
    private vector<Action*> actions;
    unordered_map<Action*, _type> transitionProbs;
    unordered_map<Action*, _type> iTransitionRewards;

   private State(const string& description="");
   public static getObject(const string& description="");
   public void addAction(Action& action);
   public void setTransitionProb(Action& action, _type transitionProb);
   public void setITransitionRewards(Action& action, _type reward);
};

template <class _type>
class MarkovDecisionProcess
{
    private vector<State<_type>*> stateSpace;
    private unordered_map<State<_type>*, Action*>  policy;
    friend _type performanceMetric();

    private MarkovDecisionProcess();
    public static getObject();
    public void addState(State& state);
    public void updatePolicy(State& state, Action& action);
};

codezonediitj / reinforce

Representation of MDPs #1

Description of the problem

Example of the problem

References/Other comments