code/craam/State_8hpp_source.html

 #pragma once

 #include "Action.hpp"

 #include <utility>
 #include <tuple>
 #include <vector>
 #include <stdexcept>
 #include <limits>
 #include <string>

 #include "cpp11-range-master/range.hpp"


 namespace craam {

 using namespace std;


 // **************************************************************************************
 //  SA State (SA rectangular, also used for a regular MDP)
 // **************************************************************************************

 template<class AType>
 class SAState{
 protected:
     vector<AType> actions;
     vector<bool> valid;

 public:

     SAState() : actions(0), valid(0) {};

     SAState(const vector<AType>& actions) : actions(actions), valid(actions.size(),true) { };

     size_t action_count() const { return actions.size();};

     size_t size() const { return action_count();};

     AType& create_action(long actionid){
         assert(actionid >= 0);

         // assumes that the default constructor makes the actions invalid
         if(actionid >= (long) actions.size()){
             actions.resize(actionid+1);
             valid.resize(actionid+1, false);
         }

         // set only the action that is being added as valid
         valid[actionid] = true;
         return actions[actionid];
     }

     AType& create_action() {return create_action(actions.size());};

     const AType& get_action(long actionid) const
                 {assert(actionid >= 0 && size_t(actionid) < action_count());
                  return actions[actionid];};

     const AType& operator[](long actionid) const {return get_action(actionid);}

     AType& get_action(long actionid)
                 {assert(actionid >= 0 && size_t(actionid) < action_count());
                  return actions[actionid];};

     AType& operator[](long actionid) {return get_action(actionid);}

     bool is_valid(long actionid) const {
         assert(actionid < long(valid.size()) && actionid >= 0);
         return valid[actionid];
     };

     void set_valid(long actionid, bool value = true){
         assert(actionid < long(valid.size()) && actionid >= 0);
         valid[actionid] = value;
     };


     const vector<AType>& get_actions() const {return actions;};

     bool is_terminal() const {return actions.empty();};

     void normalize(){
         for(AType& a : actions)
             a.normalize();
     }

     bool is_action_correct(long aid, numvec nataction) const{
         if( (aid < 0) || ((size_t)aid >= actions.size()))
             return false;

         return actions[aid].is_nature_correct(nataction);
     }

     bool is_action_correct(long aid) const{
         if( (aid < 0) || ((size_t)aid >= actions.size()))
             return false;
         else
             return true;
     }

     prec_t mean_reward(long actionid, numvec nataction) const{
         if(is_terminal()) return 0;
         else return get_action(actionid).mean_reward(nataction);
     }

     prec_t mean_reward(long actionid) const{
         if(is_terminal()) return 0;
         else return get_action(actionid).mean_reward();
     }

     Transition mean_transition(long action, numvec nataction) const{
         if(is_terminal()) return Transition();
         else return get_action(action).mean_transition(nataction);
     }

     Transition mean_transition(long action) const{
         if(is_terminal()) return Transition();
         else return get_action(action).mean_transition();
     }

     string to_json(long stateid = -1) const{
         string result{"{"};
         result += "\"stateid\" : ";
         result += std::to_string(stateid);
         result += ",\"actions\" : [";
         for(auto ai : indices(actions)){
             const auto& a = actions[ai];
             result += a.to_json(ai);
             result += ",";
         }
         if(!actions.empty()) result.pop_back(); // remove last comma
         result += ("]}");
         return result;
     }
 };

 // **********************************************************************
 // *********************    SPECIFIC STATE DEFINITIONS    ***************
 // **********************************************************************

 typedef SAState<RegularAction> RegularState;
 typedef SAState<WeightedOutcomeAction> WeightedRobustState;
 }


 namespace internal{
     using namespace craam;

     template<class SType>
     bool is_action_correct(const SType& state, long stateid, const std::pair<indvec,vector<numvec>>& policies){
         return state.is_action_correct(policies.first[stateid], policies.second[stateid]);
     }

     template<class SType>
     bool is_action_correct(const SType& state, long stateid, const indvec& policy){
         return state.is_action_correct(policy[stateid]);
     }
 }
craam::SAState
State for sa-rectangular uncertainty (or no uncertainty) in an MDP.
Definition: State.hpp:38

craam::SAState::operator[]
const AType & operator[](long actionid) const
Returns an existing action.
Definition: State.hpp:89

craam::SAState::size
size_t size() const
Number of actions.
Definition: State.hpp:57

craam::SAState::is_terminal
bool is_terminal() const
True if the state is considered terminal (no actions).
Definition: State.hpp:119

craam::RegularState
SAState< RegularAction > RegularState
Regular MDP state with no outcomes.
Definition: State.hpp:197

craam::SAState::create_action
AType & create_action()
Creates an action at the last position of the state.
Definition: State.hpp:81

std

craam::prec_t
double prec_t
Default precision used throughout the code.
Definition: definitions.hpp:25

craam::SAState::mean_transition
Transition mean_transition(long action) const
Returns the mean transition probabilities following the action and outcome.
Definition: State.hpp:169

craam::SAState::action_count
size_t action_count() const
Number of actions.
Definition: State.hpp:54

craam::numvec
vector< prec_t > numvec
Default numerical vector.
Definition: definitions.hpp:28

craam::SAState::mean_transition
Transition mean_transition(long action, numvec nataction) const
Returns the mean transition probabilities following the action and outcome.
Definition: State.hpp:161

craam::WeightedRobustState
SAState< WeightedOutcomeAction > WeightedRobustState
State with uncertain outcomes with L1 constraints on the distribution.
Definition: State.hpp:199

craam::SAState::mean_reward
prec_t mean_reward(long actionid, numvec nataction) const
Returns the mean reward following the action (and outcome).
Definition: State.hpp:144

craam::SAState::valid
vector< bool > valid
whether actions can be used in computation. If false, that means that they should not be used in algo...
Definition: State.hpp:44

craam::SAState::set_valid
void set_valid(long actionid, bool value=true)
Set action validity.
Definition: State.hpp:109

craam::SAState::is_valid
bool is_valid(long actionid) const
Returns whether the actions is valid.
Definition: State.hpp:100

craam::SAState::actions
vector< AType > actions
list of actions
Definition: State.hpp:41

craam::SAState::is_action_correct
bool is_action_correct(long aid) const
Checks whether the prescribed action correct.
Definition: State.hpp:136

craam::Transition
Represents sparse transition probabilities and rewards from a single state.
Definition: Transition.hpp:31

craam::SAState::mean_reward
prec_t mean_reward(long actionid) const
Returns the mean reward following the action.
Definition: State.hpp:150

craam::SAState::get_action
const AType & get_action(long actionid) const
Returns an existing action.
Definition: State.hpp:84

craam::SAState::operator[]
AType & operator[](long actionid)
Returns an existing action.
Definition: State.hpp:97

craam::SAState::normalize
void normalize()
Normalizes transition probabilities to sum to one.
Definition: State.hpp:122

internal
helper functions
Definition: State.hpp:204

craam::SAState::is_action_correct
bool is_action_correct(long aid, numvec nataction) const
Checks whether the prescribed action and outcome are correct.
Definition: State.hpp:128

craam::SAState::get_action
AType & get_action(long actionid)
Returns an existing action.
Definition: State.hpp:92

craam::SAState::get_actions
const vector< AType > & get_actions() const
Returns set of all actions.
Definition: State.hpp:116

craam::SAState::create_action
AType & create_action(long actionid)
Creates an action given by actionid if it does not exists.
Definition: State.hpp:66

internal::is_action_correct
bool is_action_correct(const SType &state, long stateid, const std::pair< indvec, vector< numvec >> &policies)
checks state and policy with a policy of nature
Definition: State.hpp:209

craam::SAState::to_json
string to_json(long stateid=-1) const
Returns json representation of the state.
Definition: State.hpp:176

craam::SAState::SAState
SAState(const vector< AType > &actions)
Initializes state with actions and sets them all to valid.
Definition: State.hpp:51

craam::indvec
vector< long > indvec
Default index vector.
Definition: definitions.hpp:31

craam
Main namespace which includes modeling a solving functionality.
Definition: Action.hpp:18