Class sdm::NetworkedDistributedPOMDP

Class List > sdm > NetworkedDistributedPOMDP

#include <networked_distributed_pomdp.hpp>

Inherits the following classes: sdm::MPOMDP

Classes

Type	Name
class	Node

Public Types

Type	Name
typedef number	action
typedef number	agent
typedef number	observation
typedef number	state

Public Attributes

Type	Name
std::ifstream	input_file
Node *	n
std::unordered_map< std::string, std::discrete_distribution< number > >	ndpomdp_dynamics_generator dynamics generator
agent *	nodes
std::map< std::string, std::unordered_set< observation > >	observationSuccessor
std::map< std::string, double >	observationsmatrix
double	rMax = = 45
agent	root
std::unordered_set< state > *	stateSuccessor
std::map< int, int >	transitionmatrix

Public Functions

Type	Name
	NetworkedDistributedPOMDP (std::string)
void	createDAG ()
void	getData (std::string)
std::tuple< std::vector< double >, observation, state >	getDynamicsGenerator (number x, number a)
double	getInitialBelief (std::shared_ptr< State >)
double	getObservation (agent, action, state, observation)
double	getRewardF (state, agent, agent, action, action)
std::vector< std::pair< number, number > >	getUniqueValidNeighbors ()
virtual std::shared_ptr< State >	init ()
void	printDAG (agent)
void	setupDynamicsGenerator () Get the number of observations for a specific agent.

Public Functions inherited from sdm::MPOMDP

See sdm::MPOMDP

Type	Name
	MPOMDP ()
	MPOMDP (const std::shared_ptr< Space > & state_space, const std::shared_ptr< Space > & action_space, const std::shared_ptr< Space > & obs_space, const std::shared_ptr< RewardInterface > & reward, const std::shared_ptr< StateDynamicsInterface > & state_dynamics, const std::shared_ptr< ObservationDynamicsInterface > & obs_dynamics, const std::shared_ptr< Distribution< std::shared_ptr< State >>> & start_distrib, number horizon=0, double discount=0.99, Criterion criterion=Criterion::REW_MAX)
virtual std::shared_ptr< Space >	getObservationSpace (number agent_id, number t) const Get ths observation space of agent i at timestep t.
virtual std::shared_ptr< Space >	getObservationSpace (number t=0) const Get ths observation space at timestep t.
virtual std::string	toStdFormat () Encodes MDP class into a string (standard .posg or .dpomdp or .zsposg format).
virtual	~MPOMDP ()

Public Functions inherited from sdm::MPOMDPInterface

See sdm::MPOMDPInterface

Type	Name
virtual std::shared_ptr< Space >	getObservationSpace (number agent_id, number t) const = 0 Get ths observation space of agent i at timestep t.
virtual std::shared_ptr< Space >	getObservationSpace (number t) const = 0 Get ths observation space at timestep t.

Public Functions inherited from sdm::MMDPInterface

See sdm::MMDPInterface

Type	Name
virtual std::shared_ptr< Space >	getActionSpace (number agent_id, number t) const = 0 Get ths action space of agent i at timestep t.
virtual std::shared_ptr< Space >	getActionSpace (number t) const = 0 Get ths action space at timestep t.

Public Functions inherited from sdm::MDPInterface

See sdm::MDPInterface

Type	Name
virtual std::shared_ptr< Space >	getActionSpace (number t) const = 0 Get ths action space at timestep t.
virtual double	getDiscount (number t) const = 0 Get the discount factor at timestep t.
virtual number	getHorizon () const = 0 Get the number of agents.
virtual std::shared_ptr< State >	getInternalState () const = 0
virtual double	getMaxReward (number t) const = 0
virtual double	getMinReward (number t) const = 0
virtual number	getNumAgents () const = 0 Get the number of agents.
virtual std::set< std::shared_ptr< State > >	getReachableStates (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t) const = 0 Get reachable states.
virtual double	getReward (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t) const = 0 Get the reward at timestep t when executing an action in a specific state.
virtual std::shared_ptr< Distribution< std::shared_ptr< State > > >	getStartDistribution () const = 0 Get the initial distribution over states.
virtual std::shared_ptr< Space >	getStateSpace (number t) const = 0 Get ths state space at timestep t.
virtual double	getTransitionProbability (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, const std::shared_ptr< State > & next_state, number t) const = 0 _Get the transition probability, i.e. p(s'
virtual void	setInternalState (std::shared_ptr< State > state) = 0
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action) = 0 Do a step on the environment.
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action, bool increment_timestep) = 0

Public Functions inherited from sdm::GymInterface

See sdm::GymInterface

Type	Name
virtual std::shared_ptr< Space >	getActionSpaceAt (const std::shared_ptr< Observation > & observation, number t) = 0 Get the action space.
virtual std::shared_ptr< Action >	getRandomAction (const std::shared_ptr< Observation > & observation, number t) = 0 Get random action.
virtual std::shared_ptr< Observation >	reset () = 0 Reset the environment and return initial observation.
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action) = 0 Do a step on the environment.

Public Functions inherited from sdm::POMDPInterface

See sdm::POMDPInterface

Type	Name
virtual double	getDynamics (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, const std::shared_ptr< State > & next_state, const std::shared_ptr< Observation > & observation, number t) const = 0 _Get the dynamics, i.e. p(s', o
virtual double	getObservationProbability (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, const std::shared_ptr< State > & next_state, const std::shared_ptr< Observation > & observation, number t) const = 0 _Get the observation probability, i.e. p(o
virtual std::shared_ptr< Space >	getObservationSpace (number t) const = 0 Get ths observation space at timestep t.
virtual std::set< std::shared_ptr< Observation > >	getReachableObservations (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, const std::shared_ptr< State > & next_state, number t) const = 0 Get reachable observations.

Public Functions inherited from sdm::MDPInterface

See sdm::MDPInterface

Type	Name
virtual std::shared_ptr< Space >	getActionSpace (number t) const = 0 Get ths action space at timestep t.
virtual double	getDiscount (number t) const = 0 Get the discount factor at timestep t.
virtual number	getHorizon () const = 0 Get the number of agents.
virtual std::shared_ptr< State >	getInternalState () const = 0
virtual double	getMaxReward (number t) const = 0
virtual double	getMinReward (number t) const = 0
virtual number	getNumAgents () const = 0 Get the number of agents.
virtual std::set< std::shared_ptr< State > >	getReachableStates (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t) const = 0 Get reachable states.
virtual double	getReward (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t) const = 0 Get the reward at timestep t when executing an action in a specific state.
virtual std::shared_ptr< Distribution< std::shared_ptr< State > > >	getStartDistribution () const = 0 Get the initial distribution over states.
virtual std::shared_ptr< Space >	getStateSpace (number t) const = 0 Get ths state space at timestep t.
virtual double	getTransitionProbability (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, const std::shared_ptr< State > & next_state, number t) const = 0 _Get the transition probability, i.e. p(s'
virtual void	setInternalState (std::shared_ptr< State > state) = 0
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action) = 0 Do a step on the environment.
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action, bool increment_timestep) = 0

Public Functions inherited from sdm::GymInterface

See sdm::GymInterface

Type	Name
virtual std::shared_ptr< Space >	getActionSpaceAt (const std::shared_ptr< Observation > & observation, number t) = 0 Get the action space.
virtual std::shared_ptr< Action >	getRandomAction (const std::shared_ptr< Observation > & observation, number t) = 0 Get random action.
virtual std::shared_ptr< Observation >	reset () = 0 Reset the environment and return initial observation.
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action) = 0 Do a step on the environment.

Public Functions inherited from sdm::POMDP

See sdm::POMDP

Type	Name
	POMDP ()
	POMDP (const std::shared_ptr< Space > & state_space, const std::shared_ptr< Space > & action_space, const std::shared_ptr< Space > & obs_space, const std::shared_ptr< RewardInterface > & reward, const std::shared_ptr< StateDynamicsInterface > & state_dynamics, const std::shared_ptr< ObservationDynamicsInterface > & obs_dynamics, const std::shared_ptr< Distribution< std::shared_ptr< State >>> & start_distrib, number horizon=0, double discount=0.99, Criterion criterion=Criterion::REW_MAX)
virtual double	getDynamics (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, const std::shared_ptr< State > & next_state, const std::shared_ptr< Observation > & observation, number t=0) const _Get the dynamics, i.e. p(s', o
std::shared_ptr< ObservationDynamicsInterface >	getObservationDynamics () const
virtual double	getObservationProbability (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, const std::shared_ptr< State > & next_state, const std::shared_ptr< Observation > & observation, number t=0) const _Get the observation probability, i.e. p(o
virtual std::shared_ptr< Space >	getObservationSpace (number t=0) const Get ths observation space at timestep t.
virtual std::set< std::shared_ptr< Observation > >	getReachableObservations (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, const std::shared_ptr< State > & next_state, number t) const Get reachable observations.
virtual std::shared_ptr< Observation >	sampleNextObservation (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t)

Public Functions inherited from sdm::MDP

See sdm::MDP

Type	Name
	MDP ()
	MDP (const std::shared_ptr< Space > & state_space, const std::shared_ptr< Space > & action_space, const std::shared_ptr< RewardInterface > & reward_space, const std::shared_ptr< StateDynamicsInterface > & state_dynamics, const std::shared_ptr< Distribution< std::shared_ptr< State >>> & start_distribution, number horizon=0, double discount=0.99, Criterion criterion=Criterion::REW_MAX)
void	generateFile (std::string) Save problem in file with given format (.xml, .json or .{dpomdp, posg, zsposg}).
virtual std::shared_ptr< Space >	getActionSpace (number t=0) const Get ths action space at timestep t.
virtual std::shared_ptr< Space >	getActionSpaceAt (const std::shared_ptr< Observation > & observation, number t) Get the action space.
virtual double	getDiscount (number t=0) const Get the discount factor at timestep t.
virtual number	getHorizon () const Get the planning horizon.
virtual std::shared_ptr< State >	getInternalState () const
virtual double	getMaxReward (number t=0) const
virtual double	getMinReward (number t=0) const
virtual number	getNumAgents () const Get the number of agents.
virtual std::shared_ptr< Action >	getRandomAction (const std::shared_ptr< Observation > & observation, number t) Get random action.
virtual std::set< std::shared_ptr< State > >	getReachableStates (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t=0) const Get the reachable next states.
virtual double	getReward (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t=0) const Get the reward of executing action a in state s at timestep t.
virtual std::shared_ptr< RewardInterface >	getRewardSpace () const Get the reward function.
virtual std::shared_ptr< Distribution< std::shared_ptr< State > > >	getStartDistribution () const Get the initial distribution over states.
virtual std::shared_ptr< StateDynamicsInterface >	getStateDynamics () const Get the state dynamics.
virtual std::shared_ptr< Space >	getStateSpace (number t=0) const Get ths state space at timestep t.
virtual double	getTransitionProbability (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, const std::shared_ptr< State > & next_state, number t=0) const Get the Transition Probability object.
virtual std::shared_ptr< Observation >	reset () Reset the environment and return initial observation.
virtual std::shared_ptr< Observation >	sampleNextObservation (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t)
void	setDiscount (double discount) Set the discount factor.
void	setHorizon (number horizon) Set the planning horizon.
virtual void	setInternalState (std::shared_ptr< State >)
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action) Do a step on the environment.
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action, bool increment_timestep)
virtual std::string	toJSON () Encodes MDP class into a string (JSON format).
virtual std::string	toStdFormat () Encodes MDP class into a string (standard .posg or .dpomdp or .zsposg format).
virtual std::string	toXML () Encodes MDP class into a string (XML format).
virtual	~MDP ()

Public Functions inherited from sdm::MDPInterface

See sdm::MDPInterface

Type	Name
virtual std::shared_ptr< Space >	getActionSpace (number t) const = 0 Get ths action space at timestep t.
virtual double	getDiscount (number t) const = 0 Get the discount factor at timestep t.
virtual number	getHorizon () const = 0 Get the number of agents.
virtual std::shared_ptr< State >	getInternalState () const = 0
virtual double	getMaxReward (number t) const = 0
virtual double	getMinReward (number t) const = 0
virtual number	getNumAgents () const = 0 Get the number of agents.
virtual std::set< std::shared_ptr< State > >	getReachableStates (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t) const = 0 Get reachable states.
virtual double	getReward (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t) const = 0 Get the reward at timestep t when executing an action in a specific state.
virtual std::shared_ptr< Distribution< std::shared_ptr< State > > >	getStartDistribution () const = 0 Get the initial distribution over states.
virtual std::shared_ptr< Space >	getStateSpace (number t) const = 0 Get ths state space at timestep t.
virtual double	getTransitionProbability (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, const std::shared_ptr< State > & next_state, number t) const = 0 _Get the transition probability, i.e. p(s'
virtual void	setInternalState (std::shared_ptr< State > state) = 0
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action) = 0 Do a step on the environment.
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action, bool increment_timestep) = 0

Public Functions inherited from sdm::GymInterface

See sdm::GymInterface

Type	Name
virtual std::shared_ptr< Space >	getActionSpaceAt (const std::shared_ptr< Observation > & observation, number t) = 0 Get the action space.
virtual std::shared_ptr< Action >	getRandomAction (const std::shared_ptr< Observation > & observation, number t) = 0 Get random action.
virtual std::shared_ptr< Observation >	reset () = 0 Reset the environment and return initial observation.
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action) = 0 Do a step on the environment.

Public Functions inherited from sdm::GymInterface

See sdm::GymInterface

Type	Name
virtual std::shared_ptr< Space >	getActionSpaceAt (const std::shared_ptr< Observation > & observation, number t) = 0 Get the action space.
virtual std::shared_ptr< Action >	getRandomAction (const std::shared_ptr< Observation > & observation, number t) = 0 Get random action.
virtual std::shared_ptr< Observation >	reset () = 0 Reset the environment and return initial observation.
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action) = 0 Do a step on the environment.

Public Functions inherited from sdm::POMDPInterface

See sdm::POMDPInterface

Type	Name
virtual double	getDynamics (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, const std::shared_ptr< State > & next_state, const std::shared_ptr< Observation > & observation, number t) const = 0 _Get the dynamics, i.e. p(s', o
virtual double	getObservationProbability (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, const std::shared_ptr< State > & next_state, const std::shared_ptr< Observation > & observation, number t) const = 0 _Get the observation probability, i.e. p(o
virtual std::shared_ptr< Space >	getObservationSpace (number t) const = 0 Get ths observation space at timestep t.
virtual std::set< std::shared_ptr< Observation > >	getReachableObservations (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, const std::shared_ptr< State > & next_state, number t) const = 0 Get reachable observations.

Public Functions inherited from sdm::MDPInterface

See sdm::MDPInterface

Type	Name
virtual std::shared_ptr< Space >	getActionSpace (number t) const = 0 Get ths action space at timestep t.
virtual double	getDiscount (number t) const = 0 Get the discount factor at timestep t.
virtual number	getHorizon () const = 0 Get the number of agents.
virtual std::shared_ptr< State >	getInternalState () const = 0
virtual double	getMaxReward (number t) const = 0
virtual double	getMinReward (number t) const = 0
virtual number	getNumAgents () const = 0 Get the number of agents.
virtual std::set< std::shared_ptr< State > >	getReachableStates (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t) const = 0 Get reachable states.
virtual double	getReward (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t) const = 0 Get the reward at timestep t when executing an action in a specific state.
virtual std::shared_ptr< Distribution< std::shared_ptr< State > > >	getStartDistribution () const = 0 Get the initial distribution over states.
virtual std::shared_ptr< Space >	getStateSpace (number t) const = 0 Get ths state space at timestep t.
virtual double	getTransitionProbability (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, const std::shared_ptr< State > & next_state, number t) const = 0 _Get the transition probability, i.e. p(s'
virtual void	setInternalState (std::shared_ptr< State > state) = 0
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action) = 0 Do a step on the environment.
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action, bool increment_timestep) = 0

Public Functions inherited from sdm::GymInterface

See sdm::GymInterface

Type	Name
virtual std::shared_ptr< Space >	getActionSpaceAt (const std::shared_ptr< Observation > & observation, number t) = 0 Get the action space.
virtual std::shared_ptr< Action >	getRandomAction (const std::shared_ptr< Observation > & observation, number t) = 0 Get random action.
virtual std::shared_ptr< Observation >	reset () = 0 Reset the environment and return initial observation.
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action) = 0 Do a step on the environment.

Public Functions inherited from sdm::MMDP

See sdm::MMDP

Type	Name
	MMDP ()
	MMDP (const std::shared_ptr< Space > & state_space, const std::shared_ptr< Space > & action_space, const std::shared_ptr< RewardInterface > & reward, const std::shared_ptr< StateDynamicsInterface > & state_dynamics, const std::shared_ptr< Distribution< std::shared_ptr< State >>> & start_distrib, number horizon=0, double discount=0.99, Criterion criterion=Criterion::REW_MAX)
virtual std::shared_ptr< Space >	getActionSpace (number t=0) const Get ths action space at timestep t.
virtual std::shared_ptr< Space >	getActionSpace (number agent_id, number t) const Get ths action space of agent i at timestep t.
virtual std::string	toStdFormat () Encodes MDP class into a string (standard .posg or .dpomdp or .zsposg format).

Public Functions inherited from sdm::MDP

See sdm::MDP

Type	Name
	MDP ()
	MDP (const std::shared_ptr< Space > & state_space, const std::shared_ptr< Space > & action_space, const std::shared_ptr< RewardInterface > & reward_space, const std::shared_ptr< StateDynamicsInterface > & state_dynamics, const std::shared_ptr< Distribution< std::shared_ptr< State >>> & start_distribution, number horizon=0, double discount=0.99, Criterion criterion=Criterion::REW_MAX)
void	generateFile (std::string) Save problem in file with given format (.xml, .json or .{dpomdp, posg, zsposg}).
virtual std::shared_ptr< Space >	getActionSpace (number t=0) const Get ths action space at timestep t.
virtual std::shared_ptr< Space >	getActionSpaceAt (const std::shared_ptr< Observation > & observation, number t) Get the action space.
virtual double	getDiscount (number t=0) const Get the discount factor at timestep t.
virtual number	getHorizon () const Get the planning horizon.
virtual std::shared_ptr< State >	getInternalState () const
virtual double	getMaxReward (number t=0) const
virtual double	getMinReward (number t=0) const
virtual number	getNumAgents () const Get the number of agents.
virtual std::shared_ptr< Action >	getRandomAction (const std::shared_ptr< Observation > & observation, number t) Get random action.
virtual std::set< std::shared_ptr< State > >	getReachableStates (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t=0) const Get the reachable next states.
virtual double	getReward (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t=0) const Get the reward of executing action a in state s at timestep t.
virtual std::shared_ptr< RewardInterface >	getRewardSpace () const Get the reward function.
virtual std::shared_ptr< Distribution< std::shared_ptr< State > > >	getStartDistribution () const Get the initial distribution over states.
virtual std::shared_ptr< StateDynamicsInterface >	getStateDynamics () const Get the state dynamics.
virtual std::shared_ptr< Space >	getStateSpace (number t=0) const Get ths state space at timestep t.
virtual double	getTransitionProbability (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, const std::shared_ptr< State > & next_state, number t=0) const Get the Transition Probability object.
virtual std::shared_ptr< Observation >	reset () Reset the environment and return initial observation.
virtual std::shared_ptr< Observation >	sampleNextObservation (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t)
void	setDiscount (double discount) Set the discount factor.
void	setHorizon (number horizon) Set the planning horizon.
virtual void	setInternalState (std::shared_ptr< State >)
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action) Do a step on the environment.
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action, bool increment_timestep)
virtual std::string	toJSON () Encodes MDP class into a string (JSON format).
virtual std::string	toStdFormat () Encodes MDP class into a string (standard .posg or .dpomdp or .zsposg format).
virtual std::string	toXML () Encodes MDP class into a string (XML format).
virtual	~MDP ()

Public Functions inherited from sdm::MDPInterface

See sdm::MDPInterface

Type	Name
virtual std::shared_ptr< Space >	getActionSpace (number t) const = 0 Get ths action space at timestep t.
virtual double	getDiscount (number t) const = 0 Get the discount factor at timestep t.
virtual number	getHorizon () const = 0 Get the number of agents.
virtual std::shared_ptr< State >	getInternalState () const = 0
virtual double	getMaxReward (number t) const = 0
virtual double	getMinReward (number t) const = 0
virtual number	getNumAgents () const = 0 Get the number of agents.
virtual std::set< std::shared_ptr< State > >	getReachableStates (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t) const = 0 Get reachable states.
virtual double	getReward (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t) const = 0 Get the reward at timestep t when executing an action in a specific state.
virtual std::shared_ptr< Distribution< std::shared_ptr< State > > >	getStartDistribution () const = 0 Get the initial distribution over states.
virtual std::shared_ptr< Space >	getStateSpace (number t) const = 0 Get ths state space at timestep t.
virtual double	getTransitionProbability (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, const std::shared_ptr< State > & next_state, number t) const = 0 _Get the transition probability, i.e. p(s'
virtual void	setInternalState (std::shared_ptr< State > state) = 0
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action) = 0 Do a step on the environment.
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action, bool increment_timestep) = 0

Public Functions inherited from sdm::GymInterface

See sdm::GymInterface

Type	Name
virtual std::shared_ptr< Space >	getActionSpaceAt (const std::shared_ptr< Observation > & observation, number t) = 0 Get the action space.
virtual std::shared_ptr< Action >	getRandomAction (const std::shared_ptr< Observation > & observation, number t) = 0 Get random action.
virtual std::shared_ptr< Observation >	reset () = 0 Reset the environment and return initial observation.
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action) = 0 Do a step on the environment.

Public Functions inherited from sdm::GymInterface

See sdm::GymInterface

Type	Name
virtual std::shared_ptr< Space >	getActionSpaceAt (const std::shared_ptr< Observation > & observation, number t) = 0 Get the action space.
virtual std::shared_ptr< Action >	getRandomAction (const std::shared_ptr< Observation > & observation, number t) = 0 Get random action.
virtual std::shared_ptr< Observation >	reset () = 0 Reset the environment and return initial observation.
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action) = 0 Do a step on the environment.

Public Functions inherited from sdm::MMDPInterface

See sdm::MMDPInterface

Type	Name
virtual std::shared_ptr< Space >	getActionSpace (number agent_id, number t) const = 0 Get ths action space of agent i at timestep t.
virtual std::shared_ptr< Space >	getActionSpace (number t) const = 0 Get ths action space at timestep t.

Public Functions inherited from sdm::MDPInterface

See sdm::MDPInterface

Type	Name
virtual std::shared_ptr< Space >	getActionSpace (number t) const = 0 Get ths action space at timestep t.
virtual double	getDiscount (number t) const = 0 Get the discount factor at timestep t.
virtual number	getHorizon () const = 0 Get the number of agents.
virtual std::shared_ptr< State >	getInternalState () const = 0
virtual double	getMaxReward (number t) const = 0
virtual double	getMinReward (number t) const = 0
virtual number	getNumAgents () const = 0 Get the number of agents.
virtual std::set< std::shared_ptr< State > >	getReachableStates (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t) const = 0 Get reachable states.
virtual double	getReward (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, number t) const = 0 Get the reward at timestep t when executing an action in a specific state.
virtual std::shared_ptr< Distribution< std::shared_ptr< State > > >	getStartDistribution () const = 0 Get the initial distribution over states.
virtual std::shared_ptr< Space >	getStateSpace (number t) const = 0 Get ths state space at timestep t.
virtual double	getTransitionProbability (const std::shared_ptr< State > & state, const std::shared_ptr< Action > & action, const std::shared_ptr< State > & next_state, number t) const = 0 _Get the transition probability, i.e. p(s'
virtual void	setInternalState (std::shared_ptr< State > state) = 0
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action) = 0 Do a step on the environment.
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action, bool increment_timestep) = 0

Public Functions inherited from sdm::GymInterface

See sdm::GymInterface

Type	Name
virtual std::shared_ptr< Space >	getActionSpaceAt (const std::shared_ptr< Observation > & observation, number t) = 0 Get the action space.
virtual std::shared_ptr< Action >	getRandomAction (const std::shared_ptr< Observation > & observation, number t) = 0 Get random action.
virtual std::shared_ptr< Observation >	reset () = 0 Reset the environment and return initial observation.
virtual std::tuple< std::shared_ptr< Observation >, std::vector< double >, bool >	step (std::shared_ptr< Action > action) = 0 Do a step on the environment.

Protected Attributes inherited from sdm::POMDP

See sdm::POMDP

Type	Name
std::shared_ptr< ObservationDynamicsInterface >	observation_dynamics_
std::shared_ptr< Space >	observation_space_

Protected Attributes inherited from sdm::MDP

See sdm::MDP

Type	Name
std::shared_ptr< Space >	action_space_
Criterion	criterion_
int	current_timestep_
double	discount_
number	horizon_
std::shared_ptr< State >	internal_state_
number	num_agents_
std::shared_ptr< RewardInterface >	reward_space_
std::shared_ptr< Distribution< std::shared_ptr< State > > >	start_distribution_
std::shared_ptr< StateDynamicsInterface >	state_dynamics_
std::shared_ptr< Space >	state_space_

Protected Attributes inherited from sdm::MDP

See sdm::MDP

Type	Name
std::shared_ptr< Space >	action_space_
Criterion	criterion_
int	current_timestep_
double	discount_
number	horizon_
std::shared_ptr< State >	internal_state_
number	num_agents_
std::shared_ptr< RewardInterface >	reward_space_
std::shared_ptr< Distribution< std::shared_ptr< State > > >	start_distribution_
std::shared_ptr< StateDynamicsInterface >	state_dynamics_
std::shared_ptr< Space >	state_space_

Public Types Documentation

typedef action

using sdm::NetworkedDistributedPOMDP::action =  number;

typedef agent

using sdm::NetworkedDistributedPOMDP::agent =  number;

typedef observation

using sdm::NetworkedDistributedPOMDP::observation =  number;

typedef state

using sdm::NetworkedDistributedPOMDP::state =  number;

Public Attributes Documentation

variable input_file

std::ifstream sdm::NetworkedDistributedPOMDP::input_file;

variable n

Node* sdm::NetworkedDistributedPOMDP::n;

variable ndpomdp_dynamics_generator

std::unordered_map<std::string, std::discrete_distribution<number> > sdm::NetworkedDistributedPOMDP::ndpomdp_dynamics_generator;

variable nodes

agent* sdm::NetworkedDistributedPOMDP::nodes;

variable observationSuccessor

std::map<std::string, std::unordered_set<observation> > sdm::NetworkedDistributedPOMDP::observationSuccessor;

variable observationsmatrix

std::map<std::string, double> sdm::NetworkedDistributedPOMDP::observationsmatrix;

variable rMax

double sdm::NetworkedDistributedPOMDP::rMax;

variable root

agent sdm::NetworkedDistributedPOMDP::root;

variable stateSuccessor

std::unordered_set<state>* sdm::NetworkedDistributedPOMDP::stateSuccessor;

variable transitionmatrix

std::map<int, int> sdm::NetworkedDistributedPOMDP::transitionmatrix;

Public Functions Documentation

function NetworkedDistributedPOMDP

sdm::NetworkedDistributedPOMDP::NetworkedDistributedPOMDP (
    std::string
)

function createDAG

void sdm::NetworkedDistributedPOMDP::createDAG ()

function getData

void sdm::NetworkedDistributedPOMDP::getData (
    std::string
)

function getDynamicsGenerator

std::tuple< std::vector< double >, observation , state > sdm::NetworkedDistributedPOMDP::getDynamicsGenerator (
    number x,
    number a
)

Parameters:

state the current state
jaction the joint action

Returns:

a tuple containing reward, next_osbservation and next_state

function getInitialBelief

double sdm::NetworkedDistributedPOMDP::getInitialBelief (
    std::shared_ptr< State >
)

function getObservation

double sdm::NetworkedDistributedPOMDP::getObservation (
    agent,
    action,
    state,
    observation
)

function getRewardF

double sdm::NetworkedDistributedPOMDP::getRewardF (
    state,
    agent,
    agent,
    action,
    action
)

function getUniqueValidNeighbors

std::vector< std::pair< number , number > > sdm::NetworkedDistributedPOMDP::getUniqueValidNeighbors ()

function init

virtual std::shared_ptr< State > sdm::NetworkedDistributedPOMDP::init ()

function printDAG

void sdm::NetworkedDistributedPOMDP::printDAG (
    agent
)

function setupDynamicsGenerator

void sdm::NetworkedDistributedPOMDP::setupDynamicsGenerator ()

Returns:

number Get the number of Actions for a specific agent Get the number of Action for every agents

The documentation for this class was generated from the following file src/sdm/world/networked_distributed_pomdp.hpp