Source code for pomdp_belief_tracking.types

"""Defines some types for ease of reading"""

from typing import Any, Dict, Tuple

from typing_extensions import Protocol


[docs]class Action(Protocol):
    """The abstract type representing actions"""


[docs]class Observation(Protocol):
    """The abstract type representing observations"""


[docs]class State(Protocol):
    """The abstract type representing states"""


[docs]class TransitionFunction(Protocol):
    """The signature for transition functions"""

    def __call__(self, s: State, a: Action) -> State:
        """A transition function is a (stochastic) mapping from s x a -> s

        :param s: state at time step t
        :param a: action at time step t
        :return: state at time step t + 1
        """


[docs]class Simulator(Protocol):
    """The abstract type representing simulators

    We expect simulators to map a state and action into a next state and
    observation.

    .. automethod:: __call__
    """

[docs]    def __call__(self, s: State, a: Action) -> Tuple[State, Observation]:
        """Simulate a transition

        :param s: the current state
        :param a: the executed action
        :return: next state and observation
        """


[docs]class StateDistribution(Protocol):
    """The abstract type representing state distributions

    We expect to be able to sample states

    .. automethod:: __call__
    """

[docs]    def __call__(self) -> State:
        """Required implementation of distribution: the ability to sample states

        :return: state sampled according to distribution
        """


Info = Dict[str, Any]
"""The datatype used for information flow from implementation to caller"""


[docs]class BeliefUpdate(Protocol):
    """The signature for belief updates"""

[docs]    def __call__(
        self, p: StateDistribution, a: Action, o: Observation
    ) -> Tuple[StateDistribution, Info]:
        """Updates the distribution ``p`` given an action and observation

        :param p: current distribution
        :param a: taken action
        :param o: perceived observation
        :return: next distribution
        """


[docs]class Belief:
    """A belief is the combination of a update function and current distribution"""

    def __init__(
        self, initial_distribution: StateDistribution, update_function: BeliefUpdate
    ):
        self.distribution = initial_distribution
        self.update_function = update_function

[docs]    def update(self, a: Action, o: Observation) -> Info:
        """Updates (in place) the state distribution given an action and observation

        :param a: the executed action
        :param o: the perceived observation
        :return: Side effect: updates in place, returns run-time info
        """
        self.distribution, info = self.update_function(self.distribution, a, o)
        return info

[docs]    def sample(self) -> State:
        """Samples from its distribution

        :return: state sampled according to distribution
        """
        return self.distribution()