Merge pull request #13 from sibange/main

Addition of a Transition Model class
fgnt · Mar 7, 2024 · 4dc1f2a · 4dc1f2a
2 parents 05e3c0e + 57f3d9d
commit 4dc1f2a
Show file tree

Hide file tree

Showing 3 changed files with 330 additions and 0 deletions.
diff --git a/mms_msg/sampling/pattern/meeting/__init__.py b/mms_msg/sampling/pattern/meeting/__init__.py
@@ -1 +1,2 @@
 from .meeting_sampler import MeetingSampler
+from . import state_based
diff --git a/mms_msg/sampling/pattern/meeting/state_based/__init__.py b/mms_msg/sampling/pattern/meeting/state_based/__init__.py
@@ -0,0 +1 @@
+from . import transition_model
diff --git a/mms_msg/sampling/pattern/meeting/state_based/transition_model.py b/mms_msg/sampling/pattern/meeting/state_based/transition_model.py
@@ -0,0 +1,328 @@
+import numpy as np
+from typing import Optional, List, Union, Generic, TypeVar, Tuple, Any, Set
+from abc import ABC, abstractmethod
+from copy import deepcopy
+
+
+class StateTransitionModel(ABC):
+    """
+    Abstract class that can be used to implement models which determine a sequence of previously defined states.
+    """
+
+    @abstractmethod
+    def next(self, rng: np.random.random = np.random.default_rng()) -> Any:
+        """
+        Returns the next state according to the implemented model.
+
+        Args:
+            rng: rng that can be used in the determination of the next state
+
+        Returns: Next state
+        """
+        raise NotImplementedError
+
+    @abstractmethod
+    def step_back(self) -> bool:
+        """
+        Attempt to revert the last step of the model. Only one successful step back is guaranteed.
+
+        Returns: True when successful, False otherwise
+        """
+        raise NotImplementedError
+
+    @abstractmethod
+    def reset(self) -> None:
+        """
+        Resets the transition model to its starting state.
+        """
+        raise NotImplementedError
+
+
+MST = TypeVar('MST')  # MarkovStateType
+
+
+class MarkovModel(StateTransitionModel, Generic[MST]):
+    """
+    StateTransitionModel which uses a markov model for the state transitions.
+
+    Properties:
+        s0: Name or index of the starting state
+        size: Number of states in the model
+        states: (read-only) Names of the states
+        current_state_index: Index of the current state
+        last_state_index: Index of the previous state
+    """
+
+    def __init__(self, probability_matrix: np.ndarray, s0: Optional[Union[int, MST]] = 0,
+                 state_names: Optional[List[MST]] = None) -> None:
+        """
+        Initialize a Markov Model with n states. The states can be named with the state_names parameter.
+        Default naming is a simple enumeration.
+
+        Args:
+            probability_matrix: transition matrix for the markov model.
+                It must be a stochastic matrix of the dimensions n x n.
+            s0: index of the starting state or name of the starting state.
+                When s0 is an integer s0 it is interpreted as the index of the starting state.
+            state_names: (optional) names of the states, if used all states have to be named.
+                As name every type except integer can be used,
+                this type is reserved for the default enumeration.
+        """
+
+        # Assert correct dimensions and correct probabilities
+        if not probability_matrix.shape[0] > 0:
+            raise ValueError('The markov model requires at least one state')
+        if probability_matrix.shape[0] != probability_matrix.shape[1]:
+            raise ValueError(f'Probability matrix has wrong dimensions: Expecting a square matrix, '
+                             f'but got {probability_matrix.shape}.')
+        if not np.allclose(np.sum(probability_matrix, axis=1), np.ones(probability_matrix.shape[0]),
+                           rtol=0.0, atol=1e-06):
+            raise ValueError('The probabilities in some row, are not adding up to 1')
+
+        # Assert that when states are named, all states have names
+        if not (state_names is None or len(state_names) == probability_matrix.shape[0]):
+            raise ValueError('When the states parameter is used, there has to be names for all states.')
+
+        # Assert that no integers are used as names
+        if state_names is not None and type(state_names[0]) is int:
+            raise TypeError('Integers are not allowed as names for states')
+
+        self.s0 = s0
+        self._size = probability_matrix.shape[0]
+        self.probability_matrix = probability_matrix
+        if state_names is None:
+            self._state_names = [*range(self.size)]
+        else:
+            self._state_names = deepcopy(state_names)
+
+        if isinstance(s0, int):
+            self.current_state_index = s0
+        else:
+            self.current_state_index = self.state_names.index(s0)
+
+        self.last_state_index = None
+
+    def next(self, rng: np.random.random = np.random.default_rng()) -> Union[int, MST]:
+        """
+        Simulates a step in the markov model and returns the state after the step
+
+        Args:
+            rng: The numpy rng that should be used should generate a number in the interval [0,1).
+                When not set a uniform rng is used.
+
+        Returns: Name of the state of the model after the step is executed
+        """
+
+        self.last_state_index = self.current_state_index
+
+        self.current_state_index = self._simulate_step(self.current_state_index, rng)
+
+        return self.state_names[self.current_state_index]
+
+    def step_back(self) -> bool:
+        """
+        Attempt to revert the last step of the model. Only the last previous state is saved and can be restored.
+
+        Returns: True when successful, False otherwise
+        """
+        if self.last_state_index is not None:
+            self.current_state_index = self.last_state_index
+            self.last_state_index = None
+            return True
+        else:
+            return False
+
+    def reset(self) -> None:
+        """
+        Resets the current state of the model to the starting state.
+        """
+        if isinstance(self.s0, int):
+            self.current_state_index = self.s0
+        else:
+            self.current_state_index = self.state_names.index(self.s0)
+
+    def simulate_step(self, state: Union[int, MST], rng: np.random.random = np.random.default_rng()) -> Union[int, MST]:
+        """
+        Simulates a step from a single state, without changing to current state.
+
+        Args:
+            state: Index or name of the starting state for the single step
+            rng: The numpy rng that should be used, the rng should generate a number in the interval [0,1).
+                If not set a uniform rng is used.
+
+        Returns: State after a single step from the starting state
+        """
+
+        index = self.state_names.index(state)
+        return self.state_names[self._simulate_step(index, rng)]
+
+    def _simulate_step(self, index: int, rng: np.random.random = np.random.default_rng()) -> int:
+        """
+        Internal function that simulates one step from the given starting state, without changing the current state.
+        In the input and output of this function, only the index of the states is used to identify them.
+
+        Args:
+            index: Index of the starting state for the single step
+            rng: The numpy rng that should be used should generate a number in the interval [0,1).
+                 If not set a uniform rng is used.
+
+        Returns: Index of the State after a single step from the starting state
+        """
+
+        row = self.probability_matrix[index]
+        random = rng.random()
+
+        row_sum = 0
+        for i, v in enumerate(row):
+            row_sum += v
+            if row_sum >= random:
+                return i
+
+    @property
+    def size(self) -> int:
+        return self._size
+
+    @property
+    def state_names(self) -> List[Union[int, MST]]:
+        return self._state_names
+
+    def __repr__(self):
+        return (
+            "Markov model: "
+            f"Number of states: {self._size} "
+            f"State names: {self._state_names}\n"
+            f"Probability matrix:\n {self.probability_matrix}"
+        )
+
+
+class SpeakerTransitionModel(ABC):
+    """
+    Abstract class that can be used to implement a model that can sample a sequence of active speakers,
+    along with an action for each speaker. For example, the action can be used  to determine the type of transition
+    between the speakers.
+    """
+    @abstractmethod
+    def start(self, env_state: Optional[Any] = None, **kwargs) -> Tuple[int, Any]:
+        """
+        Returns the speaker that should start speaking.
+        This method should be called when a new sequence is sampled.
+
+        Args:
+            env_state: env_state: (optional) Additional information about the state of the environment
+
+        Returns: Tuple consisting of the starting state of the next sequence and environment state
+        """
+        raise NotImplementedError
+
+    @abstractmethod
+    def next(self, rng: np.random.random = np.random.default_rng(), last_action_success: bool = True,
+             env_state: Optional[Any] = None, **kwargs) -> Tuple[str, int, Any]:
+        """
+        Returns the next action and the next speaker according to the implemented transition model.
+        When the model cannot find an action that can be executed a StopIteration error is raised.
+
+        Args:
+            rng: rng that can be used in the determination of the next state
+            last_action_success: (optional) status of the execution of the last action,
+                                  can be used when the actions can fail.
+            env_state: (optional) Additional information about the state of the environment
+
+        Returns: Next action (state), the index of the next active speaker and the current environment state
+        """
+        raise NotImplementedError
+
+    @abstractmethod
+    def reset(self) -> None:
+        """
+        Resets the transition model to its initial state.
+        """
+        raise NotImplementedError
+
+    @property
+    @abstractmethod
+    def tags(self) -> Set[str]:
+        """
+        Tag of the transition model, the tag consists of a set of all actions that can be returned.
+
+        Returns: Set of all possible actions.
+        """
+        pass
+
+
+class TwoSpeakerTransitionModel(SpeakerTransitionModel):
+    """SpeakerTransitionModel which implements the transition between two speakers.
+     For the transition of the states a transitionModel is used.
+     Supports four possible actions:
+        - TH: Turn-hold     (no speaker change with silence)
+        - TS: Turn-switch   (speaker change with silence)
+        - OV: Overlap       (speaker change with overlap)
+        - BC: Backchannel   (speaker in backchannel, totally overlapped from foreground speaker)
+
+    Corresponding paper: Improving the Naturalness of Simulated Conversations for End-to-End Neural Diarization,
+                         https://arxiv.org/abs/2204.11232
+
+    Properties:
+        transition_model: StateTransitionModel used for the selection of the action
+        current_active_index: Index of current active speaker
+        tries: Current number of tries for finding an action that can be successfully executed
+        max_tries: Maximum number of tries to find a valid action,
+                   after this is surpassed a StopIteration Exception is returned
+        tags: Set of all actions that can be returned by the model.
+    """
+    def __init__(self, transition_model: StateTransitionModel, max_tries: int = 50) -> None:
+        """
+        Initialization with a StateTransitionModel and the number of maximal tries for a successful action.
+        When it is not possible to execute the action, the StateTransitionModel is reverted
+        and the selection of the next step is done again.
+        When more than max_tries are required a StopIteration Exception is returned
+
+        Args:
+            transition_model: Underlying transition model, that is internally used to determine the next action.
+            max_tries: Maximum number of tries
+        """
+
+        self.transition_model = transition_model
+        self.current_active_index = 0
+        self.tries = 0
+        self.max_tries = max_tries
+
+    def start(self, env_state: Optional[Any] = None, **kwargs) -> Tuple[int, Any]:
+        self.reset()
+        return self.current_active_index, env_state
+
+    def next(self, rng: np.random.random = np.random.default_rng(), last_action_success: bool = True,
+             env_state: Optional[Any] = None, **kwargs) -> Tuple[str, int, Any]:
+        if last_action_success:
+            self.tries = 0
+        elif self.tries < self.max_tries:
+            self.transition_model.step_back()
+            self.tries += 1
+        else:
+            raise StopIteration('Number of max tries exceeded')
+
+        action = self.transition_model.next(rng)
+
+        # In the case of a backchannel, the next speaker changes, but the active speaker in the foreground does not.
+        if action == "BC":
+            return action, (self.current_active_index + 1) % 2, None
+
+        # Speaker changes in the case of a turn-switch or overlap
+        if action in ("TS", "OV"):
+            self.current_active_index = (self.current_active_index + 1) % 2
+
+        return action, self.current_active_index, env_state
+
+    def reset(self) -> None:
+        self.transition_model.reset()
+        self.current_active_index = 0
+
+    @property
+    def tags(self) -> Set[str]:
+        return {"TS", "TH", "OV", "BC"}
+
+    def __repr__(self):
+        return (
+            f"TwoSpeakerTransitionModel: "
+            f"Current state: {self.current_active_index}\n"
+            f"TransitionModel:\n{self.transition_model}"
+        )
Original file line number	Diff line number	Diff line change
		@@ -1 +1,2 @@
		from .meeting_sampler import MeetingSampler
		from . import state_based