Source code for yawning_titan.envs.generic.core.blue_interface

from typing import Tuple

from yawning_titan.envs.generic.core.blue_action_set import BlueActionSet
from yawning_titan.envs.generic.core.network_interface import NetworkInterface
from yawning_titan.networks.node import Node


[docs]class BlueInterface(BlueActionSet):
    """The interface used by the Blue Agents to act within the environment."""

[docs]    def __init__(self, network_interface: NetworkInterface):
        """
        Initialise the blue interface.

        Args:
            network_interface: Object from the NetworkInterface class
        """
        super().__init__(network_interface)

        # standard actions (apply to a single node)
        self.action_dict = {}
        action_number = 0
        self.deceptive_actions = 0
        # all of the actions that blue can do
        if self.network_interface.game_mode.blue.action_set.reduce_vulnerability.value:
            # Checks if the action is enabled in the settings file
            self.action_dict[action_number] = self.reduce_node_vulnerability
            action_number += 1
        if self.network_interface.game_mode.blue.action_set.restore_node.value:
            self.action_dict[action_number] = self.restore_node
            action_number += 1
        if self.network_interface.game_mode.blue.action_set.make_node_safe.use.value:
            self.action_dict[action_number] = self.make_safe_node
            action_number += 1
        if self.network_interface.game_mode.blue.action_set.isolate_node.value:
            self.action_dict[action_number] = self.isolate_node
            action_number += 1
        if self.network_interface.game_mode.blue.action_set.reconnect_node.value:
            self.action_dict[action_number] = self.reconnect_node
            action_number += 1

        # deceptive actions -> since the number of edges is not equal to the number of nodes this has to be done
        # separately
        if self.network_interface.game_mode.blue.action_set.deceptive_nodes.use.value:
            self.deceptive_actions = self.network_interface.base_graph.number_of_edges()

        # global actions (don't apply to a single node)
        self.global_action_dict = {}
        global_action_number = 0
        if self.network_interface.game_mode.blue.action_set.scan.value:
            # scans all of the nodes in the network
            self.global_action_dict[global_action_number] = self.scan_all_nodes
            global_action_number += 1
        if self.network_interface.game_mode.blue.action_set.do_nothing.value:
            # does nothing
            self.global_action_dict[global_action_number] = self.do_nothing
            global_action_number += 1
        self.number_of_actions = action_number
        self.number_global_action = global_action_number

[docs]    def perform_action(self, action: int) -> Tuple[str, Node]:
        """
        Perform an action within the environment.

        Takes in an action number and then maps this to the correct action to perform. There are 3 different item_types of
        actions:
            - standard actions
            - deceptive actions
            - global actions

        --standard actions--
        Standard actions are actions that can apply to all nodes. For each standard action there are n actions (where n
        is the number of nodes in the network). An example of this action would be to isolate a node. The agent has to
        pick the isolate action and then the node it is being applied to.

        --deceptive actions--
        Actions relating to deceptive nodes. Since the number of deceptive actions relate to the edges not the nodes
        (see deceptive nodes for more info), the deceptive actions cannot come under the standard actions. An example
        would be to place a deceptive node. The deceptive nodes can only be placed on an edge so the agent has to pick
        the "place deceptive node" action and then the edge to place it on.

        --global actions--
        Global actions are actions where the agent does not need to pick any sub action other than the action. For
        example an action that applies to all nodes so the agent does not need to pick a specific node to apply the
        action to. "Do nothing" is an example of a global action as there is no secondary choice to be made.


        The function also maps any actions outside of the action space to the "do nothing" action.

        Order of operations:
        1- check if the action is inside the action space --> perform "do nothing"
        2- check if the action is a deceptive action --> perform action
        3- check if the action is a global action --> perform action
        4- perform the standard action

        Args:
            action: the action to perform

        Returns:
            The action that has been taken
            The node the action was performed on
        """
        if action >= self.get_number_of_actions():
            blue_action, blue_node = self.do_nothing()
        elif action < self.deceptive_actions:
            # use a deceptive action
            blue_action, blue_node = self.add_deceptive_node(action)
        # global actions
        else:
            action = action - self.deceptive_actions
            # global actions
            if action < self.number_global_action:
                blue_action, blue_node = self.global_action_dict[action]()
            else:
                # standard actions
                action = action - self.number_global_action
                action_node_number = int(action / self.number_of_actions)

                if (
                    action_node_number
                    >= self.network_interface.current_graph.number_of_nodes()
                ):
                    blue_action, blue_node = self.do_nothing()
                else:
                    nodes = self.network_interface.current_graph.get_nodes()
                    action_node = sorted(nodes)[action_node_number]
                    action_taken = int(action % self.number_of_actions)

                    blue_action, blue_node = self.action_dict[action_taken](action_node)

        return blue_action, blue_node

[docs]    def get_number_of_actions(self) -> int:
        """
        Get the number of actions that this blue agent can perform.

        There are three item_types of actions:
            - global actions (apply to all nodes) - need 1 action space
            - deceptive actions (Add new nodes to environment)
            - standard actions (apply to a single node) - need 2 action space (action and node to perform on)

        Returns:
            The number of actions that this agent can perform
        """
        return (
            (self.number_of_actions * self.network_interface.get_total_num_nodes())
            + self.number_global_action
            + self.deceptive_actions
        )