PyPI - mal-toolbox - Versions diffs - 0.1.12__py3-none-any.whl → 0.3.0__py3-none-any.whl - Mend

mal-toolbox 0.1.12py3-none-any.whl → 0.3.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

{mal_toolbox-0.1.12.dist-info → mal_toolbox-0.3.0.dist-info}/METADATA +43 -25
mal_toolbox-0.3.0.dist-info/RECORD +29 -0
mal_toolbox-0.3.0.dist-info/entry_points.txt +2 -0
maltoolbox/__init__.py +38 -57
maltoolbox/__main__.py +43 -14
maltoolbox/attackgraph/__init__.py +1 -1
maltoolbox/attackgraph/analyzers/apriori.py +10 -6
maltoolbox/attackgraph/attacker.py +26 -13
maltoolbox/attackgraph/attackgraph.py +431 -355
maltoolbox/attackgraph/node.py +72 -54
maltoolbox/attackgraph/query.py +4 -2
maltoolbox/file_utils.py +4 -8
maltoolbox/ingestors/neo4j.py +146 -157
maltoolbox/language/__init__.py +10 -2
maltoolbox/language/compiler/__init__.py +485 -17
maltoolbox/language/compiler/mal_lexer.py +172 -152
maltoolbox/language/compiler/mal_parser.py +1370 -663
maltoolbox/language/languagegraph.py +1096 -545
maltoolbox/model.py +312 -485
maltoolbox/translators/securicad.py +164 -163
maltoolbox/translators/updater.py +231 -108
mal_toolbox-0.1.12.dist-info/RECORD +0 -32
maltoolbox/default.conf +0 -17
maltoolbox/language/classes_factory.py +0 -243
maltoolbox/language/compiler/mal_visitor.py +0 -416
maltoolbox/wrappers.py +0 -62
{mal_toolbox-0.1.12.dist-info → mal_toolbox-0.3.0.dist-info}/AUTHORS +0 -0
{mal_toolbox-0.1.12.dist-info → mal_toolbox-0.3.0.dist-info}/LICENSE +0 -0
{mal_toolbox-0.1.12.dist-info → mal_toolbox-0.3.0.dist-info}/WHEEL +0 -0
{mal_toolbox-0.1.12.dist-info → mal_toolbox-0.3.0.dist-info}/top_level.txt +0 -0

maltoolbox/attackgraph/attackgraph.py CHANGED Viewed

@@ -5,221 +5,112 @@ from __future__ import annotations
 import copy
 import logging
 import json
+import sys
+import zipfile
+from itertools import chain
 from typing import TYPE_CHECKING
+from .analyzers.apriori import calculate_viability_and_necessity
 from .node import AttackGraphNode
 from .attacker import Attacker
-from ..exceptions import AttackGraphStepExpressionError
+from .. import log_configs
+from ..exceptions import AttackGraphStepExpressionError, AttackGraphException
+from ..exceptions import LanguageGraphException
 from ..model import Model
-from ..exceptions import AttackGraphException
+from ..language import (LanguageGraph, ExpressionsChain,
+    LanguageGraphAttackStep, disaggregate_attack_step_full_name)
 from ..file_utils import (
     load_dict_from_json_file,
     load_dict_from_yaml_file,
     save_dict_to_file
 )
 if TYPE_CHECKING:
     from typing import Any, Optional
-    from ..language import LanguageGraph
+    from ..model import ModelAsset
 logger = logging.getLogger(__name__)
-# TODO see if (part of) this can be incorporated into the LanguageGraph, so that
-# the LanguageGraph's _lang_spec private property does not need to be accessed
-def _process_step_expression(
-        lang_graph: LanguageGraph,
-        model: Model,
-        target_assets: list[Any],
-        step_expression: dict[str, Any]
-    ) -> tuple[list, Optional[str]]:
-    """
-    Recursively process an attack step expression.
-    Arguments:
-    lang_graph      - a language graph representing the MAL language
-                      specification
-    model           - a maltoolbox.model.Model instance from which the attack
-                      graph was generated
-    target_assets   - the list of assets that this step expression should apply
-                      to. Initially it will contain the asset to which the
-                      attack step belongs
-    step_expression - a dictionary containing the step expression
-    Return:
-    A tuple pair containing a list of all of the target assets and the name of
-    the attack step.
+def create_attack_graph(
+        lang_file: str,
+        model_file: str,
+        attach_attackers=True,
+        calc_viability_and_necessity=True
+    ) -> AttackGraph:
+    """Create and return an attack graph
+    Args:
+    lang_file                       - path to language file (.mar or .mal)
+    model_file                      - path to model file (yaml or json)
+    attach_attackers                - whether to run attach_attackers or not
+    calc_viability_and_necessity    - whether run apriori calculations or not
     """
+    try:
+        lang_graph = LanguageGraph.from_mar_archive(lang_file)
+    except zipfile.BadZipFile:
+        lang_graph = LanguageGraph.from_mal_spec(lang_file)
-    if logger.isEnabledFor(logging.DEBUG):
-        # Avoid running json.dumps when not in debug
-        logger.debug(
-            'Processing Step Expression:\n%s',
-            json.dumps(step_expression, indent = 2)
-        )
+    if log_configs['langspec_file']:
+        lang_graph.save_to_file(log_configs['langspec_file'])
-    match (step_expression['type']):
-        case 'attackStep':
-            # The attack step expression just adds the name of the attack
-            # step. All other step expressions only modify the target assets.
-            return (target_assets, step_expression['name'])
-        case 'union' | 'intersection' | 'difference':
-            # The set operators are used to combine the left hand and right
-            # hand targets accordingly.
-            lh_targets, lh_attack_steps = _process_step_expression(
-                lang_graph, model, target_assets, step_expression['lhs'])
-            rh_targets, rh_attack_steps = _process_step_expression(
-                lang_graph, model, target_assets, step_expression['rhs'])
-            new_target_assets = []
-            match (step_expression['type']):
-                case 'union':
-                    new_target_assets = lh_targets
-                    for ag_node in rh_targets:
-                        if next((lnode for lnode in new_target_assets \
-                            if lnode.id != ag_node.id), None):
-                            new_target_assets.append(ag_node)
-                case 'intersection':
-                    for ag_node in rh_targets:
-                        if next((lnode for lnode in lh_targets \
-                            if lnode.id == ag_node.id), None):
-                            new_target_assets.append(ag_node)
-                case 'difference':
-                    new_target_assets = lh_targets
-                    for ag_node in lh_targets:
-                        if next((rnode for rnode in rh_targets \
-                            if rnode.id != ag_node.id), None):
-                            new_target_assets.remove(ag_node)
-            return (new_target_assets, None)
-        case 'variable':
-            # Fetch the step expression associated with the variable from
-            # the language specification and resolve that.
-            for target_asset in target_assets:
-                if (hasattr(target_asset, 'type')):
-                    # TODO how can this info be accessed in the lang_graph
-                    # directly without going through the private method?
-                    variable_step_expr = lang_graph._get_variable_for_asset_type_by_name(
-                        target_asset.type, step_expression['name'])
-                    return _process_step_expression(
-                        lang_graph, model, target_assets, variable_step_expr)
+    instance_model = Model.load_from_file(model_file, lang_graph)
-                else:
-                    logger.error(
-                        'Requested variable from non-asset target node:'
-                        '%s which cannot be resolved.', target_asset
-                    )
-            return ([], None)
-        case 'field':
-            # Change the target assets from the current ones to the associated
-            # assets given the specified field name.
-            new_target_assets = []
-            for target_asset in target_assets:
-                new_target_assets.extend(model.\
-                    get_associated_assets_by_field_name(target_asset,
-                        step_expression['name']))
-            return (new_target_assets, None)
-        case 'transitive':
-            # The transitive expression is very similar to the field
-            # expression, but it proceeds recursively until no target is
-            # found and it and it sets the new targets to the entire list
-            # of assets identified during the entire transitive recursion.
-            new_target_assets = []
-            for target_asset in target_assets:
-                new_target_assets.extend(model.\
-                    get_associated_assets_by_field_name(target_asset,
-                        step_expression['stepExpression']['name']))
-            if new_target_assets:
-                (additional_assets, _) = _process_step_expression(
-                    lang_graph, model, new_target_assets, step_expression)
-                new_target_assets.extend(additional_assets)
-                return (new_target_assets, None)
-            else:
-                return ([], None)
-        case 'subType':
-            new_target_assets = []
-            for target_asset in target_assets:
-                (assets, _) = _process_step_expression(
-                    lang_graph, model, target_assets,
-                    step_expression['stepExpression'])
-                new_target_assets.extend(assets)
-            selected_new_target_assets = []
-            for asset in new_target_assets:
-                lang_graph_asset = lang_graph.get_asset_by_name(
-                    asset.type
-                )
-                if not lang_graph_asset:
-                    raise LookupError(
-                        f'Failed to find asset \"{asset.type}\" in the '
-                        'language graph.'
-                    )
-                lang_graph_subtype_asset = lang_graph.get_asset_by_name(
-                    step_expression['subType']
-                )
-                if not lang_graph_subtype_asset:
-                    raise LookupError(
-                        'Failed to find asset '
-                        f'\"{step_expression["subType"]}\" in the '
-                        'language graph.'
-                    )
-                if lang_graph_asset.is_subasset_of(lang_graph_subtype_asset):
-                    selected_new_target_assets.append(asset)
+    if log_configs['model_file']:
+        instance_model.save_to_file(log_configs['model_file'])
+    try:
+        attack_graph = AttackGraph(lang_graph, instance_model)
+    except AttackGraphStepExpressionError:
+        logger.error(
+            'Attack graph generation failed when attempting '
+            'to resolve attack step expression!'
+        )
+        sys.exit(1)
-            return (selected_new_target_assets, None)
+    if attach_attackers:
+        attack_graph.attach_attackers()
-        case 'collect':
-            # Apply the right hand step expression to left hand step
-            # expression target assets.
-            lh_targets, _ = _process_step_expression(
-                lang_graph, model, target_assets, step_expression['lhs'])
-            return _process_step_expression(lang_graph, model, lh_targets,
-                step_expression['rhs'])
+    if calc_viability_and_necessity:
+        calculate_viability_and_necessity(attack_graph)
+    return attack_graph
-        case _:
-            logger.error(
-                'Unknown attack step type: %s', step_expression["type"]
-            )
-            return ([], None)
 class AttackGraph():
     """Graph representation of attack steps"""
-    def __init__(self, lang_graph = None, model: Optional[Model] = None):
-        self.nodes: list[AttackGraphNode] = []
-        self.attackers: list[Attacker] = []
+    def __init__(self, lang_graph, model: Optional[Model] = None):
+        self.nodes: dict[int, AttackGraphNode] = {}
+        self.attackers: dict[int, Attacker] = {}
         # Dictionaries used in optimization to get nodes and attackers by id
         # or full name faster
-        self._id_to_node: dict[int, AttackGraphNode] = {}
         self._full_name_to_node: dict[str, AttackGraphNode] = {}
-        self._id_to_attacker: dict[int, Attacker] = {}
         self.model = model
         self.lang_graph = lang_graph
         self.next_node_id = 0
         self.next_attacker_id = 0
-        if self.model is not None and self.lang_graph is not None:
+        if self.model is not None:
             self._generate_graph()
     def __repr__(self) -> str:
-        return f'AttackGraph({len(self.nodes)} nodes)'
+        return (f'AttackGraph(Number of nodes: {len(self.nodes)}, '
+            f'model: {self.model}, language: {self.lang_graph}')
     def _to_dict(self) -> dict:
         """Convert AttackGraph to dict"""
         serialized_attack_steps = {}
         serialized_attackers = {}
-        for ag_node in self.nodes:
+        for ag_node in self.nodes.values():
             serialized_attack_steps[ag_node.full_name] =\
                 ag_node.to_dict()
-        for attacker in self.attackers:
+        for attacker in self.attackers.values():
             serialized_attackers[attacker.name] = attacker.to_dict()
+        logger.debug('Serialized %d attack steps and %d attackers.' %
+            (len(self.nodes), len(self.attackers))
+        )
         return {
             'attack_steps': serialized_attack_steps,
             'attackers': serialized_attackers,
@@ -234,34 +125,32 @@ class AttackGraph():
         copied_attackgraph = AttackGraph(self.lang_graph)
         copied_attackgraph.model = self.model
-        copied_attackgraph.nodes = []
+        copied_attackgraph.nodes = {}
         # Deep copy nodes
-        for node in self.nodes:
+        for node_id, node in self.nodes.items():
             copied_node = copy.deepcopy(node, memo)
-            copied_attackgraph.nodes.append(copied_node)
+            copied_attackgraph.nodes[node_id] = copied_node
         # Re-link node references
-        for node in self.nodes:
+        for node in self.nodes.values():
             if node.parents:
                 memo[id(node)].parents = copy.deepcopy(node.parents, memo)
             if node.children:
                 memo[id(node)].children = copy.deepcopy(node.children, memo)
-        # Deep copy attackers and references to them
-        copied_attackgraph.attackers = copy.deepcopy(self.attackers, memo)
+        # Deep copy attackers
+        for attacker_id, attacker in self.attackers.items():
+            copied_attacker = copy.deepcopy(attacker, memo)
+            copied_attackgraph.attackers[attacker_id] = copied_attacker
         # Re-link attacker references
-        for node in self.nodes:
+        for node in self.nodes.values():
             if node.compromised_by:
                 memo[id(node)].compromised_by = copy.deepcopy(
                     node.compromised_by, memo)
         # Copy lookup dicts
-        copied_attackgraph._id_to_attacker = \
-            copy.deepcopy(self._id_to_attacker, memo)
-        copied_attackgraph._id_to_node = \
-            copy.deepcopy(self._id_to_node, memo)
         copied_attackgraph._full_name_to_node = \
             copy.deepcopy(self._full_name_to_node, memo)
@@ -280,6 +169,7 @@ class AttackGraph():
     def _from_dict(
             cls,
             serialized_object: dict,
+            lang_graph: LanguageGraph,
             model: Optional[Model]=None
         ) -> AttackGraph:
         """Create AttackGraph from dict
@@ -288,30 +178,38 @@ class AttackGraph():
         model               - Optional Model to add connections to
         """
-        attack_graph = AttackGraph()
+        attack_graph = AttackGraph(lang_graph)
         attack_graph.model = model
         serialized_attack_steps = serialized_object['attack_steps']
         serialized_attackers = serialized_object['attackers']
         # Create all of the nodes in the imported attack graph.
-        for node_full_name, node_dict in serialized_attack_steps.items():
+        for node_dict in serialized_attack_steps.values():
             # Recreate asset links if model is available.
             node_asset = None
             if model and 'asset' in node_dict:
                 node_asset = model.get_asset_by_name(node_dict['asset'])
                 if node_asset is None:
-                    msg = ('Failed to find asset with id %s'
-                            'when loading from attack graph dict')
+                    msg = ('Failed to find asset with name "%s"'
+                            ' when loading from attack graph dict')
                     logger.error(msg, node_dict["asset"])
                     raise LookupError(msg % node_dict["asset"])
-            ag_node = AttackGraphNode(
-                type=node_dict['type'],
-                name=node_dict['name'],
-                ttc=node_dict['ttc'],
-                asset=node_asset
+            lg_asset_name, lg_attack_step_name = \
+                disaggregate_attack_step_full_name(
+                    node_dict['lang_graph_attack_step'])
+            lg_attack_step = lang_graph.assets[lg_asset_name].\
+                attack_steps[lg_attack_step_name]
+            ag_node = attack_graph.add_node(
+                lg_attack_step = lg_attack_step,
+                node_id = node_dict['id'],
+                model_asset = node_asset,
+                defense_status = node_dict.get('defense_status', None),
+                existence_status = node_dict.get('existence_status', None)
             )
+            ag_node.tags = set(node_dict.get('tags', []))
+            ag_node.extras = node_dict.get('extras', {})
             if node_asset:
                 # Add AttackGraphNode to attack_step_nodes of asset
@@ -322,26 +220,10 @@ class AttackGraph():
                 else:
                     node_asset.attack_step_nodes = [ag_node]
-            ag_node.defense_status = float(node_dict['defense_status']) if \
-                'defense_status' in node_dict else None
-            ag_node.existence_status = node_dict['existence_status'] \
-                == 'True' if 'existence_status' in node_dict else None
-            ag_node.is_viable = node_dict['is_viable'] == 'True' if \
-                'is_viable' in node_dict else True
-            ag_node.is_necessary = node_dict['is_necessary'] == 'True' if \
-                'is_necessary' in node_dict else True
-            ag_node.mitre_info = str(node_dict['mitre_info']) if \
-                'mitre_info' in node_dict else None
-            ag_node.tags = node_dict['tags'] if \
-                'tags' in node_dict else []
-            ag_node.extras = node_dict.get('extras', {})
-            # Add AttackGraphNode to AttackGraph
-            attack_graph.add_node(ag_node, node_id=node_dict['id'])
         # Re-establish links between nodes.
-        for node_full_name, node_dict in serialized_attack_steps.items():
-            _ag_node = attack_graph.get_node_by_id(node_dict['id'])
+        for node_dict in serialized_attack_steps.values():
+            _ag_node = attack_graph.nodes[node_dict['id']]
             if not isinstance(_ag_node, AttackGraphNode):
                 msg = ('Failed to find node with id %s when loading'
                        ' attack graph from dict')
@@ -349,33 +231,36 @@ class AttackGraph():
                 raise LookupError(msg % node_dict["id"])
             else:
                 for child_id in node_dict['children']:
-                    child = attack_graph.get_node_by_id(int(child_id))
+                    child = attack_graph.nodes[int(child_id)]
                     if child is None:
                         msg = ('Failed to find child node with id %s'
                                ' when loading from attack graph from dict')
                         logger.error(msg, child_id)
                         raise LookupError(msg % child_id)
-                    _ag_node.children.append(child)
+                    _ag_node.children.add(child)
                 for parent_id in node_dict['parents']:
-                    parent = attack_graph.get_node_by_id(int(parent_id))
+                    parent = attack_graph.nodes[int(parent_id)]
                     if parent is None:
                         msg = ('Failed to find parent node with id %s '
                                'when loading from attack graph from dict')
                         logger.error(msg, parent_id)
                         raise LookupError(msg % parent_id)
-                    _ag_node.parents.append(parent)
+                    _ag_node.parents.add(parent)
-        for attacker_name, attacker in serialized_attackers.items():
+        for attacker in serialized_attackers.values():
             ag_attacker = Attacker(
                 name = attacker['name'],
-                entry_points = [],
-                reached_attack_steps = []
+                entry_points = set(),
+                reached_attack_steps = set()
             )
             attack_graph.add_attacker(
                 attacker = ag_attacker,
                 attacker_id = int(attacker['id']),
-                entry_points = attacker['entry_points'].keys(),
+                entry_points = [
+                    int(node_id) # Convert to int since they can be strings
+                    for node_id in attacker['entry_points'].keys()
+                ],
                 reached_attack_steps = [
                     int(node_id) # Convert to int since they can be strings
                     for node_id in attacker['reached_attack_steps'].keys()
@@ -388,7 +273,8 @@ class AttackGraph():
     def load_from_file(
             cls,
             filename: str,
-            model: Optional[Model]=None
+            lang_graph: LanguageGraph,
+            model: Optional[Model] = None
         ) -> AttackGraph:
         """Create from json or yaml file depending on file extension"""
         if model is not None:
@@ -404,21 +290,8 @@ class AttackGraph():
             serialized_attack_graph = load_dict_from_json_file(filename)
         else:
             raise ValueError('Unknown file extension, expected json/yml/yaml')
-        return cls._from_dict(serialized_attack_graph, model=model)
-    def get_node_by_id(self, node_id: int) -> Optional[AttackGraphNode]:
-        """
-        Return the attack node that matches the id provided.
-        Arguments:
-        node_id     - the id of the attack graph node we are looking for
-        Return:
-        The attack step node that matches the given id.
-        """
-        logger.debug('Looking up node with id %s', node_id)
-        return self._id_to_node.get(node_id)
+        return cls._from_dict(serialized_attack_graph,
+            lang_graph, model = model)
     def get_node_by_full_name(self, full_name: str) -> Optional[AttackGraphNode]:
         """
@@ -432,23 +305,9 @@ class AttackGraph():
         The attack step node that matches the given full name.
         """
-        logger.debug(f'Looking up node with full name "{full_name}"')
+        logger.debug(f'Looking up node with full name "%s"', full_name)
         return self._full_name_to_node.get(full_name)
-    def get_attacker_by_id(self, attacker_id: int) -> Optional[Attacker]:
-        """
-        Return the attacker that matches the id provided.
-        Arguments:
-        attacker_id     - the id of the attacker we are looking for
-        Return:
-        The attacker that matches the given id.
-        """
-        logger.debug(f'Looking up attacker with id {attacker_id}')
-        return self._id_to_attacker.get(attacker_id)
     def attach_attackers(self) -> None:
         """
         Create attackers and their entry point nodes and attach them to the
@@ -473,8 +332,8 @@ class AttackGraph():
             attacker = Attacker(
                 name = attacker_info.name,
-                entry_points = [],
-                reached_attack_steps = []
+                entry_points = set(),
+                reached_attack_steps = set()
             )
             self.add_attacker(attacker)
@@ -491,7 +350,170 @@ class AttackGraph():
                         continue
                     attacker.compromise(ag_node)
-            attacker.entry_points = list(attacker.reached_attack_steps)
+            attacker.entry_points = set(attacker.reached_attack_steps)
+    def _follow_expr_chain(
+            self,
+            model: Model,
+            target_assets: set[ModelAsset],
+            expr_chain: Optional[ExpressionsChain]
+        ) -> set[Any]:
+        """
+        Recursively follow a language graph expressions chain on an instance
+        model.
+        Arguments:
+        model           - a maltoolbox.model.Model on which to follow the
+                          expressions chain
+        target_assets   - the set of assets that this expressions chain
+                          should apply to. Initially it will contain the
+                          asset to which the attack step belongs
+        expr_chain      - the expressions chain we are following
+        Return:
+        A list of all of the target assets.
+        """
+        if expr_chain is None:
+            # There is no expressions chain link left to follow return the
+            # current target assets
+            return set(target_assets)
+        if logger.isEnabledFor(logging.DEBUG):
+            # Avoid running json.dumps when not in debug
+            logger.debug(
+                'Following Expressions Chain:\n%s',
+                json.dumps(expr_chain.to_dict(), indent = 2)
+            )
+        match (expr_chain.type):
+            case 'union' | 'intersection' | 'difference':
+                # The set operators are used to combine the left hand and
+                # right hand targets accordingly.
+                if not expr_chain.left_link:
+                    raise LanguageGraphException('"%s" step expression chain'
+                        ' is missing the left link.' % expr_chain.type)
+                if not expr_chain.right_link:
+                    raise LanguageGraphException('"%s" step expression chain'
+                        ' is missing the right link.' % expr_chain.type)
+                lh_targets = self._follow_expr_chain(
+                    model,
+                    target_assets,
+                    expr_chain.left_link
+                )
+                rh_targets = self._follow_expr_chain(
+                    model,
+                    target_assets,
+                    expr_chain.right_link
+                )
+                match (expr_chain.type):
+                    # Once the assets become hashable set operations should be
+                    # used instead.
+                    case 'union':
+                        new_target_assets = lh_targets.union(rh_targets)
+                    case 'intersection':
+                        new_target_assets = lh_targets.intersection(rh_targets)
+                    case 'difference':
+                        new_target_assets = lh_targets.difference(rh_targets)
+                return new_target_assets
+            case 'field':
+                # Change the target assets from the current ones to the
+                # associated assets given the specified field name.
+                if not expr_chain.fieldname:
+                    raise LanguageGraphException('"field" step expression '
+                        'chain is missing fieldname.')
+                new_target_assets = set()
+                new_target_assets.update(
+                    *(
+                        asset.associated_assets.get(
+                            expr_chain.fieldname, set()
+                        ) for asset in target_assets
+                      )
+                )
+                return new_target_assets
+            case 'transitive':
+                if not expr_chain.sub_link:
+                    raise LanguageGraphException('"transitive" step '
+                        'expression chain is missing sub link.')
+                new_assets = target_assets
+                while new_assets := self._follow_expr_chain(
+                    model, new_assets, expr_chain.sub_link
+                ):
+                    if not (new_assets := new_assets.difference(target_assets)):
+                        break
+                    target_assets.update(new_assets)
+                return target_assets
+            case 'subType':
+                if not expr_chain.sub_link:
+                    raise LanguageGraphException('"subType" step '
+                        'expression chain is missing sub link.')
+                new_target_assets = set()
+                new_target_assets.update(
+                    self._follow_expr_chain(
+                        model, target_assets, expr_chain.sub_link
+                    )
+                )
+                selected_new_target_assets = set()
+                for asset in new_target_assets:
+                    lang_graph_asset = self.lang_graph.assets[asset.type]
+                    if not lang_graph_asset:
+                        raise LookupError(
+                            f'Failed to find asset \"{asset.type}\" in the '
+                            'language graph.'
+                        )
+                    lang_graph_subtype_asset = expr_chain.subtype
+                    if not lang_graph_subtype_asset:
+                        raise LookupError(
+                            'Failed to find asset "%s" in the '
+                            'language graph.' % expr_chain.subtype
+                        )
+                    if lang_graph_asset.is_subasset_of(
+                            lang_graph_subtype_asset):
+                        selected_new_target_assets.add(asset)
+                return selected_new_target_assets
+            case 'collect':
+                if not expr_chain.left_link:
+                    raise LanguageGraphException('"collect" step expression chain'
+                        ' is missing the left link.')
+                if not expr_chain.right_link:
+                    raise LanguageGraphException('"collect" step expression chain'
+                        ' is missing the right link.')
+                lh_targets = self._follow_expr_chain(
+                    model,
+                    target_assets,
+                    expr_chain.left_link
+                )
+                rh_targets = self._follow_expr_chain(
+                    model,
+                    lh_targets,
+                    expr_chain.right_link
+                )
+                return rh_targets
+            case _:
+                msg = 'Unknown attack expressions chain type: %s'
+                logger.error(
+                    msg,
+                    expr_chain.type
+                )
+                raise AttackGraphStepExpressionError(
+                    msg % expr_chain.type
+                )
+                return None
     def _generate_graph(self) -> None:
         """
@@ -505,7 +527,7 @@ class AttackGraph():
             raise AttackGraphException(msg)
         # First, generate all of the nodes of the attack graph.
-        for asset in self.model.assets:
+        for asset in self.model.assets.values():
             logger.debug(
                 'Generating attack steps for asset %s which is of class %s.',
@@ -514,104 +536,128 @@ class AttackGraph():
             attack_step_nodes = []
-            # TODO probably part of what happens here is already done in lang_graph
-            attack_steps = self.lang_graph._get_attacks_for_asset_type(asset.type)
-            for attack_step_name, attack_step_attribs in attack_steps.items():
+            for attack_step in asset.lg_asset.attack_steps.values():
                 logger.debug(
-                    'Generating attack step node for %s.', attack_step_name
+                    'Generating attack step node for %s.', attack_step.name
                 )
                 defense_status = None
                 existence_status = None
-                node_name = asset.name + ':' + attack_step_name
+                node_name = asset.name + ':' + attack_step.name
-                match (attack_step_attribs['type']):
+                match (attack_step.type):
                     case 'defense':
                         # Set the defense status for defenses
-                        defense_status = getattr(asset, attack_step_name)
+                        defense_status = asset.defenses[attack_step.name]
                         logger.debug(
-                            'Setting the defense status of %s to %s.',
+                            'Setting the defense status of \"%s\" to "%s".',
                             node_name, defense_status
                         )
                     case 'exist' | 'notExist':
-                        # Resolve step expression associated with (non-)existence
-                        # attack steps.
-                        (target_assets, attack_step) = _process_step_expression(
-                            self.lang_graph,
-                            self.model,
-                            [asset],
-                            attack_step_attribs['requires']['stepExpressions'][0])
-                        # If the step expression resolution yielded the target
-                        # assets then the required assets exist in the model.
-                        existence_status = target_assets != []
-                mitre_info = attack_step_attribs['meta']['mitre'] if 'mitre' in\
-                    attack_step_attribs['meta'] else None
-                ag_node = AttackGraphNode(
-                    type = attack_step_attribs['type'],
-                    asset = asset,
-                    name = attack_step_name,
-                    ttc = attack_step_attribs['ttc'],
-                    children = [],
-                    parents = [],
+                        # Resolve step expression associated with
+                        # (non-)existence attack steps.
+                        existence_status = False
+                        for requirement in attack_step.requires:
+                            target_assets = self._follow_expr_chain(
+                                    self.model,
+                                    set([asset]),
+                                    requirement
+                                )
+                            # If the step expression resolution yielded
+                            # the target assets then the required assets
+                            # exist in the model.
+                            if target_assets:
+                                existence_status = True
+                                break
+                        logger.debug(
+                            'Setting the existence status of \"%s\" to '
+                            '%s.',
+                            node_name, existence_status
+                        )
+                    case _:
+                        pass
+                ag_node = self.add_node(
+                    lg_attack_step = attack_step,
+                    model_asset = asset,
                     defense_status = defense_status,
-                    existence_status = existence_status,
-                    is_viable = True,
-                    is_necessary = True,
-                    mitre_info = mitre_info,
-                    tags = attack_step_attribs['tags'],
-                    compromised_by = []
+                    existence_status = existence_status
                 )
-                ag_node.attributes = attack_step_attribs
                 attack_step_nodes.append(ag_node)
-                self.add_node(ag_node)
             asset.attack_step_nodes = attack_step_nodes
         # Then, link all of the nodes according to their associations.
-        for ag_node in self.nodes:
+        for ag_node in self.nodes.values():
             logger.debug(
                 'Determining children for attack step "%s"(%d)',
                 ag_node.full_name,
                 ag_node.id
             )
-            step_expressions = \
-                ag_node.attributes['reaches']['stepExpressions'] if \
-                    isinstance(ag_node.attributes, dict) and ag_node.attributes['reaches'] else []
-            for step_expression in step_expressions:
-                # Resolve each of the attack step expressions listed for this
-                # attack step to determine children.
-                (target_assets, attack_step) = _process_step_expression(
-                    self.lang_graph,
-                    self.model,
-                    [ag_node.asset],
-                    step_expression)
-                for target in target_assets:
-                    target_node_full_name = target.name + ':' + attack_step
-                    target_node = self.get_node_by_full_name(
-                        target_node_full_name
-                    )
-                    if not target_node:
-                        msg = ('Failed to find target node '
-                               '"%s" to link with for attack step "%s"(%d)!')
-                        logger.error(
-                            msg,
-                            target_node_full_name,
-                            ag_node.full_name,
-                            ag_node.id
-                        )
-                        raise AttackGraphStepExpressionError(
-                            msg % (
-                                target_node_full_name,
-                                ag_node.full_name,
-                                ag_node.id
-                            )
+            if not ag_node.model_asset:
+                raise AttackGraphException('Attack graph node is missing '
+                    'asset link')
+            lang_graph_asset = self.lang_graph.assets[
+                ag_node.model_asset.type]
+            lang_graph_attack_step = lang_graph_asset.attack_steps[
+                ag_node.name]
+            while lang_graph_attack_step:
+                for child in lang_graph_attack_step.children.values():
+                    for target_attack_step, expr_chain in child:
+                        target_assets = self._follow_expr_chain(
+                            self.model,
+                            set([ag_node.model_asset]),
+                            expr_chain
                         )
-                    ag_node.children.append(target_node)
-                    target_node.parents.append(ag_node)
+                        for target_asset in target_assets:
+                            if target_asset is not None:
+                                target_node_full_name = target_asset.name + \
+                                    ':' + target_attack_step.name
+                                target_node = self.get_node_by_full_name(
+                                    target_node_full_name)
+                                if target_node is None:
+                                    msg = ('Failed to find target node '
+                                           '"%s" to link with for attack '
+                                           'step "%s"(%d)!')
+                                    logger.error(
+                                        msg,
+                                        target_node_full_name,
+                                        ag_node.full_name,
+                                        ag_node.id
+                                    )
+                                    raise AttackGraphStepExpressionError(
+                                        msg % (
+                                            target_node_full_name,
+                                            ag_node.full_name,
+                                            ag_node.id
+                                        )
+                                    )
+                                assert ag_node.id is not None
+                                assert target_node.id is not None
+                                logger.debug('Linking attack step "%s"(%d) '
+                                    'to attack step "%s"(%d)' %
+                                    (
+                                        ag_node.full_name,
+                                        ag_node.id,
+                                        target_node.full_name,
+                                        target_node.id
+                                    )
+                                )
+                                ag_node.children.add(target_node)
+                                target_node.parents.add(ag_node)
+                if lang_graph_attack_step.overrides:
+                    break
+                lang_graph_attack_step = lang_graph_attack_step.inherits
     def regenerate_graph(self) -> None:
         """
@@ -619,37 +665,68 @@ class AttackGraph():
         the MAL language specification provided at initialization.
         """
-        self.nodes = []
-        self.attackers = []
+        self.nodes = {}
+        self.attackers = {}
         self._generate_graph()
     def add_node(
             self,
-            node: AttackGraphNode,
-            node_id: Optional[int] = None
-        ) -> None:
-        """Add a node to the graph
+            lg_attack_step: LanguageGraphAttackStep,
+            node_id: Optional[int] = None,
+            model_asset: Optional[ModelAsset] = None,
+            defense_status: Optional[float] = None,
+            existence_status: Optional[bool] = None
+        ) -> AttackGraphNode:
+        """Create and add a node to the graph
         Arguments:
-        node    - the node to add
-        node_id - the id to assign to this node, usually used when loading
-                  an attack graph from a file
-        """
-        if logger.isEnabledFor(logging.DEBUG):
-            # Avoid running json.dumps when not in debug
-            logger.debug(f'Add node \"{node.full_name}\" '
-                f'with id:{node_id}:\n' \
-                + json.dumps(node.to_dict(), indent = 2))
+        lg_attack_step      - the language graph attack step that corresponds
+                              to the attack graph node to create
+        node_id             - id to assign to the newly created node, usually
+                              provided only when loading an existing attack
+                              graph from a file. If not provided the id will
+                              be set to the next highest id available.
+        model_asset         - the model asset that corresponds to the attack
+                              step node. While optional it is highly
+                              recommended that this be provided. It should
+                              only be ommitted if the model which was used to
+                              generate the attack graph is not available when
+                              loading an attack graph from a file.
+        defese_status       - the defense status of the node. Only, relevant
+                              for defense type nodes. A value between 0.0 and
+                              1.0 is expected.
+        existence_status    - the existence status of the node. Only, relevant
+                              for exist and notExist type nodes.
-        if node.id in self._id_to_node:
+        Return:
+        The newly created attack step node.
+        """
+        node_id = node_id if node_id is not None else self.next_node_id
+        if node_id in self.nodes:
             raise ValueError(f'Node index {node_id} already in use.')
+        self.next_node_id = max(node_id + 1, self.next_node_id)
-        node.id = node_id if node_id is not None else self.next_node_id
-        self.next_node_id = max(node.id + 1, self.next_node_id)
+        if logger.isEnabledFor(logging.DEBUG):
+            # Avoid running json.dumps when not in debug
+            logger.debug('Create and add to attackgraph node of type "%s" '
+                'with id:%d.\n' % (
+                    lg_attack_step.full_name,
+                    node_id
+                ))
+        node = AttackGraphNode(
+            node_id = node_id,
+            lg_attack_step = lg_attack_step,
+            model_asset = model_asset,
+            defense_status = defense_status,
+            existence_status = existence_status
+        )
-        self.nodes.append(node)
-        self._id_to_node[node.id] = node
+        self.nodes[node_id] = node
         self._full_name_to_node[node.full_name] = node
+        return node
     def remove_node(self, node: AttackGraphNode) -> None:
         """Remove node from attack graph
         Arguments:
@@ -662,11 +739,10 @@ class AttackGraph():
             child.parents.remove(node)
         for parent in node.parents:
             parent.children.remove(node)
-        self.nodes.remove(node)
         if not isinstance(node.id, int):
             raise ValueError(f'Invalid node id.')
-        del self._id_to_node[node.id]
+        del self.nodes[node.id]
         del self._full_name_to_node[node.full_name]
     def add_attacker(
@@ -687,24 +763,26 @@ class AttackGraph():
         reached_attack_steps    - list of ids of the attack steps that the
                                   attacker has reached
         """
         if logger.isEnabledFor(logging.DEBUG):
             # Avoid running json.dumps when not in debug
             if attacker_id is not None:
                 logger.debug('Add attacker "%s" with id:%d.',
                     attacker.name,
-                    attacker_id)
+                    attacker_id
+                )
             else:
                 logger.debug('Add attacker "%s" without id.',
-                    attacker.name)
+                    attacker.name
+                )
         attacker.id = attacker_id or self.next_attacker_id
-        if attacker.id in self._id_to_attacker:
+        if attacker.id in self.attackers:
             raise ValueError(f'Attacker index {attacker_id} already in use.')
         self.next_attacker_id = max(attacker.id + 1, self.next_attacker_id)
         for node_id in reached_attack_steps:
-            node = self.get_node_by_id(node_id)
+            node = self.nodes[node_id]
             if node:
                 attacker.compromise(node)
             else:
@@ -713,16 +791,15 @@ class AttackGraph():
                 logger.error(msg, node_id)
                 raise AttackGraphException(msg % node_id)
         for node_id in entry_points:
-            node = self.get_node_by_id(int(node_id))
+            node = self.nodes[node_id]
             if node:
-                attacker.entry_points.append(node)
+                attacker.entry_points.add(node)
             else:
                 msg = ("Could not find node with id %d"
                        "in attacker entrypoints.")
                 logger.error(msg, node_id)
                 raise AttackGraphException(msg % node_id)
-        self.attackers.append(attacker)
-        self._id_to_attacker[attacker.id] = attacker
+        self.attackers[attacker.id] = attacker
     def remove_attacker(self, attacker: Attacker):
         """Remove attacker from attack graph
@@ -736,7 +813,6 @@ class AttackGraph():
                 attacker.id)
         for node in attacker.reached_attack_steps:
             attacker.undo_compromise(node)
-        self.attackers.remove(attacker)
         if not isinstance(attacker.id, int):
             raise ValueError(f'Invalid attacker id.')
-        del self._id_to_attacker[attacker.id]
+        del self.attackers[attacker.id]

mal-toolbox 0.1.12__py3-none-any.whl → 0.3.0__py3-none-any.whl

mal-toolbox 0.1.12py3-none-any.whl → 0.3.0py3-none-any.whl