PyPI - mal-toolbox - Versions diffs - 2.0.0__py3-none-any.whl → 2.1.0__py3-none-any.whl - Mend

mal-toolbox 2.0.0py3-none-any.whl → 2.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

{mal_toolbox-2.0.0.dist-info → mal_toolbox-2.1.0.dist-info}/METADATA +2 -2
mal_toolbox-2.1.0.dist-info/RECORD +51 -0
{mal_toolbox-2.0.0.dist-info → mal_toolbox-2.1.0.dist-info}/WHEEL +1 -1
maltoolbox/__init__.py +2 -2
maltoolbox/attackgraph/__init__.py +2 -2
maltoolbox/attackgraph/attackgraph.py +121 -549
maltoolbox/attackgraph/factories.py +68 -0
maltoolbox/attackgraph/file_utils.py +0 -0
maltoolbox/attackgraph/generate.py +338 -0
maltoolbox/attackgraph/node_getters.py +36 -0
maltoolbox/attackgraph/ttcs.py +28 -0
maltoolbox/language/__init__.py +2 -2
maltoolbox/language/compiler/mal_compiler.py +4 -3
maltoolbox/language/detector.py +43 -0
maltoolbox/language/expression_chain.py +218 -0
maltoolbox/language/language_graph_asset.py +180 -0
maltoolbox/language/language_graph_assoc.py +147 -0
maltoolbox/language/language_graph_attack_step.py +129 -0
maltoolbox/language/language_graph_builder.py +282 -0
maltoolbox/language/language_graph_loaders.py +7 -0
maltoolbox/language/language_graph_lookup.py +140 -0
maltoolbox/language/language_graph_serialization.py +5 -0
maltoolbox/language/languagegraph.py +244 -1537
maltoolbox/language/step_expression_processor.py +491 -0
mal_toolbox-2.0.0.dist-info/RECORD +0 -36
{mal_toolbox-2.0.0.dist-info → mal_toolbox-2.1.0.dist-info}/entry_points.txt +0 -0
{mal_toolbox-2.0.0.dist-info → mal_toolbox-2.1.0.dist-info}/licenses/AUTHORS +0 -0
{mal_toolbox-2.0.0.dist-info → mal_toolbox-2.1.0.dist-info}/licenses/LICENSE +0 -0
{mal_toolbox-2.0.0.dist-info → mal_toolbox-2.1.0.dist-info}/top_level.txt +0 -0

maltoolbox/attackgraph/factories.py ADDED Viewed

@@ -0,0 +1,68 @@
+from __future__ import annotations
+import logging
+import zipfile
+from maltoolbox.exceptions import AttackGraphStepExpressionError
+from maltoolbox.language.languagegraph import LanguageGraph
+from maltoolbox.model import Model
+from maltoolbox.attackgraph.attackgraph import AttackGraph
+from .. import log_configs
+logger = logging.getLogger(__name__)
+def create_attack_graph(
+        lang: str | LanguageGraph,
+        model: str | Model,
+    ) -> AttackGraph:
+    """Create and return an attack graph
+    Args:
+    ----
+    lang    - path to language file (.mar or .mal) or a LanguageGraph object
+    model   - path to model file (yaml or json) or a Model object
+    """
+    # Load language
+    if isinstance(lang, LanguageGraph):
+        lang_graph = lang
+    elif isinstance(lang, str):
+        # Load from path
+        try:
+            lang_graph = LanguageGraph.from_mar_archive(lang)
+        except zipfile.BadZipFile:
+            lang_graph = LanguageGraph.from_mal_spec(lang)
+    else:
+        raise TypeError("`lang` must be either string or LanguageGraph")
+    if 'langspec_file' in log_configs:
+        lang_graph.save_language_specification_to_json(
+            log_configs['langspec_file']
+        )
+    if 'langgraph_file' in log_configs:
+        lang_graph.save_to_file(log_configs['langgraph_file'])
+    # Load model
+    if isinstance(model, Model):
+        instance_model = model
+    elif isinstance(model, str):
+        # Load from path
+        instance_model = Model.load_from_file(model, lang_graph)
+    else:
+        raise TypeError("`model` must be either string or Model")
+    if log_configs['model_file']:
+        instance_model.save_to_file(log_configs['model_file'])
+    try:
+        attack_graph = AttackGraph(lang_graph, instance_model)
+    except AttackGraphStepExpressionError as e:
+        logger.error(
+            'Attack graph generation failed when attempting '
+            'to resolve attack step expression!'
+        )
+        raise e
+    return attack_graph

maltoolbox/attackgraph/file_utils.py ADDED Viewed

File without changes

maltoolbox/attackgraph/generate.py ADDED Viewed

@@ -0,0 +1,338 @@
+"""Graph generation functions"""
+from __future__ import annotations
+import json
+import logging
+from typing import TYPE_CHECKING, Optional
+from maltoolbox.attackgraph.node_getters import get_node_by_full_name
+from maltoolbox.attackgraph.ttcs import get_ttc_dist
+from ..exceptions import (
+    AttackGraphException,
+    AttackGraphStepExpressionError,
+    LanguageGraphException,
+)
+from ..language import ExpressionsChain, LanguageGraphAttackStep
+from ..model import Model
+from .node import AttackGraphNode
+if TYPE_CHECKING:
+    from typing import Any
+    from ..model import ModelAsset
+logger = logging.getLogger(__name__)
+def link_node_children(
+    model: Model,
+    ag_node: AttackGraphNode,
+    full_name_to_node: dict[str, AttackGraphNode]
+) -> None:
+    """Link one node to its children."""
+    if not ag_node.model_asset:
+        raise AttackGraphException('Attack graph node is missing asset link')
+    lg_asset = model.lang_graph.assets[ag_node.model_asset.type]
+    lg_attack_step: LanguageGraphAttackStep | None = (
+        lg_asset.attack_steps[ag_node.name]
+    )
+    while lg_attack_step:
+        for child_type, expr_chains in lg_attack_step.children.items():
+            for expr_chain in expr_chains:
+                link_from_expr_chain(
+                    model, ag_node, child_type, expr_chain, full_name_to_node
+                )
+        if lg_attack_step.overrides:
+            break
+        lg_attack_step = lg_attack_step.inherits
+def link_from_expr_chain(
+    model: Model,
+    ag_node: AttackGraphNode,
+    child_type: LanguageGraphAttackStep,
+    expr_chain: ExpressionsChain | None,
+    full_name_to_node: dict[str, AttackGraphNode]
+) -> None:
+    """Link a node to targets from a specific expression chain."""
+    if not ag_node.model_asset:
+        raise AttackGraphException(
+            "Need model asset connection to generate graph"
+        )
+    target_assets = follow_expr_chain(model, {ag_node.model_asset}, expr_chain)
+    for target_asset in target_assets:
+        if not target_asset:
+            continue
+        target_node = get_node_by_full_name(
+            full_name_to_node, f"{target_asset.name}:{child_type.name}"
+        )
+        if not target_node:
+            raise AttackGraphStepExpressionError(
+                f'Failed to find target node "{target_asset.name}:{child_type.name}" '
+                f'for "{ag_node.full_name}"({ag_node.id})'
+            )
+        logger.debug(
+            'Linking attack step "%s"(%d) to attack step "%s"(%d)',
+            ag_node.full_name, ag_node.id,
+            target_node.full_name, target_node.id
+        )
+        ag_node.children.add(target_node)
+        target_node.parents.add(ag_node)
+def follow_field_expr_chain(
+    target_assets: set[ModelAsset], expr_chain: ExpressionsChain
+):
+    # Change the target assets from the current ones to the
+    # associated assets given the specified field name.
+    if not expr_chain.fieldname:
+        raise LanguageGraphException(
+            '"field" step expression chain is missing fieldname.'
+        )
+    new_target_assets: set[ModelAsset] = set()
+    new_target_assets.update(
+        *(
+            asset.associated_assets.get(expr_chain.fieldname, set())
+            for asset in target_assets
+        )
+    )
+    return new_target_assets
+def follow_transitive_expr_chain(
+    model: Model,
+    target_assets: set[ModelAsset],
+    expr_chain: ExpressionsChain
+):
+    if not expr_chain.sub_link:
+        raise LanguageGraphException(
+            '"transitive" step expression chain is missing sub link.'
+        )
+    new_assets = target_assets
+    while new_assets := follow_expr_chain(
+        model, new_assets, expr_chain.sub_link
+    ):
+        new_assets = new_assets.difference(target_assets)
+        if not new_assets:
+            break
+        target_assets.update(new_assets)
+    return target_assets
+def follow_subtype_expr_chain(
+    model: Model,
+    target_assets: set[ModelAsset],
+    expr_chain: ExpressionsChain
+):
+    if not expr_chain.sub_link:
+        raise LanguageGraphException(
+            '"subType" step expression chain is missing sub link.'
+        )
+    new_target_assets = set()
+    new_target_assets.update(
+        follow_expr_chain(
+            model, target_assets, expr_chain.sub_link
+        )
+    )
+    selected_new_target_assets = set()
+    for asset in new_target_assets:
+        lang_graph_asset = model.lang_graph.assets[asset.type]
+        if not lang_graph_asset:
+            raise LookupError(
+                f'Failed to find asset "{asset.type}" in the '
+                'language graph.'
+            )
+        lang_graph_subtype_asset = expr_chain.subtype
+        if not lang_graph_subtype_asset:
+            raise LookupError(
+                'Failed to find asset "{expr_chain.subtype}" in '
+                'the language graph.'
+            )
+        if lang_graph_asset.is_subasset_of(lang_graph_subtype_asset):
+            selected_new_target_assets.add(asset)
+    return selected_new_target_assets
+def follow_union_intersection_difference_expr_chain(
+    model: Model,
+    target_assets: set[ModelAsset],
+    expr_chain: ExpressionsChain
+) -> set[Any]:
+    # The set operators are used to combine the left hand and
+    # right hand targets accordingly.
+    if not expr_chain.left_link:
+        raise LanguageGraphException(
+            '"%s" step expression chain is missing the left link.',
+            expr_chain.type
+        )
+    if not expr_chain.right_link:
+        raise LanguageGraphException(
+            '"%s" step expression chain is missing the right link.',
+            expr_chain.type
+        )
+    lh_targets = follow_expr_chain(
+        model, target_assets, expr_chain.left_link
+    )
+    rh_targets = follow_expr_chain(
+        model, target_assets, expr_chain.right_link
+    )
+    if expr_chain.type == 'union':
+        # Once the assets become hashable set operations should be
+        # used instead.
+        return lh_targets.union(rh_targets)
+    if expr_chain.type == 'intersection':
+        return lh_targets.intersection(rh_targets)
+    if expr_chain.type == 'difference':
+        return lh_targets.difference(rh_targets)
+    raise ValueError("Expr chain must be of type union, intersectin or difference")
+def follow_collect_expr_chain(
+    model: Model,
+    target_assets: set[ModelAsset],
+    expr_chain: ExpressionsChain
+) -> set[Any]:
+    if not expr_chain.left_link:
+        raise LanguageGraphException(
+            '"collect" step expression chain missing the left link.'
+        )
+    if not expr_chain.right_link:
+        raise LanguageGraphException(
+            '"collect" step expression chain missing the right link.'
+        )
+    lh_targets = follow_expr_chain(
+        model,
+        target_assets,
+        expr_chain.left_link
+    )
+    rh_targets = set()
+    for lh_target in lh_targets:
+        rh_targets |= follow_expr_chain(
+            model,
+            {lh_target},
+            expr_chain.right_link
+        )
+    return rh_targets
+def follow_expr_chain(
+    model: Model,
+    target_assets: set[ModelAsset],
+    expr_chain: Optional[ExpressionsChain]
+):
+    if expr_chain is None:
+        # There is no expressions chain link left to follow return the
+        # current target assets
+        return set(target_assets)
+    if logger.isEnabledFor(logging.DEBUG):
+        # Avoid running json.dumps when not in debug
+        logger.debug(
+            'Following Expressions Chain:\n%s',
+            json.dumps(expr_chain.to_dict(), indent=2)
+        )
+    match (expr_chain.type):
+        case 'union' | 'intersection' | 'difference':
+            return follow_union_intersection_difference_expr_chain(
+                model, target_assets, expr_chain
+            )
+        case 'field':
+            return follow_field_expr_chain(target_assets, expr_chain)
+        case 'transitive':
+            return follow_transitive_expr_chain(model, target_assets, expr_chain)
+        case 'subType':
+            return follow_subtype_expr_chain(model, target_assets, expr_chain)
+        case 'collect':
+            return follow_collect_expr_chain(model, target_assets, expr_chain)
+        case _:
+            msg = 'Unknown attack expressions chain type: %s'
+            logger.error(
+                msg,
+                expr_chain.type
+            )
+            raise AttackGraphStepExpressionError(
+                msg % expr_chain.type
+            )
+def link_nodes_by_language(
+    model: Model, full_name_to_node: dict[str, AttackGraphNode]
+):
+    for ag_node in full_name_to_node.values():
+        link_node_children(model, ag_node, full_name_to_node)
+def create_nodes_from_model(model: Model):
+    id_to_node = {}
+    full_name_to_node = {}
+    attack_steps = []
+    defense_steps = []
+    node_id = 0
+    for asset in model.assets.values():
+        asset.attack_step_nodes = [] # TODO: deprecate this
+        for lg_attack_step in asset.lg_asset.attack_steps.values():
+            node = AttackGraphNode(
+                node_id=node_id,
+                lg_attack_step=lg_attack_step,
+                model_asset=asset,
+                ttc_dist=get_ttc_dist(asset, lg_attack_step),
+                existence_status=(
+                    get_existance_status(model, asset, lg_attack_step)
+                ),
+            )
+            asset.attack_step_nodes.append(node) # TODO: deprecate this
+            id_to_node[node.id] = node
+            full_name_to_node[node.full_name] = node
+            if node.type in ('or', 'and'):
+                attack_steps.append(node)
+            elif node.type == 'defense':
+                defense_steps.append(node)
+            node_id += 1
+    return id_to_node, attack_steps, defense_steps, full_name_to_node
+def generate_graph(model: Model):
+    id_to_node, attack_steps, defense_steps, full_name_to_node = create_nodes_from_model(model)
+    link_nodes_by_language(model, full_name_to_node)
+    return id_to_node, attack_steps, defense_steps, full_name_to_node
+def get_existance_status(
+        model: Model,
+        asset: ModelAsset,
+        lg_attack_step: LanguageGraphAttackStep
+    ):
+    if lg_attack_step.type not in ('exist', 'notExist'):
+        # No existence status for other type of steps
+        return None
+    existence_status = False
+    for requirement in lg_attack_step.requires:
+        target_assets = follow_expr_chain(
+            model, set([asset]), requirement
+        )
+        # If the step expression resolution yielded
+        # the target assets then the required assets
+        # exist in the model.
+        if target_assets:
+            existence_status = True
+            break
+    return existence_status

maltoolbox/attackgraph/node_getters.py ADDED Viewed

@@ -0,0 +1,36 @@
+"""MAL-Toolbox Attack Graph Module
+"""
+from __future__ import annotations
+import logging
+from ..str_utils import levenshtein_distance
+from .node import AttackGraphNode
+logger = logging.getLogger(__name__)
+def get_similar_full_names(
+    full_name_to_node: dict[str, AttackGraphNode], q: str
+):
+    shortest_dist = 100
+    similar_names = []
+    for full_name in full_name_to_node:
+        dist = levenshtein_distance(q, full_name)
+        if dist == shortest_dist:
+            similar_names.append(full_name)
+        elif dist < shortest_dist:
+            similar_names = [full_name]
+            shortest_dist = dist
+    return similar_names
+def get_node_by_full_name(full_name_to_node: dict[str, AttackGraphNode], full_name: str):
+    logger.debug('Looking up node with full name "%s"', full_name)
+    if full_name not in full_name_to_node:
+        similar_names = get_similar_full_names(full_name_to_node, full_name)
+        raise LookupError(
+            f'Could not find node with name "{full_name}". '
+            f'Did you mean: {", ".join(similar_names)}?'
+        )
+    return full_name_to_node[full_name]

maltoolbox/attackgraph/ttcs.py ADDED Viewed

@@ -0,0 +1,28 @@
+import copy
+import logging
+from maltoolbox.language.language_graph_attack_step import LanguageGraphAttackStep
+from maltoolbox.model import ModelAsset
+logger = logging.getLogger(__name__)
+def get_ttc_dist(
+    asset: ModelAsset, attack_step: LanguageGraphAttackStep
+):
+    """Get step ttc distribution based on language
+    and possibly overriding defense status
+    """
+    ttc_dist = copy.deepcopy(attack_step.ttc)
+    if attack_step.type ==  'defense':
+        if attack_step.name in asset.defenses:
+            # If defense status was set in model, set ttc accordingly
+            defense_value = float(asset.defenses[attack_step.name])
+            ttc_dist = {
+                'arguments': [defense_value],
+                'name': 'Bernoulli',
+                'type': 'function'
+            }
+            logger.debug(
+                'Setting defense \"%s\" to "%s".',
+                asset.name + ":" + attack_step.name, defense_value
+            )
+    return ttc_dist

maltoolbox/language/__init__.py CHANGED Viewed

@@ -1,8 +1,8 @@
 """Contains tools to process MAL languages"""
+from .detector import Context, Detector
 from .languagegraph import (
-    Context,
-    Detector,
     ExpressionsChain,
     LanguageGraph,
     LanguageGraphAsset,

maltoolbox/language/compiler/mal_compiler.py CHANGED Viewed

@@ -440,7 +440,8 @@ class MalCompiler(ParseTreeVisitor):
         detectors: dict[str, Any] = {}
         while assert_node(cursor.node).type == 'detector':
             detector = self.visit(cursor)
-            detector[detector['name']] = detector
+            detector_name = str(detector['name'])
+            detectors[detector_name] = detector
             if not go_to_sibling(cursor):  # in case there is nothing after the meta
                 break
@@ -536,8 +537,8 @@ class MalCompiler(ParseTreeVisitor):
         ###############
         # (type) (id) #
         ###############
-        asset = node_text(cursor, 'asset')
-        label = node_text(cursor, 'label')
+        asset = node_text(cursor, 'asset').decode('utf-8')
+        label = node_text(cursor, 'label').decode('utf-8')
         return (label, asset)

maltoolbox/language/detector.py ADDED Viewed

@@ -0,0 +1,43 @@
+"""Detector functionality
+- A detector represent a logging rule on an attack step
+- It includes a context and a name
+"""
+from __future__ import annotations
+from dataclasses import dataclass
+@dataclass(frozen=True, eq=True)
+class Detector:
+    name: str | None
+    context: Context
+    type: str | None
+    tprate: dict | None
+    def to_dict(self) -> dict:
+        return {
+            "context": self.context.to_dict(),
+            "name": self.name,
+            "type": self.type,
+            "tprate": self.tprate,
+        }
+class Context(dict):
+    """Context is part of detectors to provide meta data about attackers"""
+    def __init__(self, context) -> None:
+        super().__init__(context)
+        self._context_dict = context
+        for label, asset in context.items():
+            setattr(self, label, asset)
+    def to_dict(self) -> dict:
+        return {label: asset.name for label, asset in self.items()}
+    def __str__(self) -> str:
+        return str({label: asset.name for label, asset in self._context_dict.items()})
+    def __repr__(self) -> str:
+        return f"Context({self!s}))"

mal-toolbox 2.0.0__py3-none-any.whl → 2.1.0__py3-none-any.whl

mal-toolbox 2.0.0py3-none-any.whl → 2.1.0py3-none-any.whl