PyPI - mal-toolbox - Versions diffs - 0.0.28__py3-none-any.whl → 0.1.12__py3-none-any.whl - Mend

mal-toolbox 0.0.28py3-none-any.whl → 0.1.12py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

{mal_toolbox-0.0.28.dist-info → mal_toolbox-0.1.12.dist-info}/METADATA +60 -28
mal_toolbox-0.1.12.dist-info/RECORD +32 -0
{mal_toolbox-0.0.28.dist-info → mal_toolbox-0.1.12.dist-info}/WHEEL +1 -1
maltoolbox/__init__.py +31 -31
maltoolbox/__main__.py +80 -4
maltoolbox/attackgraph/__init__.py +8 -0
maltoolbox/attackgraph/analyzers/__init__.py +0 -0
maltoolbox/attackgraph/analyzers/apriori.py +173 -27
maltoolbox/attackgraph/attacker.py +84 -25
maltoolbox/attackgraph/attackgraph.py +503 -215
maltoolbox/attackgraph/node.py +92 -31
maltoolbox/attackgraph/query.py +125 -19
maltoolbox/default.conf +8 -7
maltoolbox/exceptions.py +45 -0
maltoolbox/file_utils.py +66 -0
maltoolbox/ingestors/__init__.py +0 -0
maltoolbox/ingestors/neo4j.py +95 -84
maltoolbox/language/__init__.py +4 -0
maltoolbox/language/classes_factory.py +145 -64
maltoolbox/language/{lexer_parser/__main__.py → compiler/__init__.py} +5 -12
maltoolbox/language/{lexer_parser → compiler}/mal_lexer.py +1 -1
maltoolbox/language/{lexer_parser → compiler}/mal_parser.py +1 -1
maltoolbox/language/{lexer_parser → compiler}/mal_visitor.py +4 -5
maltoolbox/language/languagegraph.py +569 -168
maltoolbox/model.py +858 -0
maltoolbox/translators/__init__.py +0 -0
maltoolbox/translators/securicad.py +76 -52
maltoolbox/translators/updater.py +132 -0
maltoolbox/wrappers.py +62 -0
mal_toolbox-0.0.28.dist-info/RECORD +0 -26
maltoolbox/cl_parser.py +0 -89
maltoolbox/language/specification.py +0 -265
maltoolbox/main.py +0 -84
maltoolbox/model/model.py +0 -282
{mal_toolbox-0.0.28.dist-info → mal_toolbox-0.1.12.dist-info}/AUTHORS +0 -0
{mal_toolbox-0.0.28.dist-info → mal_toolbox-0.1.12.dist-info}/LICENSE +0 -0
{mal_toolbox-0.0.28.dist-info → mal_toolbox-0.1.12.dist-info}/top_level.txt +0 -0

maltoolbox/language/languagegraph.py CHANGED Viewed

@@ -2,30 +2,45 @@
 MAL-Toolbox Language Graph Module
 """
+from __future__ import annotations
+import copy
 import logging
 import json
-from dataclasses import dataclass
-from typing import Any, List, Optional, ForwardRef
-from maltoolbox.language import specification
+import zipfile
+from dataclasses import dataclass, field
+from typing import Any, Optional
+from maltoolbox.file_utils import (
+    load_dict_from_yaml_file, load_dict_from_json_file,
+    save_dict_to_file
+)
+from .compiler import MalCompiler
+from ..exceptions import (
+    LanguageGraphAssociationError,
+    LanguageGraphStepExpressionError,
+    LanguageGraphException,
+    LanguageGraphSuperAssetNotFoundError
+)
 logger = logging.getLogger(__name__)
 @dataclass
 class LanguageGraphAsset:
-    name: str = None
-    associations: List[ForwardRef('LanguageGraphAssociation')] = None
-    attack_steps: List[ForwardRef('LanguageGraphAttackStep')] = None
-    description: dict = None
+    name: Optional[str] = None
+    associations: list[LanguageGraphAssociation] = field(default_factory=lambda: [])
+    attack_steps: list[LanguageGraphAttackStep] = field(default_factory=lambda: [])
+    description: dict = field(default_factory=lambda: {})
     # MAL languages currently do not support multiple inheritance, but this is
     # futureproofing at its most hopeful.
-    super_assets: list = None
-    sub_assets: list = None
+    super_assets: list = field(default_factory=lambda: [])
+    sub_assets: list = field(default_factory=lambda: [])
+    is_abstract: Optional[bool] = None
-    def to_dict(self):
-        node_dict = {
+    def to_dict(self) -> dict:
+        """Convert LanguageGraphAsset to dictionary"""
+        node_dict: dict[str, Any] = {
             'name': self.name,
             'associations': [],
             'attack_steps': [],
@@ -46,7 +61,10 @@ class LanguageGraphAsset:
             node_dict['sub_assets'].append(sub_asset.name)
         return node_dict
-    def is_subasset_of(self, target_asset):
+    def __repr__(self) -> str:
+        return str(self.to_dict())
+    def is_subasset_of(self, target_asset: LanguageGraphAsset) -> bool:
         """
         Check if an asset extends the target asset through inheritance.
@@ -66,7 +84,7 @@ class LanguageGraphAsset:
             current_assets.extend(current_asset.super_assets)
         return False
-    def get_all_subassets(self):
+    def get_all_subassets(self) -> list[LanguageGraphAsset]:
         """
         Return a list of all of the assets that directly or indirectly extend
         this asset.
@@ -82,7 +100,7 @@ class LanguageGraphAsset:
             subassets.extend(current_asset.sub_assets)
         return subassets
-    def get_all_superassets(self):
+    def get_all_superassets(self) -> list[LanguageGraphAsset]:
         """
         Return a list of all of the assets that this asset directly or
         indirectly extends.
@@ -98,6 +116,20 @@ class LanguageGraphAsset:
             superassets.extend(current_asset.super_assets)
         return superassets
+    def get_all_common_superassets(
+            self, other: LanguageGraphAsset
+        ) -> set[Optional[str]]:
+        """Return a set of all common ancestors between this asset
+        and the other asset given as parameter"""
+        self_superassets = set(
+            asset.name for asset in self.get_all_superassets()
+        )
+        other_superassets = set(
+            asset.name for asset in other.get_all_superassets()
+        )
+        return self_superassets.intersection(other_superassets)
 @dataclass
 class LanguageGraphAssociationField:
     asset: LanguageGraphAsset
@@ -105,14 +137,16 @@ class LanguageGraphAssociationField:
     minimum: int
     maximum: int
 @dataclass
 class LanguageGraphAssociation:
     name: str
     left_field: LanguageGraphAssociationField
     right_field: LanguageGraphAssociationField
-    description: dict = None
+    description: Optional[dict] = None
-    def to_dict(self):
+    def to_dict(self) -> dict:
+        """Convert LanguageGraphAssociation to dictionary"""
         node_dict = {
             'name': self.name,
             'left': {
@@ -132,7 +166,10 @@ class LanguageGraphAssociation:
         return node_dict
-    def contains_fieldname(self, fieldname):
+    def __repr__(self) -> str:
+        return str(self.to_dict())
+    def contains_fieldname(self, fieldname: str) -> bool:
         """
         Check if the association contains the field name given as a parameter.
@@ -147,7 +184,7 @@ class LanguageGraphAssociation:
             return True
         return False
-    def contains_asset(self, asset):
+    def contains_asset(self, asset: Any) -> bool:
         """
         Check if the association matches the asset given as a parameter. A
         match can either be an explicit one or if the asset given subassets
@@ -164,7 +201,7 @@ class LanguageGraphAssociation:
             return True
         return False
-    def get_opposite_fieldname(self, fieldname):
+    def get_opposite_fieldname(self, fieldname: str) -> str:
         """
         Return the opposite field name if the association contains the field
         name given as a parameter.
@@ -179,11 +216,14 @@ class LanguageGraphAssociation:
         if self.right_field.fieldname == fieldname:
             return self.left_field.fieldname
-        logger.warning(f'Requested fieldname \"{fieldname}\" from '
-            f'association {self.name} which did not contain it!')
-        return None
+        msg = ('Requested fieldname "%s" from association '
+               '%s which did not contain it!')
+        logger.error(msg, fieldname, self.name)
+        raise LanguageGraphAssociationError(msg % (fieldname, self.name))
-    def get_opposite_asset(self, asset):
+    def get_opposite_asset(
+            self, asset: LanguageGraphAsset
+        ) -> Optional[LanguageGraphAsset]:
         """
         Return the opposite asset if the association matches the asset given
         as a parameter. A match can either be an explicit one or if the asset
@@ -203,22 +243,30 @@ class LanguageGraphAssociation:
         if asset.is_subasset_of(self.right_field.asset):
             return self.left_field.asset
-        logger.warning(f'Requested asset \"{asset.name}\" from '
-            f'association {self.name} which did not contain it!')
+        logger.warning(
+            'Requested asset "%s" from association %s'
+            'which did not contain it!', asset.name, self.name
+        )
         return None
 @dataclass
 class LanguageGraphAttackStep:
-    name: str = None
-    type: str = None
-    asset: List[ForwardRef('LanguageGraphAsset')] = None
-    ttc: dict = None
-    children: dict = None
-    parents: dict = None
-    description: dict = None
-    def to_dict(self):
-        node_dict = {
+    name: str
+    type: str
+    asset: LanguageGraphAsset
+    ttc: dict = field(default_factory = lambda: {})
+    children: dict = field(default_factory = lambda: {})
+    parents: dict = field(default_factory = lambda: {})
+    description: dict = field(default_factory = lambda: {})
+    attributes: Optional[dict] = None
+    @property
+    def qualified_name(self) -> str:
+        return f"{self.asset.name}:{self.name}"
+    def to_dict(self) -> dict:
+        node_dict: dict[Any, Any] = {
             'name': self.name,
             'type': self.type,
             'asset': self.asset.name,
@@ -248,11 +296,20 @@ class LanguageGraphAttackStep:
         return node_dict
+    def __repr__(self) -> str:
+        return str(self.to_dict())
 class DependencyChain:
-    def __init__(self, type, next_link):
+    def __init__(self, type: str, next_link: Optional[DependencyChain]):
         self.type = type
-        self.next_link = next_link
+        self.next_link: Optional[DependencyChain] = next_link
+        self.fieldname: str = ""
+        self.association: Optional[LanguageGraphAssociation] = None
+        self.left_chain: Optional[DependencyChain] = None
+        self.right_chain: Optional[DependencyChain] = None
+        self.subtype: Optional[Any] = None
+        self.current_link: Optional[DependencyChain] = None
     def __iter__(self):
         self.current_link = self
@@ -265,55 +322,97 @@ class DependencyChain:
             return dep_chain
         raise StopIteration
-    def to_dict(self):
+    def to_dict(self) -> dict:
+        """Convert DependencyChain to dictionary"""
         match (self.type):
             case 'union' | 'intersection' | 'difference':
                 return {self.type: {
-                    'left': self.left_chain.to_dict(),
+                    'left': self.left_chain.to_dict()
+                            if self.left_chain else {},
                     'right': self.right_chain.to_dict()
+                             if self.right_chain else {}
                     }
                 }
             case 'field':
-                association = self.association
-                return {association.name:
+                if not self.association:
+                    raise LanguageGraphAssociationError("Missing association for dep chain")
+                return {self.association.name:
                     {'fieldname': self.fieldname,
                      'next_association':
-                          self.next_link.to_dict() if self.next_link else None
+                            self.next_link.to_dict()
+                            if self.next_link else {}
+                        }
                     }
-                }
             case 'transitive':
                 return {'transitive':
                     self.next_link.to_dict()
+                    if self.next_link else {}
                 }
             case 'subType':
+                if not self.subtype:
+                    raise LanguageGraphException(
+                        "No subtype for dependency chain"
+                    )
+                if not self.next_link:
+                    raise LanguageGraphException(
+                        "No next link for subtype dependency chain"
+                    )
                 return {'subType': self.subtype.name,
                     'expression': self.next_link.to_dict()
                 }
             case _:
-                logger.error('Unknown associations chain element '
-                    f'{self.type}!')
-                return None
+                msg = 'Unknown associations chain element %s!'
+                logger.error(msg, self.type)
+                raise LanguageGraphAssociationError(msg % self.type)
+    def __repr__(self) -> str:
+        return str(self.to_dict())
+class LanguageGraph():
+    """Graph representation of a MAL language"""
+    def __init__(self, lang: dict):
+        self.assets: list = []
+        self.associations: list = []
+        self.attack_steps: list = []
+        self._lang_spec: dict = lang
+        self.metadata = {
+            "version": lang["defines"]["version"],
+            "id": lang["defines"]["id"],
+        }
+        self._generate_graph()
+    @classmethod
+    def from_mal_spec(cls, mal_spec_file: str) -> LanguageGraph:
+        """
+        Create a LanguageGraph from a .mal file (a MAL spec).
-class LanguageGraph:
-    def __init__(self):
-        self.assets = []
-        self.associations = []
-        self.attack_steps = []
+        Arguments:
+        mal_spec_file   -   the path to the .mal file
+        """
+        logger.info("Loading mal spec %s", mal_spec_file)
+        return LanguageGraph(MalCompiler().compile(mal_spec_file))
-    def save_to_file(self, filename: str):
+    @classmethod
+    def from_mar_archive(cls, mar_archive: str) -> LanguageGraph:
         """
-        Save the language graph to a json file.
+        Create a LanguageGraph from a ".mar" archive provided by malc
+        (https://github.com/mal-lang/malc).
         Arguments:
-        filename        - the name of the output file
+        mar_archive     -   the path to a ".mar" archive
         """
+        logger.info('Loading mar archive %s', mar_archive)
+        with zipfile.ZipFile(mar_archive, 'r') as archive:
+            langspec = archive.read('langspec.json')
+            return LanguageGraph(json.loads(langspec))
-        logger.info(f'Saving language graph to \"{filename}\" file.')
+    def _to_dict(self):
+        """Converts LanguageGraph into a dict"""
         serialized_assets = []
         for asset in self.assets:
             serialized_assets.append(asset.to_dict())
@@ -323,24 +422,67 @@ class LanguageGraph:
         serialized_attack_steps = []
         for attack_step in self.attack_steps:
             serialized_attack_steps.append(attack_step.to_dict())
-        logger.debug(f'Saving {len(serialized_assets)} assets, '
-            f'{len(serialized_associations)} associations, and '
-            f'{len(serialized_attack_steps)} attack steps to '
-            f'\"{filename}\" file')
+        logger.debug(
+            'Serializing %s assets, %s associations, and %s attack steps',
+            len(serialized_assets), len(serialized_associations),
+            len(serialized_attack_steps)
+        )
         serialized_graph = {
             'Assets': serialized_assets,
             'Associations': serialized_associations,
             'Attack Steps': serialized_attack_steps
         }
-        with open(filename, 'w', encoding='utf-8') as file:
-            json.dump(serialized_graph, file, indent=4)
+        return serialized_graph
+    def save_to_file(self, filename: str) -> None:
+        """Save to json/yml depending on extension"""
+        return save_dict_to_file(filename, self._to_dict())
+    @classmethod
+    def _from_dict(cls, serialized_object: dict) -> None:
+        raise NotImplementedError(
+            "Converting from dict feature is not implemented yet")
+    @classmethod
+    def load_from_file(cls, filename: str) -> LanguageGraph:
+        """Create LanguageGraph from mal, mar, yaml or json"""
+        lang_graph = None
+        if filename.endswith('.mal'):
+            lang_graph = cls.from_mal_spec(filename)
+        elif filename.endswith('.mar'):
+            lang_graph = cls.from_mar_archive(filename)
+        elif filename.endswith(('yaml', 'yml')):
+            lang_graph = cls._from_dict(load_dict_from_yaml_file(filename))
+        elif filename.endswith(('json')):
+            lang_graph = cls._from_dict(load_dict_from_json_file(filename))
+        if lang_graph:
+            return lang_graph
+        raise TypeError(
+            "Unknown file extension, expected json/mal/mar/yml/yaml"
+        )
+    def save_language_specification_to_json(self, filename: str) -> None:
+        """
+        Save a MAL language specification dictionary to a JSON file
+        Arguments:
+        filename        - the JSON filename where the language specification will be written
+        """
+        logger.info('Save language specification to %s', filename)
+        with open(filename, 'w', encoding='utf-8') as file:
+            json.dump(self._lang_spec, file, indent=4)
     def process_step_expression(self,
-        lang: dict,
-        target_asset,
-        dep_chain,
-        step_expression: dict):
+            lang: dict,
+            target_asset,
+            dep_chain,
+            step_expression: dict
+        ) -> tuple:
         """
         Recursively process an attack step expression.
@@ -363,8 +505,13 @@ class LanguageGraph:
         A tuple triplet containing the target asset, the resulting parent
         associations chain, and the name of the attack step.
         """
-        logger.debug('Processing Step Expression:\n' \
-            + json.dumps(step_expression, indent = 2))
+        if logger.isEnabledFor(logging.DEBUG):
+            # Avoid running json.dumps when not in debug
+            logger.debug(
+                'Processing Step Expression:\n%s',
+                json.dumps(step_expression, indent = 2)
+            )
         match (step_expression['type']):
             case 'attackStep':
@@ -383,10 +530,12 @@ class LanguageGraph:
                 rh_target_asset, rh_dep_chain, _ = self.process_step_expression(
                     lang, target_asset, dep_chain, step_expression['rhs'])
-                if lh_target_asset != rh_target_asset:
-                    logger.error('Set operation has different target asset '
-                        'types for each side of the expression: '
-                        f'{lh_target_asset.name} and {rh_target_asset.name}!')
+                if not lh_target_asset.get_all_common_superassets(rh_target_asset):
+                    logger.error(
+                        "Set operation attempted between targets that"
+                        " do not share any common superassets: %s and %s!",
+                        lh_target_asset.name, rh_target_asset.name
+                    )
                     return (None, None, None)
                 new_dep_chain = DependencyChain(
@@ -401,9 +550,8 @@ class LanguageGraph:
             case 'variable':
                 # Fetch the step expression associated with the variable from
                 # the language specification and resolve that.
-                variable_step_expr = specification.\
-                    get_variable_for_class_by_name(lang,
-                        target_asset.name, step_expression['name'])
+                variable_step_expr = self._get_variable_for_asset_type_by_name(
+                    target_asset.name, step_expression['name'])
                 if variable_step_expr:
                     return self.process_step_expression(
                         lang,
@@ -412,8 +560,10 @@ class LanguageGraph:
                         variable_step_expr)
                 else:
-                    logger.error('Failed to find variable '
-                        f'{step_expression["name"]} for {target_asset.name}')
+                    logger.error(
+                        'Failed to find variable %s for %s',
+                        step_expression["name"], target_asset.name
+                    )
                     return (None, None, None)
             case 'field':
@@ -422,7 +572,9 @@ class LanguageGraph:
                 # fieldname and association to the parent associations chain.
                 fieldname = step_expression['name']
                 if not target_asset:
-                    logger.error(f'Missing target asset for field \"{fieldname}\"!')
+                    logger.error(
+                        'Missing target asset for field "%s"!', fieldname
+                    )
                     return (None, None, None)
                 new_target_asset = None
@@ -447,8 +599,10 @@ class LanguageGraph:
                         return (new_target_asset,
                             new_dep_chain,
                             None)
-                logger.error(f'Failed to find field \"{fieldname}\" on '
-                    f'asset \"{target_asset.name}\"!')
+                logger.error(
+                    'Failed to find field "%s" on asset "%s"!',
+                    fieldname, target_asset.name
+                )
                 return (None, None, None)
             case 'transitive':
@@ -481,19 +635,23 @@ class LanguageGraph:
                         dep_chain,
                         step_expression['stepExpression'])
-                subtype_asset = next((asset for asset in self.assets \
-                    if asset.name == subtype_name), None)
+                subtype_asset = next((asset for asset in self.assets if asset.name == subtype_name), None)
                 if not subtype_asset:
-                    logger.error('Failed to find subtype attack step '
-                        f'\"{subtype_name}\"')
+                    msg = 'Failed to find subtype attackstep "{subtype_name}"'
+                    logger.error(msg)
+                    raise LanguageGraphException(msg)
                 if not subtype_asset.is_subasset_of(result_target_asset):
-                    logger.error(f'Found subtype \"{subtype_name}\" which '
-                        f'does not extend \"{result_target_asset.name}\". '
-                        'Therefore the subtype cannot be resolved.')
+                    logger.error(
+                        'Found subtype "%s" which does not extend "%s", '
+                        'therefore the subtype cannot be resolved.',
+                        subtype_name, result_target_asset.name
+                    )
                     return (None, None, None)
                 new_dep_chain = DependencyChain(
-                    type = 'subtype',
+                    type = 'subType',
                     next_link = result_dep_chain)
                 new_dep_chain.subtype = subtype_asset
                 return (subtype_asset,
@@ -519,11 +677,16 @@ class LanguageGraph:
                     rh_attack_step_name)
             case _:
-                logger.error('Unknown attack step type: '
-                    f'{step_expression["type"]}')
+                logger.error(
+                    'Unknown attack step type: "%s"', step_expression["type"]
+                )
                 return (None, None, None)
-    def reverse_dep_chain(self, dep_chain, reverse_chain):
+    def reverse_dep_chain(
+            self,
+            dep_chain: Optional[DependencyChain],
+            reverse_chain: Optional[DependencyChain]
+        ) -> Optional[DependencyChain]:
         """
         Recursively reverse the associations chain. From parent to child or
         vice versa.
@@ -566,94 +729,109 @@ class LanguageGraph:
                 case 'field':
                     association = dep_chain.association
+                    if not association:
+                        raise LanguageGraphException(
+                            "Missing association for dep chain"
+                        )
                     opposite_fieldname = association.get_opposite_fieldname(
                         dep_chain.fieldname)
                     new_dep_chain = DependencyChain(
                         type = 'field',
-                        next_link = reverse_chain)
+                        next_link = reverse_chain
+                    )
                     new_dep_chain.fieldname = opposite_fieldname
                     new_dep_chain.association = association
-                    return self.reverse_dep_chain(dep_chain.next_link,
-                        new_dep_chain)
+                    return self.reverse_dep_chain(
+                                dep_chain.next_link,
+                                new_dep_chain
+                            )
                 case 'subType':
                     result_reverse_chain = self.reverse_dep_chain(
-                        new_dep_chain.next_link,
-                        reverse_chain)
+                        dep_chain.next_link,
+                        reverse_chain
+                    )
                     new_dep_chain = DependencyChain(
-                        type = 'subtype',
-                        next_link = result_reverse_chain)
+                        type = 'subType',
+                        next_link = result_reverse_chain
+                    )
                     new_dep_chain.subtype = dep_chain.subtype
                     return new_dep_chain
+                    # return reverse_chain
                 case _:
-                    logger.error('Unknown associations chain element '
-                        f'{dep_chain.type}!')
-                    return None
+                    msg = 'Unknown assoc chain element "%s"'
+                    logger.error(msg, dep_chain.type)
+                    raise LanguageGraphAssociationError(msg % dep_chain.type)
-    def generate_graph(self, lang: dict):
+    def _generate_graph(self) -> None:
         """
-        Generate language graph starting from a MAL language specification
-        Arguments:
-        lang            - a dictionary representing the MAL language specification
+        Generate language graph starting from the MAL language specification
+        given in the constructor.
         """
         # Generate all of the asset nodes of the language graph.
-        for asset in lang['assets']:
-            logger.debug(f'Create asset language graph nodes for asset '
-                f'{asset["name"]}')
+        for asset in self._lang_spec['assets']:
+            logger.debug(
+                'Create asset language graph nodes for asset %s',
+                asset["name"]
+            )
             asset_node = LanguageGraphAsset(
                 name = asset['name'],
                 associations = [],
                 attack_steps = [],
                 description = asset['meta'],
                 super_assets = [],
-                sub_assets = []
+                sub_assets = [],
+                is_abstract = asset['isAbstract']
             )
             self.assets.append(asset_node)
         # Link assets based on inheritance
-        for asset_info in lang['assets']:
+        for asset_info in self._lang_spec['assets']:
             asset = next((asset for asset in self.assets \
                 if asset.name == asset_info['name']), None)
-            if not asset:
-                logger.error('Failed to find asset '
-                    f'\"{asset_info["name"]}\"!')
-                return 1
             if asset_info['superAsset']:
                 super_asset = next((asset for asset in self.assets \
                     if asset.name == asset_info['superAsset']), None)
                 if not super_asset:
-                    logger.error('Failed to find super asset '
-                        f'\"{asset_info["superAsset"]}\" '
-                        f'for asset \"{asset_info["name"]}\"!')
-                    return 1
+                    msg = 'Failed to find super asset "%s" for asset "%s"!'
+                    logger.error(
+                        msg, asset_info["superAsset"], asset_info["name"])
+                    raise LanguageGraphSuperAssetNotFoundError(
+                        msg % (asset_info["superAsset"], asset_info["name"]))
                 super_asset.sub_assets.append(asset)
                 asset.super_assets.append(super_asset)
         # Generate all of the association nodes of the language graph.
         for asset in self.assets:
-            logger.debug(f'Create association language graph nodes for asset '
-                f'{asset.name}')
-            associations_nodes = []
-            associations = specification.get_associations_for_class(lang,
-                asset.name)
+            logger.debug(
+                'Create association language graph nodes for asset %s',
+                asset.name
+            )
+            associations = self._get_associations_for_asset_type(asset.name)
             for association in associations:
                 left_asset = next((asset for asset in self.assets \
                     if asset.name == association['leftAsset']), None)
                 if not left_asset:
-                    logger.error('Failed to find left hand asset '
-                        f'\"{association["leftAsset"]}\" for '
-                        f'association \"{association["name"]}\"!')
-                    return 1
+                    msg = 'Left asset "%s" for association "%s" not found!'
+                    logger.error(
+                        msg, association["leftAsset"], association["name"])
+                    raise LanguageGraphAssociationError(
+                        msg % (association["leftAsset"], association["name"]))
                 right_asset = next((asset for asset in self.assets \
                     if asset.name == association['rightAsset']), None)
                 if not right_asset:
-                    logger.error('Failed to find right hand asset '
-                        f'\"{association["rightAsset"]}\" for '
-                        f'association \"{association["name"]}\"!')
-                    return 1
+                    msg = 'Right asset "%s" for association "%s" not found!'
+                    logger.error(
+                        msg, association["rightAsset"], association["name"])
+                    raise LanguageGraphAssociationError(
+                        msg % (association["rightAsset"], association["name"])
+                    )
                 # Technically we should be more exhaustive and check the
                 # flipped version too and all of the fieldnames as well.
@@ -694,17 +872,19 @@ class LanguageGraph:
         # Generate all of the attack step nodes of the language graph.
         for asset in self.assets:
-            logger.debug(f'Create attack steps language graph nodes for asset '
-                f'{asset.name}.')
-            attack_step_nodes = []
-            attack_steps = specification.get_attacks_for_class(lang,
-                asset.name)
+            logger.debug(
+                'Create attack steps language graph nodes for asset %s',
+                asset.name
+            )
+            attack_steps = self._get_attacks_for_asset_type(asset.name)
             for attack_step_name, attack_step_attribs in attack_steps.items():
-                logger.debug(f'Create attack step language graph nodes for '
-                    f'{attack_step_name}.')
+                logger.debug(
+                    'Create attack step language graph nodes for %s',
+                    attack_step_name
+                )
                 attack_step_node = LanguageGraphAttackStep(
-                    name = asset.name + ':' + attack_step_name,
+                    name = attack_step_name,
                     type = attack_step_attribs['type'],
                     asset = asset,
                     ttc = attack_step_attribs['ttc'],
@@ -718,8 +898,10 @@ class LanguageGraph:
         # Then, link all of the attack step nodes according to their associations.
         for attack_step in self.attack_steps:
-            logger.debug('Determining children for attack step '\
-                f'{attack_step.name}.')
+            logger.debug(
+                'Determining children for attack step %s',
+                attack_step.name
+            )
             step_expressions = \
                 attack_step.attributes['reaches']['stepExpressions'] if \
                     attack_step.attributes['reaches'] else []
@@ -728,36 +910,31 @@ class LanguageGraph:
                 # Resolve each of the attack step expressions listed for this
                 # attack step to determine children.
                 (target_asset, dep_chain, attack_step_name) = \
-                    self.process_step_expression(lang,
+                    self.process_step_expression(self._lang_spec,
                         attack_step.asset,
                         None,
                         step_expression)
                 if not target_asset:
-                    logger.error('Failed to find target asset ' \
-                    f'to link with for step expression:\n' +
-                    json.dumps(step_expression, indent = 2))
-                    print('Failed to find target asset ' \
-                    f'to link with for step expression:\n' +
-                    json.dumps(step_expression, indent = 2))
-                    return 1
-                attack_step_fullname = target_asset.name + ':' + attack_step_name
+                    msg = 'Failed to find target asset to link with for ' \
+                        'step expression:\n%s'
+                    raise LanguageGraphStepExpressionError(
+                        msg % json.dumps(step_expression, indent = 2)
+                    )
                 target_attack_step = next((attack_step \
                     for attack_step in target_asset.attack_steps \
-                        if attack_step.name == attack_step_fullname), None)
+                        if attack_step.name == attack_step_name), None)
                 if not target_attack_step:
-                    logger.error('Failed to find target attack step '
-                        f'{attack_step_fullname} on '
-                        f'{target_asset.name} to link with for step '
-                        'expression:\n' +
-                        json.dumps(step_expression, indent = 2))
-                    print('Failed to find target attack step '
-                        f'{attack_step_fullname} on '
-                        f'{target_asset.name} to link with for step '
-                        'expression:\n' +
-                        json.dumps(step_expression, indent = 2))
-                    return 1
+                    msg = 'Failed to find target attack step %s on %s to ' \
+                          'link with for step expression:\n%s'
+                    raise LanguageGraphStepExpressionError(
+                        msg % (
+                            attack_step_name,
+                            target_asset.name,
+                            json.dumps(step_expression, indent = 2)
+                        )
+                    )
                 # It is easier to create the parent associations chain due to
                 # the left-hand first progression.
@@ -780,4 +957,228 @@ class LanguageGraph:
                         self.reverse_dep_chain(dep_chain,
                             None))]
-        return 0
+    def _get_attacks_for_asset_type(self, asset_type: str) -> dict:
+        """
+        Get all Attack Steps for a specific Class
+        Arguments:
+        asset_type      - a string representing the class for which we want to list
+                          the possible attack steps
+        Return:
+        A dictionary representing the set of possible attacks for the specified
+        class. Each key in the dictionary is an attack name and is associated
+        with a dictionary containing other characteristics of the attack such as
+        type of attack, TTC distribution, child attack steps and other information
+        """
+        attack_steps: dict = {}
+        try:
+            asset = next((asset for asset in self._lang_spec['assets'] if asset['name'] == asset_type))
+        except StopIteration:
+            logger.error(
+                'Failed to find asset type %s when looking'
+                'for attack steps.', asset_type
+            )
+            return attack_steps
+        logger.debug(
+            'Get attack steps for %s asset from '
+            'language specification.', asset["name"]
+        )
+        if asset['superAsset']:
+            logger.debug('Asset extends another one, fetch the superclass '\
+                'attack steps for it.')
+            attack_steps = self._get_attacks_for_asset_type(asset['superAsset'])
+        for step in asset['attackSteps']:
+            if step['name'] not in attack_steps:
+                attack_steps[step['name']] = copy.deepcopy(step)
+            elif not step['reaches']:
+                # This attack step does not lead to any attack steps
+                continue
+            elif step['reaches']['overrides'] == True:
+                attack_steps[step['name']] = copy.deepcopy(step)
+            else:
+                if attack_steps[step['name']]['reaches'] is not None and \
+                        'stepExpressions' in \
+                        attack_steps[step['name']]['reaches']:
+                    attack_steps[step['name']]['reaches']['stepExpressions'].\
+                        extend(step['reaches']['stepExpressions'])
+                else:
+                    attack_steps[step['name']]['reaches'] = {
+                        'overrides': False,
+                        'stepExpressions': step['reaches']['stepExpressions']
+                    }
+        return attack_steps
+    def _get_associations_for_asset_type(self, asset_type: str) -> list:
+        """
+        Get all Associations for a specific Class
+        Arguments:
+        asset_type      - a string representing the class for which we want to list
+                          the associations
+        Return:
+        A dictionary representing the set of associations for the specified
+        class. Each key in the dictionary is an attack name and is associated
+        with a dictionary containing other characteristics of the attack such as
+        type of attack, TTC distribution, child attack steps and other information
+        """
+        logger.debug(
+            'Get associations for %s asset from '
+            'language specification.', asset_type
+        )
+        associations: list = []
+        asset = next((asset for asset in self._lang_spec['assets'] if asset['name'] == \
+            asset_type), None)
+        if not asset:
+            logger.error(
+                'Failed to find asset type %s when '
+                'looking for associations.', asset_type
+            )
+            return associations
+        if asset['superAsset']:
+            logger.debug('Asset extends another one, fetch the superclass '\
+                'associations for it.')
+            associations.extend(self._get_associations_for_asset_type(asset['superAsset']))
+        assoc_iter = (assoc for assoc in self._lang_spec['associations'] \
+            if assoc['leftAsset'] == asset_type or \
+                assoc['rightAsset'] == asset_type)
+        assoc = next(assoc_iter, None)
+        while (assoc):
+            associations.append(assoc)
+            assoc = next(assoc_iter, None)
+        return associations
+    def _get_variable_for_asset_type_by_name(
+            self, asset_type: str, variable_name: str) -> dict:
+        """
+        Get a variables for a specific asset type by name.
+        NOTE: Variables are the ones specified in MAL through `let` statements
+        Arguments:
+        asset_type      - a string representing the type of asset which
+                          contains the variable
+        variable_name   - the name of the variable to search for
+        Return:
+        A dictionary representing the step expressions for the specified variable.
+        """
+        asset = next((asset for asset in self._lang_spec['assets'] if asset['name'] == \
+            asset_type), None)
+        if not asset:
+            msg = 'Failed to find asset type %s when looking for variable.'
+            logger.error(msg, asset_type)
+            raise LanguageGraphException(msg % asset_type)
+        variable_dict = next((variable for variable in \
+            asset['variables'] if variable['name'] == variable_name), None)
+        if not variable_dict:
+            if asset['superAsset']:
+                variable_dict = self._get_variable_for_asset_type_by_name(asset['superAsset'],
+                                                       variable_name)
+            if variable_dict:
+                return variable_dict
+            else:
+                msg = 'Failed to find variable %s in %s lang specification.'
+                logger.error(msg, variable_name, asset_type)
+                raise LanguageGraphException(
+                    msg % (variable_name, asset_type))
+        return variable_dict['stepExpression']
+    def regenerate_graph(self) -> None:
+        """
+        Regenerate language graph starting from the MAL language specification
+        given in the constructor.
+        """
+        self.assets = []
+        self.associations = []
+        self.attack_steps = []
+        self._generate_graph()
+    def get_asset_by_name(
+            self,
+            asset_name
+    ) -> Optional[LanguageGraphAsset]:
+        """
+        Get an asset based on its name
+        Arguments:
+        asset_name  - a string containing the asset name
+        Return:
+        The asset matching the name.
+        None if there is no match.
+        """
+        for asset in self.assets:
+            if asset.name == asset_name:
+                return asset
+        return None
+    def get_association_by_fields_and_assets(
+            self,
+            first_field: str,
+            second_field: str,
+            first_asset_name: str,
+            second_asset_name: str
+        ) -> Optional[LanguageGraphAssociation]:
+        """
+        Get an association based on its field names and asset types
+        Arguments:
+        first_field         - a string containing the first field
+        second_field        - a string containing the second field
+        first_asset_name    - a string representing the first asset type
+        second_asset_name   - a string representing the second asset type
+        Return:
+        The association matching the fieldnames and asset types.
+        None if there is no match.
+        """
+        first_asset = self.get_asset_by_name(first_asset_name)
+        if first_asset is None:
+            raise LookupError(
+                f'Failed to find asset with name \"{first_asset_name}\" in '
+                'the language graph.'
+            )
+        second_asset = self.get_asset_by_name(second_asset_name)
+        if second_asset is None:
+            raise LookupError(
+                f'Failed to find asset with name \"{second_asset_name}\" in '
+                'the language graph.'
+            )
+        for assoc in self.associations:
+            logger.debug(
+                'Compare ("%s", "%s", "%s", "%s") to ("%s", "%s", "%s", "%s").',
+                first_asset_name, first_field,
+                second_asset_name, second_field,
+                assoc.left_field.asset.name, assoc.left_field.fieldname,
+                assoc.right_field.asset.name, assoc.right_field.fieldname
+            )
+            # If the asset and fields match either way we accept it as a match.
+            if assoc.left_field.fieldname == first_field and \
+                assoc.right_field.fieldname == second_field and \
+                first_asset.is_subasset_of(assoc.left_field.asset) and \
+                second_asset.is_subasset_of(assoc.right_field.asset):
+                return assoc
+            if assoc.left_field.fieldname == second_field and \
+                assoc.right_field.fieldname == first_field and \
+                second_asset.is_subasset_of(assoc.left_field.asset) and \
+                first_asset.is_subasset_of(assoc.right_field.asset):
+                return assoc
+        return None

mal-toolbox 0.0.28__py3-none-any.whl → 0.1.12__py3-none-any.whl

mal-toolbox 0.0.28py3-none-any.whl → 0.1.12py3-none-any.whl