PyPI - synapse - Versions diffs - 2.169.0__py311-none-any.whl → 2.171.0__py311-none-any.whl - Mend

synapse 2.169.0py311-none-any.whl → 2.171.0py311-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of synapse might be problematic. Click here for more details.

Files changed (41) hide show

synapse/cortex.py +99 -3
synapse/datamodel.py +5 -0
synapse/lib/ast.py +70 -12
synapse/lib/cell.py +76 -7
synapse/lib/layer.py +75 -6
synapse/lib/lmdbslab.py +17 -0
synapse/lib/node.py +7 -0
synapse/lib/snap.py +22 -4
synapse/lib/storm.py +1 -1
synapse/lib/stormlib/cortex.py +1 -1
synapse/lib/stormlib/model.py +339 -40
synapse/lib/stormtypes.py +58 -1
synapse/lib/types.py +36 -1
synapse/lib/version.py +2 -2
synapse/lib/view.py +94 -15
synapse/models/files.py +40 -0
synapse/models/inet.py +8 -4
synapse/models/infotech.py +355 -17
synapse/tests/files/cpedata.json +525034 -0
synapse/tests/test_cortex.py +108 -0
synapse/tests/test_lib_ast.py +66 -0
synapse/tests/test_lib_cell.py +112 -0
synapse/tests/test_lib_layer.py +52 -1
synapse/tests/test_lib_lmdbslab.py +36 -0
synapse/tests/test_lib_scrape.py +72 -71
synapse/tests/test_lib_snap.py +16 -1
synapse/tests/test_lib_storm.py +118 -0
synapse/tests/test_lib_stormlib_cortex.py +15 -0
synapse/tests/test_lib_stormlib_model.py +427 -0
synapse/tests/test_lib_stormtypes.py +147 -15
synapse/tests/test_lib_types.py +21 -0
synapse/tests/test_lib_view.py +77 -0
synapse/tests/test_model_files.py +52 -0
synapse/tests/test_model_inet.py +63 -1
synapse/tests/test_model_infotech.py +187 -26
synapse/tests/utils.py +42 -9
{synapse-2.169.0.dist-info → synapse-2.171.0.dist-info}/METADATA +1 -1
{synapse-2.169.0.dist-info → synapse-2.171.0.dist-info}/RECORD +41 -40
{synapse-2.169.0.dist-info → synapse-2.171.0.dist-info}/LICENSE +0 -0
{synapse-2.169.0.dist-info → synapse-2.171.0.dist-info}/WHEEL +0 -0
{synapse-2.169.0.dist-info → synapse-2.171.0.dist-info}/top_level.txt +0 -0

synapse/models/infotech.py CHANGED Viewed

@@ -1,6 +1,10 @@
+import copy
+import string
 import asyncio
 import logging
+import regex
 import synapse.exc as s_exc
 import synapse.data as s_data
@@ -9,10 +13,53 @@ import synapse.common as s_common
 import synapse.lib.chop as s_chop
 import synapse.lib.types as s_types
 import synapse.lib.module as s_module
+import synapse.lib.scrape as s_scrape
 import synapse.lib.version as s_version
 logger = logging.getLogger(__name__)
+# This is the regular expression pattern for CPE2.2. It's kind of a hybrid
+# between compatible binding and preferred binding. Differences are here:
+# - Use only the list of percent encoded values specified by preferred binding.
+#   This is to ensure it converts properly to CPE2.3.
+# - Add tilde (~) to the UNRESERVED list which removes the need to specify the
+#   PACKED encoding specifically.
+ALPHA = '[A-Za-z]'
+DIGIT = '[0-9]'
+UNRESERVED = r'[A-Za-z0-9\-\.\_~]'
+SPEC1 = '%01'
+SPEC2 = '%02'
+# This is defined in the ABNF but not actually referenced
+# SPECIAL = f'(?:{SPEC1}|{SPEC2})'
+SPEC_CHRS = f'(?:{SPEC1}+|{SPEC2})'
+PCT_ENCODED = '%(?:21|22|23|24|25|26|27|28|28|29|2a|2b|2c|2f|3a|3b|3c|3d|3e|3f|40|5b|5c|5d|5e|60|7b|7c|7d|7e)'
+STR_WO_SPECIAL = f'(?:{UNRESERVED}|{PCT_ENCODED})*'
+STR_W_SPECIAL = f'{SPEC_CHRS}? (?:{UNRESERVED}|{PCT_ENCODED})+ {SPEC_CHRS}?'
+STRING = f'(?:{STR_W_SPECIAL}|{STR_WO_SPECIAL})'
+REGION = f'(?:{ALPHA}{{2}}|{DIGIT}{{3}})'
+LANGTAG = rf'(?:{ALPHA}{{2,3}}(?:\-{REGION})?)'
+PART = '[hoa]?'
+VENDOR = STRING
+PRODUCT = STRING
+VERSION = STRING
+UPDATE = STRING
+EDITION = STRING
+LANG = f'{LANGTAG}?'
+COMPONENT_LIST = f'''
+    (?:
+        {PART}:{VENDOR}:{PRODUCT}:{VERSION}:{UPDATE}:{EDITION}:{LANG} |
+        {PART}:{VENDOR}:{PRODUCT}:{VERSION}:{UPDATE}:{EDITION} |
+        {PART}:{VENDOR}:{PRODUCT}:{VERSION}:{UPDATE} |
+        {PART}:{VENDOR}:{PRODUCT}:{VERSION} |
+        {PART}:{VENDOR}:{PRODUCT} |
+        {PART}:{VENDOR} |
+        {PART}
+    )
+'''
+cpe22_regex = regex.compile(f'cpe:/{COMPONENT_LIST}', regex.VERBOSE | regex.IGNORECASE)
+cpe23_regex = regex.compile(s_scrape._cpe23_regex, regex.VERBOSE | regex.IGNORECASE)
 def cpesplit(text):
     part = ''
     parts = []
@@ -36,7 +83,160 @@ def cpesplit(text):
     except StopIteration:
         parts.append(part)
-    return parts
+    return [part.strip() for part in parts]
+# Formatted String Binding characters that need to be escaped
+FSB_ESCAPE_CHARS = [
+    '!', '"', '#', '$', '%', '&', "'", '(', ')',
+    '+', ',', '/', ':', ';', '<', '=', '>', '@',
+    '[', ']', '^', '`', '{', '|', '}', '~',
+    '\\', '?', '*'
+]
+FSB_VALID_CHARS = ['-', '.', '_']
+FSB_VALID_CHARS.extend(string.ascii_letters)
+FSB_VALID_CHARS.extend(string.digits)
+FSB_VALID_CHARS.extend(FSB_ESCAPE_CHARS)
+def fsb_escape(text):
+    ret = ''
+    if text in ('*', '-'):
+        return text
+    # Check validity of text first
+    if (invalid := [char for char in text if char not in FSB_VALID_CHARS]):
+        badchars = ', '.join(invalid)
+        mesg = f'Invalid CPE 2.3 character(s) ({badchars}) detected.'
+        raise s_exc.BadTypeValu(mesg=mesg, valu=text)
+    textlen = len(text)
+    for idx, char in enumerate(text):
+        if char not in FSB_ESCAPE_CHARS:
+            ret += char
+            continue
+        escchar = f'\\{char}'
+        # The only character in the string
+        if idx == 0 and idx == textlen - 1:
+            ret += escchar
+            continue
+        # Handle the backslash as a special case
+        if char == '\\':
+            if idx == 0:
+                # Its the first character and escaping another special character
+                if text[idx + 1] in FSB_ESCAPE_CHARS:
+                    ret += char
+                else:
+                    ret += escchar
+                continue
+            if idx == textlen - 1:
+                # Its the last character and being escaped
+                if text[idx - 1] == '\\':
+                    ret += char
+                else:
+                    ret += escchar
+                continue
+            # The backslash is in the middle somewhere
+            # It's already escaped or it's escaping a special char
+            if text[idx - 1] == '\\' or text[idx + 1] in FSB_ESCAPE_CHARS:
+                ret += char
+                continue
+            # Lone backslash, escape it and move on
+            ret += escchar
+            continue
+        # First char, no look behind
+        if idx == 0:
+            # Escape the first character and go around
+            ret += escchar
+            continue
+        escaped = text[idx - 1] == '\\'
+        if not escaped:
+            ret += escchar
+            continue
+        ret += char
+    return ret
+def fsb_unescape(text):
+    ret = ''
+    textlen = len(text)
+    for idx, char in enumerate(text):
+        # The last character so we can't look ahead
+        if idx == textlen - 1:
+            ret += char
+            continue
+        if char == '\\' and text[idx + 1] in FSB_ESCAPE_CHARS:
+            continue
+        ret += char
+    return ret
+# URI Binding characters that can be encoded in percent format
+URI_PERCENT_CHARS = [
+    # Do the percent first so we don't double encode by accident
+    ('%25', '%'),
+    ('%21', '!'), ('%22', '"'), ('%23', '#'), ('%24', '$'), ('%26', '&'), ('%27', "'"),
+    ('%28', '('), ('%29', ')'), ('%2a', '*'), ('%2b', '+'), ('%2c', ','), ('%2f', '/'), ('%3a', ':'),
+    ('%3b', ';'), ('%3c', '<'), ('%3d', '='), ('%3e', '>'), ('%3f', '?'), ('%40', '@'), ('%5b', '['),
+    ('%5c', '\\'), ('%5d', ']'), ('%5e', '^'), ('%60', '`'), ('%7b', '{'), ('%7c', '|'), ('%7d', '}'),
+    ('%7e', '~'),
+]
+def uri_quote(text):
+    ret = ''
+    for (pct, char) in URI_PERCENT_CHARS:
+        text = text.replace(char, pct)
+    return text
+def uri_unquote(text):
+    # iterate backwards so we do the % last to avoid double unquoting
+    # example: "%2521" would turn into "%21" which would then replace into "!"
+    for (pct, char) in URI_PERCENT_CHARS[::-1]:
+        text = text.replace(pct, char)
+    return text
+UNSPECIFIED = ('', '*')
+def uri_pack(edition, sw_edition, target_sw, target_hw, other):
+    # If the four extended attributes are unspecified, only return the edition value
+    if (sw_edition in UNSPECIFIED and target_sw in UNSPECIFIED and target_hw in UNSPECIFIED and other in UNSPECIFIED):
+        return edition
+    ret = [edition, '', '', '', '']
+    if sw_edition not in UNSPECIFIED:
+        ret[1] = sw_edition
+    if target_sw not in UNSPECIFIED:
+        ret[2] = target_sw
+    if target_hw not in UNSPECIFIED:
+        ret[3] = target_hw
+    if other not in UNSPECIFIED:
+        ret[4] = other
+    return '~' + '~'.join(ret)
+def uri_unpack(edition):
+    if edition.startswith('~') and edition.count('~') == 5:
+        return edition[1:].split('~', 5)
+    return None
 class Cpe22Str(s_types.Str):
     '''
@@ -60,7 +260,14 @@ class Cpe22Str(s_types.Str):
             mesg = 'CPE 2.2 string is expected to start with "cpe:/"'
             raise s_exc.BadTypeValu(valu=valu, mesg=mesg)
-        return zipCpe22(parts), {}
+        v2_2 = zipCpe22(parts)
+        rgx = cpe22_regex.match(v2_2)
+        if rgx is None or rgx.group() != v2_2:
+            mesg = 'CPE 2.2 string appears to be invalid.'
+            raise s_exc.BadTypeValu(mesg=mesg, valu=valu)
+        return v2_2, {}
     def _normPyList(self, parts):
         return zipCpe22(parts), {}
@@ -77,7 +284,7 @@ def chopCpe22(text):
     CPE 2.2 Formatted String
     https://cpe.mitre.org/files/cpe-specification_2.2.pdf
     '''
-    if not text.startswith('cpe:/'):
+    if not text.startswith('cpe:/'): # pragma: no cover
         mesg = 'CPE 2.2 string is expected to start with "cpe:/"'
         raise s_exc.BadTypeValu(valu=text, mesg=mesg)
@@ -89,6 +296,18 @@ def chopCpe22(text):
     return parts
+PART_IDX_PART = 0
+PART_IDX_VENDOR = 1
+PART_IDX_PRODUCT = 2
+PART_IDX_VERSION = 3
+PART_IDX_UPDATE = 4
+PART_IDX_EDITION = 5
+PART_IDX_LANG = 6
+PART_IDX_SW_EDITION = 7
+PART_IDX_TARGET_SW = 8
+PART_IDX_TARGET_HW = 9
+PART_IDX_OTHER = 10
 class Cpe23Str(s_types.Str):
     '''
     CPE 2.3 Formatted String
@@ -119,31 +338,113 @@ class Cpe23Str(s_types.Str):
             extsize = 11 - len(parts)
             parts.extend(['*' for _ in range(extsize)])
+            v2_3 = 'cpe:2.3:' + ':'.join(parts)
+            v2_2 = copy.copy(parts)
+            for idx, part in enumerate(v2_2):
+                if part == '*':
+                    v2_2[idx] = ''
+                    continue
+                part = fsb_unescape(part)
+                v2_2[idx] = uri_quote(part)
+            v2_2[PART_IDX_EDITION] = uri_pack(
+                v2_2[PART_IDX_EDITION],
+                v2_2[PART_IDX_SW_EDITION],
+                v2_2[PART_IDX_TARGET_SW],
+                v2_2[PART_IDX_TARGET_HW],
+                v2_2[PART_IDX_OTHER]
+            )
+            v2_2 = v2_2[:7]
+            parts = [fsb_unescape(k) for k in parts]
         elif text.startswith('cpe:/'):
+            v2_2 = text
             # automatically normalize CPE 2.2 format to CPE 2.3
             parts = chopCpe22(text)
+            # Account for blank fields
+            for idx, part in enumerate(parts):
+                if not part:
+                    parts[idx] = '*'
             extsize = 11 - len(parts)
             parts.extend(['*' for _ in range(extsize)])
+            # URI bindings can pack extended attributes into the
+            # edition field, handle that here.
+            unpacked = uri_unpack(parts[PART_IDX_EDITION])
+            if unpacked:
+                (edition, sw_edition, target_sw, target_hw, other) = unpacked
+                if edition:
+                    parts[PART_IDX_EDITION] = edition
+                else:
+                    parts[PART_IDX_EDITION] = '*'
+                if sw_edition:
+                    parts[PART_IDX_SW_EDITION] = sw_edition
+                if target_sw:
+                    parts[PART_IDX_TARGET_SW] = target_sw
+                if target_hw:
+                    parts[PART_IDX_TARGET_HW] = target_hw
+                if other:
+                    parts[PART_IDX_OTHER] = other
+            parts = [uri_unquote(part) for part in parts]
+            # This feels a little uninuitive to escape parts for "escaped" and
+            # unescape parts for "parts" but values in parts could be incorrectly
+            # escaped or incorrectly unescaped so just do both.
+            escaped = [fsb_escape(part) for part in parts]
+            parts = [fsb_unescape(part) for part in parts]
+            v2_3 = 'cpe:2.3:' + ':'.join(escaped)
         else:
             mesg = 'CPE 2.3 string is expected to start with "cpe:2.3:"'
             raise s_exc.BadTypeValu(valu=valu, mesg=mesg)
+        rgx = cpe23_regex.match(v2_3)
+        if rgx is None or rgx.group() != v2_3:
+            mesg = 'CPE 2.3 string appears to be invalid.'
+            raise s_exc.BadTypeValu(mesg=mesg, valu=valu)
+        if isinstance(v2_2, list):
+            cpe22 = zipCpe22(v2_2)
+        else:
+            cpe22 = v2_2
+        rgx = cpe22_regex.match(cpe22)
+        if rgx is None or rgx.group() != cpe22:
+            v2_2 = None
         subs = {
-            'v2_2': parts,
-            'part': parts[0],
-            'vendor': parts[1],
-            'product': parts[2],
-            'version': parts[3],
-            'update': parts[4],
-            'edition': parts[5],
-            'language': parts[6],
-            'sw_edition': parts[7],
-            'target_sw': parts[8],
-            'target_hw': parts[9],
-            'other': parts[10],
+            'part': parts[PART_IDX_PART],
+            'vendor': parts[PART_IDX_VENDOR],
+            'product': parts[PART_IDX_PRODUCT],
+            'version': parts[PART_IDX_VERSION],
+            'update': parts[PART_IDX_UPDATE],
+            'edition': parts[PART_IDX_EDITION],
+            'language': parts[PART_IDX_LANG],
+            'sw_edition': parts[PART_IDX_SW_EDITION],
+            'target_sw': parts[PART_IDX_TARGET_SW],
+            'target_hw': parts[PART_IDX_TARGET_HW],
+            'other': parts[PART_IDX_OTHER],
         }
-        return 'cpe:2.3:' + ':'.join(parts), {'subs': subs}
+        if v2_2 is not None:
+            subs['v2_2'] = v2_2
+        return v2_3, {'subs': subs}
 class SemVer(s_types.Int):
     '''
@@ -412,6 +713,13 @@ class ItModule(s_module.CoreModule):
                     'doc': 'A MITRE ATT&CK Campaign ID.',
                     'ex': 'C0028',
                 }),
+                ('it:mitre:attack:datasource', ('str', {'regex': r'^DS[0-9]{4}$'}), {
+                    'doc': 'A MITRE ATT&CK Datasource ID.',
+                    'ex': 'DS0026',
+                }),
+                ('it:mitre:attack:data:component', ('guid', {}), {
+                        'doc': 'A MITRE ATT&CK data component.',
+                }),
                 ('it:mitre:attack:flow', ('guid', {}), {
                     'doc': 'A MITRE ATT&CK Flow diagram.',
                 }),
@@ -1216,6 +1524,10 @@ class ItModule(s_module.CoreModule):
                                            'uniq': True, 'sorted': True, 'split': ','}), {
                         'doc': 'An array of ATT&CK tactics that include this technique.',
                     }),
+                    ('data:components', ('array', {'type': 'it:mitre:attack:data:component',
+                                                   'uniq': True, 'sorted': True}), {
+                        'doc': 'An array of MITRE ATT&CK data components that detect the ATT&CK technique.',
+                    }),
                 )),
                 ('it:mitre:attack:software', {}, (
                     ('software', ('it:prod:soft', {}), {
@@ -1335,6 +1647,27 @@ class ItModule(s_module.CoreModule):
                     ('author:contact', ('ps:contact', {}), {
                         'doc': 'The contact information for the author of the ATT&CK Flow diagram.'}),
                 )),
+                ('it:mitre:attack:datasource', {}, (
+                    ('name', ('str', {'lower': True, 'onespace': True}), {
+                        'doc': 'The name of the datasource.'}),
+                    ('description', ('str', {}), {
+                        'disp': {'hint': 'text'},
+                        'doc': 'A description of the datasource.'}),
+                    ('references', ('array', {'type': 'inet:url', 'uniq': True, 'sorted': True}), {
+                        'doc': 'An array of URLs that document the datasource.',
+                    }),
+                )),
+                ('it:mitre:attack:data:component', {}, (
+                    ('name', ('str', {'lower': True, 'onespace': True}), {
+                        'ro': True,
+                        'doc': 'The name of the data component.'}),
+                    ('description', ('str', {}), {
+                        'disp': {'hint': 'text'},
+                        'doc': 'A description of the data component.'}),
+                    ('datasource', ('it:mitre:attack:datasource', {}), {
+                        'ro': True,
+                        'doc': 'The datasource this data component belongs to.'}),
+                )),
                 ('it:dev:int', {}, ()),
                 ('it:dev:pipe', {}, ()),
                 ('it:dev:mutex', {}, ()),
@@ -1573,8 +1906,13 @@ class ItModule(s_module.CoreModule):
                         'doc': 'A brief description of the hardware.'}),
                     ('cpe', ('it:sec:cpe', {}), {
                         'doc': 'The NIST CPE 2.3 string specifying this hardware.'}),
+                    ('manufacturer', ('ou:org', {}), {
+                        'doc': 'The organization that manufactures this hardware.'}),
+                    ('manufacturer:name', ('ou:name', {}), {
+                        'doc': 'The name of the organization that manufactures this hardware.'}),
                     ('make', ('ou:name', {}), {
-                        'doc': 'The name of the organization which manufactures this hardware.'}),
+                        'deprecated': True,
+                        'doc': 'Deprecated. Please use :manufacturer:name.'}),
                     ('model', ('str', {'lower': True, 'onespace': True}), {
                         'doc': 'The model name or number for this hardware specification.'}),
                     ('version', ('str', {'lower': True, 'onespace': True}), {

synapse 2.169.0__py311-none-any.whl → 2.171.0__py311-none-any.whl

Potentially problematic release.

synapse 2.169.0py311-none-any.whl → 2.171.0py311-none-any.whl