PyPI - contentctl - Versions diffs - 4.4.7__py3-none-any.whl → 5.0.0__py3-none-any.whl - Mend

contentctl 4.4.7py3-none-any.whl → 5.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (123) hide show

contentctl/__init__.py +1 -1
contentctl/actions/build.py +102 -57
contentctl/actions/deploy_acs.py +29 -24
contentctl/actions/detection_testing/DetectionTestingManager.py +66 -42
contentctl/actions/detection_testing/GitService.py +134 -76
contentctl/actions/detection_testing/generate_detection_coverage_badge.py +48 -30
contentctl/actions/detection_testing/infrastructures/DetectionTestingInfrastructure.py +192 -147
contentctl/actions/detection_testing/infrastructures/DetectionTestingInfrastructureContainer.py +45 -32
contentctl/actions/detection_testing/progress_bar.py +9 -6
contentctl/actions/detection_testing/views/DetectionTestingView.py +16 -19
contentctl/actions/detection_testing/views/DetectionTestingViewCLI.py +1 -5
contentctl/actions/detection_testing/views/DetectionTestingViewFile.py +2 -2
contentctl/actions/detection_testing/views/DetectionTestingViewWeb.py +1 -4
contentctl/actions/doc_gen.py +9 -5
contentctl/actions/initialize.py +45 -33
contentctl/actions/inspect.py +118 -61
contentctl/actions/new_content.py +155 -108
contentctl/actions/release_notes.py +276 -146
contentctl/actions/reporting.py +23 -19
contentctl/actions/test.py +33 -28
contentctl/actions/validate.py +55 -34
contentctl/api.py +54 -45
contentctl/contentctl.py +124 -90
contentctl/enrichments/attack_enrichment.py +112 -72
contentctl/enrichments/cve_enrichment.py +34 -28
contentctl/enrichments/splunk_app_enrichment.py +38 -36
contentctl/helper/link_validator.py +101 -78
contentctl/helper/splunk_app.py +69 -41
contentctl/helper/utils.py +58 -53
contentctl/input/director.py +68 -36
contentctl/input/new_content_questions.py +27 -35
contentctl/input/yml_reader.py +28 -18
contentctl/objects/abstract_security_content_objects/detection_abstract.py +303 -259
contentctl/objects/abstract_security_content_objects/security_content_object_abstract.py +115 -52
contentctl/objects/alert_action.py +10 -9
contentctl/objects/annotated_types.py +1 -1
contentctl/objects/atomic.py +65 -54
contentctl/objects/base_test.py +5 -3
contentctl/objects/base_test_result.py +19 -11
contentctl/objects/baseline.py +62 -30
contentctl/objects/baseline_tags.py +30 -24
contentctl/objects/config.py +790 -597
contentctl/objects/constants.py +33 -56
contentctl/objects/correlation_search.py +150 -136
contentctl/objects/dashboard.py +55 -41
contentctl/objects/data_source.py +16 -17
contentctl/objects/deployment.py +43 -44
contentctl/objects/deployment_email.py +3 -2
contentctl/objects/deployment_notable.py +4 -2
contentctl/objects/deployment_phantom.py +7 -6
contentctl/objects/deployment_rba.py +3 -2
contentctl/objects/deployment_scheduling.py +3 -2
contentctl/objects/deployment_slack.py +3 -2
contentctl/objects/detection.py +5 -2
contentctl/objects/detection_metadata.py +1 -0
contentctl/objects/detection_stanza.py +7 -2
contentctl/objects/detection_tags.py +58 -103
contentctl/objects/drilldown.py +66 -34
contentctl/objects/enums.py +81 -100
contentctl/objects/errors.py +16 -24
contentctl/objects/integration_test.py +3 -3
contentctl/objects/integration_test_result.py +1 -0
contentctl/objects/investigation.py +59 -36
contentctl/objects/investigation_tags.py +30 -19
contentctl/objects/lookup.py +304 -101
contentctl/objects/macro.py +55 -39
contentctl/objects/manual_test.py +3 -3
contentctl/objects/manual_test_result.py +1 -0
contentctl/objects/mitre_attack_enrichment.py +17 -16
contentctl/objects/notable_action.py +2 -1
contentctl/objects/notable_event.py +1 -3
contentctl/objects/playbook.py +37 -35
contentctl/objects/playbook_tags.py +23 -13
contentctl/objects/rba.py +96 -0
contentctl/objects/risk_analysis_action.py +15 -11
contentctl/objects/risk_event.py +110 -160
contentctl/objects/risk_object.py +1 -0
contentctl/objects/savedsearches_conf.py +9 -7
contentctl/objects/security_content_object.py +5 -2
contentctl/objects/story.py +54 -49
contentctl/objects/story_tags.py +56 -45
contentctl/objects/test_attack_data.py +2 -1
contentctl/objects/test_group.py +5 -2
contentctl/objects/threat_object.py +1 -0
contentctl/objects/throttling.py +27 -18
contentctl/objects/unit_test.py +3 -4
contentctl/objects/unit_test_baseline.py +5 -5
contentctl/objects/unit_test_result.py +6 -6
contentctl/output/api_json_output.py +233 -220
contentctl/output/attack_nav_output.py +21 -21
contentctl/output/attack_nav_writer.py +29 -37
contentctl/output/conf_output.py +235 -172
contentctl/output/conf_writer.py +201 -125
contentctl/output/data_source_writer.py +38 -26
contentctl/output/doc_md_output.py +53 -27
contentctl/output/jinja_writer.py +19 -15
contentctl/output/json_writer.py +21 -11
contentctl/output/svg_output.py +56 -38
contentctl/output/templates/analyticstories_detections.j2 +2 -2
contentctl/output/templates/analyticstories_stories.j2 +1 -1
contentctl/output/templates/collections.j2 +1 -1
contentctl/output/templates/doc_detections.j2 +0 -5
contentctl/output/templates/es_investigations_investigations.j2 +1 -1
contentctl/output/templates/es_investigations_stories.j2 +1 -1
contentctl/output/templates/savedsearches_baselines.j2 +2 -2
contentctl/output/templates/savedsearches_detections.j2 +10 -11
contentctl/output/templates/savedsearches_investigations.j2 +2 -2
contentctl/output/templates/transforms.j2 +6 -8
contentctl/output/yml_writer.py +29 -20
contentctl/templates/detections/endpoint/anomalous_usage_of_7zip.yml +16 -34
contentctl/templates/stories/cobalt_strike.yml +1 -0
{contentctl-4.4.7.dist-info → contentctl-5.0.0.dist-info}/METADATA +5 -4
contentctl-5.0.0.dist-info/RECORD +168 -0
{contentctl-4.4.7.dist-info → contentctl-5.0.0.dist-info}/WHEEL +1 -1
contentctl/actions/initialize_old.py +0 -245
contentctl/objects/event_source.py +0 -11
contentctl/objects/observable.py +0 -37
contentctl/output/detection_writer.py +0 -28
contentctl/output/new_content_yml_output.py +0 -56
contentctl/output/yml_output.py +0 -66
contentctl-4.4.7.dist-info/RECORD +0 -173
{contentctl-4.4.7.dist-info → contentctl-5.0.0.dist-info}/LICENSE.md +0 -0
{contentctl-4.4.7.dist-info → contentctl-5.0.0.dist-info}/entry_points.txt +0 -0

contentctl/objects/investigation_tags.py CHANGED Viewed

@@ -1,34 +1,45 @@
 from __future__ import annotations
 from typing import List
-from pydantic import BaseModel, Field, field_validator, ValidationInfo, model_serializer
+from pydantic import (
+    BaseModel,
+    Field,
+    field_validator,
+    ValidationInfo,
+    model_serializer,
+    ConfigDict,
+)
 from contentctl.objects.story import Story
-from contentctl.objects.enums import SecurityContentInvestigationProductName, SecurityDomain
+from contentctl.objects.enums import (
+    SecurityContentInvestigationProductName,
+    SecurityDomain,
+)
 class InvestigationTags(BaseModel):
-    analytic_story: List[Story] = Field([],min_length=1)
-    product: List[SecurityContentInvestigationProductName] = Field(...,min_length=1)
-    required_fields: List[str] = Field(min_length=1)
+    model_config = ConfigDict(extra="forbid")
+    analytic_story: List[Story] = Field([], min_length=1)
+    product: List[SecurityContentInvestigationProductName] = Field(..., min_length=1)
     security_domain: SecurityDomain = Field(...)
-    @field_validator('analytic_story',mode="before")
+    @field_validator("analytic_story", mode="before")
     @classmethod
-    def mapStoryNamesToStoryObjects(cls, v:list[str], info:ValidationInfo)->list[Story]:
-        return Story.mapNamesToSecurityContentObjects(v, info.context.get("output_dto",None))
+    def mapStoryNamesToStoryObjects(
+        cls, v: list[str], info: ValidationInfo
+    ) -> list[Story]:
+        return Story.mapNamesToSecurityContentObjects(
+            v, info.context.get("output_dto", None)
+        )
     @model_serializer
     def serialize_model(self):
-        #All fields custom to this model
-        model= {
+        # All fields custom to this model
+        model = {
             "analytic_story": [story.name for story in self.analytic_story],
             "product": self.product,
-            "required_fields": self.required_fields,
             "security_domain": self.security_domain,
         }
-        #Combine fields from this model with fields from parent
-        #return the model
-        return model
+        # Combine fields from this model with fields from parent
+        # return the model
+        return model

contentctl/objects/lookup.py CHANGED Viewed

@@ -1,153 +1,356 @@
 from __future__ import annotations
-from pydantic import field_validator, ValidationInfo, model_validator, FilePath, model_serializer, Field, NonNegativeInt
-from typing import TYPE_CHECKING, Optional, Any, Union
-import re
+import abc
 import csv
-import uuid
-import datetime
+import pathlib
+import re
+from enum import StrEnum, auto
+from functools import cached_property
+from typing import TYPE_CHECKING, Annotated, Any, Literal, Optional, Self
+from pydantic import (
+    Field,
+    FilePath,
+    NonNegativeInt,
+    TypeAdapter,
+    ValidationInfo,
+    computed_field,
+    field_validator,
+    model_serializer,
+    model_validator,
+)
 if TYPE_CHECKING:
     from contentctl.input.director import DirectorOutputDto
     from contentctl.objects.config import validate
 from contentctl.objects.security_content_object import SecurityContentObject
 # This section is used to ignore lookups that are NOT  shipped with ESCU app but are used in the detections. Adding exclusions here will so that contentctl builds will not fail.
 LOOKUPS_TO_IGNORE = set(["outputlookup"])
-LOOKUPS_TO_IGNORE.add("ut_shannon_lookup") #In the URL toolbox app which is recommended for ESCU
-LOOKUPS_TO_IGNORE.add("identity_lookup_expanded") #Shipped with the Asset and Identity Framework
-LOOKUPS_TO_IGNORE.add("cim_corporate_web_domain_lookup") #Shipped with the Asset and Identity Framework
-LOOKUPS_TO_IGNORE.add("alexa_lookup_by_str") #Shipped with the Asset and Identity Framework
-LOOKUPS_TO_IGNORE.add("interesting_ports_lookup") #Shipped with the Asset and Identity Framework
-LOOKUPS_TO_IGNORE.add("admon_groups_def") #Shipped with the SA-admon addon
+LOOKUPS_TO_IGNORE.add(
+    "ut_shannon_lookup"
+)  # In the URL toolbox app which is recommended for ESCU
+LOOKUPS_TO_IGNORE.add(
+    "identity_lookup_expanded"
+)  # Shipped with the Asset and Identity Framework
+LOOKUPS_TO_IGNORE.add(
+    "cim_corporate_web_domain_lookup"
+)  # Shipped with the Asset and Identity Framework
+LOOKUPS_TO_IGNORE.add(
+    "cim_corporate_email_domain_lookup"
+)  # Shipped with the Enterprise Security
+LOOKUPS_TO_IGNORE.add("cim_cloud_domain_lookup")  # Shipped with the Enterprise Security
+LOOKUPS_TO_IGNORE.add(
+    "alexa_lookup_by_str"
+)  # Shipped with the Asset and Identity Framework
+LOOKUPS_TO_IGNORE.add(
+    "interesting_ports_lookup"
+)  # Shipped with the Asset and Identity Framework
+LOOKUPS_TO_IGNORE.add(
+    "asset_lookup_by_str"
+)  # Shipped with the Asset and Identity Framework
+LOOKUPS_TO_IGNORE.add("admon_groups_def")  # Shipped with the SA-admon addon
+LOOKUPS_TO_IGNORE.add(
+    "identity_lookup_expanded"
+)  # Shipped with the Enterprise Security
+# Special case for the Detection "Exploit Public Facing Application via Apache Commons Text"
+LOOKUPS_TO_IGNORE.add("=")
+LOOKUPS_TO_IGNORE.add("other_lookups")
-#Special case for the Detection "Exploit Public Facing Application via Apache Commons Text"
-LOOKUPS_TO_IGNORE.add("=")
-LOOKUPS_TO_IGNORE.add("other_lookups")
+class Lookup_Type(StrEnum):
+    csv = auto()
+    kvstore = auto()
+    mlmodel = auto()
 # TODO (#220): Split Lookup into 2 classes
-class Lookup(SecurityContentObject):
-    collection: Optional[str] = None
-    fields_list: Optional[str] = None
-    filename: Optional[FilePath] = None
+class Lookup(SecurityContentObject, abc.ABC):
     default_match: Optional[bool] = None
-    match_type: Optional[str] = None
-    min_matches: Optional[int] = None
-    case_sensitive_match: Optional[bool] = None
-    # TODO: Add id field to all lookup ymls
-    id: uuid.UUID = Field(default_factory=uuid.uuid4)
-    date: datetime.date = Field(datetime.date.today())
-    author: str = Field("NO AUTHOR DEFINED",max_length=255)
-    version: NonNegativeInt = 1
+    # Per the documentation for transforms.conf, EXACT should not be specified in this list,
+    # so we include only WILDCARD and CIDR
+    match_type: list[Annotated[str, Field(pattern=r"(^WILDCARD|CIDR)\(.+\)$")]] = Field(
+        default=[]
+    )
+    min_matches: None | NonNegativeInt = Field(default=None)
+    max_matches: None | Annotated[NonNegativeInt, Field(ge=1, le=1000)] = Field(
+        default=None
+    )
+    case_sensitive_match: None | bool = Field(default=None)
     @model_serializer
     def serialize_model(self):
-        #Call parent serializer
+        # Call parent serializer
         super_fields = super().serialize_model()
-        #All fields custom to this model
-        model= {
-            "filename": self.filename.name if self.filename is not None else None,
+        # All fields custom to this model
+        model = {
             "default_match": "true" if self.default_match is True else "false",
-            "match_type": self.match_type,
+            "match_type": self.match_type_to_conf_format,
             "min_matches": self.min_matches,
-            "case_sensitive_match": "true" if self.case_sensitive_match is True else "false",
-            "collection": self.collection,
-            "fields_list": self.fields_list
+            "max_matches": self.max_matches,
+            "case_sensitive_match": "true"
+            if self.case_sensitive_match is True
+            else "false",
         }
-        #return the model
+        # return the model
         model.update(super_fields)
         return model
     @model_validator(mode="before")
-    def fix_lookup_path(cls, data:Any, info: ValidationInfo)->Any:
+    def fix_lookup_path(cls, data: Any, info: ValidationInfo) -> Any:
         if data.get("filename"):
-            config:validate = info.context.get("config",None)
+            config: validate = info.context.get("config", None)
             if config is not None:
                 data["filename"] = config.path / "lookups/" / data["filename"]
             else:
-                raise ValueError("config required for constructing lookup filename, but it was not")
+                raise ValueError(
+                    "config required for constructing lookup filename, but it was not"
+                )
         return data
+    @computed_field
+    @cached_property
+    def match_type_to_conf_format(self) -> str:
+        return ", ".join(self.match_type)
+    @staticmethod
+    def get_lookups(
+        text_field: str,
+        director: DirectorOutputDto,
+        ignore_lookups: set[str] = LOOKUPS_TO_IGNORE,
+    ) -> list[Lookup]:
+        # Comprehensively match all kinds of lookups, including inputlookup and outputlookup
+        inputLookupsToGet = set(
+            re.findall(
+                r"[^\w]inputlookup(?:\s*(?:(?:append|strict|start|max)\s*=\s*(?:true|t|false|f))){0,4}\s+([\w]+)",
+                text_field,
+                re.IGNORECASE,
+            )
+        )
+        outputLookupsToGet = set(
+            re.findall(
+                r"[^\w]outputlookup(?:\s*(?:(?:append|create_empty|override_if_empty|max|key_field|allow_updates|createinapp|create_context|output_format)\s*=\s*[^\s]*))*\s+([\w]+)",
+                text_field,
+                re.IGNORECASE,
+            )
+        )
+        lookupsToGet = set(
+            re.findall(
+                r"[^\w](?:(?<!output)(?<!input))lookup(?:\s*(?:(?:local|update)\s*=\s*(?:true|t|false|f))){0,2}\s+([\w]+)",
+                text_field,
+                re.IGNORECASE,
+            )
+        )
+        input_lookups = Lookup.mapNamesToSecurityContentObjects(
+            list(inputLookupsToGet - LOOKUPS_TO_IGNORE), director
+        )
+        output_lookups = Lookup.mapNamesToSecurityContentObjects(
+            list(outputLookupsToGet - LOOKUPS_TO_IGNORE), director
+        )
+        lookups = Lookup.mapNamesToSecurityContentObjects(
+            list(lookupsToGet - LOOKUPS_TO_IGNORE), director
+        )
+        all_lookups = set(input_lookups + output_lookups + lookups)
-    def model_post_init(self, ctx:dict[str,Any]):
-        if not self.filename:
-            return
-        import pathlib
-        filenamePath = pathlib.Path(self.filename)
-        if filenamePath.suffix not in [".csv", ".mlmodel"]:
-            raise ValueError(f"All Lookup files must be CSV files and end in .csv.  The following file does not: '{filenamePath}'")
+        return list(all_lookups)
-        if filenamePath.suffix == ".mlmodel":
-            # Do not need any additional checks for an mlmodel file
-            return
+class FileBackedLookup(Lookup, abc.ABC):
+    # For purposes of the disciminated union, the child classes which
+    # inherit from this class must declare the typing of lookup_type
+    # themselves, hence it is not defined in the Lookup class
+    @model_validator(mode="after")
+    def ensure_lookup_file_exists(self) -> Self:
+        if not self.filename.exists():
+            raise ValueError(f"Expected lookup filename {self.filename} does not exist")
+        return self
+    @computed_field
+    @cached_property
+    @abc.abstractmethod
+    def filename(self) -> FilePath:
+        """
+        This function computes the backing file for the lookup. It is abstract because different types of lookups
+        (CSV for MlModel) backing files have different name format.
+        """
+        pass
+    @computed_field
+    @cached_property
+    @abc.abstractmethod
+    def app_filename(self) -> FilePath:
+        """
+        This function computes the filenames to write into the app itself.  This is abstract because
+        CSV and MLmodel requirements are different.
+        """
+        pass
+class CSVLookup(FileBackedLookup):
+    lookup_type: Literal[Lookup_Type.csv]
+    @model_serializer
+    def serialize_model(self):
+        # Call parent serializer
+        super_fields = super().serialize_model()
+        # All fields custom to this model
+        model = {"filename": self.app_filename.name}
+        # return the model
+        model.update(super_fields)
+        return model
+    @computed_field
+    @cached_property
+    def filename(self) -> FilePath:
+        """
+        This function computes the backing file for the lookup. The names of CSV files must EXACTLY match the
+        names of their lookup definitions except with the CSV file extension rather than the YML file extension.
+        """
+        if self.file_path is None:
+            raise ValueError(
+                f"Cannot get the filename of the lookup {self.lookup_type} because the YML file_path attribute is None"
+            )  # type: ignore
+        csv_file = self.file_path.parent / f"{self.file_path.stem}.{self.lookup_type}"  # type: ignore
+        return csv_file
+    @computed_field
+    @cached_property
+    def app_filename(self) -> FilePath:
+        """
+        This function computes the filenames to write into the app itself.  This is abstract because
+        CSV and MLmodel requirements are different.
+        """
+        return pathlib.Path(
+            f"{self.filename.stem}_{self.date.year}{self.date.month:02}{self.date.day:02}.{self.lookup_type}"
+        )
+    @model_validator(mode="after")
+    def ensure_correct_csv_structure(self) -> Self:
         # https://docs.python.org/3/library/csv.html#csv.DictReader
         # Column Names (fieldnames) determine by the number of columns in the first row.
         # If a row has MORE fields than fieldnames, they will be dumped in a list under the key 'restkey' - this should throw an Exception
-        # If a row has LESS fields than fieldnames, then the field should contain None by default. This should also throw an exception.
-        csv_errors:list[str] = []
-        with open(filenamePath, "r") as csv_fp:
+        # If a row has LESS fields than fieldnames, then the field should contain None by default. This should also throw an exception.
+        csv_errors: list[str] = []
+        with open(self.filename, "r") as csv_fp:
             RESTKEY = "extra_fields_in_a_row"
-            csv_dict = csv.DictReader(csv_fp, restkey=RESTKEY)
+            csv_dict = csv.DictReader(csv_fp, restkey=RESTKEY)
             if csv_dict.fieldnames is None:
-                raise ValueError(f"Error validating the CSV referenced by the lookup: {filenamePath}:\n\t"
-                                 "Unable to read fieldnames from CSV. Is the CSV empty?\n"
-                                 "  Please try opening the file with a CSV Editor to ensure that it is correct.")
+                raise ValueError(
+                    f"Error validating the CSV referenced by the lookup: {self.filename}:\n\t"
+                    "Unable to read fieldnames from CSV. Is the CSV empty?\n"
+                    "  Please try opening the file with a CSV Editor to ensure that it is correct."
+                )
             # Remember that row 1 has the headers and we do not iterate over it in the loop below
             # CSVs are typically indexed starting a row 1 for the header.
             for row_index, data_row in enumerate(csv_dict):
-                row_index+=2
-                if len(data_row.get(RESTKEY,[])) > 0:
-                    csv_errors.append(f"row [{row_index}] should have [{len(csv_dict.fieldnames)}] columns,"
-                                      f" but instead had [{len(csv_dict.fieldnames) + len(data_row.get(RESTKEY,[]))}].")
+                row_index += 2
+                if len(data_row.get(RESTKEY, [])) > 0:
+                    csv_errors.append(
+                        f"row [{row_index}] should have [{len(csv_dict.fieldnames)}] columns,"
+                        f" but instead had [{len(csv_dict.fieldnames) + len(data_row.get(RESTKEY, []))}]."
+                    )
                 for column_index, column_name in enumerate(data_row):
                     if data_row[column_name] is None:
-                        csv_errors.append(f"row [{row_index}] should have [{len(csv_dict.fieldnames)}] columns, "
-                                          f"but instead had [{column_index}].")
+                        csv_errors.append(
+                            f"row [{row_index}] should have [{len(csv_dict.fieldnames)}] columns, "
+                            f"but instead had [{column_index}]."
+                        )
         if len(csv_errors) > 0:
-            err_string = '\n\t'.join(csv_errors)
-            raise ValueError(f"Error validating the CSV referenced by the lookup: {filenamePath}:\n\t{err_string}\n"
-                             f"  Please try opening the file with a CSV Editor to ensure that it is correct.")
-        return
-    @field_validator('match_type')
+            err_string = "\n\t".join(csv_errors)
+            raise ValueError(
+                f"Error validating the CSV referenced by the lookup: {self.filename}:\n\t{err_string}\n"
+                f"  Please try opening the file with a CSV Editor to ensure that it is correct."
+            )
+        return self
+class KVStoreLookup(Lookup):
+    lookup_type: Literal[Lookup_Type.kvstore]
+    fields: list[str] = Field(
+        description="The names of the fields/headings for the KVStore.", min_length=1
+    )
+    @field_validator("fields", mode="after")
     @classmethod
-    def match_type_valid(cls, v: Union[str,None], info: ValidationInfo):
-        if not v:
-            #Match type can be None and that's okay
-            return v
+    def ensure_key(cls, values: list[str]):
+        if values[0] != "_key":
+            raise ValueError(f"fields MUST begin with '_key', not '{values[0]}'")
+        return values
+    @computed_field
+    @cached_property
+    def collection(self) -> str:
+        return self.name
+    @computed_field
+    @cached_property
+    def fields_to_fields_list_conf_format(self) -> str:
+        return ", ".join(self.fields)
+    @model_serializer
+    def serialize_model(self):
+        # Call parent serializer
+        super_fields = super().serialize_model()
+        # All fields custom to this model
+        model = {
+            "collection": self.collection,
+            "fields_list": self.fields_to_fields_list_conf_format,
+        }
+        # return the model
+        model.update(super_fields)
+        return model
-        if not (v.startswith("WILDCARD(") or v.endswith(")")) :
-            raise ValueError(f"All match_types must take the format 'WILDCARD(field_name)'. The following file does not: '{v}'")
-        return v
+class MlModel(FileBackedLookup):
+    lookup_type: Literal[Lookup_Type.mlmodel]
-    #Ensure that exactly one of location or filename are defined
-    @model_validator(mode='after')
-    def ensure_mutually_exclusive_fields(self)->Lookup:
-        if self.filename is not None and self.collection is not None:
-            raise ValueError("filename and collection cannot be defined in the lookup file.  Exactly one must be defined.")
-        elif self.filename is None and self.collection is None:
-            raise ValueError("Neither filename nor collection were defined in the lookup file.  Exactly one must "
-                             "be defined.")
+    @computed_field
+    @cached_property
+    def filename(self) -> FilePath:
+        """
+        This function computes the backing file for the lookup. The names of mlmodel files must EXACTLY match the
+        names of their lookup definitions except with:
+        - __mlspl_ prefix
+        - .mlmodel file extension rather than the YML file extension.
+        """
+        if self.file_path is None:
+            raise ValueError(
+                f"Cannot get the filename of the lookup {self.lookup_type} because the YML file_path attribute is None"
+            )  # type: ignore
+        if not self.file_path.stem.startswith("__mlspl_"):
+            raise ValueError(
+                f"The file_path for ML Model {self.name} MUST start with '__mlspl_', but it does not."
+            )
-        return self
-    @staticmethod
-    def get_lookups(text_field: str, director:DirectorOutputDto, ignore_lookups:set[str]=LOOKUPS_TO_IGNORE)->list[Lookup]:
-        lookups_to_get = set(re.findall(r'[^output]lookup (?:update=true)?(?:append=t)?\s*([^\s]*)', text_field))
-        lookups_to_ignore = set([lookup for lookup in lookups_to_get if any(to_ignore in lookups_to_get for to_ignore in ignore_lookups)])
-        lookups_to_get -= lookups_to_ignore
-        return Lookup.mapNamesToSecurityContentObjects(list(lookups_to_get), director)
+        return self.file_path.parent / f"{self.file_path.stem}.{self.lookup_type}"
+    @computed_field
+    @cached_property
+    def app_filename(self) -> FilePath:
+        """
+        This function computes the filenames to write into the app itself.  This is abstract because
+        CSV and MLmodel requirements are different.
+        """
+        return pathlib.Path(f"{self.filename.stem}.{self.lookup_type}")
+LookupAdapter = TypeAdapter(
+    Annotated[CSVLookup | KVStoreLookup | MlModel, Field(discriminator="lookup_type")]
+)

contentctl/objects/macro.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Used so that we can have a staticmethod that takes the class
+# Used so that we can have a staticmethod that takes the class
 # type Macro as an argument
 from __future__ import annotations
 from typing import TYPE_CHECKING, List
@@ -6,18 +6,21 @@ import re
 from pydantic import Field, model_serializer, NonNegativeInt
 import uuid
 import datetime
 if TYPE_CHECKING:
     from contentctl.input.director import DirectorOutputDto
 from contentctl.objects.security_content_object import SecurityContentObject
-#The following macros are included in commonly-installed apps.
-#As such, we will ignore if they are missing from our app.
-#Included in
-MACROS_TO_IGNORE = set(["drop_dm_object_name"]) # Part of CIM/Splunk_SA_CIM
-MACROS_TO_IGNORE.add("get_asset") #SA-IdentityManagement, part of Enterprise Security
-MACROS_TO_IGNORE.add("get_risk_severity") #SA-ThreatIntelligence, part of Enterprise Security
-MACROS_TO_IGNORE.add("cim_corporate_web_domain_search") #Part of CIM/Splunk_SA_CIM
-#MACROS_TO_IGNORE.add("prohibited_processes")
+# The following macros are included in commonly-installed apps.
+# As such, we will ignore if they are missing from our app.
+# Included in
+MACROS_TO_IGNORE = set(["drop_dm_object_name"])  # Part of CIM/Splunk_SA_CIM
+MACROS_TO_IGNORE.add("get_asset")  # SA-IdentityManagement, part of Enterprise Security
+MACROS_TO_IGNORE.add(
+    "get_risk_severity"
+)  # SA-ThreatIntelligence, part of Enterprise Security
+MACROS_TO_IGNORE.add("cim_corporate_web_domain_search")  # Part of CIM/Splunk_SA_CIM
+# MACROS_TO_IGNORE.add("prohibited_processes")
 class Macro(SecurityContentObject):
@@ -26,49 +29,62 @@ class Macro(SecurityContentObject):
     # TODO: Add id field to all macro ymls
     id: uuid.UUID = Field(default_factory=uuid.uuid4)
     date: datetime.date = Field(datetime.date.today())
-    author: str = Field("NO AUTHOR DEFINED",max_length=255)
+    author: str = Field("NO AUTHOR DEFINED", max_length=255)
     version: NonNegativeInt = 1
     @model_serializer
     def serialize_model(self):
-        #Call serializer for parent
+        # Call serializer for parent
         super_fields = super().serialize_model()
-        #All fields custom to this model
-        model= {
+        # All fields custom to this model
+        model = {
             "definition": self.definition,
             "description": self.description,
         }
-        #return the model
+        # return the model
         model.update(super_fields)
         return model
-    @staticmethod
-    def get_macros(text_field:str, director:DirectorOutputDto , ignore_macros:set[str]=MACROS_TO_IGNORE)->list[Macro]:
-        #Remove any comments, allowing there to be macros (which have a single backtick) inside those comments
-        #If a comment ENDS in a macro, for example ```this is a comment with a macro `macro_here````
-        #then there is a small edge case where the regex below does not work properly.  If that is
-        #the case, we edit the search slightly to insert a space
+    @staticmethod
+    def get_macros(
+        text_field: str,
+        director: DirectorOutputDto,
+        ignore_macros: set[str] = MACROS_TO_IGNORE,
+    ) -> list[Macro]:
+        # Remove any comments, allowing there to be macros (which have a single backtick) inside those comments
+        # If a comment ENDS in a macro, for example ```this is a comment with a macro `macro_here````
+        # then there is a small edge case where the regex below does not work properly.  If that is
+        # the case, we edit the search slightly to insert a space
         if re.findall(r"\`\`\`\`", text_field):
-            raise ValueError("Search contained four or more '`' characters in a row which is invalid SPL"
-                            "This may have occurred when a macro was commented out.\n"
-                            "Please ammend your search to remove the substring '````'")
+            raise ValueError(
+                "Search contained four or more '`' characters in a row which is invalid SPL"
+                "This may have occurred when a macro was commented out.\n"
+                "Please ammend your search to remove the substring '````'"
+            )
+        # Replace all the comments with a space. This prevents a comment from looking like a macro to the parser below
+        text_field = re.sub(r"\`\`\`[\s\S]*?\`\`\`", " ", text_field)
+        # Find all the macros, which start and end with a '`' character
+        macros_to_get = re.findall(r"`([^\s]+)`", text_field)
+        # If macros take arguments, stop at the first argument.  We just want the name of the macro
+        macros_to_get = set(
+            [
+                macro[: macro.find("(")] if macro.find("(") != -1 else macro
+                for macro in macros_to_get
+            ]
+        )
-        # replace all the macros with a space
-        text_field = re.sub(r"\`\`\`[\s\S]*?\`\`\`", " ", text_field)
-        macros_to_get = re.findall(r'`([^\s]+)`', text_field)
-        #If macros take arguments, stop at the first argument.  We just want the name of the macro
-        macros_to_get = set([macro[:macro.find('(')] if macro.find('(') != -1 else macro for macro in macros_to_get])
-        macros_to_ignore = set([macro for macro in macros_to_get if any(to_ignore in macro for to_ignore in ignore_macros)])
-        #remove the ones that we will ignore
+        macros_to_ignore = set(
+            [
+                macro
+                for macro in macros_to_get
+                if any(to_ignore in macro for to_ignore in ignore_macros)
+            ]
+        )
+        # remove the ones that we will ignore
         macros_to_get -= macros_to_ignore
         return Macro.mapNamesToSecurityContentObjects(list(macros_to_get), director)

contentctl 4.4.7__py3-none-any.whl → 5.0.0__py3-none-any.whl

contentctl 4.4.7py3-none-any.whl → 5.0.0py3-none-any.whl