PyPI - cyvest - Versions diffs - 0.1.0__py3-none-any.whl → 5.1.3__py3-none-any.whl - Mend

cyvest 0.1.0py3-none-any.whl → 5.1.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (35) hide show

cyvest/__init__.py +48 -38
cyvest/cli.py +487 -0
cyvest/compare.py +318 -0
cyvest/cyvest.py +1431 -0
cyvest/investigation.py +1682 -0
cyvest/io_rich.py +1153 -0
cyvest/io_schema.py +35 -0
cyvest/io_serialization.py +465 -0
cyvest/io_visualization.py +358 -0
cyvest/keys.py +237 -0
cyvest/level_score_rules.py +78 -0
cyvest/levels.py +175 -0
cyvest/model.py +595 -0
cyvest/model_enums.py +69 -0
cyvest/model_schema.py +164 -0
cyvest/proxies.py +595 -0
cyvest/score.py +473 -0
cyvest/shared.py +508 -0
cyvest/stats.py +291 -0
cyvest/ulid.py +36 -0
cyvest-5.1.3.dist-info/METADATA +632 -0
cyvest-5.1.3.dist-info/RECORD +24 -0
{cyvest-0.1.0.dist-info → cyvest-5.1.3.dist-info}/WHEEL +1 -2
cyvest-5.1.3.dist-info/entry_points.txt +3 -0
cyvest/builder.py +0 -182
cyvest/check_tree.py +0 -117
cyvest/models.py +0 -785
cyvest/observable_registry.py +0 -69
cyvest/report_render.py +0 -306
cyvest/report_serialization.py +0 -237
cyvest/visitors.py +0 -332
cyvest-0.1.0.dist-info/METADATA +0 -110
cyvest-0.1.0.dist-info/RECORD +0 -13
cyvest-0.1.0.dist-info/licenses/LICENSE +0 -21
cyvest-0.1.0.dist-info/top_level.txt +0 -1

cyvest/io_schema.py ADDED Viewed

@@ -0,0 +1,35 @@
+"""
+JSON Schema definition for serialized Cyvest investigations.
+The schema mirrors the structure emitted by `serialize_investigation` in
+`cyvest.io_serialization` so consumers can validate exports or generate
+typed bindings.
+This module uses Pydantic's `model_json_schema(mode='serialization')` to generate
+schemas that match the actual serialized output (respecting field_serializer decorators).
+"""
+from __future__ import annotations
+from typing import Any
+from cyvest.model_schema import InvestigationSchema
+def get_investigation_schema() -> dict[str, Any]:
+    """
+    Get the JSON Schema for serialized investigations.
+    Generates a JSON Schema (Draft 2020-12) that describes the output of
+    `serialize_investigation()`. The schema uses Pydantic's `model_json_schema`
+    with `mode='serialization'`, which respects field_serializer decorators and
+    matches the actual `model_dump()` output structure.
+    The returned schema automatically includes all referenced entity types
+    (Observable, Check, ThreatIntel, Enrichment, Tag, InvestigationWhitelist)
+    in the `$defs` section.
+    Returns:
+        dict[str, Any]: Schema dictionary compliant with JSON Schema Draft 2020-12.
+    """
+    return InvestigationSchema.model_json_schema(mode="serialization", by_alias=True)

cyvest/io_serialization.py ADDED Viewed

@@ -0,0 +1,465 @@
+"""
+Serialization and deserialization for Cyvest investigations.
+Provides JSON export/import and Markdown generation for LLM consumption.
+"""
+from __future__ import annotations
+import json
+from decimal import Decimal
+from pathlib import Path
+from typing import TYPE_CHECKING, Any
+from cyvest.levels import Level, normalize_level
+from cyvest.model import AuditEvent, Check, Enrichment, Observable, Relationship, Tag, ThreatIntel
+from cyvest.model_enums import ObservableType
+from cyvest.model_schema import InvestigationSchema
+from cyvest.score import ScoreMode
+if TYPE_CHECKING:
+    from cyvest.cyvest import Cyvest
+    from cyvest.investigation import Investigation
+def serialize_investigation(inv: Investigation, *, include_audit_log: bool = True) -> InvestigationSchema:
+    """
+    Serialize a complete investigation to an InvestigationSchema.
+    Uses InvestigationSchema for validation and automatic serialization via
+    Pydantic's field_serializer decorators.
+    Args:
+        inv: Investigation to serialize
+        include_audit_log: Include audit log in serialization (default: True).
+            When False, audit_log is set to None for compact, deterministic output.
+    Returns:
+        InvestigationSchema instance (use .model_dump() for dict)
+    """
+    inv._rebuild_all_check_links()
+    observables = dict(inv.get_all_observables())
+    threat_intels = dict(inv.get_all_threat_intels())
+    enrichments = dict(inv.get_all_enrichments())
+    tags = dict(inv.get_all_tags())
+    # Get all checks
+    checks = dict(inv.get_all_checks())
+    # Get root type
+    root = inv.get_root()
+    root_type_value = root.obs_type.value
+    # Build and validate using Pydantic model
+    investigation = InvestigationSchema(
+        investigation_id=inv.investigation_id,
+        investigation_name=inv.investigation_name,
+        score=inv.get_global_score(),
+        level=inv.get_global_level(),
+        whitelisted=inv.is_whitelisted(),
+        whitelists=list(inv.get_whitelists()),
+        audit_log=inv.get_audit_log() if include_audit_log else None,
+        observables=observables,
+        checks=checks,
+        threat_intels=threat_intels,
+        enrichments=enrichments,
+        tags=tags,
+        stats=inv.get_statistics(),
+        data_extraction={
+            "root_type": root_type_value,
+            "score_mode_obs": inv._score_engine._score_mode_obs.value,
+        },
+    )
+    return investigation
+def save_investigation_json(inv: Investigation, filepath: str | Path, *, include_audit_log: bool = True) -> None:
+    """
+    Save an investigation to a JSON file.
+    Args:
+        inv: Investigation to save
+        filepath: Path to save the JSON file
+        include_audit_log: Include audit log in output (default: True).
+            When False, audit_log is set to null for compact, deterministic output.
+    """
+    data = serialize_investigation(inv, include_audit_log=include_audit_log)
+    with open(filepath, "w", encoding="utf-8") as f:
+        f.write(data.model_dump_json(indent=2, by_alias=True))
+def generate_markdown_report(
+    inv: Investigation,
+    include_tags: bool = False,
+    include_enrichments: bool = False,
+    include_observables: bool = True,
+    exclude_levels: set[Level] | None = None,
+) -> str:
+    """
+    Generate a Markdown report of the investigation for LLM consumption.
+    Args:
+        inv: Investigation
+        include_tags: Include tags section in the report (default: False)
+        include_enrichments: Include enrichments section in the report (default: False)
+        include_observables: Include observables section in the report (default: True)
+        exclude_levels: Set of levels to exclude from checks section (default: {Level.NONE})
+    Returns:
+        Markdown formatted report
+    """
+    if exclude_levels is None:
+        exclude_levels = {Level.NONE}
+    lines = []
+    # Header
+    lines.append("# Cybersecurity Investigation Report")
+    lines.append("")
+    if getattr(inv, "investigation_name", None):
+        lines.append(f"**Investigation Name:** {inv.investigation_name}")
+    lines.append(f"**Global Score:** {inv.get_global_score():.2f}")
+    lines.append(f"**Global Level:** {inv.get_global_level().name}")
+    whitelists = inv.get_whitelists()
+    whitelist_status = "Yes" if whitelists else "No"
+    lines.append(f"**Whitelisted Investigation:** {whitelist_status}")
+    if whitelists:
+        lines.append(f"**Whitelist Entries:** {len(whitelists)}")
+    lines.append("")
+    # Statistics
+    lines.append("## Statistics")
+    lines.append("")
+    stats = inv.get_statistics()
+    lines.append(f"- **Total Observables:** {stats.total_observables}")
+    lines.append(f"- **Internal Observables:** {stats.internal_observables}")
+    lines.append(f"- **External Observables:** {stats.external_observables}")
+    lines.append(f"- **Whitelisted Observables:** {stats.whitelisted_observables}")
+    lines.append(f"- **Total Checks:** {stats.total_checks}")
+    lines.append(f"- **Applied Checks:** {stats.applied_checks}")
+    lines.append(f"- **Total Threat Intel:** {stats.total_threat_intel}")
+    lines.append("")
+    # Whitelists
+    if whitelists:
+        lines.append("## Whitelists")
+        lines.append("")
+        for entry in whitelists:
+            lines.append(f"- **{entry.identifier}** - {entry.name}")
+            if entry.justification:
+                lines.append(f"  - Justification: {entry.justification}")
+        lines.append("")
+    # Checks
+    lines.append("## Checks")
+    lines.append("")
+    for check in inv.get_all_checks().values():
+        if check.level not in exclude_levels:
+            lines.append(f"- **{check.check_name}**: Score: {check.score_display}, Level: {check.level.name}")
+            lines.append(f"  - Description: {check.description}")
+            if check.comment:
+                lines.append(f"  - Comment: {check.comment}")
+    lines.append("")
+    # Observables
+    if include_observables and inv.get_all_observables():
+        lines.append("## Observables")
+        lines.append("")
+        for obs in inv.get_all_observables().values():
+            lines.append(f"### {obs.obs_type}: {obs.value}")
+            lines.append(f"- **Key:** {obs.key}")
+            lines.append(f"- **Score:** {obs.score_display}")
+            lines.append(f"- **Level:** {obs.level.name}")
+            lines.append(f"- **Internal:** {obs.internal}")
+            lines.append(f"- **Whitelisted:** {obs.whitelisted}")
+            if obs.comment:
+                lines.append(f"- **Comment:** {obs.comment}")
+            if obs.relationships:
+                lines.append("- **Relationships:**")
+                for rel in obs.relationships:
+                    direction_symbol = {
+                        "outbound": "→",
+                        "inbound": "←",
+                        "bidirectional": "↔",
+                    }.get(rel.direction if isinstance(rel.direction, str) else rel.direction.value, "→")
+                    lines.append(f"  - {rel.relationship_type} {direction_symbol} {rel.target_key}")
+            if obs.threat_intels:
+                lines.append("- **Threat Intelligence:**")
+                for ti in obs.threat_intels:
+                    lines.append(f"  - {ti.source}: Score {ti.score_display}, Level {ti.level.name}")
+                    if ti.comment:
+                        lines.append(f"    - {ti.comment}")
+            lines.append("")
+    # Enrichments
+    if include_enrichments and inv.get_all_enrichments():
+        lines.append("## Enrichments")
+        lines.append("")
+        for enr in inv.get_all_enrichments().values():
+            lines.append(f"### {enr.name}")
+            if enr.context:
+                lines.append(f"- **Context:** {enr.context}")
+            lines.append(f"- **Data:** {json.dumps(enr.data, indent=2)}")
+            lines.append("")
+    # Tags
+    if include_tags and inv.get_all_tags():
+        lines.append("## Tags")
+        lines.append("")
+        for tag in inv.get_all_tags().values():
+            lines.append(f"### {tag.name}")
+            lines.append(f"- **Description:** {tag.description}")
+            lines.append(f"- **Direct Score:** {tag.get_direct_score():.2f}")
+            lines.append(f"- **Aggregated Score:** {inv.get_tag_aggregated_score(tag.name):.2f}")
+            lines.append(f"- **Aggregated Level:** {inv.get_tag_aggregated_level(tag.name).name}")
+            lines.append(f"- **Direct Checks:** {len(tag.checks)}")
+            lines.append("")
+    return "\n".join(lines)
+def save_investigation_markdown(
+    inv: Investigation,
+    filepath: str | Path,
+    include_tags: bool = False,
+    include_enrichments: bool = False,
+    include_observables: bool = True,
+    exclude_levels: set[Level] | None = None,
+) -> None:
+    """
+    Save an investigation as a Markdown report.
+    Args:
+        inv: Investigation to save
+        filepath: Path to save the Markdown file
+        include_tags: Include tags section in the report (default: False)
+        include_enrichments: Include enrichments section in the report (default: False)
+        include_observables: Include observables section in the report (default: True)
+        exclude_levels: Set of levels to exclude from checks section (default: {Level.NONE})
+    """
+    markdown = generate_markdown_report(inv, include_tags, include_enrichments, include_observables, exclude_levels)
+    with open(filepath, "w", encoding="utf-8") as f:
+        f.write(markdown)
+def load_investigation_dict(data: dict[str, Any]) -> Cyvest:
+    """
+    Load an investigation from a dictionary (parsed JSON) into a Cyvest object.
+    Args:
+        data: Dictionary containing the serialized investigation data
+    Returns:
+        Reconstructed Cyvest investigation
+    """
+    from cyvest.cyvest import Cyvest
+    from cyvest.investigation import Investigation
+    investigation_id = data.get("investigation_id")
+    if not isinstance(investigation_id, str) or not investigation_id.strip():
+        raise ValueError("Serialized investigation must include 'investigation_id'.")
+    root_data = data.get("root_data")
+    extraction = data.get("data_extraction", {})
+    root_type_raw = extraction.get("root_type")
+    try:
+        root_type = ObservableType.normalize_root_type(root_type_raw)
+    except (TypeError, ValueError):
+        root_type = ObservableType.FILE
+    score_mode_raw = extraction.get("score_mode_obs")
+    try:
+        score_mode = ScoreMode(score_mode_raw) if score_mode_raw else ScoreMode.MAX
+    except (TypeError, ValueError):
+        score_mode = ScoreMode.MAX
+    cv = Cyvest(root_data=root_data, root_type=root_type, score_mode_obs=score_mode)
+    # Reset internal state to avoid default root pollution
+    cv._investigation = Investigation(
+        root_data,
+        root_type=root_type,
+        score_mode_obs=score_mode,
+        investigation_id=investigation_id,
+    )
+    cv._investigation._audit_enabled = False
+    cv._investigation._audit_log = []
+    investigation_name = data.get("investigation_name")
+    if isinstance(investigation_name, str):
+        cv._investigation.investigation_name = investigation_name
+    # Load whitelists using Pydantic validation
+    whitelists = data.get("whitelists") or []
+    for whitelist_info in whitelists:
+        try:
+            identifier = str(whitelist_info.get("identifier", "")).strip()
+            name = str(whitelist_info.get("name", "")).strip()
+            if identifier and name:
+                cv._investigation.add_whitelist(
+                    identifier,
+                    name,
+                    whitelist_info.get("justification"),
+                )
+        except ValueError:
+            continue
+    # Observables - leverage Pydantic model_validate (two-pass so root can merge after others exist)
+    new_root_key = cv._investigation.get_root().key
+    root_obs_info: dict[str, Any] | None = None
+    other_obs_infos: list[dict[str, Any]] = []
+    for obs_info in data.get("observables", {}).values():
+        obs_key = obs_info.get("key", "")
+        if obs_key == new_root_key:
+            root_obs_info = obs_info
+            continue
+        other_obs_infos.append(obs_info)
+    for obs_info in other_obs_infos:
+        # Prepare data for Pydantic validation
+        obs_data = {
+            "obs_type": obs_info.get("type", "unknown"),
+            "value": obs_info.get("value", ""),
+            "internal": obs_info.get("internal", True),
+            "whitelisted": obs_info.get("whitelisted", False),
+            "comment": obs_info.get("comment", ""),
+            "extra": obs_info.get("extra", {}),
+            "score": Decimal(str(obs_info.get("score", 0))),
+            "level": obs_info.get("level", "INFO"),
+            "key": obs_info.get("key", ""),
+            "relationships": [Relationship.model_validate(rel) for rel in obs_info.get("relationships", [])],
+        }
+        obs = Observable.model_validate(obs_data)
+        cv._investigation.add_observable(obs)
+    if root_obs_info is not None:
+        # Merge serialized root into the live root (preserves relationships, etc.).
+        root_data = {
+            "obs_type": root_obs_info.get("type", root_type),
+            "value": "root",
+            "internal": root_obs_info.get("internal", False),
+            "whitelisted": root_obs_info.get("whitelisted", False),
+            "comment": root_obs_info.get("comment", ""),
+            "extra": root_obs_info.get("extra", root_data),
+            "score": Decimal(str(root_obs_info.get("score", 0))),
+            "level": root_obs_info.get("level", "INFO"),
+            "key": new_root_key,
+            "relationships": [Relationship.model_validate(rel) for rel in root_obs_info.get("relationships", [])],
+        }
+        root_obs = Observable.model_validate(root_data)
+        cv._investigation.add_observable(root_obs)
+    # Threat intel - leverage Pydantic model_validate
+    for ti_info in data.get("threat_intels", {}).values():
+        raw_taxonomies = ti_info.get("taxonomies", []) or []
+        normalized_taxonomies: list[Any] = []
+        for taxonomy in raw_taxonomies:
+            if isinstance(taxonomy, dict) and "level" in taxonomy:
+                taxonomy = dict(taxonomy)
+                taxonomy["level"] = normalize_level(taxonomy["level"])
+            normalized_taxonomies.append(taxonomy)
+        ti_data = {
+            "source": ti_info.get("source", ""),
+            "observable_key": ti_info.get("observable_key", ""),
+            "comment": ti_info.get("comment", ""),
+            "extra": ti_info.get("extra", {}),
+            "score": Decimal(str(ti_info.get("score", 0))),
+            "level": ti_info.get("level", "INFO"),
+            "taxonomies": normalized_taxonomies,
+            "key": ti_info.get("key", ""),
+        }
+        ti = ThreatIntel.model_validate(ti_data)
+        observable = cv._investigation.get_observable(ti.observable_key)
+        if observable:
+            cv._investigation.add_threat_intel(ti, observable)
+    # Checks - leverage Pydantic model_validate
+    for check_info in data.get("checks", {}).values():
+        raw_links = check_info.get("observable_links", []) or []
+        normalized_links = []
+        for link in raw_links:
+            if isinstance(link, dict):
+                normalized_links.append(
+                    {
+                        "observable_key": link.get("observable_key", ""),
+                        "propagation_mode": link.get("propagation_mode", "LOCAL_ONLY"),
+                    }
+                )
+            else:
+                normalized_links.append(link)
+        check_data = {
+            "check_name": check_info.get("check_name", ""),
+            "description": check_info.get("description", ""),
+            "comment": check_info.get("comment", ""),
+            "extra": check_info.get("extra", {}),
+            "score": Decimal(str(check_info.get("score", 0))),
+            "level": check_info.get("level", "NONE"),
+            "origin_investigation_id": check_info.get("origin_investigation_id") or cv._investigation.investigation_id,
+            "observable_links": normalized_links,
+            "key": check_info.get("key", ""),
+        }
+        check = Check.model_validate(check_data)
+        cv._investigation.add_check(check)
+    # Enrichments - leverage Pydantic model_validate
+    for enr_info in data.get("enrichments", {}).values():
+        enr_data = {
+            "name": enr_info.get("name", ""),
+            "data": enr_info.get("data", {}),
+            "context": enr_info.get("context", ""),
+            "key": enr_info.get("key", ""),
+        }
+        enrichment = Enrichment.model_validate(enr_data)
+        cv._investigation.add_enrichment(enrichment)
+    # Tags
+    def build_tag(tag_info: dict[str, Any]) -> Tag:
+        tag_data = {
+            "name": tag_info.get("name", ""),
+            "description": tag_info.get("description", ""),
+            "key": tag_info.get("key", ""),
+        }
+        tag = Tag.model_validate(tag_data)
+        tag = cv._investigation.add_tag(tag)
+        for check_key in tag_info.get("checks", []):
+            check = cv._investigation.get_check(check_key)
+            if check:
+                cv._investigation.add_check_to_tag(tag.key, check.key)
+        return tag
+    for tag_info in data.get("tags", {}).values():
+        build_tag(tag_info)
+    cv._investigation._rebuild_all_check_links()
+    audit_log = []
+    for event_info in data.get("audit_log", []) or []:
+        try:
+            audit_log.append(AuditEvent.model_validate(event_info))
+        except Exception:
+            continue
+    cv._investigation._audit_log = audit_log
+    cv._investigation._audit_enabled = True
+    return cv
+def load_investigation_json(filepath: str | Path) -> Cyvest:
+    """
+    Load an investigation from a JSON file into a Cyvest object.
+    Args:
+        filepath: Path to the JSON file
+    Returns:
+        Reconstructed Cyvest investigation
+    """
+    with open(filepath, encoding="utf-8") as handle:
+        data = json.load(handle)
+    return load_investigation_dict(data)

cyvest 0.1.0__py3-none-any.whl → 5.1.3__py3-none-any.whl

cyvest 0.1.0py3-none-any.whl → 5.1.3py3-none-any.whl