PyPI - ddeutil-workflow - Versions diffs - 0.0.78__py3-none-any.whl → 0.0.80__py3-none-any.whl - Mend

ddeutil-workflow 0.0.78py3-none-any.whl → 0.0.80py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

ddeutil/workflow/__about__.py +1 -1
ddeutil/workflow/__init__.py +2 -6
ddeutil/workflow/api/routes/job.py +2 -2
ddeutil/workflow/api/routes/logs.py +5 -5
ddeutil/workflow/api/routes/workflows.py +3 -3
ddeutil/workflow/audits.py +547 -176
ddeutil/workflow/cli.py +19 -1
ddeutil/workflow/conf.py +10 -20
ddeutil/workflow/event.py +15 -6
ddeutil/workflow/job.py +147 -74
ddeutil/workflow/params.py +172 -58
ddeutil/workflow/plugins/__init__.py +0 -0
ddeutil/workflow/plugins/providers/__init__.py +0 -0
ddeutil/workflow/plugins/providers/aws.py +908 -0
ddeutil/workflow/plugins/providers/az.py +1003 -0
ddeutil/workflow/plugins/providers/container.py +703 -0
ddeutil/workflow/plugins/providers/gcs.py +826 -0
ddeutil/workflow/result.py +6 -4
ddeutil/workflow/reusables.py +151 -95
ddeutil/workflow/stages.py +28 -28
ddeutil/workflow/traces.py +1697 -541
ddeutil/workflow/utils.py +109 -67
ddeutil/workflow/workflow.py +42 -30
{ddeutil_workflow-0.0.78.dist-info → ddeutil_workflow-0.0.80.dist-info}/METADATA +39 -19
ddeutil_workflow-0.0.80.dist-info/RECORD +36 -0
ddeutil_workflow-0.0.78.dist-info/RECORD +0 -30
{ddeutil_workflow-0.0.78.dist-info → ddeutil_workflow-0.0.80.dist-info}/WHEEL +0 -0
{ddeutil_workflow-0.0.78.dist-info → ddeutil_workflow-0.0.80.dist-info}/entry_points.txt +0 -0
{ddeutil_workflow-0.0.78.dist-info → ddeutil_workflow-0.0.80.dist-info}/licenses/LICENSE +0 -0
{ddeutil_workflow-0.0.78.dist-info → ddeutil_workflow-0.0.80.dist-info}/top_level.txt +0 -0

ddeutil/workflow/audits.py CHANGED Viewed

@@ -9,26 +9,31 @@ This module provides comprehensive audit capabilities for workflow execution
 tracking and monitoring. It supports multiple audit backends for capturing
 execution metadata, status information, and detailed logging.
+Be noted that, you can set only one audit backend setting for the current
+run-time because it will conflinct audit data if it set more than one audit
+backend pointer.
 The audit system tracks workflow, job, and stage executions with configurable
-storage backends including file-based JSON storage and database persistence.
+storage backends including file-based JSON storage, database persistence, and
+more (Up to this package already implement).
+That is mean if you release the workflow with the same release date with force mode,
+it will overwrite the previous release log. By the way, if you do not pass any
+release mode, it will not overwrite the previous release log and return the skip
+status to you because it already releases.
 Classes:
-    Audit: Pydantic model for audit data validation
+    BaseAudit: Abstract base class for audit implementations
     FileAudit: File-based audit storage implementation
+    SQLiteAudit: SQLite database audit storage implementation
 Functions:
     get_audit_model: Factory function for creating audit instances
 Example:
-    ```python
-    from ddeutil.workflow.audits import get_audit_model
-    # NOTE: Create file-based Audit.
-    audit = get_audit_model(run_id="run-123")
-    audit.info("Workflow execution started")
-    audit.success("Workflow completed successfully")
-    ```
+    >>> from ddeutil.workflow.audits import get_audit
+    >>> audit = get_audit(run_id="run-123")
 Note:
     Audit instances are automatically configured based on the workflow
@@ -39,35 +44,27 @@ from __future__ import annotations
 import json
 import logging
 import os
+import sqlite3
+import zlib
 from abc import ABC, abstractmethod
 from collections.abc import Iterator
-from datetime import datetime
+from datetime import datetime, timedelta
 from pathlib import Path
-from typing import ClassVar, Optional, Union
-from urllib.parse import ParseResult
+from typing import Annotated, Any, ClassVar, Literal, Optional, Union
+from urllib.parse import ParseResult, urlparse
-from pydantic import BaseModel, Field
-from pydantic.functional_serializers import field_serializer
-from pydantic.functional_validators import model_validator
+from pydantic import BaseModel, Field, TypeAdapter
+from pydantic.functional_validators import field_validator, model_validator
 from typing_extensions import Self
 from .__types import DictData
 from .conf import dynamic
-from .traces import Trace, get_trace, set_logging
+from .traces import TraceManager, get_trace, set_logging
 logger = logging.getLogger("ddeutil.workflow")
-class BaseAudit(BaseModel, ABC):
-    """Base Audit Pydantic Model with abstraction class property that implement
-    only model fields. This model should to use with inherit to logging
-    subclass like file, sqlite, etc.
-    """
-    extras: DictData = Field(
-        default_factory=dict,
-        description="An extras parameter that want to override core config",
-    )
+class AuditData(BaseModel):
     name: str = Field(description="A workflow name.")
     release: datetime = Field(description="A release datetime.")
     type: str = Field(description="A running type before logging.")
@@ -84,11 +81,36 @@ class BaseAudit(BaseModel, ABC):
         description="A runs metadata that will use to tracking this audit log.",
     )
+class BaseAudit(BaseModel, ABC):
+    """Base Audit Pydantic Model with abstraction class property.
+    This model implements only model fields and should be used as a base class
+    for logging subclasses like file, sqlite, etc.
+    """
+    type: str
+    extras: DictData = Field(
+        default_factory=dict,
+        description="An extras parameter that want to override core config",
+    )
+    @field_validator("extras", mode="before")
+    def validate_extras(cls, v: Any) -> DictData:
+        """Validate extras field to ensure it's a dictionary."""
+        if v is None:
+            return {}
+        return v
     @model_validator(mode="after")
     def __model_action(self) -> Self:
-        """Do before the Audit action with WORKFLOW_AUDIT_ENABLE_WRITE env variable.
+        """Perform actions before Audit initialization.
+        This method checks the WORKFLOW_AUDIT_ENABLE_WRITE environment variable
+        and performs necessary setup actions.
-        :rtype: Self
+        Returns:
+            Self: The validated model instance.
         """
         if dynamic("enable_write_audit", extras=self.extras):
             self.do_before()
@@ -97,199 +119,278 @@ class BaseAudit(BaseModel, ABC):
         set_logging("ddeutil.workflow")
         return self
-    @classmethod
     @abstractmethod
     def is_pointed(
-        cls,
-        name: str,
-        release: datetime,
+        self,
+        data: AuditData,
         *,
         extras: Optional[DictData] = None,
     ) -> bool:
+        """Check if audit data exists for the given workflow and release.
+        Args:
+            data:
+            extras: Optional extra parameters to override core config.
+        Returns:
+            bool: True if audit data exists, False otherwise.
+        Raises:
+            NotImplementedError: If the method is not implemented by subclass.
+        """
         raise NotImplementedError(
             "Audit should implement `is_pointed` class-method"
         )
-    @classmethod
     @abstractmethod
     def find_audits(
-        cls,
+        self,
         name: str,
         *,
         extras: Optional[DictData] = None,
     ) -> Iterator[Self]:
+        """Find all audit data for a given workflow name.
+        Args:
+            name: The workflow name to search for.
+            extras: Optional extra parameters to override core config.
+        Returns:
+            Iterator[Self]: Iterator of audit instances.
+        Raises:
+            NotImplementedError: If the method is not implemented by subclass.
+        """
         raise NotImplementedError(
             "Audit should implement `find_audits` class-method"
         )
-    @classmethod
     @abstractmethod
     def find_audit_with_release(
-        cls,
+        self,
         name: str,
         release: Optional[datetime] = None,
         *,
         extras: Optional[DictData] = None,
     ) -> Self:
+        """Find audit data for a specific workflow and release.
+        Args:
+            name: The workflow name to search for.
+            release: Optional release datetime. If None, returns latest release.
+            extras: Optional extra parameters to override core config.
+        Returns:
+            Self: The audit instance for the specified workflow and release.
+        Raises:
+            NotImplementedError: If the method is not implemented by subclass.
+        """
         raise NotImplementedError(
             "Audit should implement `find_audit_with_release` class-method"
         )
-    def do_before(self) -> None:  # pragma: no cov
-        """To something before end up of initial log model."""
+    def do_before(self) -> None:
+        """Perform actions before the end of initial log model setup.
+        This method is called during model validation and can be overridden
+        by subclasses to perform custom initialization actions.
+        """
     @abstractmethod
-    def save(self, excluded: Optional[list[str]]) -> None:  # pragma: no cov
-        """Save this model logging to target logging store."""
+    def save(
+        self, data: Any, excluded: Optional[list[str]] = None
+    ) -> Self:  # pragma: no cov
+        """Save this model logging to target logging store.
+        Args:
+            data:
+            excluded: Optional list of field names to exclude from saving.
+        Returns:
+            Self: The audit instance after saving.
+        Raises:
+            NotImplementedError: If the method is not implemented by subclass.
+        """
         raise NotImplementedError("Audit should implement `save` method.")
 class FileAudit(BaseAudit):
-    """File Audit Pydantic Model that use to saving log data from result of
-    workflow execution. It inherits from BaseAudit model that implement the
-    ``self.save`` method for file.
+    """File Audit Pydantic Model for saving log data from workflow execution.
+    This class inherits from BaseAudit and implements file-based storage
+    for audit logs. It saves workflow execution results to JSON files
+    in a structured directory hierarchy.
+    Attributes:
+        filename_fmt: Class variable defining the filename format for audit files.
     """
     filename_fmt: ClassVar[str] = (
         "workflow={name}/release={release:%Y%m%d%H%M%S}"
     )
-    @field_serializer("extras")
-    def __serialize_extras(self, value: DictData) -> DictData:
-        return {
-            k: (v.geturl() if isinstance(v, ParseResult) else v)
-            for k, v in value.items()
-        }
+    type: Literal["file"] = "file"
+    path: str = Field(
+        default="./audits",
+        description="A file path that use to manage audit logs.",
+    )
     def do_before(self) -> None:
-        """Create directory of release before saving log file."""
-        self.pointer().mkdir(parents=True, exist_ok=True)
+        """Create directory of release before saving log file.
+        This method ensures the target directory exists before attempting
+        to save audit log files.
+        """
+        Path(self.path).mkdir(parents=True, exist_ok=True)
-    @classmethod
     def find_audits(
-        cls, name: str, *, extras: Optional[DictData] = None
-    ) -> Iterator[Self]:
-        """Generate the audit data that found from logs path with specific a
-        workflow name.
+        self, name: str, *, extras: Optional[DictData] = None
+    ) -> Iterator[AuditData]:
+        """Generate audit data found from logs path for a specific workflow name.
+        Args:
+            name: The workflow name to search for release logging data.
+            extras: Optional extra parameters to override core config.
-        :param name: A workflow name that want to search release logging data.
-        :param extras: An extra parameter that want to override core config.
+        Returns:
+            Iterator[Self]: Iterator of audit instances found for the workflow.
-        :rtype: Iterator[Self]
+        Raises:
+            FileNotFoundError: If the workflow directory does not exist.
         """
-        pointer: Path = (
-            Path(dynamic("audit_url", extras=extras).path) / f"workflow={name}"
-        )
+        pointer: Path = Path(self.path) / f"workflow={name}"
         if not pointer.exists():
             raise FileNotFoundError(f"Pointer: {pointer.absolute()}.")
         for file in pointer.glob("./release=*/*.log"):
             with file.open(mode="r", encoding="utf-8") as f:
-                yield cls.model_validate(obj=json.load(f))
+                yield AuditData.model_validate(obj=json.load(f))
-    @classmethod
     def find_audit_with_release(
-        cls,
+        self,
         name: str,
         release: Optional[datetime] = None,
         *,
         extras: Optional[DictData] = None,
-    ) -> Self:
-        """Return the audit data that found from logs path with specific
-        workflow name and release values. If a release does not pass to an input
-        argument, it will return the latest release from the current log path.
+    ) -> AuditData:
+        """Return audit data found from logs path for specific workflow and release.
+        If a release is not provided, it will return the latest release from
+        the current log path.
-        :param name: (str) A workflow name that want to search log.
-        :param release: (datetime) A release datetime that want to search log.
-        :param extras: An extra parameter that want to override core config.
+        Args:
+            name: The workflow name to search for.
+            release: Optional release datetime to search for.
+            extras: Optional extra parameters to override core config.
-        :raise FileNotFoundError:
-        :raise NotImplementedError: If an input release does not pass to this
-            method. Because this method does not implement latest log.
+        Returns:
+            AuditData: The audit instance for the specified workflow and release.
-        :rtype: Self
+        Raises:
+            FileNotFoundError: If the specified workflow/release directory does not exist.
+            ValueError: If no releases found when release is None.
         """
         if release is None:
-            raise NotImplementedError("Find latest log does not implement yet.")
+            pointer: Path = Path(self.path) / f"workflow={name}"
+            if not pointer.exists():
+                raise FileNotFoundError(f"Pointer: {pointer.absolute()}.")
+            if not any(pointer.glob("./release=*")):
+                raise FileNotFoundError(
+                    f"No releases found for workflow: {name}"
+                )
+            # NOTE: Get the latest release directory
+            release_pointer = max(
+                pointer.glob("./release=*"), key=os.path.getctime
+            )
+        else:
+            release_pointer: Path = (
+                Path(self.path)
+                / f"workflow={name}/release={release:%Y%m%d%H%M%S}"
+            )
+            if not release_pointer.exists():
+                raise FileNotFoundError(
+                    f"Pointer: {release_pointer} does not found."
+                )
-        pointer: Path = (
-            Path(dynamic("audit_url", extras=extras).path)
-            / f"workflow={name}/release={release:%Y%m%d%H%M%S}"
-        )
-        if not pointer.exists():
+        if not any(release_pointer.glob("./*.log")):
             raise FileNotFoundError(
-                f"Pointer: ./logs/workflow={name}/"
-                f"release={release:%Y%m%d%H%M%S} does not found."
+                f"Pointer: {release_pointer} does not contain any log."
             )
-        latest_file: Path = max(pointer.glob("./*.log"), key=os.path.getctime)
+        latest_file: Path = max(
+            release_pointer.glob("./*.log"), key=os.path.getctime
+        )
         with latest_file.open(mode="r", encoding="utf-8") as f:
-            return cls.model_validate(obj=json.load(f))
+            return AuditData.model_validate(obj=json.load(f))
-    @classmethod
     def is_pointed(
-        cls,
-        name: str,
-        release: datetime,
-        *,
-        extras: Optional[DictData] = None,
+        self, data: AuditData, *, extras: Optional[DictData] = None
     ) -> bool:
-        """Check the release log already pointed or created at the destination
-        log path.
+        """Check if the release log already exists at the destination log path.
-        :param name: (str) A workflow name.
-        :param release: (datetime) A release datetime.
-        :param extras: An extra parameter that want to override core config.
+        Args:
+            data: The workflow name.
+            extras: Optional extra parameters to override core config.
-        :rtype: bool
-        :return: Return False if the release log was not pointed or created.
+        Returns:
+            bool: True if the release log exists, False otherwise.
         """
         # NOTE: Return False if enable writing log flag does not set.
         if not dynamic("enable_write_audit", extras=extras):
             return False
+        return self.pointer(data).exists()
-        # NOTE: create pointer path that use the same logic of pointer method.
-        pointer: Path = Path(
-            dynamic("audit_url", extras=extras).path
-        ) / cls.filename_fmt.format(name=name, release=release)
-        return pointer.exists()
+    def pointer(self, data: AuditData) -> Path:
+        """Return release directory path generated from model data.
-    def pointer(self) -> Path:
-        """Return release directory path that was generated from model data.
-        :rtype: Path
+        Returns:
+            Path: The directory path for the current workflow and release.
         """
-        return Path(
-            dynamic("audit_url", extras=self.extras).path
-        ) / self.filename_fmt.format(name=self.name, release=self.release)
+        return Path(self.path) / self.filename_fmt.format(
+            name=data.name, release=data.release
+        )
-    def save(self, excluded: Optional[list[str]] = None) -> Self:
-        """Save logging data that receive a context data from a workflow
-        execution result.
+    def save(self, data: Any, excluded: Optional[list[str]] = None) -> Self:
+        """Save logging data received from workflow execution result.
-        :param excluded: An excluded list of key name that want to pass in the
-            model_dump method.
+        Args:
+            data:
+            excluded: Optional list of field names to exclude from saving.
-        :rtype: Self
+        Returns:
+            Self: The audit instance after saving.
         """
-        trace: Trace = get_trace(
-            self.run_id,
-            parent_run_id=self.parent_run_id,
+        audit = AuditData.model_validate(data)
+        trace: TraceManager = get_trace(
+            audit.run_id,
+            parent_run_id=audit.parent_run_id,
             extras=self.extras,
         )
         # NOTE: Check environ variable was set for real writing.
         if not dynamic("enable_write_audit", extras=self.extras):
-            trace.debug("[AUDIT]: Skip writing log cause config was set")
+            trace.debug("[AUDIT]: Skip writing audit log cause config was set.")
             return self
-        log_file: Path = (
-            self.pointer() / f"{self.parent_run_id or self.run_id}.log"
+        pointer: Path = self.pointer(data=audit)
+        if not pointer.exists():
+            pointer.mkdir(parents=True)
+        log_file: Path = pointer / f"{audit.parent_run_id or audit.run_id}.log"
+        # NOTE: Convert excluded list to set for pydantic compatibility
+        exclude_set = set(excluded) if excluded else None
+        trace.info(
+            f"[AUDIT]: Start writing audit log with "
+            f"release: {audit.release:%Y%m%d%H%M%S}"
         )
         log_file.write_text(
             json.dumps(
-                self.model_dump(exclude=excluded),
+                audit.model_dump(exclude=exclude_set),
                 default=str,
                 indent=2,
             ),
@@ -297,34 +398,116 @@ class FileAudit(BaseAudit):
         )
         return self
+    def cleanup(self, max_age_days: int = 180) -> int:  # pragma: no cov
+        """Clean up old audit files based on its age.
+        Args:
+            max_age_days: Maximum age in days for audit files to keep.
+        Returns:
+            int: Number of files cleaned up.
+        """
+        audit_url = dynamic("audit_url", extras=self.extras)
+        if audit_url is None:
+            return 0
+        audit_url_parse: ParseResult = urlparse(audit_url)
+        base_path = Path(audit_url_parse.path)
+        cutoff_time = datetime.now().timestamp() - (max_age_days * 24 * 3600)
+        cleaned_count: int = 0
+        for workflow_dir in base_path.glob("workflow=*"):
+            for release_dir in workflow_dir.glob("release=*"):
+                if release_dir.stat().st_mtime < cutoff_time:
+                    import shutil
+                    shutil.rmtree(release_dir)
+                    cleaned_count += 1
+        return cleaned_count
 class SQLiteAudit(BaseAudit):  # pragma: no cov
-    """SQLite Audit model."""
+    """SQLite Audit model for database-based audit storage.
+    This class inherits from BaseAudit and implements SQLite database storage
+    for audit logs with compression support.
+    Attributes:
+        table_name: Class variable defining the database table name.
+        schemas: Class variable defining the database schema.
+    """
     table_name: ClassVar[str] = "audits"
     schemas: ClassVar[
         str
     ] = """
-        workflow          str
-        , release         int
-        , type            str
-        , context         JSON
-        , parent_run_id   int
-        , run_id          int
-        , metadata        JSON
-        , created_at      datetime
-        , updated_at      datetime
-        primary key ( workflow, release )
+        CREATE TABLE IF NOT EXISTS audits (
+            workflow        TEXT NOT NULL
+            , release       TEXT NOT NULL
+            , type          TEXT NOT NULL
+            , context       BLOB NOT NULL
+            , parent_run_id TEXT
+            , run_id        TEXT NOT NULL
+            , metadata      BLOB NOT NULL
+            , created_at    TIMESTAMP DEFAULT CURRENT_TIMESTAMP
+            , updated_at    TIMESTAMP DEFAULT CURRENT_TIMESTAMP
+            , PRIMARY KEY ( workflow, release )
+        )
         """
-    @classmethod
+    type: Literal["sqlite"] = "sqlite"
+    path: str
+    def _ensure_table_exists(self) -> None:
+        """Ensure the audit table exists in the database."""
+        audit_url = dynamic("audit_url", extras=self.extras)
+        if audit_url is None or not audit_url.path:
+            raise ValueError(
+                "SQLite audit_url must specify a database file path"
+            )
+        audit_url_parse: ParseResult = urlparse(audit_url)
+        db_path = Path(audit_url_parse.path)
+        db_path.parent.mkdir(parents=True, exist_ok=True)
+        with sqlite3.connect(db_path) as conn:
+            conn.execute(self.schemas)
+            conn.commit()
     def is_pointed(
-        cls,
-        name: str,
-        release: datetime,
+        self,
+        data: AuditData,
         *,
         extras: Optional[DictData] = None,
-    ) -> bool: ...
+    ) -> bool:
+        """Check if audit data exists for the given workflow and release.
+        Args:
+            data:
+            extras: Optional extra parameters to override core config.
+        Returns:
+            bool: True if audit data exists, False otherwise.
+        """
+        if not dynamic("enable_write_audit", extras=extras):
+            return False
+        audit_url = dynamic("audit_url", extras=extras)
+        if audit_url is None or not audit_url.path:
+            return False
+        audit_url_parse: ParseResult = urlparse(audit_url)
+        db_path = Path(audit_url_parse.path)
+        if not db_path.exists():
+            return False
+        with sqlite3.connect(db_path) as conn:
+            cursor = conn.execute(
+                "SELECT COUNT(*) FROM audits WHERE workflow = ? AND release = ?",
+                (data.name, data.release.isoformat()),
+            )
+            return cursor.fetchone()[0] > 0
     @classmethod
     def find_audits(
@@ -332,7 +515,44 @@ class SQLiteAudit(BaseAudit):  # pragma: no cov
         name: str,
         *,
         extras: Optional[DictData] = None,
-    ) -> Iterator[Self]: ...
+    ) -> Iterator[Self]:
+        """Find all audit data for a given workflow name.
+        Args:
+            name: The workflow name to search for.
+            extras: Optional extra parameters to override core config.
+        Returns:
+            Iterator[Self]: Iterator of audit instances.
+        """
+        audit_url = dynamic("audit_url", extras=extras)
+        if audit_url is None or not audit_url.path:
+            return
+        audit_url_parse: ParseResult = urlparse(audit_url)
+        db_path = Path(audit_url_parse.path)
+        if not db_path.exists():
+            return
+        with sqlite3.connect(db_path) as conn:
+            cursor = conn.execute(
+                "SELECT * FROM audits WHERE workflow = ? ORDER BY release DESC",
+                (name,),
+            )
+            for row in cursor.fetchall():
+                # Decompress context and metadata
+                context = json.loads(cls._decompress_data(row[3]))
+                metadata = json.loads(cls._decompress_data(row[6]))
+                yield AuditData(
+                    name=row[0],
+                    release=datetime.fromisoformat(row[1]),
+                    type=row[2],
+                    context=context,
+                    parent_run_id=row[4],
+                    run_id=row[5],
+                    runs_metadata=metadata,
+                )
     @classmethod
     def find_audit_with_release(
@@ -341,54 +561,205 @@ class SQLiteAudit(BaseAudit):  # pragma: no cov
         release: Optional[datetime] = None,
         *,
         extras: Optional[DictData] = None,
-    ) -> Self: ...
+    ) -> AuditData:
+        """Find audit data for a specific workflow and release.
+        Args:
+            name: The workflow name to search for.
+            release: Optional release datetime. If None, returns latest release.
+            extras: Optional extra parameters to override core config.
+        Returns:
+            Self: The audit instance for the specified workflow and release.
+        Raises:
+            FileNotFoundError: If the specified workflow/release is not found.
+        """
+        audit_url = dynamic("audit_url", extras=extras)
+        if audit_url is None or not audit_url.path:
+            raise FileNotFoundError("SQLite database not configured")
+        audit_url_parse: ParseResult = urlparse(audit_url)
+        db_path = Path(audit_url_parse.path)
+        if not db_path.exists():
+            raise FileNotFoundError(f"Database file not found: {db_path}")
+        with sqlite3.connect(db_path) as conn:
+            if release is None:
+                # Get latest release
+                cursor = conn.execute(
+                    "SELECT * FROM audits WHERE workflow = ? ORDER BY release DESC LIMIT 1",
+                    (name,),
+                )
+            else:
+                cursor = conn.execute(
+                    "SELECT * FROM audits WHERE workflow = ? AND release = ?",
+                    (name, release.isoformat()),
+                )
+            row = cursor.fetchone()
+            if not row:
+                raise FileNotFoundError(
+                    f"Audit not found for workflow: {name}, release: {release}"
+                )
+            # Decompress context and metadata
+            context = json.loads(cls._decompress_data(row[3]))
+            metadata = json.loads(cls._decompress_data(row[6]))
+            return AuditData(
+                name=row[0],
+                release=datetime.fromisoformat(row[1]),
+                type=row[2],
+                context=context,
+                parent_run_id=row[4],
+                run_id=row[5],
+                runs_metadata=metadata,
+            )
+    @staticmethod
+    def _compress_data(data: str) -> bytes:
+        """Compress audit data for storage efficiency.
+        Args:
+            data: JSON string data to compress.
+        Returns:
+            bytes: Compressed data.
+        """
+        return zlib.compress(data.encode("utf-8"))
+    @staticmethod
+    def _decompress_data(data: bytes) -> str:
+        """Decompress audit data.
+        Args:
+            data: Compressed data to decompress.
+        Returns:
+            str: Decompressed JSON string.
+        """
+        return zlib.decompress(data).decode("utf-8")
+    def save(self, data: Any, excluded: Optional[list[str]] = None) -> Self:
+        """Save logging data received from workflow execution result.
+        Args:
+            data: Any
+            excluded: Optional list of field names to exclude from saving.
+        Returns:
+            Self: The audit instance after saving.
-    def save(self, excluded: Optional[list[str]]) -> SQLiteAudit:
-        """Save logging data that receive a context data from a workflow
-        execution result.
+        Raises:
+            ValueError: If SQLite database is not properly configured.
         """
-        trace: Trace = get_trace(
-            self.run_id,
-            parent_run_id=self.parent_run_id,
+        audit = AuditData.model_validate(data)
+        trace: TraceManager = get_trace(
+            audit.run_id,
+            parent_run_id=audit.parent_run_id,
             extras=self.extras,
         )
         # NOTE: Check environ variable was set for real writing.
         if not dynamic("enable_write_audit", extras=self.extras):
-            trace.debug("[AUDIT]: Skip writing log cause config was set")
+            trace.debug("[AUDIT]: Skip writing audit log cause config was set.")
             return self
-        raise NotImplementedError("SQLiteAudit does not implement yet.")
+        audit_url = dynamic("audit_url", extras=self.extras)
+        if audit_url is None or not audit_url.path:
+            raise ValueError(
+                "SQLite audit_url must specify a database file path"
+            )
+        audit_url_parse: ParseResult = urlparse(audit_url)
+        db_path = Path(audit_url_parse.path)
+        db_path.parent.mkdir(parents=True, exist_ok=True)
+        # Prepare data for storage
+        exclude_set = set(excluded) if excluded else None
+        model_data = audit.model_dump(exclude=exclude_set)
+        # Compress context and metadata
+        context_blob = self._compress_data(
+            json.dumps(model_data.get("context", {}))
+        )
+        metadata_blob = self._compress_data(
+            json.dumps(model_data.get("runs_metadata", {}))
+        )
+        with sqlite3.connect(db_path) as conn:
+            conn.execute(
+                """
+                INSERT OR REPLACE INTO audits
+                (workflow, release, type, context, parent_run_id, run_id, metadata, updated_at)
+                VALUES (?, ?, ?, ?, ?, ?, ?, CURRENT_TIMESTAMP)
+                """,
+                (
+                    audit.name,
+                    audit.release.isoformat(),
+                    audit.type,
+                    context_blob,
+                    audit.parent_run_id,
+                    audit.run_id,
+                    metadata_blob,
+                ),
+            )
+            conn.commit()
+        return self
+    def cleanup(self, max_age_days: int = 180) -> int:
+        """Clean up old audit records based on age.
+        Args:
+            max_age_days: Maximum age in days for audit records to keep.
+        Returns:
+            int: Number of records cleaned up.
+        """
+        audit_url = dynamic("audit_url", extras=self.extras)
+        if audit_url is None or not audit_url.path:
+            return 0
+        audit_url_parse: ParseResult = urlparse(audit_url)
+        db_path = Path(audit_url_parse.path)
+        if not db_path.exists():
+            return 0
+        cutoff_date = (
+            datetime.now() - timedelta(days=max_age_days)
+        ).isoformat()
+        with sqlite3.connect(db_path) as conn:
+            cursor = conn.execute(
+                "DELETE FROM audits WHERE release < ?", (cutoff_date,)
+            )
+            conn.commit()
+            return cursor.rowcount
-Audit = Union[
-    FileAudit,
-    SQLiteAudit,
-    BaseAudit,
+Audit = Annotated[
+    Union[
+        FileAudit,
+        SQLiteAudit,
+    ],
+    Field(discriminator="type"),
 ]
-def get_audit_model(
+def get_audit(
+    *,
     extras: Optional[DictData] = None,
-) -> type[Audit]:  # pragma: no cov
-    """Get an audit model that dynamic base on the config audit path value.
+) -> Audit:  # pragma: no cov
+    """Get an audit model dynamically based on the config audit path value.
-    :param extras: An extra parameter that want to override the core config.
+    Args:
+        extras: Optional extra parameters to override the core config.
-    :rtype: type[Audit]
+    Returns:
+        Audit: The appropriate audit model class based on configuration.
     """
-    # NOTE: Allow you to override trace model by the extra parameter.
-    map_audit_models: dict[str, type[Trace]] = extras.get(
-        "audit_model_mapping", {}
-    )
-    url: ParseResult
-    if (url := dynamic("audit_url", extras=extras)).scheme and (
-        url.scheme == "sqlite"
-        or (url.scheme == "file" and Path(url.path).is_file())
-    ):
-        return map_audit_models.get("sqlite", FileAudit)
-    elif url.scheme and url.scheme != "file":
-        raise NotImplementedError(
-            f"Does not implement the audit model support for URL: {url}"
-        )
-    return map_audit_models.get("file", FileAudit)
+    audit_conf = dynamic("audit_conf", extras=extras)
+    model = TypeAdapter(Audit).validate_python(audit_conf | {"extras": extras})
+    return model

ddeutil-workflow 0.0.78__py3-none-any.whl → 0.0.80__py3-none-any.whl

ddeutil-workflow 0.0.78py3-none-any.whl → 0.0.80py3-none-any.whl