PyPI - pointblank - Versions diffs - 0.18.0__py3-none-any.whl → 0.20.0__py3-none-any.whl - Mend

pointblank 0.18.0py3-none-any.whl → 0.20.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (322) hide show

pointblank/__init__.py +44 -1
pointblank/_constants.py +258 -166
pointblank/_constants_translations.py +378 -0
pointblank/_interrogation.py +204 -0
pointblank/_utils_llms_txt.py +20 -0
pointblank/data/api-docs.txt +793 -1
pointblank/field.py +1507 -0
pointblank/generate/__init__.py +17 -0
pointblank/generate/base.py +49 -0
pointblank/generate/generators.py +573 -0
pointblank/generate/regex.py +217 -0
pointblank/locales/__init__.py +1476 -0
pointblank/locales/data/AR/address.json +73 -0
pointblank/locales/data/AR/company.json +60 -0
pointblank/locales/data/AR/internet.json +19 -0
pointblank/locales/data/AR/misc.json +7 -0
pointblank/locales/data/AR/person.json +39 -0
pointblank/locales/data/AR/text.json +38 -0
pointblank/locales/data/AT/address.json +84 -0
pointblank/locales/data/AT/company.json +65 -0
pointblank/locales/data/AT/internet.json +20 -0
pointblank/locales/data/AT/misc.json +8 -0
pointblank/locales/data/AT/person.json +17 -0
pointblank/locales/data/AT/text.json +35 -0
pointblank/locales/data/AU/address.json +83 -0
pointblank/locales/data/AU/company.json +65 -0
pointblank/locales/data/AU/internet.json +20 -0
pointblank/locales/data/AU/misc.json +8 -0
pointblank/locales/data/AU/person.json +17 -0
pointblank/locales/data/AU/text.json +35 -0
pointblank/locales/data/BE/address.json +225 -0
pointblank/locales/data/BE/company.json +129 -0
pointblank/locales/data/BE/internet.json +36 -0
pointblank/locales/data/BE/misc.json +6 -0
pointblank/locales/data/BE/person.json +62 -0
pointblank/locales/data/BE/text.json +38 -0
pointblank/locales/data/BG/address.json +75 -0
pointblank/locales/data/BG/company.json +60 -0
pointblank/locales/data/BG/internet.json +19 -0
pointblank/locales/data/BG/misc.json +7 -0
pointblank/locales/data/BG/person.json +40 -0
pointblank/locales/data/BG/text.json +38 -0
pointblank/locales/data/BR/address.json +98 -0
pointblank/locales/data/BR/company.json +65 -0
pointblank/locales/data/BR/internet.json +20 -0
pointblank/locales/data/BR/misc.json +8 -0
pointblank/locales/data/BR/person.json +17 -0
pointblank/locales/data/BR/text.json +35 -0
pointblank/locales/data/CA/address.json +747 -0
pointblank/locales/data/CA/company.json +120 -0
pointblank/locales/data/CA/internet.json +24 -0
pointblank/locales/data/CA/misc.json +11 -0
pointblank/locales/data/CA/person.json +1033 -0
pointblank/locales/data/CA/text.json +58 -0
pointblank/locales/data/CH/address.json +184 -0
pointblank/locales/data/CH/company.json +112 -0
pointblank/locales/data/CH/internet.json +20 -0
pointblank/locales/data/CH/misc.json +10 -0
pointblank/locales/data/CH/person.json +64 -0
pointblank/locales/data/CH/text.json +45 -0
pointblank/locales/data/CL/address.json +71 -0
pointblank/locales/data/CL/company.json +60 -0
pointblank/locales/data/CL/internet.json +19 -0
pointblank/locales/data/CL/misc.json +7 -0
pointblank/locales/data/CL/person.json +38 -0
pointblank/locales/data/CL/text.json +38 -0
pointblank/locales/data/CN/address.json +124 -0
pointblank/locales/data/CN/company.json +76 -0
pointblank/locales/data/CN/internet.json +20 -0
pointblank/locales/data/CN/misc.json +8 -0
pointblank/locales/data/CN/person.json +50 -0
pointblank/locales/data/CN/text.json +38 -0
pointblank/locales/data/CO/address.json +76 -0
pointblank/locales/data/CO/company.json +60 -0
pointblank/locales/data/CO/internet.json +19 -0
pointblank/locales/data/CO/misc.json +7 -0
pointblank/locales/data/CO/person.json +38 -0
pointblank/locales/data/CO/text.json +38 -0
pointblank/locales/data/CY/address.json +62 -0
pointblank/locales/data/CY/company.json +60 -0
pointblank/locales/data/CY/internet.json +19 -0
pointblank/locales/data/CY/misc.json +7 -0
pointblank/locales/data/CY/person.json +38 -0
pointblank/locales/data/CY/text.json +38 -0
pointblank/locales/data/CZ/address.json +70 -0
pointblank/locales/data/CZ/company.json +61 -0
pointblank/locales/data/CZ/internet.json +19 -0
pointblank/locales/data/CZ/misc.json +7 -0
pointblank/locales/data/CZ/person.json +40 -0
pointblank/locales/data/CZ/text.json +38 -0
pointblank/locales/data/DE/address.json +756 -0
pointblank/locales/data/DE/company.json +101 -0
pointblank/locales/data/DE/internet.json +22 -0
pointblank/locales/data/DE/misc.json +11 -0
pointblank/locales/data/DE/person.json +1026 -0
pointblank/locales/data/DE/text.json +50 -0
pointblank/locales/data/DK/address.json +231 -0
pointblank/locales/data/DK/company.json +65 -0
pointblank/locales/data/DK/internet.json +20 -0
pointblank/locales/data/DK/misc.json +7 -0
pointblank/locales/data/DK/person.json +45 -0
pointblank/locales/data/DK/text.json +43 -0
pointblank/locales/data/EE/address.json +69 -0
pointblank/locales/data/EE/company.json +60 -0
pointblank/locales/data/EE/internet.json +19 -0
pointblank/locales/data/EE/misc.json +7 -0
pointblank/locales/data/EE/person.json +39 -0
pointblank/locales/data/EE/text.json +38 -0
pointblank/locales/data/ES/address.json +3086 -0
pointblank/locales/data/ES/company.json +644 -0
pointblank/locales/data/ES/internet.json +25 -0
pointblank/locales/data/ES/misc.json +11 -0
pointblank/locales/data/ES/person.json +488 -0
pointblank/locales/data/ES/text.json +49 -0
pointblank/locales/data/FI/address.json +93 -0
pointblank/locales/data/FI/company.json +65 -0
pointblank/locales/data/FI/internet.json +20 -0
pointblank/locales/data/FI/misc.json +8 -0
pointblank/locales/data/FI/person.json +17 -0
pointblank/locales/data/FI/text.json +35 -0
pointblank/locales/data/FR/address.json +619 -0
pointblank/locales/data/FR/company.json +111 -0
pointblank/locales/data/FR/internet.json +22 -0
pointblank/locales/data/FR/misc.json +11 -0
pointblank/locales/data/FR/person.json +1066 -0
pointblank/locales/data/FR/text.json +50 -0
pointblank/locales/data/GB/address.json +5759 -0
pointblank/locales/data/GB/company.json +131 -0
pointblank/locales/data/GB/internet.json +24 -0
pointblank/locales/data/GB/misc.json +45 -0
pointblank/locales/data/GB/person.json +578 -0
pointblank/locales/data/GB/text.json +61 -0
pointblank/locales/data/GR/address.json +68 -0
pointblank/locales/data/GR/company.json +61 -0
pointblank/locales/data/GR/internet.json +19 -0
pointblank/locales/data/GR/misc.json +7 -0
pointblank/locales/data/GR/person.json +39 -0
pointblank/locales/data/GR/text.json +38 -0
pointblank/locales/data/HK/address.json +79 -0
pointblank/locales/data/HK/company.json +69 -0
pointblank/locales/data/HK/internet.json +19 -0
pointblank/locales/data/HK/misc.json +7 -0
pointblank/locales/data/HK/person.json +42 -0
pointblank/locales/data/HK/text.json +38 -0
pointblank/locales/data/HR/address.json +73 -0
pointblank/locales/data/HR/company.json +60 -0
pointblank/locales/data/HR/internet.json +19 -0
pointblank/locales/data/HR/misc.json +7 -0
pointblank/locales/data/HR/person.json +38 -0
pointblank/locales/data/HR/text.json +38 -0
pointblank/locales/data/HU/address.json +70 -0
pointblank/locales/data/HU/company.json +61 -0
pointblank/locales/data/HU/internet.json +19 -0
pointblank/locales/data/HU/misc.json +7 -0
pointblank/locales/data/HU/person.json +40 -0
pointblank/locales/data/HU/text.json +38 -0
pointblank/locales/data/ID/address.json +68 -0
pointblank/locales/data/ID/company.json +61 -0
pointblank/locales/data/ID/internet.json +19 -0
pointblank/locales/data/ID/misc.json +7 -0
pointblank/locales/data/ID/person.json +40 -0
pointblank/locales/data/ID/text.json +38 -0
pointblank/locales/data/IE/address.json +643 -0
pointblank/locales/data/IE/company.json +140 -0
pointblank/locales/data/IE/internet.json +24 -0
pointblank/locales/data/IE/misc.json +44 -0
pointblank/locales/data/IE/person.json +55 -0
pointblank/locales/data/IE/text.json +60 -0
pointblank/locales/data/IN/address.json +92 -0
pointblank/locales/data/IN/company.json +65 -0
pointblank/locales/data/IN/internet.json +20 -0
pointblank/locales/data/IN/misc.json +8 -0
pointblank/locales/data/IN/person.json +52 -0
pointblank/locales/data/IN/text.json +39 -0
pointblank/locales/data/IS/address.json +63 -0
pointblank/locales/data/IS/company.json +61 -0
pointblank/locales/data/IS/internet.json +19 -0
pointblank/locales/data/IS/misc.json +7 -0
pointblank/locales/data/IS/person.json +44 -0
pointblank/locales/data/IS/text.json +38 -0
pointblank/locales/data/IT/address.json +192 -0
pointblank/locales/data/IT/company.json +137 -0
pointblank/locales/data/IT/internet.json +20 -0
pointblank/locales/data/IT/misc.json +10 -0
pointblank/locales/data/IT/person.json +70 -0
pointblank/locales/data/IT/text.json +44 -0
pointblank/locales/data/JP/address.json +713 -0
pointblank/locales/data/JP/company.json +113 -0
pointblank/locales/data/JP/internet.json +22 -0
pointblank/locales/data/JP/misc.json +10 -0
pointblank/locales/data/JP/person.json +1057 -0
pointblank/locales/data/JP/text.json +51 -0
pointblank/locales/data/KR/address.json +77 -0
pointblank/locales/data/KR/company.json +68 -0
pointblank/locales/data/KR/internet.json +19 -0
pointblank/locales/data/KR/misc.json +7 -0
pointblank/locales/data/KR/person.json +40 -0
pointblank/locales/data/KR/text.json +38 -0
pointblank/locales/data/LT/address.json +66 -0
pointblank/locales/data/LT/company.json +60 -0
pointblank/locales/data/LT/internet.json +19 -0
pointblank/locales/data/LT/misc.json +7 -0
pointblank/locales/data/LT/person.json +42 -0
pointblank/locales/data/LT/text.json +38 -0
pointblank/locales/data/LU/address.json +66 -0
pointblank/locales/data/LU/company.json +60 -0
pointblank/locales/data/LU/internet.json +19 -0
pointblank/locales/data/LU/misc.json +7 -0
pointblank/locales/data/LU/person.json +38 -0
pointblank/locales/data/LU/text.json +38 -0
pointblank/locales/data/LV/address.json +62 -0
pointblank/locales/data/LV/company.json +60 -0
pointblank/locales/data/LV/internet.json +19 -0
pointblank/locales/data/LV/misc.json +7 -0
pointblank/locales/data/LV/person.json +40 -0
pointblank/locales/data/LV/text.json +38 -0
pointblank/locales/data/MT/address.json +61 -0
pointblank/locales/data/MT/company.json +60 -0
pointblank/locales/data/MT/internet.json +19 -0
pointblank/locales/data/MT/misc.json +7 -0
pointblank/locales/data/MT/person.json +38 -0
pointblank/locales/data/MT/text.json +38 -0
pointblank/locales/data/MX/address.json +100 -0
pointblank/locales/data/MX/company.json +65 -0
pointblank/locales/data/MX/internet.json +20 -0
pointblank/locales/data/MX/misc.json +8 -0
pointblank/locales/data/MX/person.json +18 -0
pointblank/locales/data/MX/text.json +39 -0
pointblank/locales/data/NL/address.json +1517 -0
pointblank/locales/data/NL/company.json +133 -0
pointblank/locales/data/NL/internet.json +44 -0
pointblank/locales/data/NL/misc.json +55 -0
pointblank/locales/data/NL/person.json +365 -0
pointblank/locales/data/NL/text.json +210 -0
pointblank/locales/data/NO/address.json +86 -0
pointblank/locales/data/NO/company.json +66 -0
pointblank/locales/data/NO/internet.json +20 -0
pointblank/locales/data/NO/misc.json +8 -0
pointblank/locales/data/NO/person.json +17 -0
pointblank/locales/data/NO/text.json +35 -0
pointblank/locales/data/NZ/address.json +90 -0
pointblank/locales/data/NZ/company.json +65 -0
pointblank/locales/data/NZ/internet.json +20 -0
pointblank/locales/data/NZ/misc.json +8 -0
pointblank/locales/data/NZ/person.json +17 -0
pointblank/locales/data/NZ/text.json +39 -0
pointblank/locales/data/PH/address.json +67 -0
pointblank/locales/data/PH/company.json +61 -0
pointblank/locales/data/PH/internet.json +19 -0
pointblank/locales/data/PH/misc.json +7 -0
pointblank/locales/data/PH/person.json +40 -0
pointblank/locales/data/PH/text.json +38 -0
pointblank/locales/data/PL/address.json +91 -0
pointblank/locales/data/PL/company.json +65 -0
pointblank/locales/data/PL/internet.json +20 -0
pointblank/locales/data/PL/misc.json +8 -0
pointblank/locales/data/PL/person.json +17 -0
pointblank/locales/data/PL/text.json +35 -0
pointblank/locales/data/PT/address.json +90 -0
pointblank/locales/data/PT/company.json +65 -0
pointblank/locales/data/PT/internet.json +20 -0
pointblank/locales/data/PT/misc.json +8 -0
pointblank/locales/data/PT/person.json +17 -0
pointblank/locales/data/PT/text.json +35 -0
pointblank/locales/data/RO/address.json +73 -0
pointblank/locales/data/RO/company.json +61 -0
pointblank/locales/data/RO/internet.json +19 -0
pointblank/locales/data/RO/misc.json +7 -0
pointblank/locales/data/RO/person.json +40 -0
pointblank/locales/data/RO/text.json +38 -0
pointblank/locales/data/RU/address.json +74 -0
pointblank/locales/data/RU/company.json +60 -0
pointblank/locales/data/RU/internet.json +19 -0
pointblank/locales/data/RU/misc.json +7 -0
pointblank/locales/data/RU/person.json +38 -0
pointblank/locales/data/RU/text.json +38 -0
pointblank/locales/data/SE/address.json +247 -0
pointblank/locales/data/SE/company.json +65 -0
pointblank/locales/data/SE/internet.json +20 -0
pointblank/locales/data/SE/misc.json +7 -0
pointblank/locales/data/SE/person.json +45 -0
pointblank/locales/data/SE/text.json +43 -0
pointblank/locales/data/SI/address.json +67 -0
pointblank/locales/data/SI/company.json +60 -0
pointblank/locales/data/SI/internet.json +19 -0
pointblank/locales/data/SI/misc.json +7 -0
pointblank/locales/data/SI/person.json +38 -0
pointblank/locales/data/SI/text.json +38 -0
pointblank/locales/data/SK/address.json +64 -0
pointblank/locales/data/SK/company.json +60 -0
pointblank/locales/data/SK/internet.json +19 -0
pointblank/locales/data/SK/misc.json +7 -0
pointblank/locales/data/SK/person.json +38 -0
pointblank/locales/data/SK/text.json +38 -0
pointblank/locales/data/TR/address.json +105 -0
pointblank/locales/data/TR/company.json +65 -0
pointblank/locales/data/TR/internet.json +20 -0
pointblank/locales/data/TR/misc.json +8 -0
pointblank/locales/data/TR/person.json +17 -0
pointblank/locales/data/TR/text.json +35 -0
pointblank/locales/data/TW/address.json +86 -0
pointblank/locales/data/TW/company.json +69 -0
pointblank/locales/data/TW/internet.json +19 -0
pointblank/locales/data/TW/misc.json +7 -0
pointblank/locales/data/TW/person.json +42 -0
pointblank/locales/data/TW/text.json +38 -0
pointblank/locales/data/US/address.json +996 -0
pointblank/locales/data/US/company.json +131 -0
pointblank/locales/data/US/internet.json +22 -0
pointblank/locales/data/US/misc.json +11 -0
pointblank/locales/data/US/person.json +1092 -0
pointblank/locales/data/US/text.json +56 -0
pointblank/locales/data/_shared/misc.json +42 -0
pointblank/schema.py +339 -2
pointblank/validate.py +1263 -11
{pointblank-0.18.0.dist-info → pointblank-0.20.0.dist-info}/METADATA +45 -1
pointblank-0.20.0.dist-info/RECORD +366 -0
{pointblank-0.18.0.dist-info → pointblank-0.20.0.dist-info}/WHEEL +1 -1
pointblank-0.18.0.dist-info/RECORD +0 -59
{pointblank-0.18.0.dist-info → pointblank-0.20.0.dist-info}/entry_points.txt +0 -0
{pointblank-0.18.0.dist-info → pointblank-0.20.0.dist-info}/licenses/LICENSE +0 -0
{pointblank-0.18.0.dist-info → pointblank-0.20.0.dist-info}/top_level.txt +0 -0

pointblank/validate.py CHANGED Viewed

@@ -17,6 +17,7 @@ from importlib.metadata import version
 from pathlib import Path
 from typing import TYPE_CHECKING, Any, Callable, Literal, NoReturn, ParamSpec, TypeVar
 from zipfile import ZipFile
+from zoneinfo import ZoneInfo
 import commonmark
 import narwhals as nw
@@ -4350,6 +4351,18 @@ class Validate:
         locale's rules. Examples include `"en-US"` for English (United States) and `"fr-FR"` for
         French (France). More simply, this can be a language identifier without a designation of
         territory, like `"es"` for Spanish.
+    owner
+        An optional string identifying the owner of the data being validated. This is useful for
+        governance purposes, indicating who is responsible for the quality and maintenance of the
+        data. For example, `"data-platform-team"` or `"analytics-engineering"`.
+    consumers
+        An optional string or list of strings identifying who depends on or consumes this data.
+        This helps document data dependencies and can be useful for impact analysis when data
+        quality issues are detected. For example, `"ml-team"` or `["ml-team", "analytics"]`.
+    version
+        An optional string representing the version of the validation plan or data contract. This
+        supports semantic versioning (e.g., `"1.0.0"`, `"2.1.0"`) and is useful for tracking changes
+        to validation rules over time and for organizational governance.
     Returns
     -------
@@ -4836,6 +4849,9 @@ class Validate:
     brief: str | bool | None = None
     lang: str | None = None
     locale: str | None = None
+    owner: str | None = None
+    consumers: str | list[str] | None = None
+    version: str | None = None
     def __post_init__(self):
         # Process data through the centralized data processing pipeline
@@ -4880,6 +4896,36 @@ class Validate:
         # Transform any shorthands of `brief` to string representations
         self.brief = _transform_auto_brief(brief=self.brief)
+        # Validate and normalize the `owner` parameter
+        if self.owner is not None and not isinstance(self.owner, str):
+            raise TypeError(
+                "The `owner=` parameter must be a string representing the owner of the data. "
+                f"Received type: {type(self.owner).__name__}"
+            )
+        # Validate and normalize the `consumers` parameter
+        if self.consumers is not None:
+            if isinstance(self.consumers, str):
+                self.consumers = [self.consumers]
+            elif isinstance(self.consumers, list):
+                if not all(isinstance(c, str) for c in self.consumers):
+                    raise TypeError(
+                        "The `consumers=` parameter must be a string or a list of strings. "
+                        "All elements in the list must be strings."
+                    )
+            else:
+                raise TypeError(
+                    "The `consumers=` parameter must be a string or a list of strings. "
+                    f"Received type: {type(self.consumers).__name__}"
+                )
+        # Validate the `version` parameter
+        if self.version is not None and not isinstance(self.version, str):
+            raise TypeError(
+                "The `version=` parameter must be a string representing the version. "
+                f"Received type: {type(self.version).__name__}"
+            )
         # TODO: Add functionality to obtain the column names and types from the table
         self.col_names = None
         self.col_types = None
@@ -11530,6 +11576,369 @@ class Validate:
         return self
+    def data_freshness(
+        self,
+        column: str,
+        max_age: str | datetime.timedelta,
+        reference_time: datetime.datetime | str | None = None,
+        timezone: str | None = None,
+        allow_tz_mismatch: bool = False,
+        pre: Callable | None = None,
+        thresholds: int | float | bool | tuple | dict | Thresholds | None = None,
+        actions: Actions | None = None,
+        brief: str | bool | None = None,
+        active: bool = True,
+    ) -> Validate:
+        """
+        Validate that data in a datetime column is not older than a specified maximum age.
+        The `data_freshness()` validation method checks whether the most recent timestamp in the
+        specified datetime column is within the allowed `max_age=` from the `reference_time=` (which
+        defaults to the current time). This is useful for ensuring data pipelines are delivering
+        fresh data and for enforcing data SLAs.
+        This method helps detect stale data by comparing the maximum (most recent) value in a
+        datetime column against an expected freshness threshold.
+        Parameters
+        ----------
+        column
+            The name of the datetime column to check for freshness. This column should contain
+            date or datetime values.
+        max_age
+            The maximum allowed age of the data. Can be specified as: (1) a string with a
+            human-readable duration like `"24 hours"`, `"1 day"`, `"30 minutes"`, `"2 weeks"`, etc.
+            (supported units: `seconds`, `minutes`, `hours`, `days`, `weeks`), or (2) a
+            `datetime.timedelta` object for precise control.
+        reference_time
+            The reference point in time to compare against. Defaults to `None`, which uses the
+            current time (UTC if `timezone=` is not specified). Can be: (1) a `datetime.datetime`
+            object (timezone-aware recommended), (2) a string in ISO 8601 format (e.g.,
+            `"2024-01-15T10:30:00"` or `"2024-01-15T10:30:00+05:30"`), or (3) `None` to use the
+            current time.
+        timezone
+            The timezone to use for interpreting the data and reference time. Accepts IANA
+            timezone names (e.g., `"America/New_York"`), hour offsets (e.g., `"-7"`), or ISO 8601
+            offsets (e.g., `"-07:00"`). When `None` (default), naive datetimes are treated as UTC.
+            See the *The `timezone=` Parameter* section for details.
+        allow_tz_mismatch
+            Whether to allow timezone mismatches between the column data and reference time.
+            By default (`False`), a warning note is added when comparing timezone-naive with
+            timezone-aware datetimes. Set to `True` to suppress these warnings.
+        pre
+            An optional preprocessing function or lambda to apply to the data table during
+            interrogation. This function should take a table as input and return a modified table.
+        thresholds
+            Set threshold failure levels for reporting and reacting to exceedences of the levels.
+            The thresholds are set at the step level and will override any global thresholds set in
+            `Validate(thresholds=...)`. The default is `None`, which means that no thresholds will
+            be set locally and global thresholds (if any) will take effect.
+        actions
+            Optional actions to take when the validation step meets or exceeds any set threshold
+            levels. If provided, the [`Actions`](`pointblank.Actions`) class should be used to
+            define the actions.
+        brief
+            An optional brief description of the validation step that will be displayed in the
+            reporting table. You can use the templating elements like `"{step}"` to insert
+            the step number, or `"{auto}"` to include an automatically generated brief. If `True`
+            the entire brief will be automatically generated. If `None` (the default) then there
+            won't be a brief.
+        active
+            A boolean value indicating whether the validation step should be active. Using `False`
+            will make the validation step inactive (still reporting its presence and keeping indexes
+            for the steps unchanged).
+        Returns
+        -------
+        Validate
+            The `Validate` object with the added validation step.
+        How Timezones Affect Freshness Checks
+        -------------------------------------
+        Freshness validation involves comparing two times: the **data time** (the most recent
+        timestamp in your column) and the **execution time** (when and where the validation runs).
+        Timezone confusion typically arises because these two times may originate from different
+        contexts.
+        Consider these common scenarios:
+        - your data timestamps are stored in UTC (common for databases), but you're running
+          validation on your laptop in New York (Eastern Time)
+        - you develop and test validation locally, then deploy it to a cloud workflow that runs
+          in UTC—suddenly your 'same' validation behaves differently
+        - your data comes from servers in multiple regions, each recording timestamps in their
+          local timezone
+        The `timezone=` parameter exists to solve this problem by establishing a single, explicit
+        timezone context for the freshness comparison. When you specify a timezone, Pointblank
+        interprets both the data timestamps (if naive) and the execution time in that timezone,
+        ensuring consistent behavior whether you run validation on your laptop or in a cloud
+        workflow.
+        **Scenario 1: Data has timezone-aware datetimes**
+        ```python
+        # Your data column has values like: 2024-01-15 10:30:00+00:00 (UTC)
+        # Comparison is straightforward as both sides have explicit timezones
+        .data_freshness(column="updated_at", max_age="24 hours")
+        ```
+        **Scenario 2: Data has naive datetimes (no timezone)**
+        ```python
+        # Your data column has values like: 2024-01-15 10:30:00 (no timezone)
+        # Specify the timezone the data was recorded in:
+        .data_freshness(column="updated_at", max_age="24 hours", timezone="America/New_York")
+        ```
+        **Scenario 3: Ensuring consistent behavior across environments**
+        ```python
+        # Pin the timezone to ensure identical results whether running locally or in the cloud
+        .data_freshness(
+            column="updated_at",
+            max_age="24 hours",
+            timezone="UTC",  # Explicit timezone removes environment dependence
+        )
+        ```
+        The `timezone=` Parameter
+        ---------------------------
+        The `timezone=` parameter accepts several convenient formats, making it easy to specify
+        timezones in whatever way is most natural for your use case. The following examples
+        illustrate the three supported input styles.
+        **IANA Timezone Names** (recommended for regions with daylight saving time):
+        ```python
+        timezone="America/New_York"   # Eastern Time (handles DST automatically)
+        timezone="Europe/London"      # UK time
+        timezone="Asia/Tokyo"         # Japan Standard Time
+        timezone="Australia/Sydney"   # Australian Eastern Time
+        timezone="UTC"                # Coordinated Universal Time
+        ```
+        **Simple Hour Offsets** (quick and easy):
+        ```python
+        timezone="-7"    # UTC-7 (e.g., Mountain Standard Time)
+        timezone="+5"    # UTC+5 (e.g., Pakistan Standard Time)
+        timezone="0"     # UTC
+        timezone="-12"   # UTC-12
+        ```
+        **ISO 8601 Offset Format** (precise, including fractional hours):
+        ```python
+        timezone="-07:00"   # UTC-7
+        timezone="+05:30"   # UTC+5:30 (e.g., India Standard Time)
+        timezone="+00:00"   # UTC
+        timezone="-09:30"   # UTC-9:30
+        ```
+        When a timezone is specified:
+        - naive datetime values in the column are assumed to be in this timezone.
+        - the reference time (if naive) is assumed to be in this timezone.
+        - the validation report will show times in this timezone.
+        When `None` (default):
+        - if your column has timezone-aware datetimes, those timezones are used
+        - if your column has naive datetimes, they're treated as UTC
+        - the current time reference uses UTC
+        Note that IANA timezone names are preferred when daylight saving time transitions matter, as
+        they automatically handle the offset changes. Fixed offsets like `"-7"` or `"-07:00"` do not
+        account for DST.
+        Recommendations for Working with Timestamps
+        -------------------------------------------
+        When working with datetime data, storing timestamps in UTC in your databases is strongly
+        recommended since it provides a consistent reference point regardless of where your data
+        originates or where it's consumed. Using timezone-aware datetimes whenever possible helps
+        avoid ambiguity—when a datetime has an explicit timezone, there's no guessing about what
+        time it actually represents.
+        If you're working with naive datetimes (which lack timezone information), always specify the
+        `timezone=` parameter so Pointblank knows how to interpret those values. When providing
+        `reference_time=` as a string, use ISO 8601 format with the timezone offset included (e.g.,
+        `"2024-01-15T10:30:00+00:00"`) to ensure unambiguous parsing. Finally, prefer IANA timezone
+        names (like `"America/New_York"`) over fixed offsets (like `"-05:00"`) when daylight saving
+        time transitions matter, since IANA names automatically handle the twice-yearly offset
+        changes. To see all available IANA timezone names in Python, use
+        `zoneinfo.available_timezones()` from the standard library's `zoneinfo` module.
+        Examples
+        --------
+        ```{python}
+        #| echo: false
+        #| output: false
+        import pointblank as pb
+        pb.config(report_incl_header=False, report_incl_footer=False)
+        ```
+        The simplest use of `data_freshness()` requires just two arguments: the `column=` containing
+        your timestamps and `max_age=` specifying how old the data can be. In this first example,
+        we create sample data with an `"updated_at"` column containing timestamps from 1, 12, and
+        20 hours ago. By setting `max_age="24 hours"`, we're asserting that the most recent
+        timestamp should be within 24 hours of the current time. Since the newest record is only
+        1 hour old, this validation passes.
+        ```{python}
+        import pointblank as pb
+        import polars as pl
+        from datetime import datetime, timedelta
+        # Create sample data with recent timestamps
+        recent_data = pl.DataFrame({
+            "id": [1, 2, 3],
+            "updated_at": [
+                datetime.now() - timedelta(hours=1),
+                datetime.now() - timedelta(hours=12),
+                datetime.now() - timedelta(hours=20),
+            ]
+        })
+        validation = (
+            pb.Validate(data=recent_data)
+            .data_freshness(column="updated_at", max_age="24 hours")
+            .interrogate()
+        )
+        validation
+        ```
+        The `max_age=` parameter accepts human-readable strings with various time units. You can
+        chain multiple `data_freshness()` calls to check different freshness thresholds
+        simultaneously—useful for tiered SLAs where you might want warnings at 30 minutes but
+        errors at 2 days.
+        ```{python}
+        # Check data is fresh within different time windows
+        validation = (
+            pb.Validate(data=recent_data)
+            .data_freshness(column="updated_at", max_age="30 minutes")  # Very fresh
+            .data_freshness(column="updated_at", max_age="2 days")      # Reasonably fresh
+            .data_freshness(column="updated_at", max_age="1 week")      # Within a week
+            .interrogate()
+        )
+        validation
+        ```
+        When your data contains naive datetimes (timestamps without timezone information), use the
+        `timezone=` parameter to specify what timezone those values represent. Here we have event
+        data recorded in Eastern Time, so we set `timezone="America/New_York"` to ensure the
+        freshness comparison is done correctly.
+        ```{python}
+        # Data with naive datetimes (assume they're in Eastern Time)
+        eastern_data = pl.DataFrame({
+            "event_time": [
+                datetime.now() - timedelta(hours=2),
+                datetime.now() - timedelta(hours=5),
+            ]
+        })
+        validation = (
+            pb.Validate(data=eastern_data)
+            .data_freshness(
+                column="event_time",
+                max_age="12 hours",
+                timezone="America/New_York"  # Interpret times as Eastern
+            )
+            .interrogate()
+        )
+        validation
+        ```
+        For reproducible validations or historical checks, you can use `reference_time=` to compare
+        against a specific point in time instead of the current time. This is particularly useful
+        for testing or when validating data snapshots. The reference time should include a timezone
+        offset (like `+00:00` for UTC) to avoid ambiguity.
+        ```{python}
+        validation = (
+            pb.Validate(data=recent_data)
+            .data_freshness(
+                column="updated_at",
+                max_age="24 hours",
+                reference_time="2024-01-15T12:00:00+00:00"
+            )
+            .interrogate()
+        )
+        validation
+        ```
+        """
+        assertion_type = _get_fn_name()
+        _check_pre(pre=pre)
+        _check_thresholds(thresholds=thresholds)
+        _check_boolean_input(param=active, param_name="active")
+        _check_boolean_input(param=allow_tz_mismatch, param_name="allow_tz_mismatch")
+        # Validate and parse the max_age parameter
+        max_age_td = _parse_max_age(max_age)
+        # Validate the column parameter
+        if not isinstance(column, str):
+            raise TypeError(
+                f"The `column` parameter must be a string, got {type(column).__name__}."
+            )
+        # Validate the timezone parameter if provided
+        if timezone is not None:
+            _validate_timezone(timezone)
+        # Parse reference_time if it's a string
+        parsed_reference_time = None
+        if reference_time is not None:
+            if isinstance(reference_time, str):
+                parsed_reference_time = _parse_reference_time(reference_time)
+            elif isinstance(reference_time, datetime.datetime):
+                parsed_reference_time = reference_time
+            else:
+                raise TypeError(
+                    f"The `reference_time` parameter must be a string or datetime object, "
+                    f"got {type(reference_time).__name__}."
+                )
+        # Determine threshold to use (global or local) and normalize a local `thresholds=` value
+        thresholds = (
+            self.thresholds if thresholds is None else _normalize_thresholds_creation(thresholds)
+        )
+        # Package up the parameters for later interrogation
+        values = {
+            "max_age": max_age_td,
+            "max_age_str": max_age if isinstance(max_age, str) else str(max_age),
+            "reference_time": parsed_reference_time,
+            "timezone": timezone,
+            "allow_tz_mismatch": allow_tz_mismatch,
+        }
+        # Determine brief to use (global or local) and transform any shorthands of `brief=`
+        brief = self.brief if brief is None else _transform_auto_brief(brief=brief)
+        val_info = _ValidationInfo(
+            assertion_type=assertion_type,
+            column=column,
+            values=values,
+            pre=pre,
+            thresholds=thresholds,
+            actions=actions,
+            brief=brief,
+            active=active,
+        )
+        self._add_validation(validation_info=val_info)
+        return self
     def col_count_match(
         self,
         count: int | Any,
@@ -12941,6 +13350,8 @@ class Validate:
                 "col_schema_match",
                 "row_count_match",
                 "col_count_match",
+                "data_freshness",
+                "tbl_match",
             ]
             if validation.n == 0 and assertion_type not in table_level_assertions:
@@ -13201,6 +13612,105 @@ class Validate:
                         results_tbl = None
+                    elif assertion_type == "data_freshness":
+                        from pointblank._interrogation import data_freshness as data_freshness_check
+                        freshness_result = data_freshness_check(
+                            data_tbl=data_tbl_step,
+                            column=column,
+                            max_age=value["max_age"],
+                            reference_time=value["reference_time"],
+                            timezone=value["timezone"],
+                            allow_tz_mismatch=value["allow_tz_mismatch"],
+                        )
+                        result_bool = freshness_result["passed"]
+                        validation.all_passed = result_bool
+                        validation.n = 1
+                        validation.n_passed = int(result_bool)
+                        validation.n_failed = 1 - int(result_bool)
+                        # Store the freshness check details for reporting
+                        validation.val_info = freshness_result
+                        # Update the values dict with actual computed values for failure text
+                        if freshness_result.get("age") is not None:
+                            value["age"] = freshness_result["age"]
+                        # Add timezone warning note if applicable
+                        if freshness_result.get("tz_warning_key"):
+                            tz_key = freshness_result["tz_warning_key"]
+                            tz_warning_text = NOTES_TEXT.get(tz_key, {}).get(
+                                self.locale, NOTES_TEXT.get(tz_key, {}).get("en", "")
+                            )
+                            validation._add_note(
+                                key="tz_warning",
+                                markdown=f"⚠️ {tz_warning_text}",
+                                text=tz_warning_text,
+                            )
+                        # Add note about column being empty if applicable
+                        if freshness_result.get("column_empty"):
+                            column_empty_text = NOTES_TEXT.get(
+                                "data_freshness_column_empty", {}
+                            ).get(
+                                self.locale,
+                                NOTES_TEXT.get("data_freshness_column_empty", {}).get(
+                                    "en", "The datetime column is empty (no values to check)."
+                                ),
+                            )
+                            validation._add_note(
+                                key="column_empty",
+                                markdown=f"⚠️ {column_empty_text}",
+                                text=column_empty_text,
+                            )
+                        # Add informational note about the freshness check
+                        if freshness_result.get("max_datetime") and freshness_result.get("age"):
+                            max_dt = freshness_result["max_datetime"]
+                            # Format datetime without microseconds for cleaner display
+                            if hasattr(max_dt, "replace"):
+                                max_dt_display = max_dt.replace(microsecond=0)
+                            else:
+                                max_dt_display = max_dt
+                            age = freshness_result["age"]
+                            age_str = _format_timedelta(age)
+                            max_age_str = _format_timedelta(value["max_age"])
+                            # Get translated template for pass/fail
+                            if result_bool:
+                                details_key = "data_freshness_details_pass"
+                                prefix = "✓"
+                            else:
+                                details_key = "data_freshness_details_fail"
+                                prefix = "✗"
+                            details_template = NOTES_TEXT.get(details_key, {}).get(
+                                self.locale,
+                                NOTES_TEXT.get(details_key, {}).get(
+                                    "en",
+                                    "Most recent data: `{max_dt}` (age: {age}, max allowed: {max_age})",
+                                ),
+                            )
+                            # Format the template with values
+                            note_text = details_template.format(
+                                max_dt=max_dt_display, age=age_str, max_age=max_age_str
+                            )
+                            # For markdown, make the age bold
+                            note_md_template = details_template.replace(
+                                "(age: {age}", "(age: **{age}**"
+                            )
+                            note_md = f"{prefix} {note_md_template.format(max_dt=max_dt_display, age=age_str, max_age=max_age_str)}"
+                            validation._add_note(
+                                key="freshness_details",
+                                markdown=note_md,
+                                text=note_text,
+                            )
+                        results_tbl = None
                     elif assertion_type == "tbl_match":
                         from pointblank._interrogation import tbl_match
@@ -13265,6 +13775,15 @@ class Validate:
                         validation.n_passed = int(result_bool)
                         validation.n_failed = 1 - result_bool
+                        # Store computed values for step reports
+                        validation.val_info = {
+                            "actual": real,
+                            "target": target,
+                            "tol": tol,
+                            "lower_bound": lower_bound,
+                            "upper_bound": upper_bound,
+                        }
                         results_tbl = None
                     else:
                         raise ValueError(
@@ -16045,6 +16564,69 @@ class Validate:
                 tol_value = bound_finder.keywords.get("tol", 0) if bound_finder else 0
                 values_upd.append(f"p = {p_value}<br/>tol = {tol_value}")
+            elif assertion_type[i] in ["data_freshness"]:
+                # Format max_age nicely for display
+                max_age = value.get("max_age")
+                max_age_str = _format_timedelta(max_age) if max_age else "&mdash;"
+                # Build additional lines with non-default parameters
+                extra_lines = []
+                if value.get("reference_time") is not None:
+                    ref_time = value["reference_time"]
+                    # Format datetime across two lines: date and time+tz
+                    if hasattr(ref_time, "strftime"):
+                        date_str = ref_time.strftime("@%Y-%m-%d")
+                        time_str = " " + ref_time.strftime("%H:%M:%S")
+                        # Add timezone offset if present
+                        if hasattr(ref_time, "tzinfo") and ref_time.tzinfo is not None:
+                            tz_offset = ref_time.strftime("%z")
+                            if tz_offset:
+                                time_str += tz_offset
+                        extra_lines.append(date_str)
+                        extra_lines.append(time_str)
+                    else:
+                        extra_lines.append(f"@{ref_time}")
+                # Timezone and allow_tz_mismatch on same line
+                tz_line_parts = []
+                if value.get("timezone") is not None:
+                    # Convert timezone name to ISO 8601 offset format
+                    tz_name = value["timezone"]
+                    try:
+                        tz_obj = ZoneInfo(tz_name)
+                        # Get the current offset for this timezone
+                        now = datetime.datetime.now(tz_obj)
+                        offset = now.strftime("%z")
+                        # Format as ISO 8601 extended: -07:00 (insert colon)
+                        if len(offset) == 5:
+                            tz_display = f"{offset[:3]}:{offset[3:]}"
+                        else:
+                            tz_display = offset
+                    except Exception:
+                        tz_display = tz_name
+                    tz_line_parts.append(tz_display)
+                if value.get("allow_tz_mismatch"):
+                    tz_line_parts.append("~tz")
+                if tz_line_parts:
+                    extra_lines.append(" ".join(tz_line_parts))
+                if extra_lines:
+                    extra_html = "<br/>".join(extra_lines)
+                    values_upd.append(
+                        f'{max_age_str}<br/><span style="font-size: 9px;">{extra_html}</span>'
+                    )
+                else:
+                    values_upd.append(max_age_str)
             elif assertion_type[i] in ["col_schema_match"]:
                 values_upd.append("SCHEMA")
@@ -16550,6 +17132,15 @@ class Validate:
             if incl_footer_timings:
                 gt_tbl = gt_tbl.tab_source_note(source_note=html(table_time))
+            # Add governance metadata as source note if any metadata is present
+            governance_html = _create_governance_metadata_html(
+                owner=self.owner,
+                consumers=self.consumers,
+                version=self.version,
+            )
+            if governance_html:
+                gt_tbl = gt_tbl.tab_source_note(source_note=html(governance_html))
             # Create notes markdown from validation steps and add as separate source note if enabled
             if incl_footer_notes:
                 notes_markdown = _create_notes_html(self.validation_info)
@@ -16898,6 +17489,18 @@ class Validate:
                     debug_return_df=debug_return_df,
                 )
+        elif is_valid_agg(assertion_type):
+            step_report = _step_report_aggregate(
+                assertion_type=assertion_type,
+                i=i,
+                column=column,
+                values=values,
+                all_passed=all_passed,
+                val_info=val_info,
+                header=header,
+                lang=lang,
+            )
         else:
             step_report = None  # pragma: no cover
@@ -17494,19 +18097,278 @@ def _process_brief(
     return brief
-def _transform_auto_brief(brief: str | bool | None) -> str | None:
-    if isinstance(brief, bool):
-        if brief:
-            return "{auto}"
-        else:
-            return None
-    else:
-        return brief
+def _parse_max_age(max_age: str | datetime.timedelta) -> datetime.timedelta:
+    """
+    Parse a max_age specification into a timedelta.
+    Parameters
+    ----------
+    max_age
+        Either a timedelta object or a string like "24 hours", "1 day", "30 minutes",
+        or compound expressions like "2 hours 15 minutes", "1 day 6 hours", etc.
-def _process_action_str(
-    action_str: str,
-    step: int,
+    Returns
+    -------
+    datetime.timedelta
+        The parsed timedelta.
+    Raises
+    ------
+    ValueError
+        If the string format is invalid or the unit is not recognized.
+    """
+    if isinstance(max_age, datetime.timedelta):
+        return max_age
+    if not isinstance(max_age, str):
+        raise TypeError(
+            f"The `max_age` parameter must be a string or timedelta, got {type(max_age).__name__}."
+        )
+    # Parse string format like "24 hours", "1 day", "30 minutes", etc.
+    max_age_str = max_age.strip().lower()
+    # Define unit mappings (singular and plural forms)
+    unit_mappings = {
+        "second": "seconds",
+        "seconds": "seconds",
+        "sec": "seconds",
+        "secs": "seconds",
+        "s": "seconds",
+        "minute": "minutes",
+        "minutes": "minutes",
+        "min": "minutes",
+        "mins": "minutes",
+        "m": "minutes",
+        "hour": "hours",
+        "hours": "hours",
+        "hr": "hours",
+        "hrs": "hours",
+        "h": "hours",
+        "day": "days",
+        "days": "days",
+        "d": "days",
+        "week": "weeks",
+        "weeks": "weeks",
+        "wk": "weeks",
+        "wks": "weeks",
+        "w": "weeks",
+    }
+    import re
+    # Pattern to find all number+unit pairs (supports compound expressions)
+    # Matches: "2 hours 15 minutes", "1day6h", "30 min", etc.
+    compound_pattern = r"(\d+(?:\.\d+)?)\s*([a-zA-Z]+)"
+    matches = re.findall(compound_pattern, max_age_str)
+    if not matches:
+        raise ValueError(
+            f"Invalid max_age format: '{max_age}'. Expected format like '24 hours', "
+            f"'1 day', '30 minutes', '2 hours 15 minutes', etc."
+        )
+    # Accumulate timedelta from all matched components
+    total_td = datetime.timedelta()
+    valid_units = ["seconds", "minutes", "hours", "days", "weeks"]
+    for value_str, unit in matches:
+        value = float(value_str)
+        # Normalize the unit
+        unit_lower = unit.lower()
+        if unit_lower not in unit_mappings:
+            raise ValueError(
+                f"Unknown time unit '{unit}' in max_age '{max_age}'. "
+                f"Valid units are: {', '.join(valid_units)} (or their abbreviations)."
+            )
+        normalized_unit = unit_mappings[unit_lower]
+        # Add to total timedelta
+        if normalized_unit == "seconds":
+            total_td += datetime.timedelta(seconds=value)
+        elif normalized_unit == "minutes":
+            total_td += datetime.timedelta(minutes=value)
+        elif normalized_unit == "hours":
+            total_td += datetime.timedelta(hours=value)
+        elif normalized_unit == "days":
+            total_td += datetime.timedelta(days=value)
+        elif normalized_unit == "weeks":
+            total_td += datetime.timedelta(weeks=value)
+    return total_td
+def _parse_timezone(timezone: str) -> datetime.tzinfo:
+    """
+    Parse a timezone string into a tzinfo object.
+    Supports:
+    - IANA timezone names: "America/New_York", "Europe/London", "UTC"
+    - Offset strings: "-7", "+5", "-07:00", "+05:30"
+    Parameters
+    ----------
+    timezone
+        The timezone string to parse.
+    Returns
+    -------
+    datetime.tzinfo
+        The parsed timezone object.
+    Raises
+    ------
+    ValueError
+        If the timezone is not valid.
+    """
+    import re
+    # Check for offset formats: "-7", "+5", "-07:00", "+05:30", etc.
+    # Match: optional sign, 1-2 digits, optional colon and 2 more digits
+    offset_pattern = r"^([+-]?)(\d{1,2})(?::(\d{2}))?$"
+    match = re.match(offset_pattern, timezone.strip())
+    if match:
+        sign_str, hours_str, minutes_str = match.groups()
+        hours = int(hours_str)
+        minutes = int(minutes_str) if minutes_str else 0
+        # Apply sign (default positive if not specified)
+        total_minutes = hours * 60 + minutes
+        if sign_str == "-":
+            total_minutes = -total_minutes
+        return datetime.timezone(datetime.timedelta(minutes=total_minutes))
+    # Try IANA timezone names (zoneinfo is standard in Python 3.9+)
+    try:
+        return ZoneInfo(timezone)
+    except KeyError:
+        pass
+    raise ValueError(
+        f"Invalid timezone: '{timezone}'. Use an IANA timezone name "
+        f"(e.g., 'America/New_York', 'UTC') or an offset (e.g., '-7', '+05:30')."
+    )
+def _validate_timezone(timezone: str) -> None:
+    """
+    Validate that a timezone string is valid.
+    Parameters
+    ----------
+    timezone
+        The timezone string to validate.
+    Raises
+    ------
+    ValueError
+        If the timezone is not valid.
+    """
+    # Use _parse_timezone to validate - it will raise ValueError if invalid
+    _parse_timezone(timezone)
+def _parse_reference_time(reference_time: str) -> datetime.datetime:
+    """
+    Parse a reference time string into a datetime object.
+    Parameters
+    ----------
+    reference_time
+        An ISO 8601 formatted datetime string.
+    Returns
+    -------
+    datetime.datetime
+        The parsed datetime object.
+    Raises
+    ------
+    ValueError
+        If the string cannot be parsed.
+    """
+    # Try parsing with fromisoformat (handles most ISO 8601 formats)
+    try:
+        return datetime.datetime.fromisoformat(reference_time)
+    except ValueError:
+        pass
+    # Try parsing common formats
+    formats = [
+        "%Y-%m-%d %H:%M:%S",
+        "%Y-%m-%d %H:%M:%S%z",
+        "%Y-%m-%dT%H:%M:%S",
+        "%Y-%m-%dT%H:%M:%S%z",
+        "%Y-%m-%d",
+    ]
+    for fmt in formats:
+        try:
+            return datetime.datetime.strptime(reference_time, fmt)
+        except ValueError:
+            continue
+    raise ValueError(
+        f"Could not parse reference_time '{reference_time}'. "
+        f"Please use ISO 8601 format like '2024-01-15T10:30:00' or '2024-01-15T10:30:00+00:00'."
+    )
+def _format_timedelta(td: datetime.timedelta) -> str:
+    """
+    Format a timedelta into a human-readable string.
+    Parameters
+    ----------
+    td
+        The timedelta to format.
+    Returns
+    -------
+    str
+        A human-readable string like "24 hours", "2 days 5 hours", etc.
+    """
+    total_seconds = td.total_seconds()
+    if total_seconds < 60:
+        val = round(total_seconds, 1)
+        return f"{val}s"
+    elif total_seconds < 3600:
+        val = round(total_seconds / 60, 1)
+        return f"{val}m"
+    elif total_seconds < 86400:
+        val = round(total_seconds / 3600, 1)
+        return f"{val}h"
+    elif total_seconds < 604800:
+        # For days, show "xd yh" format for better readability
+        days = int(total_seconds // 86400)
+        remaining_hours = round((total_seconds % 86400) / 3600, 1)
+        if remaining_hours == 0:
+            return f"{days}d"
+        else:
+            return f"{days}d {remaining_hours}h"
+    else:
+        val = round(total_seconds / 604800)
+        return f"{val}w"
+def _transform_auto_brief(brief: str | bool | None) -> str | None:
+    if isinstance(brief, bool):
+        if brief:
+            return "{auto}"
+        else:
+            return None
+    else:
+        return brief
+def _process_action_str(
+    action_str: str,
+    step: int,
     col: str | None,
     value: Any,
     type: str,
@@ -17688,6 +18550,14 @@ def _create_autobrief_or_failure_text(
             for_failure=for_failure,
         )
+    if assertion_type == "data_freshness":
+        return _create_text_data_freshness(
+            lang=lang,
+            column=column,
+            value=values,
+            for_failure=for_failure,
+        )
     if assertion_type == "col_pct_null":
         return _create_text_col_pct_null(
             lang=lang,
@@ -17916,6 +18786,33 @@ def _create_text_col_count_match(lang: str, value: dict, for_failure: bool = Fal
     return EXPECT_FAIL_TEXT[f"col_count_match_n_{type_}_text"][lang].format(values_text=values_text)
+def _create_text_data_freshness(
+    lang: str,
+    column: str | None,
+    value: dict,
+    for_failure: bool = False,
+) -> str:
+    """Create text for data_freshness validation."""
+    type_ = _expect_failure_type(for_failure=for_failure)
+    column_text = _prep_column_text(column=column)
+    max_age_text = _format_timedelta(value.get("max_age"))
+    if for_failure:
+        age = value.get("age")
+        age_text = _format_timedelta(age) if age else "unknown"
+        return EXPECT_FAIL_TEXT[f"data_freshness_{type_}_text"][lang].format(
+            column_text=column_text,
+            max_age_text=max_age_text,
+            age_text=age_text,
+        )
+    else:
+        return EXPECT_FAIL_TEXT[f"data_freshness_{type_}_text"][lang].format(
+            column_text=column_text,
+            max_age_text=max_age_text,
+        )
 def _create_text_col_pct_null(
     lang: str,
     column: str | None,
@@ -18850,6 +19747,71 @@ def _extract_pre_argument(source: str) -> str:
     return pre_arg
+def _create_governance_metadata_html(
+    owner: str | None,
+    consumers: list[str] | None,
+    version: str | None,
+) -> str:
+    """
+    Create HTML for governance metadata display in the report footer.
+    Parameters
+    ----------
+    owner
+        The owner of the data being validated.
+    consumers
+        List of consumers who depend on the data.
+    version
+        The version of the validation plan.
+    Returns
+    -------
+    str
+        HTML string containing formatted governance metadata, or empty string if no metadata.
+    """
+    if owner is None and consumers is None and version is None:
+        return ""
+    metadata_parts = []
+    # Common style for the metadata badges (similar to timing style but slightly smaller font)
+    badge_style = (
+        "background-color: #FFF; color: #444; padding: 0.5em 0.5em; position: inherit; "
+        "margin-right: 5px; border: solid 1px #999999; font-variant-numeric: tabular-nums; "
+        "border-radius: 0; padding: 2px 10px 2px 10px; font-size: 11px;"
+    )
+    label_style = (
+        "color: #777; font-weight: bold; font-size: 9px; text-transform: uppercase; "
+        "margin-right: 3px;"
+    )
+    if owner is not None:
+        metadata_parts.append(
+            f"<span style='{badge_style}'><span style='{label_style}'>Owner:</span> {owner}</span>"
+        )
+    if consumers is not None and len(consumers) > 0:
+        consumers_str = ", ".join(consumers)
+        metadata_parts.append(
+            f"<span style='{badge_style}'>"
+            f"<span style='{label_style}'>Consumers:</span> {consumers_str}"
+            f"</span>"
+        )
+    if version is not None:
+        metadata_parts.append(
+            f"<span style='{badge_style}'>"
+            f"<span style='{label_style}'>Version:</span> {version}"
+            f"</span>"
+        )
+    return (
+        f"<div style='margin-top: 5px; margin-bottom: 5px; margin-left: 10px;'>"
+        f"{''.join(metadata_parts)}"
+        f"</div>"
+    )
 def _create_table_time_html(
     time_start: datetime.datetime | None, time_end: datetime.datetime | None
 ) -> str:
@@ -20356,6 +21318,296 @@ def _step_report_rows_distinct(
     return step_report
+def _step_report_aggregate(
+    assertion_type: str,
+    i: int,
+    column: str,
+    values: dict,
+    all_passed: bool,
+    val_info: dict | None,
+    header: str,
+    lang: str,
+) -> GT:
+    """
+    Generate a step report for aggregate validation methods (col_sum_*, col_avg_*, col_sd_*).
+    This creates a 1-row table showing the computed aggregate value vs. the target value,
+    along with tolerance and pass/fail status.
+    """
+    # Determine whether the `lang` value represents a right-to-left language
+    is_rtl_lang = lang in RTL_LANGUAGES
+    direction_rtl = " direction: rtl;" if is_rtl_lang else ""
+    # Parse assertion type to get aggregate function and comparison operator
+    # Format: col_{agg}_{comp} (e.g., col_sum_eq, col_avg_gt, col_sd_le)
+    parts = assertion_type.split("_")
+    agg_type = parts[1]  # sum, avg, sd
+    comp_type = parts[2]  # eq, gt, ge, lt, le
+    # Map aggregate type to display name
+    agg_display = {"sum": "SUM", "avg": "AVG", "sd": "SD"}.get(agg_type, agg_type.upper())
+    # Map comparison type to symbol
+    comp_symbols = {
+        "eq": "=",
+        "gt": "&gt;",
+        "ge": "&ge;",
+        "lt": "&lt;",
+        "le": "&le;",
+    }
+    comp_symbol = comp_symbols.get(comp_type, comp_type)
+    # Get computed values from val_info (stored during interrogation)
+    if val_info is not None:
+        actual = val_info.get("actual", None)
+        target = val_info.get("target", None)
+        tol = val_info.get("tol", 0)
+        lower_bound = val_info.get("lower_bound", target)
+        upper_bound = val_info.get("upper_bound", target)
+    else:
+        # Fallback if val_info is not available
+        actual = None
+        target = values.get("value", None)
+        tol = values.get("tol", 0)
+        lower_bound = target
+        upper_bound = target
+    # Format column name for display (handle list vs string)
+    if isinstance(column, list):
+        column_display = column[0] if len(column) == 1 else ", ".join(column)
+    else:
+        column_display = str(column)
+    # Generate assertion text for header
+    if target is not None:
+        target_display = f"{target:,.6g}" if isinstance(target, float) else f"{target:,}"
+        assertion_text = f"{agg_display}({column_display}) {comp_symbol} {target_display}"
+    else:
+        assertion_text = f"{agg_display}({column_display}) {comp_symbol} ?"
+    # Calculate difference from boundary
+    if actual is not None and target is not None:
+        if comp_type == "eq":
+            # For equality, show distance from target (considering tolerance)
+            if lower_bound == upper_bound:
+                difference = actual - target
+            else:
+                # With tolerance, show distance from nearest bound
+                if actual < lower_bound:
+                    difference = actual - lower_bound
+                elif actual > upper_bound:
+                    difference = actual - upper_bound
+                else:
+                    difference = 0  # Within bounds
+        elif comp_type in ["gt", "ge"]:
+            # Distance from lower bound (positive if passing)
+            difference = actual - lower_bound
+        elif comp_type in ["lt", "le"]:
+            # Distance from upper bound (negative if passing)
+            difference = actual - upper_bound
+        else:
+            difference = actual - target
+    else:
+        difference = None
+    # Format values for display
+    def format_value(v):
+        if v is None:
+            return "&mdash;"
+        if isinstance(v, float):
+            return f"{v:,.6g}"
+        return f"{v:,}"
+    # Format tolerance for display
+    if tol == 0:
+        tol_display = "&mdash;"
+    elif isinstance(tol, tuple):
+        tol_display = f"(-{tol[0]}, +{tol[1]})"
+    else:
+        tol_display = f"&plusmn;{tol}"
+    # Format difference with sign
+    if difference is not None:
+        if difference == 0:
+            diff_display = "0"
+        elif difference > 0:
+            diff_display = (
+                f"+{difference:,.6g}" if isinstance(difference, float) else f"+{difference:,}"
+            )
+        else:
+            diff_display = (
+                f"{difference:,.6g}" if isinstance(difference, float) else f"{difference:,}"
+            )
+    else:
+        diff_display = "&mdash;"
+    # Create pass/fail indicator
+    if all_passed:
+        status_html = CHECK_MARK_SPAN
+        status_color = "#4CA64C"
+    else:
+        status_html = CROSS_MARK_SPAN
+        status_color = "#CF142B"
+    # Select DataFrame library (prefer Polars, fall back to Pandas)
+    if _is_lib_present("polars"):
+        import polars as pl
+        df_lib = pl
+    elif _is_lib_present("pandas"):  # pragma: no cover
+        import pandas as pd  # pragma: no cover
+        df_lib = pd  # pragma: no cover
+    else:  # pragma: no cover
+        raise ImportError(
+            "Neither Polars nor Pandas is available for step report generation"
+        )  # pragma: no cover
+    # Create the data for the 1-row table
+    report_data = df_lib.DataFrame(
+        {
+            "actual": [format_value(actual)],
+            "target": [format_value(target)],
+            "tolerance": [tol_display],
+            "difference": [diff_display],
+            "status": [status_html],
+        }
+    )
+    # Create GT table with styling matching preview() and other step reports
+    step_report = (
+        GT(report_data, id="pb_step_tbl")
+        .opt_table_font(font=google_font(name="IBM Plex Sans"))
+        .opt_align_table_header(align="left")
+        .cols_label(
+            actual="ACTUAL",
+            target="EXPECTED",
+            tolerance="TOL",
+            difference="DIFFERENCE",
+            status="",
+        )
+        .cols_align(align="center")
+        .fmt_markdown(columns=["actual", "target", "tolerance", "difference", "status"])
+        .tab_style(
+            style=style.text(color="black", font=google_font(name="IBM Plex Mono"), size="13px"),
+            locations=loc.body(columns=["actual", "target", "tolerance", "difference"]),
+        )
+        .tab_style(
+            style=style.text(size="13px"),
+            locations=loc.body(columns="status"),
+        )
+        .tab_style(
+            style=style.text(color="gray20", font=google_font(name="IBM Plex Mono"), size="12px"),
+            locations=loc.column_labels(),
+        )
+        .tab_style(
+            style=style.borders(
+                sides=["top", "bottom"], color="#E9E9E9", style="solid", weight="1px"
+            ),
+            locations=loc.body(),
+        )
+        .tab_options(
+            table_body_vlines_style="solid",
+            table_body_vlines_width="1px",
+            table_body_vlines_color="#E9E9E9",
+            column_labels_vlines_style="solid",
+            column_labels_vlines_width="1px",
+            column_labels_vlines_color="#F2F2F2",
+        )
+        .cols_width(
+            cases={
+                "actual": "200px",
+                "target": "200px",
+                "tolerance": "150px",
+                "difference": "200px",
+                "status": "50px",
+            }
+        )
+    )
+    # Apply styling based on pass/fail
+    if all_passed:
+        step_report = step_report.tab_style(
+            style=[
+                style.text(color="#006400"),
+                style.fill(color="#4CA64C33"),
+            ],
+            locations=loc.body(columns="status"),
+        )
+    else:
+        step_report = step_report.tab_style(
+            style=[
+                style.text(color="#B22222"),
+                style.fill(color="#FFC1C159"),
+            ],
+            locations=loc.body(columns="status"),
+        )
+    # If the version of `great_tables` is `>=0.17.0` then disable Quarto table processing
+    if version("great_tables") >= "0.17.0":
+        step_report = step_report.tab_options(quarto_disable_processing=True)
+    # If no header requested, return the table as-is
+    if header is None:
+        return step_report
+    # Create header content
+    assertion_header_text = STEP_REPORT_TEXT["assertion_header_text"][lang]
+    # Wrap assertion text in styled code tag
+    assertion_code = (
+        f"<code style='color: #303030; font-family: monospace; font-size: smaller;'>"
+        f"{assertion_text}</code>"
+    )
+    if all_passed:
+        title = STEP_REPORT_TEXT["report_for_step_i"][lang].format(i=i) + " " + CHECK_MARK_SPAN
+        result_stmt = STEP_REPORT_TEXT.get("agg_success_statement", {}).get(
+            lang,
+            f"The aggregate value for column <code>{column_display}</code> satisfies the condition.",
+        )
+        if isinstance(result_stmt, str) and "{column}" in result_stmt:
+            result_stmt = result_stmt.format(column=column_display)
+    else:
+        title = STEP_REPORT_TEXT["report_for_step_i"][lang].format(i=i) + " " + CROSS_MARK_SPAN
+        result_stmt = STEP_REPORT_TEXT.get("agg_failure_statement", {}).get(
+            lang,
+            f"The aggregate value for column <code>{column_display}</code> does not satisfy the condition.",
+        )
+        if isinstance(result_stmt, str) and "{column}" in result_stmt:
+            result_stmt = result_stmt.format(column=column_display)
+    details = (
+        f"<div style='font-size: 13.6px; {direction_rtl}'>"
+        "<div style='padding-top: 7px;'>"
+        f"{assertion_header_text} <span style='border-style: solid; border-width: thin; "
+        "border-color: lightblue; padding-left: 2px; padding-right: 2px;'>"
+        "<code style='color: #303030; background-color: transparent; "
+        f"position: relative; bottom: 1px;'>{assertion_code}</code></span>"
+        "</div>"
+        "<div style='padding-top: 7px;'>"
+        f"{result_stmt}"
+        "</div>"
+        "</div>"
+    )
+    # Generate the default template text for the header when `":default:"` is used
+    if header == ":default:":
+        header = "{title}{details}"
+    # Use commonmark to convert the header text to HTML
+    header = commonmark.commonmark(header)
+    # Place any templated text in the header
+    header = header.format(title=title, details=details)
+    # Create the header with `header` string
+    step_report = step_report.tab_header(title=md(header))
+    return step_report
 def _step_report_schema_in_order(
     step: int, schema_info: dict, header: str | None, lang: str, debug_return_df: bool = False
 ) -> GT | Any:

pointblank 0.18.0__py3-none-any.whl → 0.20.0__py3-none-any.whl

pointblank 0.18.0py3-none-any.whl → 0.20.0py3-none-any.whl