PyPI - truthound-dashboard - Versions diffs - 1.4.4__py3-none-any.whl → 1.5.1__py3-none-any.whl - Mend

truthound-dashboard 1.4.4py3-none-any.whl → 1.5.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (205) hide show

truthound_dashboard/api/alerts.py +75 -86
truthound_dashboard/api/anomaly.py +7 -13
truthound_dashboard/api/cross_alerts.py +38 -52
truthound_dashboard/api/drift.py +49 -59
truthound_dashboard/api/drift_monitor.py +234 -79
truthound_dashboard/api/enterprise_sampling.py +498 -0
truthound_dashboard/api/history.py +57 -5
truthound_dashboard/api/lineage.py +3 -48
truthound_dashboard/api/maintenance.py +104 -49
truthound_dashboard/api/mask.py +1 -2
truthound_dashboard/api/middleware.py +2 -1
truthound_dashboard/api/model_monitoring.py +435 -311
truthound_dashboard/api/notifications.py +227 -191
truthound_dashboard/api/notifications_advanced.py +21 -20
truthound_dashboard/api/observability.py +586 -0
truthound_dashboard/api/plugins.py +2 -433
truthound_dashboard/api/profile.py +199 -37
truthound_dashboard/api/quality_reporter.py +701 -0
truthound_dashboard/api/reports.py +7 -16
truthound_dashboard/api/router.py +66 -0
truthound_dashboard/api/rule_suggestions.py +5 -5
truthound_dashboard/api/scan.py +17 -19
truthound_dashboard/api/schedules.py +85 -50
truthound_dashboard/api/schema_evolution.py +6 -6
truthound_dashboard/api/schema_watcher.py +667 -0
truthound_dashboard/api/sources.py +98 -27
truthound_dashboard/api/tiering.py +1323 -0
truthound_dashboard/api/triggers.py +14 -11
truthound_dashboard/api/validations.py +12 -11
truthound_dashboard/api/versioning.py +1 -6
truthound_dashboard/core/__init__.py +129 -3
truthound_dashboard/core/actions/__init__.py +62 -0
truthound_dashboard/core/actions/custom.py +426 -0
truthound_dashboard/core/actions/notifications.py +910 -0
truthound_dashboard/core/actions/storage.py +472 -0
truthound_dashboard/core/actions/webhook.py +281 -0
truthound_dashboard/core/anomaly.py +262 -67
truthound_dashboard/core/anomaly_explainer.py +4 -3
truthound_dashboard/core/backends/__init__.py +67 -0
truthound_dashboard/core/backends/base.py +299 -0
truthound_dashboard/core/backends/errors.py +191 -0
truthound_dashboard/core/backends/factory.py +423 -0
truthound_dashboard/core/backends/mock_backend.py +451 -0
truthound_dashboard/core/backends/truthound_backend.py +718 -0
truthound_dashboard/core/checkpoint/__init__.py +87 -0
truthound_dashboard/core/checkpoint/adapters.py +814 -0
truthound_dashboard/core/checkpoint/checkpoint.py +491 -0
truthound_dashboard/core/checkpoint/runner.py +270 -0
truthound_dashboard/core/connections.py +645 -23
truthound_dashboard/core/converters/__init__.py +14 -0
truthound_dashboard/core/converters/truthound.py +620 -0
truthound_dashboard/core/cross_alerts.py +540 -320
truthound_dashboard/core/datasource_factory.py +1672 -0
truthound_dashboard/core/drift_monitor.py +216 -20
truthound_dashboard/core/enterprise_sampling.py +1291 -0
truthound_dashboard/core/interfaces/__init__.py +225 -0
truthound_dashboard/core/interfaces/actions.py +652 -0
truthound_dashboard/core/interfaces/base.py +247 -0
truthound_dashboard/core/interfaces/checkpoint.py +676 -0
truthound_dashboard/core/interfaces/protocols.py +664 -0
truthound_dashboard/core/interfaces/reporters.py +650 -0
truthound_dashboard/core/interfaces/routing.py +646 -0
truthound_dashboard/core/interfaces/triggers.py +619 -0
truthound_dashboard/core/lineage.py +407 -71
truthound_dashboard/core/model_monitoring.py +431 -3
truthound_dashboard/core/notifications/base.py +4 -0
truthound_dashboard/core/notifications/channels.py +501 -1203
truthound_dashboard/core/notifications/deduplication/__init__.py +81 -115
truthound_dashboard/core/notifications/deduplication/service.py +131 -348
truthound_dashboard/core/notifications/dispatcher.py +202 -11
truthound_dashboard/core/notifications/escalation/__init__.py +119 -106
truthound_dashboard/core/notifications/escalation/engine.py +168 -358
truthound_dashboard/core/notifications/routing/__init__.py +88 -128
truthound_dashboard/core/notifications/routing/engine.py +90 -317
truthound_dashboard/core/notifications/stats_aggregator.py +246 -1
truthound_dashboard/core/notifications/throttling/__init__.py +67 -50
truthound_dashboard/core/notifications/throttling/builder.py +117 -255
truthound_dashboard/core/notifications/truthound_adapter.py +842 -0
truthound_dashboard/core/phase5/collaboration.py +1 -1
truthound_dashboard/core/plugins/lifecycle/__init__.py +0 -13
truthound_dashboard/core/quality_reporter.py +1359 -0
truthound_dashboard/core/report_history.py +0 -6
truthound_dashboard/core/reporters/__init__.py +175 -14
truthound_dashboard/core/reporters/adapters.py +943 -0
truthound_dashboard/core/reporters/base.py +0 -3
truthound_dashboard/core/reporters/builtin/__init__.py +18 -0
truthound_dashboard/core/reporters/builtin/csv_reporter.py +111 -0
truthound_dashboard/core/reporters/builtin/html_reporter.py +270 -0
truthound_dashboard/core/reporters/builtin/json_reporter.py +127 -0
truthound_dashboard/core/reporters/compat.py +266 -0
truthound_dashboard/core/reporters/csv_reporter.py +2 -35
truthound_dashboard/core/reporters/factory.py +526 -0
truthound_dashboard/core/reporters/interfaces.py +745 -0
truthound_dashboard/core/reporters/registry.py +1 -10
truthound_dashboard/core/scheduler.py +165 -0
truthound_dashboard/core/schema_evolution.py +3 -3
truthound_dashboard/core/schema_watcher.py +1528 -0
truthound_dashboard/core/services.py +595 -76
truthound_dashboard/core/store_manager.py +810 -0
truthound_dashboard/core/streaming_anomaly.py +169 -4
truthound_dashboard/core/tiering.py +1309 -0
truthound_dashboard/core/triggers/evaluators.py +178 -8
truthound_dashboard/core/truthound_adapter.py +2620 -197
truthound_dashboard/core/unified_alerts.py +23 -20
truthound_dashboard/db/__init__.py +8 -0
truthound_dashboard/db/database.py +8 -2
truthound_dashboard/db/models.py +944 -25
truthound_dashboard/db/repository.py +2 -0
truthound_dashboard/main.py +15 -0
truthound_dashboard/schemas/__init__.py +177 -16
truthound_dashboard/schemas/base.py +44 -23
truthound_dashboard/schemas/collaboration.py +19 -6
truthound_dashboard/schemas/cross_alerts.py +19 -3
truthound_dashboard/schemas/drift.py +61 -55
truthound_dashboard/schemas/drift_monitor.py +67 -23
truthound_dashboard/schemas/enterprise_sampling.py +653 -0
truthound_dashboard/schemas/lineage.py +0 -33
truthound_dashboard/schemas/mask.py +10 -8
truthound_dashboard/schemas/model_monitoring.py +89 -10
truthound_dashboard/schemas/notifications_advanced.py +13 -0
truthound_dashboard/schemas/observability.py +453 -0
truthound_dashboard/schemas/plugins.py +0 -280
truthound_dashboard/schemas/profile.py +154 -247
truthound_dashboard/schemas/quality_reporter.py +403 -0
truthound_dashboard/schemas/reports.py +2 -2
truthound_dashboard/schemas/rule_suggestion.py +8 -1
truthound_dashboard/schemas/scan.py +4 -24
truthound_dashboard/schemas/schedule.py +11 -3
truthound_dashboard/schemas/schema_watcher.py +727 -0
truthound_dashboard/schemas/source.py +17 -2
truthound_dashboard/schemas/tiering.py +822 -0
truthound_dashboard/schemas/triggers.py +16 -0
truthound_dashboard/schemas/unified_alerts.py +7 -0
truthound_dashboard/schemas/validation.py +0 -13
truthound_dashboard/schemas/validators/base.py +41 -21
truthound_dashboard/schemas/validators/business_rule_validators.py +244 -0
truthound_dashboard/schemas/validators/localization_validators.py +273 -0
truthound_dashboard/schemas/validators/ml_feature_validators.py +308 -0
truthound_dashboard/schemas/validators/profiling_validators.py +275 -0
truthound_dashboard/schemas/validators/referential_validators.py +312 -0
truthound_dashboard/schemas/validators/registry.py +93 -8
truthound_dashboard/schemas/validators/timeseries_validators.py +389 -0
truthound_dashboard/schemas/versioning.py +1 -6
truthound_dashboard/static/index.html +2 -2
truthound_dashboard-1.5.1.dist-info/METADATA +312 -0
{truthound_dashboard-1.4.4.dist-info → truthound_dashboard-1.5.1.dist-info}/RECORD +149 -148
truthound_dashboard/core/plugins/hooks/__init__.py +0 -63
truthound_dashboard/core/plugins/hooks/decorators.py +0 -367
truthound_dashboard/core/plugins/hooks/manager.py +0 -403
truthound_dashboard/core/plugins/hooks/protocols.py +0 -265
truthound_dashboard/core/plugins/lifecycle/hot_reload.py +0 -584
truthound_dashboard/core/reporters/junit_reporter.py +0 -233
truthound_dashboard/core/reporters/markdown_reporter.py +0 -207
truthound_dashboard/core/reporters/pdf_reporter.py +0 -209
truthound_dashboard/static/assets/_baseUniq-BcrSP13d.js +0 -1
truthound_dashboard/static/assets/arc-DlYjKwIL.js +0 -1
truthound_dashboard/static/assets/architectureDiagram-VXUJARFQ-Bb2drbQM.js +0 -36
truthound_dashboard/static/assets/blockDiagram-VD42YOAC-BlsPG1CH.js +0 -122
truthound_dashboard/static/assets/c4Diagram-YG6GDRKO-B9JdUoaC.js +0 -10
truthound_dashboard/static/assets/channel-Q6mHF1Hd.js +0 -1
truthound_dashboard/static/assets/chunk-4BX2VUAB-DmyoPVuJ.js +0 -1
truthound_dashboard/static/assets/chunk-55IACEB6-Bcz6Siv8.js +0 -1
truthound_dashboard/static/assets/chunk-B4BG7PRW-Br3G5Rum.js +0 -165
truthound_dashboard/static/assets/chunk-DI55MBZ5-DuM9c23u.js +0 -220
truthound_dashboard/static/assets/chunk-FMBD7UC4-DNU-5mvT.js +0 -15
truthound_dashboard/static/assets/chunk-QN33PNHL-Im2yNcmS.js +0 -1
truthound_dashboard/static/assets/chunk-QZHKN3VN-kZr8XFm1.js +0 -1
truthound_dashboard/static/assets/chunk-TZMSLE5B-Q__360q_.js +0 -1
truthound_dashboard/static/assets/classDiagram-2ON5EDUG-vtixxUyK.js +0 -1
truthound_dashboard/static/assets/classDiagram-v2-WZHVMYZB-vtixxUyK.js +0 -1
truthound_dashboard/static/assets/clone-BOt2LwD0.js +0 -1
truthound_dashboard/static/assets/cose-bilkent-S5V4N54A-CBDw6iac.js +0 -1
truthound_dashboard/static/assets/dagre-6UL2VRFP-XdKqmmY9.js +0 -4
truthound_dashboard/static/assets/diagram-PSM6KHXK-DAZ8nx9V.js +0 -24
truthound_dashboard/static/assets/diagram-QEK2KX5R-BRvDTbGD.js +0 -43
truthound_dashboard/static/assets/diagram-S2PKOQOG-bQcczUkl.js +0 -24
truthound_dashboard/static/assets/erDiagram-Q2GNP2WA-DPje7VMN.js +0 -60
truthound_dashboard/static/assets/flowDiagram-NV44I4VS-B7BVtFVS.js +0 -162
truthound_dashboard/static/assets/ganttDiagram-JELNMOA3-D6WKSS7U.js +0 -267
truthound_dashboard/static/assets/gitGraphDiagram-NY62KEGX-D3vtVd3y.js +0 -65
truthound_dashboard/static/assets/graph-BKgNKZVp.js +0 -1
truthound_dashboard/static/assets/index-C6JSrkHo.css +0 -1
truthound_dashboard/static/assets/index-DkU82VsU.js +0 -1800
truthound_dashboard/static/assets/infoDiagram-WHAUD3N6-DnNCT429.js +0 -2
truthound_dashboard/static/assets/journeyDiagram-XKPGCS4Q-DGiMozqS.js +0 -139
truthound_dashboard/static/assets/kanban-definition-3W4ZIXB7-BV2gUgli.js +0 -89
truthound_dashboard/static/assets/katex-Cu_Erd72.js +0 -261
truthound_dashboard/static/assets/layout-DI2MfQ5G.js +0 -1
truthound_dashboard/static/assets/min-DYdgXVcT.js +0 -1
truthound_dashboard/static/assets/mindmap-definition-VGOIOE7T-C7x4ruxz.js +0 -68
truthound_dashboard/static/assets/pieDiagram-ADFJNKIX-CAJaAB9f.js +0 -30
truthound_dashboard/static/assets/quadrantDiagram-AYHSOK5B-DeqwDI46.js +0 -7
truthound_dashboard/static/assets/requirementDiagram-UZGBJVZJ-e3XDpZIM.js +0 -64
truthound_dashboard/static/assets/sankeyDiagram-TZEHDZUN-CNnAv5Ux.js +0 -10
truthound_dashboard/static/assets/sequenceDiagram-WL72ISMW-Dsne-Of3.js +0 -145
truthound_dashboard/static/assets/stateDiagram-FKZM4ZOC-Ee0sQXyb.js +0 -1
truthound_dashboard/static/assets/stateDiagram-v2-4FDKWEC3-B26KqW_W.js +0 -1
truthound_dashboard/static/assets/timeline-definition-IT6M3QCI-DZYi2yl3.js +0 -61
truthound_dashboard/static/assets/treemap-KMMF4GRG-CY3f8In2.js +0 -128
truthound_dashboard/static/assets/unmerged_dictionaries-Dd7xcPWG.js +0 -1
truthound_dashboard/static/assets/xychartDiagram-PRI3JC2R-CS7fydZZ.js +0 -7
truthound_dashboard-1.4.4.dist-info/METADATA +0 -507
{truthound_dashboard-1.4.4.dist-info → truthound_dashboard-1.5.1.dist-info}/WHEEL +0 -0
{truthound_dashboard-1.4.4.dist-info → truthound_dashboard-1.5.1.dist-info}/entry_points.txt +0 -0
{truthound_dashboard-1.4.4.dist-info → truthound_dashboard-1.5.1.dist-info}/licenses/LICENSE +0 -0

truthound_dashboard/core/converters/__init__.py ADDED Viewed

@@ -0,0 +1,14 @@
+"""Result converters for data quality backends.
+This module provides converters that transform backend-specific result
+objects into dashboard-standard result models.
+The converter pattern isolates backend-specific code and makes it easy
+to support multiple backends or handle API changes.
+"""
+from .truthound import TruthoundResultConverter
+__all__ = [
+    "TruthoundResultConverter",
+]

truthound_dashboard/core/converters/truthound.py ADDED Viewed

@@ -0,0 +1,620 @@
+"""Truthound result converters.
+This module isolates all truthound-specific result object conversions.
+It handles converting truthound's Report, Schema, TableProfile, etc.
+into dashboard-standard result dataclasses.
+By isolating conversions here, we can:
+- Handle truthound API changes in one place
+- Support multiple truthound versions
+- Provide graceful fallbacks for missing attributes
+"""
+from __future__ import annotations
+import logging
+from datetime import datetime
+from pathlib import Path
+from typing import Any
+import yaml
+logger = logging.getLogger(__name__)
+class TruthoundResultConverter:
+    """Converter for truthound result objects.
+    This class provides static methods to convert truthound-specific
+    objects into dashboard result dataclasses.
+    All conversions use defensive attribute access (getattr with defaults)
+    to handle different truthound versions gracefully.
+    """
+    @staticmethod
+    def convert_severity(severity: Any) -> str:
+        """Safely convert severity enum or value to lowercase string.
+        Args:
+            severity: Severity value (enum with .value or string).
+        Returns:
+            Lowercase severity string.
+        """
+        if hasattr(severity, "value"):
+            return str(severity.value).lower()
+        return str(severity).lower()
+    @staticmethod
+    def convert_check_result(result: Any) -> dict[str, Any]:
+        """Convert truthound Report to CheckResult dict.
+        The truthound Report contains:
+        - issues: list[ValidationIssue]
+        - source: str
+        - row_count: int
+        - column_count: int
+        - has_issues: bool
+        - has_critical: bool
+        - has_high: bool
+        Args:
+            result: Truthound Report object.
+        Returns:
+            Dictionary with CheckResult fields.
+        """
+        issues = getattr(result, "issues", [])
+        severity_counts = {"critical": 0, "high": 0, "medium": 0, "low": 0}
+        converted_issues = []
+        for issue in issues:
+            severity = TruthoundResultConverter.convert_severity(issue.severity)
+            if severity in severity_counts:
+                severity_counts[severity] += 1
+            converted_issues.append({
+                "column": getattr(issue, "column", ""),
+                "issue_type": getattr(issue, "issue_type", "unknown"),
+                "count": getattr(issue, "count", 0),
+                "severity": severity,
+                "details": getattr(issue, "details", None),
+                "expected": getattr(issue, "expected", None),
+                "actual": getattr(issue, "actual", None),
+                "sample_values": getattr(issue, "sample_values", None),
+            })
+        return {
+            "passed": not getattr(result, "has_issues", len(issues) > 0),
+            "has_critical": getattr(result, "has_critical", severity_counts["critical"] > 0),
+            "has_high": getattr(result, "has_high", severity_counts["high"] > 0),
+            "total_issues": len(issues),
+            "critical_issues": severity_counts["critical"],
+            "high_issues": severity_counts["high"],
+            "medium_issues": severity_counts["medium"],
+            "low_issues": severity_counts["low"],
+            "source": getattr(result, "source", ""),
+            "row_count": getattr(result, "row_count", 0),
+            "column_count": getattr(result, "column_count", 0),
+            "issues": converted_issues,
+        }
+    @staticmethod
+    def convert_learn_result(result: Any) -> dict[str, Any]:
+        """Convert truthound Schema to LearnResult dict.
+        The truthound Schema contains:
+        - columns: dict[str, ColumnSchema]
+        - row_count: int | None
+        - version: str
+        - to_dict(): Convert to dictionary
+        Args:
+            result: Truthound Schema object.
+        Returns:
+            Dictionary with LearnResult fields.
+        """
+        schema_dict = result.to_dict() if hasattr(result, "to_dict") else {}
+        schema_yaml = yaml.dump(
+            schema_dict,
+            default_flow_style=False,
+            sort_keys=False,
+            allow_unicode=True,
+        )
+        columns = getattr(result, "columns", {})
+        column_list = list(columns.keys()) if isinstance(columns, dict) else []
+        return {
+            "schema": schema_dict,
+            "schema_yaml": schema_yaml,
+            "row_count": getattr(result, "row_count", None),
+            "column_count": len(column_list),
+            "columns": column_list,
+        }
+    @staticmethod
+    def convert_profile_result(result: Any) -> dict[str, Any]:
+        """Convert truthound TableProfile or ProfileReport to ProfileResult dict.
+        Supports both new TableProfile and legacy ProfileReport formats.
+        Args:
+            result: Truthound profile result object.
+        Returns:
+            Dictionary with ProfileResult fields.
+        """
+        # Check if this is the new TableProfile or legacy ProfileReport
+        if hasattr(result, "estimated_memory_bytes"):
+            return TruthoundResultConverter._convert_table_profile(result)
+        else:
+            return TruthoundResultConverter._convert_legacy_profile(result)
+    @staticmethod
+    def _convert_table_profile(result: Any) -> dict[str, Any]:
+        """Convert new truthound TableProfile to ProfileResult dict."""
+        columns = []
+        for col in getattr(result, "columns", []):
+            col_data = TruthoundResultConverter._convert_column_profile(col)
+            columns.append(col_data)
+        # Convert correlations
+        correlations = None
+        raw_correlations = getattr(result, "correlations", None)
+        if raw_correlations:
+            correlations = [(c[0], c[1], c[2]) for c in raw_correlations]
+        # Get profiled_at as ISO string
+        profiled_at = None
+        raw_profiled_at = getattr(result, "profiled_at", None)
+        if raw_profiled_at:
+            profiled_at = (
+                raw_profiled_at.isoformat()
+                if isinstance(raw_profiled_at, datetime)
+                else str(raw_profiled_at)
+            )
+        estimated_memory = getattr(result, "estimated_memory_bytes", 0)
+        return {
+            "name": getattr(result, "name", ""),
+            "source": getattr(result, "source", ""),
+            "row_count": getattr(result, "row_count", 0),
+            "column_count": getattr(result, "column_count", 0),
+            "estimated_memory_bytes": estimated_memory,
+            "columns": columns,
+            "duplicate_row_count": getattr(result, "duplicate_row_count", 0),
+            "duplicate_row_ratio": getattr(result, "duplicate_row_ratio", 0.0),
+            "correlations": correlations,
+            "profiled_at": profiled_at,
+            "profile_duration_ms": getattr(result, "profile_duration_ms", 0.0),
+            "size_bytes": estimated_memory,
+        }
+    @staticmethod
+    def _convert_column_profile(col: Any) -> dict[str, Any]:
+        """Convert a single column profile."""
+        # Extract distribution stats if present
+        distribution = None
+        raw_distribution = getattr(col, "distribution", None)
+        if raw_distribution:
+            distribution = {
+                "mean": getattr(raw_distribution, "mean", None),
+                "std": getattr(raw_distribution, "std", None),
+                "min": getattr(raw_distribution, "min", None),
+                "max": getattr(raw_distribution, "max", None),
+                "median": getattr(raw_distribution, "median", None),
+                "q1": getattr(raw_distribution, "q1", None),
+                "q3": getattr(raw_distribution, "q3", None),
+                "skewness": getattr(raw_distribution, "skewness", None),
+                "kurtosis": getattr(raw_distribution, "kurtosis", None),
+            }
+        # Convert top_values
+        top_values = None
+        raw_top_values = getattr(col, "top_values", None)
+        if raw_top_values:
+            top_values = [
+                {
+                    "value": str(v.value) if getattr(v, "value", None) is not None else None,
+                    "count": getattr(v, "count", 0),
+                    "ratio": getattr(v, "ratio", 0.0),
+                }
+                for v in raw_top_values
+            ]
+        # Convert bottom_values
+        bottom_values = None
+        raw_bottom_values = getattr(col, "bottom_values", None)
+        if raw_bottom_values:
+            bottom_values = [
+                {
+                    "value": str(v.value) if getattr(v, "value", None) is not None else None,
+                    "count": getattr(v, "count", 0),
+                    "ratio": getattr(v, "ratio", 0.0),
+                }
+                for v in raw_bottom_values
+            ]
+        # Convert detected_patterns
+        detected_patterns = None
+        raw_patterns = getattr(col, "detected_patterns", None)
+        if raw_patterns:
+            detected_patterns = [
+                {
+                    "pattern": getattr(p, "pattern", None),
+                    "regex": getattr(p, "regex", None),
+                    "match_ratio": getattr(p, "match_ratio", 0.0),
+                    "sample_matches": list(getattr(p, "sample_matches", [])),
+                }
+                for p in raw_patterns
+            ]
+        # Get inferred type value
+        inferred_type = "unknown"
+        raw_inferred_type = getattr(col, "inferred_type", None)
+        if raw_inferred_type:
+            inferred_type = (
+                raw_inferred_type.value
+                if hasattr(raw_inferred_type, "value")
+                else str(raw_inferred_type)
+            )
+        # Convert datetime fields
+        min_date = None
+        max_date = None
+        raw_min_date = getattr(col, "min_date", None)
+        raw_max_date = getattr(col, "max_date", None)
+        if raw_min_date:
+            min_date = (
+                raw_min_date.isoformat()
+                if isinstance(raw_min_date, datetime)
+                else str(raw_min_date)
+            )
+        if raw_max_date:
+            max_date = (
+                raw_max_date.isoformat()
+                if isinstance(raw_max_date, datetime)
+                else str(raw_max_date)
+            )
+        # Get suggested validators
+        suggested_validators = None
+        raw_validators = getattr(col, "suggested_validators", None)
+        if raw_validators:
+            suggested_validators = list(raw_validators)
+        return {
+            "name": getattr(col, "name", ""),
+            "physical_type": getattr(col, "physical_type", "unknown"),
+            "inferred_type": inferred_type,
+            "row_count": getattr(col, "row_count", 0),
+            "null_count": getattr(col, "null_count", 0),
+            "null_ratio": getattr(col, "null_ratio", 0.0),
+            "empty_string_count": getattr(col, "empty_string_count", 0),
+            "distinct_count": getattr(col, "distinct_count", 0),
+            "unique_ratio": getattr(col, "unique_ratio", 0.0),
+            "is_unique": getattr(col, "is_unique", False),
+            "is_constant": getattr(col, "is_constant", False),
+            "distribution": distribution,
+            "top_values": top_values,
+            "bottom_values": bottom_values,
+            "min_length": getattr(col, "min_length", None),
+            "max_length": getattr(col, "max_length", None),
+            "avg_length": getattr(col, "avg_length", None),
+            "detected_patterns": detected_patterns,
+            "min_date": min_date,
+            "max_date": max_date,
+            "date_gaps": getattr(col, "date_gaps", 0),
+            "suggested_validators": suggested_validators,
+            "profile_duration_ms": getattr(col, "profile_duration_ms", 0.0),
+        }
+    @staticmethod
+    def _convert_legacy_profile(result: Any) -> dict[str, Any]:
+        """Convert legacy truthound ProfileReport to ProfileResult dict."""
+        row_count = getattr(result, "row_count", 0)
+        columns = []
+        for col in getattr(result, "columns", []):
+            if isinstance(col, dict):
+                col_data = TruthoundResultConverter._convert_legacy_column(col, row_count)
+            else:
+                col_data = TruthoundResultConverter._convert_column_profile(col)
+            columns.append(col_data)
+        size_bytes = getattr(result, "size_bytes", 0)
+        return {
+            "name": getattr(result, "source", ""),
+            "source": getattr(result, "source", ""),
+            "row_count": row_count,
+            "column_count": getattr(result, "column_count", len(columns)),
+            "estimated_memory_bytes": size_bytes,
+            "columns": columns,
+            "duplicate_row_count": 0,
+            "duplicate_row_ratio": 0.0,
+            "correlations": None,
+            "profiled_at": None,
+            "profile_duration_ms": 0.0,
+            "size_bytes": size_bytes,
+        }
+    @staticmethod
+    def _convert_legacy_column(col: dict, row_count: int) -> dict[str, Any]:
+        """Convert legacy column dict to column profile dict."""
+        # Parse null_pct and unique_pct
+        null_ratio = 0.0
+        unique_ratio = 0.0
+        null_pct = col.get("null_pct")
+        if isinstance(null_pct, str):
+            null_ratio = float(null_pct.rstrip("%")) / 100.0
+        elif isinstance(null_pct, (int, float)):
+            null_ratio = float(null_pct)
+        unique_pct = col.get("unique_pct")
+        if isinstance(unique_pct, str):
+            unique_ratio = float(unique_pct.rstrip("%")) / 100.0
+        elif isinstance(unique_pct, (int, float)):
+            unique_ratio = float(unique_pct)
+        # Build distribution if numeric stats present
+        distribution = None
+        if col.get("min") is not None or col.get("mean") is not None:
+            distribution = {
+                "min": col.get("min"),
+                "max": col.get("max"),
+                "mean": col.get("mean"),
+                "std": col.get("std"),
+            }
+        return {
+            "name": col.get("name", ""),
+            "physical_type": col.get("dtype", "unknown"),
+            "inferred_type": col.get("dtype", "unknown"),
+            "row_count": row_count,
+            "null_count": 0,
+            "null_ratio": null_ratio,
+            "empty_string_count": 0,
+            "distinct_count": 0,
+            "unique_ratio": unique_ratio,
+            "is_unique": False,
+            "is_constant": False,
+            "distribution": distribution,
+            "top_values": None,
+            "bottom_values": None,
+            "min_length": None,
+            "max_length": None,
+            "avg_length": None,
+            "detected_patterns": None,
+            "min_date": None,
+            "max_date": None,
+            "date_gaps": 0,
+            "suggested_validators": None,
+            "profile_duration_ms": 0.0,
+        }
+    @staticmethod
+    def convert_compare_result(result: Any) -> dict[str, Any]:
+        """Convert truthound DriftReport to CompareResult dict.
+        The truthound DriftReport contains:
+        - baseline_source: str
+        - current_source: str
+        - baseline_rows: int
+        - current_rows: int
+        - columns: list[ColumnDrift]
+        - has_drift: bool
+        - has_high_drift: bool
+        - get_drifted_columns(): list[str]
+        Args:
+            result: Truthound DriftReport object.
+        Returns:
+            Dictionary with CompareResult fields.
+        """
+        columns = []
+        for col in getattr(result, "columns", []):
+            col_result = getattr(col, "result", None)
+            if col_result:
+                level = getattr(col_result, "level", "none")
+                level_str = (
+                    level.value if hasattr(level, "value") else str(level)
+                )
+                columns.append({
+                    "column": getattr(col, "column", ""),
+                    "dtype": getattr(col, "dtype", "unknown"),
+                    "drifted": getattr(col_result, "drifted", False),
+                    "level": level_str,
+                    "method": getattr(col_result, "method", "unknown"),
+                    "statistic": getattr(col_result, "statistic", 0.0),
+                    "p_value": getattr(col_result, "p_value", 1.0),
+                    "baseline_stats": getattr(col, "baseline_stats", {}),
+                    "current_stats": getattr(col, "current_stats", {}),
+                })
+        # Get drifted columns
+        drifted_columns = []
+        if hasattr(result, "get_drifted_columns"):
+            drifted_columns = result.get_drifted_columns()
+        else:
+            drifted_columns = [c["column"] for c in columns if c.get("drifted")]
+        return {
+            "baseline_source": getattr(result, "baseline_source", ""),
+            "current_source": getattr(result, "current_source", ""),
+            "baseline_rows": getattr(result, "baseline_rows", 0),
+            "current_rows": getattr(result, "current_rows", 0),
+            "has_drift": getattr(result, "has_drift", False),
+            "has_high_drift": getattr(result, "has_high_drift", False),
+            "total_columns": len(columns),
+            "drifted_columns": drifted_columns,
+            "columns": columns,
+        }
+    @staticmethod
+    def convert_scan_result(result: Any) -> dict[str, Any]:
+        """Convert truthound PIIReport to ScanResult dict.
+        Args:
+            result: Truthound PIIReport object.
+        Returns:
+            Dictionary with ScanResult fields.
+        """
+        # Convert findings
+        findings = []
+        columns_with_pii = set()
+        for finding in getattr(result, "findings", []):
+            col = getattr(finding, "column", "")
+            columns_with_pii.add(col)
+            findings.append({
+                "column": col,
+                "pii_type": getattr(finding, "pii_type", "unknown"),
+                "confidence": getattr(finding, "confidence", 0.0),
+                "sample_count": getattr(finding, "sample_count", 0),
+                "sample_values": getattr(finding, "sample_values", None),
+            })
+        # Convert violations
+        violations = []
+        for violation in getattr(result, "violations", []):
+            violations.append({
+                "regulation": getattr(violation, "regulation", "unknown"),
+                "column": getattr(violation, "column", ""),
+                "pii_type": getattr(violation, "pii_type", "unknown"),
+                "message": getattr(violation, "message", ""),
+                "severity": getattr(violation, "severity", "high"),
+            })
+        return {
+            "source": getattr(result, "source", ""),
+            "row_count": getattr(result, "row_count", 0),
+            "column_count": getattr(result, "column_count", 0),
+            "total_columns_scanned": getattr(result, "column_count", 0),
+            "columns_with_pii": len(columns_with_pii),
+            "total_findings": len(findings),
+            "has_violations": getattr(result, "has_violations", len(violations) > 0),
+            "total_violations": len(violations),
+            "findings": findings,
+            "violations": violations,
+        }
+    @staticmethod
+    def convert_mask_result(
+        source: Any,
+        output: str,
+        masked_df: Any,
+        strategy: str,
+        columns: list[str] | None,
+    ) -> dict[str, Any]:
+        """Convert truthound mask result to MaskResult dict.
+        Args:
+            source: Original data source.
+            output: Output file path.
+            masked_df: Polars DataFrame with masked data.
+            strategy: Masking strategy used.
+            columns: Columns that were masked.
+        Returns:
+            Dictionary with MaskResult fields.
+        """
+        # Get column information from the DataFrame
+        all_columns = list(masked_df.columns) if hasattr(masked_df, "columns") else []
+        row_count = len(masked_df) if hasattr(masked_df, "__len__") else 0
+        # Get source name
+        if isinstance(source, str):
+            source_name = source
+        else:
+            source_name = getattr(source, "name", str(type(source).__name__))
+        # Write the masked data to output file
+        output_path = Path(output)
+        suffix = output_path.suffix.lower()
+        if hasattr(masked_df, "write_csv"):
+            if suffix == ".csv":
+                masked_df.write_csv(output)
+            elif suffix == ".parquet" and hasattr(masked_df, "write_parquet"):
+                masked_df.write_parquet(output)
+            elif suffix == ".json" and hasattr(masked_df, "write_json"):
+                masked_df.write_json(output)
+            else:
+                # Default to CSV
+                masked_df.write_csv(output)
+        return {
+            "source": source_name,
+            "output_path": str(output_path.absolute()),
+            "row_count": row_count,
+            "column_count": len(all_columns),
+            "columns_masked": columns if columns else [],
+            "strategy": strategy,
+            "original_columns": all_columns,
+        }
+    @staticmethod
+    def convert_suite_result(
+        suite: Any,
+        strictness: str,
+        output_format: str = "yaml",
+    ) -> dict[str, Any]:
+        """Convert truthound ValidationSuite to GenerateSuiteResult dict.
+        Args:
+            suite: ValidationSuite from generate_suite().
+            strictness: Strictness level used.
+            output_format: Requested output format.
+        Returns:
+            Dictionary with GenerateSuiteResult fields.
+        """
+        rules = []
+        categories = set()
+        if hasattr(suite, "rules"):
+            for rule in suite.rules:
+                rule_dict = {
+                    "name": getattr(rule, "name", ""),
+                    "validator": getattr(rule, "validator", ""),
+                    "column": getattr(rule, "column", None),
+                    "params": getattr(rule, "params", {}),
+                    "severity": getattr(rule, "severity", "medium"),
+                    "category": getattr(rule, "category", "unknown"),
+                }
+                rules.append(rule_dict)
+                if rule_dict["category"]:
+                    categories.add(rule_dict["category"])
+        # Generate YAML content
+        yaml_content = ""
+        if hasattr(suite, "to_yaml"):
+            yaml_content = suite.to_yaml()
+        else:
+            yaml_content = yaml.dump(
+                {"rules": rules},
+                default_flow_style=False,
+                sort_keys=False,
+                allow_unicode=True,
+            )
+        # Generate JSON content
+        json_content = {"rules": rules}
+        if hasattr(suite, "to_dict"):
+            json_content = suite.to_dict()
+        return {
+            "rules": rules,
+            "rule_count": len(rules),
+            "categories": sorted(categories),
+            "strictness": strictness,
+            "yaml_content": yaml_content,
+            "json_content": json_content,
+        }

truthound-dashboard 1.4.4__py3-none-any.whl → 1.5.1__py3-none-any.whl

truthound-dashboard 1.4.4py3-none-any.whl → 1.5.1py3-none-any.whl