PyPI - truthound - Versions diffs - 1.0.8__py3-none-any.whl - Mend

truthound 1.0.8__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (877) hide show

truthound/__init__.py +162 -0
truthound/adapters.py +100 -0
truthound/api.py +365 -0
truthound/audit/__init__.py +248 -0
truthound/audit/core.py +967 -0
truthound/audit/filters.py +620 -0
truthound/audit/formatters.py +707 -0
truthound/audit/logger.py +902 -0
truthound/audit/middleware.py +571 -0
truthound/audit/storage.py +1083 -0
truthound/benchmark/__init__.py +123 -0
truthound/benchmark/base.py +757 -0
truthound/benchmark/comparison.py +635 -0
truthound/benchmark/generators.py +706 -0
truthound/benchmark/reporters.py +718 -0
truthound/benchmark/runner.py +635 -0
truthound/benchmark/scenarios.py +712 -0
truthound/cache.py +252 -0
truthound/checkpoint/__init__.py +136 -0
truthound/checkpoint/actions/__init__.py +164 -0
truthound/checkpoint/actions/base.py +324 -0
truthound/checkpoint/actions/custom.py +234 -0
truthound/checkpoint/actions/discord_notify.py +290 -0
truthound/checkpoint/actions/email_notify.py +405 -0
truthound/checkpoint/actions/github_action.py +406 -0
truthound/checkpoint/actions/opsgenie.py +1499 -0
truthound/checkpoint/actions/pagerduty.py +226 -0
truthound/checkpoint/actions/slack_notify.py +233 -0
truthound/checkpoint/actions/store_result.py +249 -0
truthound/checkpoint/actions/teams_notify.py +1570 -0
truthound/checkpoint/actions/telegram_notify.py +419 -0
truthound/checkpoint/actions/update_docs.py +552 -0
truthound/checkpoint/actions/webhook.py +293 -0
truthound/checkpoint/analytics/__init__.py +147 -0
truthound/checkpoint/analytics/aggregations/__init__.py +23 -0
truthound/checkpoint/analytics/aggregations/rollup.py +481 -0
truthound/checkpoint/analytics/aggregations/time_bucket.py +306 -0
truthound/checkpoint/analytics/analyzers/__init__.py +17 -0
truthound/checkpoint/analytics/analyzers/anomaly.py +386 -0
truthound/checkpoint/analytics/analyzers/base.py +270 -0
truthound/checkpoint/analytics/analyzers/forecast.py +421 -0
truthound/checkpoint/analytics/analyzers/trend.py +314 -0
truthound/checkpoint/analytics/models.py +292 -0
truthound/checkpoint/analytics/protocols.py +549 -0
truthound/checkpoint/analytics/service.py +718 -0
truthound/checkpoint/analytics/stores/__init__.py +16 -0
truthound/checkpoint/analytics/stores/base.py +306 -0
truthound/checkpoint/analytics/stores/memory_store.py +353 -0
truthound/checkpoint/analytics/stores/sqlite_store.py +557 -0
truthound/checkpoint/analytics/stores/timescale_store.py +501 -0
truthound/checkpoint/async_actions.py +794 -0
truthound/checkpoint/async_base.py +708 -0
truthound/checkpoint/async_checkpoint.py +617 -0
truthound/checkpoint/async_runner.py +639 -0
truthound/checkpoint/checkpoint.py +527 -0
truthound/checkpoint/ci/__init__.py +61 -0
truthound/checkpoint/ci/detector.py +355 -0
truthound/checkpoint/ci/reporter.py +436 -0
truthound/checkpoint/ci/templates.py +454 -0
truthound/checkpoint/circuitbreaker/__init__.py +133 -0
truthound/checkpoint/circuitbreaker/breaker.py +542 -0
truthound/checkpoint/circuitbreaker/core.py +252 -0
truthound/checkpoint/circuitbreaker/detection.py +459 -0
truthound/checkpoint/circuitbreaker/middleware.py +389 -0
truthound/checkpoint/circuitbreaker/registry.py +357 -0
truthound/checkpoint/distributed/__init__.py +139 -0
truthound/checkpoint/distributed/backends/__init__.py +35 -0
truthound/checkpoint/distributed/backends/celery_backend.py +503 -0
truthound/checkpoint/distributed/backends/kubernetes_backend.py +696 -0
truthound/checkpoint/distributed/backends/local_backend.py +397 -0
truthound/checkpoint/distributed/backends/ray_backend.py +625 -0
truthound/checkpoint/distributed/base.py +774 -0
truthound/checkpoint/distributed/orchestrator.py +765 -0
truthound/checkpoint/distributed/protocols.py +842 -0
truthound/checkpoint/distributed/registry.py +449 -0
truthound/checkpoint/idempotency/__init__.py +120 -0
truthound/checkpoint/idempotency/core.py +295 -0
truthound/checkpoint/idempotency/fingerprint.py +454 -0
truthound/checkpoint/idempotency/locking.py +604 -0
truthound/checkpoint/idempotency/service.py +592 -0
truthound/checkpoint/idempotency/stores.py +653 -0
truthound/checkpoint/monitoring/__init__.py +134 -0
truthound/checkpoint/monitoring/aggregators/__init__.py +15 -0
truthound/checkpoint/monitoring/aggregators/base.py +372 -0
truthound/checkpoint/monitoring/aggregators/realtime.py +300 -0
truthound/checkpoint/monitoring/aggregators/window.py +493 -0
truthound/checkpoint/monitoring/collectors/__init__.py +17 -0
truthound/checkpoint/monitoring/collectors/base.py +257 -0
truthound/checkpoint/monitoring/collectors/memory_collector.py +617 -0
truthound/checkpoint/monitoring/collectors/prometheus_collector.py +451 -0
truthound/checkpoint/monitoring/collectors/redis_collector.py +518 -0
truthound/checkpoint/monitoring/events.py +410 -0
truthound/checkpoint/monitoring/protocols.py +636 -0
truthound/checkpoint/monitoring/service.py +578 -0
truthound/checkpoint/monitoring/views/__init__.py +17 -0
truthound/checkpoint/monitoring/views/base.py +172 -0
truthound/checkpoint/monitoring/views/queue_view.py +220 -0
truthound/checkpoint/monitoring/views/task_view.py +240 -0
truthound/checkpoint/monitoring/views/worker_view.py +263 -0
truthound/checkpoint/registry.py +337 -0
truthound/checkpoint/runner.py +356 -0
truthound/checkpoint/transaction/__init__.py +133 -0
truthound/checkpoint/transaction/base.py +389 -0
truthound/checkpoint/transaction/compensatable.py +537 -0
truthound/checkpoint/transaction/coordinator.py +576 -0
truthound/checkpoint/transaction/executor.py +622 -0
truthound/checkpoint/transaction/idempotency.py +534 -0
truthound/checkpoint/transaction/saga/__init__.py +143 -0
truthound/checkpoint/transaction/saga/builder.py +584 -0
truthound/checkpoint/transaction/saga/definition.py +515 -0
truthound/checkpoint/transaction/saga/event_store.py +542 -0
truthound/checkpoint/transaction/saga/patterns.py +833 -0
truthound/checkpoint/transaction/saga/runner.py +718 -0
truthound/checkpoint/transaction/saga/state_machine.py +793 -0
truthound/checkpoint/transaction/saga/strategies.py +780 -0
truthound/checkpoint/transaction/saga/testing.py +886 -0
truthound/checkpoint/triggers/__init__.py +58 -0
truthound/checkpoint/triggers/base.py +237 -0
truthound/checkpoint/triggers/event.py +385 -0
truthound/checkpoint/triggers/schedule.py +355 -0
truthound/cli.py +2358 -0
truthound/cli_modules/__init__.py +124 -0
truthound/cli_modules/advanced/__init__.py +45 -0
truthound/cli_modules/advanced/benchmark.py +343 -0
truthound/cli_modules/advanced/docs.py +225 -0
truthound/cli_modules/advanced/lineage.py +209 -0
truthound/cli_modules/advanced/ml.py +320 -0
truthound/cli_modules/advanced/realtime.py +196 -0
truthound/cli_modules/checkpoint/__init__.py +46 -0
truthound/cli_modules/checkpoint/init.py +114 -0
truthound/cli_modules/checkpoint/list.py +71 -0
truthound/cli_modules/checkpoint/run.py +159 -0
truthound/cli_modules/checkpoint/validate.py +67 -0
truthound/cli_modules/common/__init__.py +71 -0
truthound/cli_modules/common/errors.py +414 -0
truthound/cli_modules/common/options.py +419 -0
truthound/cli_modules/common/output.py +507 -0
truthound/cli_modules/common/protocol.py +552 -0
truthound/cli_modules/core/__init__.py +48 -0
truthound/cli_modules/core/check.py +123 -0
truthound/cli_modules/core/compare.py +104 -0
truthound/cli_modules/core/learn.py +57 -0
truthound/cli_modules/core/mask.py +77 -0
truthound/cli_modules/core/profile.py +65 -0
truthound/cli_modules/core/scan.py +61 -0
truthound/cli_modules/profiler/__init__.py +51 -0
truthound/cli_modules/profiler/auto_profile.py +175 -0
truthound/cli_modules/profiler/metadata.py +107 -0
truthound/cli_modules/profiler/suite.py +283 -0
truthound/cli_modules/registry.py +431 -0
truthound/cli_modules/scaffolding/__init__.py +89 -0
truthound/cli_modules/scaffolding/base.py +631 -0
truthound/cli_modules/scaffolding/commands.py +545 -0
truthound/cli_modules/scaffolding/plugins.py +1072 -0
truthound/cli_modules/scaffolding/reporters.py +594 -0
truthound/cli_modules/scaffolding/validators.py +1127 -0
truthound/common/__init__.py +18 -0
truthound/common/resilience/__init__.py +130 -0
truthound/common/resilience/bulkhead.py +266 -0
truthound/common/resilience/circuit_breaker.py +516 -0
truthound/common/resilience/composite.py +332 -0
truthound/common/resilience/config.py +292 -0
truthound/common/resilience/protocols.py +217 -0
truthound/common/resilience/rate_limiter.py +404 -0
truthound/common/resilience/retry.py +341 -0
truthound/datadocs/__init__.py +260 -0
truthound/datadocs/base.py +571 -0
truthound/datadocs/builder.py +761 -0
truthound/datadocs/charts.py +764 -0
truthound/datadocs/dashboard/__init__.py +63 -0
truthound/datadocs/dashboard/app.py +576 -0
truthound/datadocs/dashboard/components.py +584 -0
truthound/datadocs/dashboard/state.py +240 -0
truthound/datadocs/engine/__init__.py +46 -0
truthound/datadocs/engine/context.py +376 -0
truthound/datadocs/engine/pipeline.py +618 -0
truthound/datadocs/engine/registry.py +469 -0
truthound/datadocs/exporters/__init__.py +49 -0
truthound/datadocs/exporters/base.py +198 -0
truthound/datadocs/exporters/html.py +178 -0
truthound/datadocs/exporters/json_exporter.py +253 -0
truthound/datadocs/exporters/markdown.py +284 -0
truthound/datadocs/exporters/pdf.py +392 -0
truthound/datadocs/i18n/__init__.py +86 -0
truthound/datadocs/i18n/catalog.py +960 -0
truthound/datadocs/i18n/formatting.py +505 -0
truthound/datadocs/i18n/loader.py +256 -0
truthound/datadocs/i18n/plurals.py +378 -0
truthound/datadocs/renderers/__init__.py +42 -0
truthound/datadocs/renderers/base.py +401 -0
truthound/datadocs/renderers/custom.py +342 -0
truthound/datadocs/renderers/jinja.py +697 -0
truthound/datadocs/sections.py +736 -0
truthound/datadocs/styles.py +931 -0
truthound/datadocs/themes/__init__.py +101 -0
truthound/datadocs/themes/base.py +336 -0
truthound/datadocs/themes/default.py +417 -0
truthound/datadocs/themes/enterprise.py +419 -0
truthound/datadocs/themes/loader.py +336 -0
truthound/datadocs/themes.py +301 -0
truthound/datadocs/transformers/__init__.py +57 -0
truthound/datadocs/transformers/base.py +268 -0
truthound/datadocs/transformers/enrichers.py +544 -0
truthound/datadocs/transformers/filters.py +447 -0
truthound/datadocs/transformers/i18n.py +468 -0
truthound/datadocs/versioning/__init__.py +62 -0
truthound/datadocs/versioning/diff.py +639 -0
truthound/datadocs/versioning/storage.py +497 -0
truthound/datadocs/versioning/version.py +358 -0
truthound/datasources/__init__.py +223 -0
truthound/datasources/_async_protocols.py +222 -0
truthound/datasources/_protocols.py +159 -0
truthound/datasources/adapters.py +428 -0
truthound/datasources/async_base.py +599 -0
truthound/datasources/async_factory.py +511 -0
truthound/datasources/base.py +516 -0
truthound/datasources/factory.py +433 -0
truthound/datasources/nosql/__init__.py +47 -0
truthound/datasources/nosql/base.py +487 -0
truthound/datasources/nosql/elasticsearch.py +801 -0
truthound/datasources/nosql/mongodb.py +636 -0
truthound/datasources/pandas_optimized.py +582 -0
truthound/datasources/pandas_source.py +216 -0
truthound/datasources/polars_source.py +395 -0
truthound/datasources/spark_source.py +479 -0
truthound/datasources/sql/__init__.py +154 -0
truthound/datasources/sql/base.py +710 -0
truthound/datasources/sql/bigquery.py +410 -0
truthound/datasources/sql/cloud_base.py +199 -0
truthound/datasources/sql/databricks.py +471 -0
truthound/datasources/sql/mysql.py +316 -0
truthound/datasources/sql/oracle.py +427 -0
truthound/datasources/sql/postgresql.py +321 -0
truthound/datasources/sql/redshift.py +479 -0
truthound/datasources/sql/snowflake.py +439 -0
truthound/datasources/sql/sqlite.py +286 -0
truthound/datasources/sql/sqlserver.py +437 -0
truthound/datasources/streaming/__init__.py +47 -0
truthound/datasources/streaming/base.py +350 -0
truthound/datasources/streaming/kafka.py +670 -0
truthound/decorators.py +98 -0
truthound/docs/__init__.py +69 -0
truthound/docs/extractor.py +971 -0
truthound/docs/generator.py +601 -0
truthound/docs/parser.py +1037 -0
truthound/docs/renderer.py +999 -0
truthound/drift/__init__.py +22 -0
truthound/drift/compare.py +189 -0
truthound/drift/detectors.py +464 -0
truthound/drift/report.py +160 -0
truthound/execution/__init__.py +65 -0
truthound/execution/_protocols.py +324 -0
truthound/execution/base.py +576 -0
truthound/execution/distributed/__init__.py +179 -0
truthound/execution/distributed/aggregations.py +731 -0
truthound/execution/distributed/arrow_bridge.py +817 -0
truthound/execution/distributed/base.py +550 -0
truthound/execution/distributed/dask_engine.py +976 -0
truthound/execution/distributed/mixins.py +766 -0
truthound/execution/distributed/protocols.py +756 -0
truthound/execution/distributed/ray_engine.py +1127 -0
truthound/execution/distributed/registry.py +446 -0
truthound/execution/distributed/spark_engine.py +1011 -0
truthound/execution/distributed/validator_adapter.py +682 -0
truthound/execution/pandas_engine.py +401 -0
truthound/execution/polars_engine.py +497 -0
truthound/execution/pushdown/__init__.py +230 -0
truthound/execution/pushdown/ast.py +1550 -0
truthound/execution/pushdown/builder.py +1550 -0
truthound/execution/pushdown/dialects.py +1072 -0
truthound/execution/pushdown/executor.py +829 -0
truthound/execution/pushdown/optimizer.py +1041 -0
truthound/execution/sql_engine.py +518 -0
truthound/infrastructure/__init__.py +189 -0
truthound/infrastructure/audit.py +1515 -0
truthound/infrastructure/config.py +1133 -0
truthound/infrastructure/encryption.py +1132 -0
truthound/infrastructure/logging.py +1503 -0
truthound/infrastructure/metrics.py +1220 -0
truthound/lineage/__init__.py +89 -0
truthound/lineage/base.py +746 -0
truthound/lineage/impact_analysis.py +474 -0
truthound/lineage/integrations/__init__.py +22 -0
truthound/lineage/integrations/openlineage.py +548 -0
truthound/lineage/tracker.py +512 -0
truthound/lineage/visualization/__init__.py +33 -0
truthound/lineage/visualization/protocols.py +145 -0
truthound/lineage/visualization/renderers/__init__.py +20 -0
truthound/lineage/visualization/renderers/cytoscape.py +329 -0
truthound/lineage/visualization/renderers/d3.py +331 -0
truthound/lineage/visualization/renderers/graphviz.py +276 -0
truthound/lineage/visualization/renderers/mermaid.py +308 -0
truthound/maskers.py +113 -0
truthound/ml/__init__.py +124 -0
truthound/ml/anomaly_models/__init__.py +31 -0
truthound/ml/anomaly_models/ensemble.py +362 -0
truthound/ml/anomaly_models/isolation_forest.py +444 -0
truthound/ml/anomaly_models/statistical.py +392 -0
truthound/ml/base.py +1178 -0
truthound/ml/drift_detection/__init__.py +26 -0
truthound/ml/drift_detection/concept.py +381 -0
truthound/ml/drift_detection/distribution.py +361 -0
truthound/ml/drift_detection/feature.py +442 -0
truthound/ml/drift_detection/multivariate.py +495 -0
truthound/ml/monitoring/__init__.py +88 -0
truthound/ml/monitoring/alerting/__init__.py +33 -0
truthound/ml/monitoring/alerting/handlers.py +427 -0
truthound/ml/monitoring/alerting/rules.py +508 -0
truthound/ml/monitoring/collectors/__init__.py +19 -0
truthound/ml/monitoring/collectors/composite.py +105 -0
truthound/ml/monitoring/collectors/drift.py +324 -0
truthound/ml/monitoring/collectors/performance.py +179 -0
truthound/ml/monitoring/collectors/quality.py +369 -0
truthound/ml/monitoring/monitor.py +536 -0
truthound/ml/monitoring/protocols.py +451 -0
truthound/ml/monitoring/stores/__init__.py +15 -0
truthound/ml/monitoring/stores/memory.py +201 -0
truthound/ml/monitoring/stores/prometheus.py +296 -0
truthound/ml/rule_learning/__init__.py +25 -0
truthound/ml/rule_learning/constraint_miner.py +443 -0
truthound/ml/rule_learning/pattern_learner.py +499 -0
truthound/ml/rule_learning/profile_learner.py +462 -0
truthound/multitenancy/__init__.py +326 -0
truthound/multitenancy/core.py +852 -0
truthound/multitenancy/integration.py +597 -0
truthound/multitenancy/isolation.py +630 -0
truthound/multitenancy/manager.py +770 -0
truthound/multitenancy/middleware.py +765 -0
truthound/multitenancy/quota.py +537 -0
truthound/multitenancy/resolvers.py +603 -0
truthound/multitenancy/storage.py +703 -0
truthound/observability/__init__.py +307 -0
truthound/observability/context.py +531 -0
truthound/observability/instrumentation.py +611 -0
truthound/observability/logging.py +887 -0
truthound/observability/metrics.py +1157 -0
truthound/observability/tracing/__init__.py +178 -0
truthound/observability/tracing/baggage.py +310 -0
truthound/observability/tracing/config.py +426 -0
truthound/observability/tracing/exporter.py +787 -0
truthound/observability/tracing/integration.py +1018 -0
truthound/observability/tracing/otel/__init__.py +146 -0
truthound/observability/tracing/otel/adapter.py +982 -0
truthound/observability/tracing/otel/bridge.py +1177 -0
truthound/observability/tracing/otel/compat.py +681 -0
truthound/observability/tracing/otel/config.py +691 -0
truthound/observability/tracing/otel/detection.py +327 -0
truthound/observability/tracing/otel/protocols.py +426 -0
truthound/observability/tracing/processor.py +561 -0
truthound/observability/tracing/propagator.py +757 -0
truthound/observability/tracing/provider.py +569 -0
truthound/observability/tracing/resource.py +515 -0
truthound/observability/tracing/sampler.py +487 -0
truthound/observability/tracing/span.py +676 -0
truthound/plugins/__init__.py +198 -0
truthound/plugins/base.py +599 -0
truthound/plugins/cli.py +680 -0
truthound/plugins/dependencies/__init__.py +42 -0
truthound/plugins/dependencies/graph.py +422 -0
truthound/plugins/dependencies/resolver.py +417 -0
truthound/plugins/discovery.py +379 -0
truthound/plugins/docs/__init__.py +46 -0
truthound/plugins/docs/extractor.py +444 -0
truthound/plugins/docs/renderer.py +499 -0
truthound/plugins/enterprise_manager.py +877 -0
truthound/plugins/examples/__init__.py +19 -0
truthound/plugins/examples/custom_validators.py +317 -0
truthound/plugins/examples/slack_notifier.py +312 -0
truthound/plugins/examples/xml_reporter.py +254 -0
truthound/plugins/hooks.py +558 -0
truthound/plugins/lifecycle/__init__.py +43 -0
truthound/plugins/lifecycle/hot_reload.py +402 -0
truthound/plugins/lifecycle/manager.py +371 -0
truthound/plugins/manager.py +736 -0
truthound/plugins/registry.py +338 -0
truthound/plugins/security/__init__.py +93 -0
truthound/plugins/security/exceptions.py +332 -0
truthound/plugins/security/policies.py +348 -0
truthound/plugins/security/protocols.py +643 -0
truthound/plugins/security/sandbox/__init__.py +45 -0
truthound/plugins/security/sandbox/context.py +158 -0
truthound/plugins/security/sandbox/engines/__init__.py +19 -0
truthound/plugins/security/sandbox/engines/container.py +379 -0
truthound/plugins/security/sandbox/engines/noop.py +144 -0
truthound/plugins/security/sandbox/engines/process.py +336 -0
truthound/plugins/security/sandbox/factory.py +211 -0
truthound/plugins/security/signing/__init__.py +57 -0
truthound/plugins/security/signing/service.py +330 -0
truthound/plugins/security/signing/trust_store.py +368 -0
truthound/plugins/security/signing/verifier.py +459 -0
truthound/plugins/versioning/__init__.py +41 -0
truthound/plugins/versioning/constraints.py +297 -0
truthound/plugins/versioning/resolver.py +329 -0
truthound/profiler/__init__.py +1729 -0
truthound/profiler/_lazy.py +452 -0
truthound/profiler/ab_testing/__init__.py +80 -0
truthound/profiler/ab_testing/analysis.py +449 -0
truthound/profiler/ab_testing/base.py +257 -0
truthound/profiler/ab_testing/experiment.py +395 -0
truthound/profiler/ab_testing/tracking.py +368 -0
truthound/profiler/auto_threshold.py +1170 -0
truthound/profiler/base.py +579 -0
truthound/profiler/cache_patterns.py +911 -0
truthound/profiler/caching.py +1303 -0
truthound/profiler/column_profiler.py +712 -0
truthound/profiler/comparison.py +1007 -0
truthound/profiler/custom_patterns.py +1170 -0
truthound/profiler/dashboard/__init__.py +50 -0
truthound/profiler/dashboard/app.py +476 -0
truthound/profiler/dashboard/components.py +457 -0
truthound/profiler/dashboard/config.py +72 -0
truthound/profiler/distributed/__init__.py +83 -0
truthound/profiler/distributed/base.py +281 -0
truthound/profiler/distributed/dask_backend.py +498 -0
truthound/profiler/distributed/local_backend.py +293 -0
truthound/profiler/distributed/profiler.py +304 -0
truthound/profiler/distributed/ray_backend.py +374 -0
truthound/profiler/distributed/spark_backend.py +375 -0
truthound/profiler/distributed.py +1366 -0
truthound/profiler/enterprise_sampling.py +1065 -0
truthound/profiler/errors.py +488 -0
truthound/profiler/evolution/__init__.py +91 -0
truthound/profiler/evolution/alerts.py +426 -0
truthound/profiler/evolution/changes.py +206 -0
truthound/profiler/evolution/compatibility.py +365 -0
truthound/profiler/evolution/detector.py +372 -0
truthound/profiler/evolution/protocols.py +121 -0
truthound/profiler/generators/__init__.py +48 -0
truthound/profiler/generators/base.py +384 -0
truthound/profiler/generators/ml_rules.py +375 -0
truthound/profiler/generators/pattern_rules.py +384 -0
truthound/profiler/generators/schema_rules.py +267 -0
truthound/profiler/generators/stats_rules.py +324 -0
truthound/profiler/generators/suite_generator.py +857 -0
truthound/profiler/i18n.py +1542 -0
truthound/profiler/incremental.py +554 -0
truthound/profiler/incremental_validation.py +1710 -0
truthound/profiler/integration/__init__.py +73 -0
truthound/profiler/integration/adapters.py +345 -0
truthound/profiler/integration/context.py +371 -0
truthound/profiler/integration/executor.py +527 -0
truthound/profiler/integration/naming.py +75 -0
truthound/profiler/integration/protocols.py +243 -0
truthound/profiler/memory.py +1185 -0
truthound/profiler/migration/__init__.py +60 -0
truthound/profiler/migration/base.py +345 -0
truthound/profiler/migration/manager.py +444 -0
truthound/profiler/migration/v1_0_to_v1_1.py +484 -0
truthound/profiler/ml/__init__.py +73 -0
truthound/profiler/ml/base.py +244 -0
truthound/profiler/ml/classifier.py +507 -0
truthound/profiler/ml/feature_extraction.py +604 -0
truthound/profiler/ml/pretrained.py +448 -0
truthound/profiler/ml_inference.py +1276 -0
truthound/profiler/native_patterns.py +815 -0
truthound/profiler/observability.py +1184 -0
truthound/profiler/process_timeout.py +1566 -0
truthound/profiler/progress.py +568 -0
truthound/profiler/progress_callbacks.py +1734 -0
truthound/profiler/quality.py +1345 -0
truthound/profiler/resilience.py +1180 -0
truthound/profiler/sampled_matcher.py +794 -0
truthound/profiler/sampling.py +1288 -0
truthound/profiler/scheduling/__init__.py +82 -0
truthound/profiler/scheduling/protocols.py +214 -0
truthound/profiler/scheduling/scheduler.py +474 -0
truthound/profiler/scheduling/storage.py +457 -0
truthound/profiler/scheduling/triggers.py +449 -0
truthound/profiler/schema.py +603 -0
truthound/profiler/streaming.py +685 -0
truthound/profiler/streaming_patterns.py +1354 -0
truthound/profiler/suite_cli.py +625 -0
truthound/profiler/suite_config.py +789 -0
truthound/profiler/suite_export.py +1268 -0
truthound/profiler/table_profiler.py +547 -0
truthound/profiler/timeout.py +565 -0
truthound/profiler/validation.py +1532 -0
truthound/profiler/visualization/__init__.py +118 -0
truthound/profiler/visualization/base.py +346 -0
truthound/profiler/visualization/generator.py +1259 -0
truthound/profiler/visualization/plotly_renderer.py +811 -0
truthound/profiler/visualization/renderers.py +669 -0
truthound/profiler/visualization/sections.py +540 -0
truthound/profiler/visualization.py +2122 -0
truthound/profiler/yaml_validation.py +1151 -0
truthound/py.typed +0 -0
truthound/ratelimit/__init__.py +248 -0
truthound/ratelimit/algorithms.py +1108 -0
truthound/ratelimit/core.py +573 -0
truthound/ratelimit/integration.py +532 -0
truthound/ratelimit/limiter.py +663 -0
truthound/ratelimit/middleware.py +700 -0
truthound/ratelimit/policy.py +792 -0
truthound/ratelimit/storage.py +763 -0
truthound/rbac/__init__.py +340 -0
truthound/rbac/core.py +976 -0
truthound/rbac/integration.py +760 -0
truthound/rbac/manager.py +1052 -0
truthound/rbac/middleware.py +842 -0
truthound/rbac/policy.py +954 -0
truthound/rbac/storage.py +878 -0
truthound/realtime/__init__.py +141 -0
truthound/realtime/adapters/__init__.py +43 -0
truthound/realtime/adapters/base.py +533 -0
truthound/realtime/adapters/kafka.py +487 -0
truthound/realtime/adapters/kinesis.py +479 -0
truthound/realtime/adapters/mock.py +243 -0
truthound/realtime/base.py +553 -0
truthound/realtime/factory.py +382 -0
truthound/realtime/incremental.py +660 -0
truthound/realtime/processing/__init__.py +67 -0
truthound/realtime/processing/exactly_once.py +575 -0
truthound/realtime/processing/state.py +547 -0
truthound/realtime/processing/windows.py +647 -0
truthound/realtime/protocols.py +569 -0
truthound/realtime/streaming.py +605 -0
truthound/realtime/testing/__init__.py +32 -0
truthound/realtime/testing/containers.py +615 -0
truthound/realtime/testing/fixtures.py +484 -0
truthound/report.py +280 -0
truthound/reporters/__init__.py +46 -0
truthound/reporters/_protocols.py +30 -0
truthound/reporters/base.py +324 -0
truthound/reporters/ci/__init__.py +66 -0
truthound/reporters/ci/azure.py +436 -0
truthound/reporters/ci/base.py +509 -0
truthound/reporters/ci/bitbucket.py +567 -0
truthound/reporters/ci/circleci.py +547 -0
truthound/reporters/ci/detection.py +364 -0
truthound/reporters/ci/factory.py +182 -0
truthound/reporters/ci/github.py +388 -0
truthound/reporters/ci/gitlab.py +471 -0
truthound/reporters/ci/jenkins.py +525 -0
truthound/reporters/console_reporter.py +299 -0
truthound/reporters/factory.py +211 -0
truthound/reporters/html_reporter.py +524 -0
truthound/reporters/json_reporter.py +256 -0
truthound/reporters/markdown_reporter.py +280 -0
truthound/reporters/sdk/__init__.py +174 -0
truthound/reporters/sdk/builder.py +558 -0
truthound/reporters/sdk/mixins.py +1150 -0
truthound/reporters/sdk/schema.py +1493 -0
truthound/reporters/sdk/templates.py +666 -0
truthound/reporters/sdk/testing.py +968 -0
truthound/scanners.py +170 -0
truthound/scheduling/__init__.py +122 -0
truthound/scheduling/cron.py +1136 -0
truthound/scheduling/presets.py +212 -0
truthound/schema.py +275 -0
truthound/secrets/__init__.py +173 -0
truthound/secrets/base.py +618 -0
truthound/secrets/cloud.py +682 -0
truthound/secrets/integration.py +507 -0
truthound/secrets/manager.py +633 -0
truthound/secrets/oidc/__init__.py +172 -0
truthound/secrets/oidc/base.py +902 -0
truthound/secrets/oidc/credential_provider.py +623 -0
truthound/secrets/oidc/exchangers.py +1001 -0
truthound/secrets/oidc/github/__init__.py +110 -0
truthound/secrets/oidc/github/claims.py +718 -0
truthound/secrets/oidc/github/enhanced_provider.py +693 -0
truthound/secrets/oidc/github/trust_policy.py +742 -0
truthound/secrets/oidc/github/verification.py +723 -0
truthound/secrets/oidc/github/workflow.py +691 -0
truthound/secrets/oidc/providers.py +825 -0
truthound/secrets/providers.py +506 -0
truthound/secrets/resolver.py +495 -0
truthound/stores/__init__.py +177 -0
truthound/stores/backends/__init__.py +18 -0
truthound/stores/backends/_protocols.py +340 -0
truthound/stores/backends/azure_blob.py +530 -0
truthound/stores/backends/concurrent_filesystem.py +915 -0
truthound/stores/backends/connection_pool.py +1365 -0
truthound/stores/backends/database.py +743 -0
truthound/stores/backends/filesystem.py +538 -0
truthound/stores/backends/gcs.py +399 -0
truthound/stores/backends/memory.py +354 -0
truthound/stores/backends/s3.py +434 -0
truthound/stores/backpressure/__init__.py +84 -0
truthound/stores/backpressure/base.py +375 -0
truthound/stores/backpressure/circuit_breaker.py +434 -0
truthound/stores/backpressure/monitor.py +376 -0
truthound/stores/backpressure/strategies.py +677 -0
truthound/stores/base.py +551 -0
truthound/stores/batching/__init__.py +65 -0
truthound/stores/batching/base.py +305 -0
truthound/stores/batching/buffer.py +370 -0
truthound/stores/batching/store.py +248 -0
truthound/stores/batching/writer.py +521 -0
truthound/stores/caching/__init__.py +60 -0
truthound/stores/caching/backends.py +684 -0
truthound/stores/caching/base.py +356 -0
truthound/stores/caching/store.py +305 -0
truthound/stores/compression/__init__.py +193 -0
truthound/stores/compression/adaptive.py +694 -0
truthound/stores/compression/base.py +514 -0
truthound/stores/compression/pipeline.py +868 -0
truthound/stores/compression/providers.py +672 -0
truthound/stores/compression/streaming.py +832 -0
truthound/stores/concurrency/__init__.py +81 -0
truthound/stores/concurrency/atomic.py +556 -0
truthound/stores/concurrency/index.py +775 -0
truthound/stores/concurrency/locks.py +576 -0
truthound/stores/concurrency/manager.py +482 -0
truthound/stores/encryption/__init__.py +297 -0
truthound/stores/encryption/base.py +952 -0
truthound/stores/encryption/keys.py +1191 -0
truthound/stores/encryption/pipeline.py +903 -0
truthound/stores/encryption/providers.py +953 -0
truthound/stores/encryption/streaming.py +950 -0
truthound/stores/expectations.py +227 -0
truthound/stores/factory.py +246 -0
truthound/stores/migration/__init__.py +75 -0
truthound/stores/migration/base.py +480 -0
truthound/stores/migration/manager.py +347 -0
truthound/stores/migration/registry.py +382 -0
truthound/stores/migration/store.py +559 -0
truthound/stores/observability/__init__.py +106 -0
truthound/stores/observability/audit.py +718 -0
truthound/stores/observability/config.py +270 -0
truthound/stores/observability/factory.py +208 -0
truthound/stores/observability/metrics.py +636 -0
truthound/stores/observability/protocols.py +410 -0
truthound/stores/observability/store.py +570 -0
truthound/stores/observability/tracing.py +784 -0
truthound/stores/replication/__init__.py +76 -0
truthound/stores/replication/base.py +260 -0
truthound/stores/replication/monitor.py +269 -0
truthound/stores/replication/store.py +439 -0
truthound/stores/replication/syncer.py +391 -0
truthound/stores/results.py +359 -0
truthound/stores/retention/__init__.py +77 -0
truthound/stores/retention/base.py +378 -0
truthound/stores/retention/policies.py +621 -0
truthound/stores/retention/scheduler.py +279 -0
truthound/stores/retention/store.py +526 -0
truthound/stores/streaming/__init__.py +138 -0
truthound/stores/streaming/base.py +801 -0
truthound/stores/streaming/database.py +984 -0
truthound/stores/streaming/filesystem.py +719 -0
truthound/stores/streaming/reader.py +629 -0
truthound/stores/streaming/s3.py +843 -0
truthound/stores/streaming/writer.py +790 -0
truthound/stores/tiering/__init__.py +108 -0
truthound/stores/tiering/base.py +462 -0
truthound/stores/tiering/manager.py +249 -0
truthound/stores/tiering/policies.py +692 -0
truthound/stores/tiering/store.py +526 -0
truthound/stores/versioning/__init__.py +56 -0
truthound/stores/versioning/base.py +376 -0
truthound/stores/versioning/store.py +660 -0
truthound/stores/versioning/strategies.py +353 -0
truthound/types.py +56 -0
truthound/validators/__init__.py +774 -0
truthound/validators/aggregate/__init__.py +27 -0
truthound/validators/aggregate/central.py +116 -0
truthound/validators/aggregate/extremes.py +116 -0
truthound/validators/aggregate/spread.py +118 -0
truthound/validators/aggregate/sum.py +64 -0
truthound/validators/aggregate/type.py +78 -0
truthound/validators/anomaly/__init__.py +93 -0
truthound/validators/anomaly/base.py +431 -0
truthound/validators/anomaly/ml_based.py +1190 -0
truthound/validators/anomaly/multivariate.py +647 -0
truthound/validators/anomaly/statistical.py +599 -0
truthound/validators/base.py +1089 -0
truthound/validators/business_rule/__init__.py +46 -0
truthound/validators/business_rule/base.py +147 -0
truthound/validators/business_rule/checksum.py +509 -0
truthound/validators/business_rule/financial.py +526 -0
truthound/validators/cache.py +733 -0
truthound/validators/completeness/__init__.py +39 -0
truthound/validators/completeness/conditional.py +73 -0
truthound/validators/completeness/default.py +98 -0
truthound/validators/completeness/empty.py +103 -0
truthound/validators/completeness/nan.py +337 -0
truthound/validators/completeness/null.py +152 -0
truthound/validators/cross_table/__init__.py +17 -0
truthound/validators/cross_table/aggregate.py +333 -0
truthound/validators/cross_table/row_count.py +122 -0
truthound/validators/datetime/__init__.py +29 -0
truthound/validators/datetime/format.py +78 -0
truthound/validators/datetime/freshness.py +269 -0
truthound/validators/datetime/order.py +73 -0
truthound/validators/datetime/parseable.py +185 -0
truthound/validators/datetime/range.py +202 -0
truthound/validators/datetime/timezone.py +69 -0
truthound/validators/distribution/__init__.py +49 -0
truthound/validators/distribution/distribution.py +128 -0
truthound/validators/distribution/monotonic.py +119 -0
truthound/validators/distribution/outlier.py +178 -0
truthound/validators/distribution/quantile.py +80 -0
truthound/validators/distribution/range.py +254 -0
truthound/validators/distribution/set.py +125 -0
truthound/validators/distribution/statistical.py +459 -0
truthound/validators/drift/__init__.py +79 -0
truthound/validators/drift/base.py +427 -0
truthound/validators/drift/multi_feature.py +401 -0
truthound/validators/drift/numeric.py +395 -0
truthound/validators/drift/psi.py +446 -0
truthound/validators/drift/statistical.py +510 -0
truthound/validators/enterprise.py +1658 -0
truthound/validators/geospatial/__init__.py +80 -0
truthound/validators/geospatial/base.py +97 -0
truthound/validators/geospatial/boundary.py +238 -0
truthound/validators/geospatial/coordinate.py +351 -0
truthound/validators/geospatial/distance.py +399 -0
truthound/validators/geospatial/polygon.py +665 -0
truthound/validators/i18n/__init__.py +308 -0
truthound/validators/i18n/bidi.py +571 -0
truthound/validators/i18n/catalogs.py +570 -0
truthound/validators/i18n/dialects.py +763 -0
truthound/validators/i18n/extended_catalogs.py +549 -0
truthound/validators/i18n/formatting.py +1434 -0
truthound/validators/i18n/loader.py +1020 -0
truthound/validators/i18n/messages.py +521 -0
truthound/validators/i18n/plural.py +683 -0
truthound/validators/i18n/protocols.py +855 -0
truthound/validators/i18n/tms.py +1162 -0
truthound/validators/localization/__init__.py +53 -0
truthound/validators/localization/base.py +122 -0
truthound/validators/localization/chinese.py +362 -0
truthound/validators/localization/japanese.py +275 -0
truthound/validators/localization/korean.py +524 -0
truthound/validators/memory/__init__.py +94 -0
truthound/validators/memory/approximate_knn.py +506 -0
truthound/validators/memory/base.py +547 -0
truthound/validators/memory/sgd_online.py +719 -0
truthound/validators/memory/streaming_ecdf.py +753 -0
truthound/validators/ml_feature/__init__.py +54 -0
truthound/validators/ml_feature/base.py +249 -0
truthound/validators/ml_feature/correlation.py +299 -0
truthound/validators/ml_feature/leakage.py +344 -0
truthound/validators/ml_feature/null_impact.py +270 -0
truthound/validators/ml_feature/scale.py +264 -0
truthound/validators/multi_column/__init__.py +89 -0
truthound/validators/multi_column/arithmetic.py +284 -0
truthound/validators/multi_column/base.py +231 -0
truthound/validators/multi_column/comparison.py +273 -0
truthound/validators/multi_column/consistency.py +312 -0
truthound/validators/multi_column/statistical.py +299 -0
truthound/validators/optimization/__init__.py +164 -0
truthound/validators/optimization/aggregation.py +563 -0
truthound/validators/optimization/covariance.py +556 -0
truthound/validators/optimization/geo.py +626 -0
truthound/validators/optimization/graph.py +587 -0
truthound/validators/optimization/orchestrator.py +970 -0
truthound/validators/optimization/profiling.py +1312 -0
truthound/validators/privacy/__init__.py +223 -0
truthound/validators/privacy/base.py +635 -0
truthound/validators/privacy/ccpa.py +670 -0
truthound/validators/privacy/gdpr.py +728 -0
truthound/validators/privacy/global_patterns.py +604 -0
truthound/validators/privacy/plugins.py +867 -0
truthound/validators/profiling/__init__.py +52 -0
truthound/validators/profiling/base.py +175 -0
truthound/validators/profiling/cardinality.py +312 -0
truthound/validators/profiling/entropy.py +391 -0
truthound/validators/profiling/frequency.py +455 -0
truthound/validators/pushdown_support.py +660 -0
truthound/validators/query/__init__.py +91 -0
truthound/validators/query/aggregate.py +346 -0
truthound/validators/query/base.py +246 -0
truthound/validators/query/column.py +249 -0
truthound/validators/query/expression.py +274 -0
truthound/validators/query/result.py +323 -0
truthound/validators/query/row_count.py +264 -0
truthound/validators/referential/__init__.py +80 -0
truthound/validators/referential/base.py +395 -0
truthound/validators/referential/cascade.py +391 -0
truthound/validators/referential/circular.py +563 -0
truthound/validators/referential/foreign_key.py +624 -0
truthound/validators/referential/orphan.py +485 -0
truthound/validators/registry.py +112 -0
truthound/validators/schema/__init__.py +41 -0
truthound/validators/schema/column_count.py +142 -0
truthound/validators/schema/column_exists.py +80 -0
truthound/validators/schema/column_order.py +82 -0
truthound/validators/schema/column_pair.py +85 -0
truthound/validators/schema/column_pair_set.py +195 -0
truthound/validators/schema/column_type.py +94 -0
truthound/validators/schema/multi_column.py +53 -0
truthound/validators/schema/multi_column_aggregate.py +175 -0
truthound/validators/schema/referential.py +274 -0
truthound/validators/schema/table_schema.py +91 -0
truthound/validators/schema_validator.py +219 -0
truthound/validators/sdk/__init__.py +250 -0
truthound/validators/sdk/builder.py +680 -0
truthound/validators/sdk/decorators.py +474 -0
truthound/validators/sdk/enterprise/__init__.py +211 -0
truthound/validators/sdk/enterprise/docs.py +725 -0
truthound/validators/sdk/enterprise/fuzzing.py +659 -0
truthound/validators/sdk/enterprise/licensing.py +709 -0
truthound/validators/sdk/enterprise/manager.py +543 -0
truthound/validators/sdk/enterprise/resources.py +628 -0
truthound/validators/sdk/enterprise/sandbox.py +766 -0
truthound/validators/sdk/enterprise/signing.py +603 -0
truthound/validators/sdk/enterprise/templates.py +865 -0
truthound/validators/sdk/enterprise/versioning.py +659 -0
truthound/validators/sdk/templates.py +757 -0
truthound/validators/sdk/testing.py +807 -0
truthound/validators/security/__init__.py +181 -0
truthound/validators/security/redos/__init__.py +182 -0
truthound/validators/security/redos/core.py +861 -0
truthound/validators/security/redos/cpu_monitor.py +593 -0
truthound/validators/security/redos/cve_database.py +791 -0
truthound/validators/security/redos/ml/__init__.py +155 -0
truthound/validators/security/redos/ml/base.py +785 -0
truthound/validators/security/redos/ml/datasets.py +618 -0
truthound/validators/security/redos/ml/features.py +359 -0
truthound/validators/security/redos/ml/models.py +1000 -0
truthound/validators/security/redos/ml/predictor.py +507 -0
truthound/validators/security/redos/ml/storage.py +632 -0
truthound/validators/security/redos/ml/training.py +571 -0
truthound/validators/security/redos/ml_analyzer.py +937 -0
truthound/validators/security/redos/optimizer.py +674 -0
truthound/validators/security/redos/profiler.py +682 -0
truthound/validators/security/redos/re2_engine.py +709 -0
truthound/validators/security/redos.py +886 -0
truthound/validators/security/sql_security.py +1247 -0
truthound/validators/streaming/__init__.py +126 -0
truthound/validators/streaming/base.py +292 -0
truthound/validators/streaming/completeness.py +210 -0
truthound/validators/streaming/mixin.py +575 -0
truthound/validators/streaming/range.py +308 -0
truthound/validators/streaming/sources.py +846 -0
truthound/validators/string/__init__.py +57 -0
truthound/validators/string/casing.py +158 -0
truthound/validators/string/charset.py +96 -0
truthound/validators/string/format.py +501 -0
truthound/validators/string/json.py +77 -0
truthound/validators/string/json_schema.py +184 -0
truthound/validators/string/length.py +104 -0
truthound/validators/string/like_pattern.py +237 -0
truthound/validators/string/regex.py +202 -0
truthound/validators/string/regex_extended.py +435 -0
truthound/validators/table/__init__.py +88 -0
truthound/validators/table/base.py +78 -0
truthound/validators/table/column_count.py +198 -0
truthound/validators/table/freshness.py +362 -0
truthound/validators/table/row_count.py +251 -0
truthound/validators/table/schema.py +333 -0
truthound/validators/table/size.py +285 -0
truthound/validators/timeout/__init__.py +102 -0
truthound/validators/timeout/advanced/__init__.py +247 -0
truthound/validators/timeout/advanced/circuit_breaker.py +675 -0
truthound/validators/timeout/advanced/prediction.py +773 -0
truthound/validators/timeout/advanced/priority.py +618 -0
truthound/validators/timeout/advanced/redis_backend.py +770 -0
truthound/validators/timeout/advanced/retry.py +721 -0
truthound/validators/timeout/advanced/sampling.py +788 -0
truthound/validators/timeout/advanced/sla.py +661 -0
truthound/validators/timeout/advanced/telemetry.py +804 -0
truthound/validators/timeout/cascade.py +477 -0
truthound/validators/timeout/deadline.py +657 -0
truthound/validators/timeout/degradation.py +525 -0
truthound/validators/timeout/distributed.py +597 -0
truthound/validators/timeseries/__init__.py +89 -0
truthound/validators/timeseries/base.py +326 -0
truthound/validators/timeseries/completeness.py +617 -0
truthound/validators/timeseries/gap.py +485 -0
truthound/validators/timeseries/monotonic.py +310 -0
truthound/validators/timeseries/seasonality.py +422 -0
truthound/validators/timeseries/trend.py +510 -0
truthound/validators/uniqueness/__init__.py +59 -0
truthound/validators/uniqueness/approximate.py +475 -0
truthound/validators/uniqueness/distinct_values.py +253 -0
truthound/validators/uniqueness/duplicate.py +118 -0
truthound/validators/uniqueness/primary_key.py +140 -0
truthound/validators/uniqueness/unique.py +191 -0
truthound/validators/uniqueness/within_record.py +599 -0
truthound/validators/utils.py +756 -0
truthound-1.0.8.dist-info/METADATA +474 -0
truthound-1.0.8.dist-info/RECORD +877 -0
truthound-1.0.8.dist-info/WHEEL +4 -0
truthound-1.0.8.dist-info/entry_points.txt +2 -0
truthound-1.0.8.dist-info/licenses/LICENSE +190 -0

truthound/profiler/validation.py ADDED Viewed

@@ -0,0 +1,1532 @@
+"""Rule quality validation with labeled data support.
+This module provides comprehensive quality validation using labeled datasets:
+- Ground truth dataset management
+- Statistical validation with confidence intervals
+- Cross-validation and bootstrap methods
+- A/B testing for rule comparison
+- Labeled data collection and annotation
+Key features:
+- Pluggable validation strategy architecture
+- Support for partial labeling (not all rows need labels)
+- Integration with existing quality scoring
+- Detailed validation reports with actionable insights
+Example:
+    from truthound.profiler.validation import (
+        LabeledDataValidator,
+        ValidationDataset,
+        create_validation_suite,
+    )
+    # Create labeled dataset
+    dataset = ValidationDataset.from_csv(
+        "validation_data.csv",
+        label_column="is_valid",
+    )
+    # Validate rule quality
+    validator = LabeledDataValidator()
+    result = validator.validate(rule, dataset)
+    print(f"Precision: {result.precision:.2%}")
+    print(f"Recall: {result.recall:.2%}")
+    print(f"Confidence: {result.confidence:.2%}")
+"""
+from __future__ import annotations
+import hashlib
+import json
+import math
+import random
+import statistics
+import threading
+from abc import ABC, abstractmethod
+from collections import defaultdict
+from dataclasses import dataclass, field
+from datetime import datetime
+from enum import Enum
+from pathlib import Path
+from typing import Any, Callable, Generic, Iterator, Protocol, TypeVar
+import polars as pl
+from truthound.profiler.quality import (
+    ConfusionMatrix,
+    QualityLevel,
+    QualityMetrics,
+    RuleProtocol,
+    RuleType,
+    ValidationRule,
+)
+# =============================================================================
+# Types and Enums
+# =============================================================================
+class LabelType(str, Enum):
+    """Types of labels for validation data."""
+    BINARY = "binary"  # True/False for valid/invalid
+    CATEGORICAL = "categorical"  # Multiple categories
+    ORDINAL = "ordinal"  # Ordered categories (e.g., quality scores)
+    CONFIDENCE = "confidence"  # Probability/confidence scores
+class ValidationMethod(str, Enum):
+    """Validation methods available."""
+    HOLDOUT = "holdout"  # Simple train/test split
+    CROSS_VALIDATION = "cross_validation"  # K-fold cross-validation
+    BOOTSTRAP = "bootstrap"  # Bootstrap resampling
+    TEMPORAL = "temporal"  # Time-based validation
+    STRATIFIED = "stratified"  # Stratified sampling
+class ValidationStatus(str, Enum):
+    """Status of validation result."""
+    PASSED = "passed"  # Rule meets quality threshold
+    FAILED = "failed"  # Rule below quality threshold
+    INCONCLUSIVE = "inconclusive"  # Not enough data/confidence
+    DEGRADED = "degraded"  # Quality dropped from previous
+# =============================================================================
+# Labeled Data Management
+# =============================================================================
+@dataclass
+class LabeledRow:
+    """A single labeled data point."""
+    row_id: str | int
+    data: dict[str, Any]
+    label: bool | str | float
+    label_type: LabelType = LabelType.BINARY
+    confidence: float = 1.0  # Confidence in the label
+    source: str = ""  # Where the label came from
+    annotated_at: datetime = field(default_factory=datetime.now)
+    annotated_by: str = ""
+    notes: str = ""
+@dataclass
+class ValidationDataset:
+    """Dataset with labeled ground truth.
+    Manages labeled data for validating rule quality.
+    Attributes:
+        name: Dataset name
+        rows: Labeled data rows
+        label_type: Type of labels
+        label_column: Name of label column
+        metadata: Additional metadata
+    """
+    name: str
+    rows: list[LabeledRow] = field(default_factory=list)
+    label_type: LabelType = LabelType.BINARY
+    label_column: str = "is_valid"
+    metadata: dict[str, Any] = field(default_factory=dict)
+    created_at: datetime = field(default_factory=datetime.now)
+    version: str = "1.0"
+    def __len__(self) -> int:
+        return len(self.rows)
+    def __iter__(self) -> Iterator[LabeledRow]:
+        return iter(self.rows)
+    @classmethod
+    def from_dataframe(
+        cls,
+        df: pl.DataFrame,
+        label_column: str,
+        name: str = "validation_set",
+        id_column: str | None = None,
+        label_type: LabelType = LabelType.BINARY,
+    ) -> "ValidationDataset":
+        """Create dataset from a Polars DataFrame.
+        Args:
+            df: DataFrame with data and labels
+            label_column: Column containing labels
+            name: Dataset name
+            id_column: Column to use as row ID (uses index if None)
+            label_type: Type of labels
+        Returns:
+            ValidationDataset instance
+        """
+        rows = []
+        for i, row in enumerate(df.iter_rows(named=True)):
+            label = row.pop(label_column) if label_column in row else None
+            row_id = row.get(id_column, i) if id_column else i
+            rows.append(LabeledRow(
+                row_id=row_id,
+                data=row,
+                label=label,
+                label_type=label_type,
+            ))
+        return cls(
+            name=name,
+            rows=rows,
+            label_type=label_type,
+            label_column=label_column,
+        )
+    @classmethod
+    def from_csv(
+        cls,
+        path: str | Path,
+        label_column: str,
+        name: str | None = None,
+        **kwargs: Any,
+    ) -> "ValidationDataset":
+        """Load dataset from CSV file.
+        Args:
+            path: Path to CSV file
+            label_column: Column containing labels
+            name: Dataset name (uses filename if None)
+            **kwargs: Additional arguments for from_dataframe
+        Returns:
+            ValidationDataset instance
+        """
+        path = Path(path)
+        df = pl.read_csv(path)
+        return cls.from_dataframe(
+            df,
+            label_column=label_column,
+            name=name or path.stem,
+            **kwargs,
+        )
+    @classmethod
+    def from_json(
+        cls,
+        path: str | Path,
+    ) -> "ValidationDataset":
+        """Load dataset from JSON file.
+        Args:
+            path: Path to JSON file
+        Returns:
+            ValidationDataset instance
+        """
+        path = Path(path)
+        with open(path) as f:
+            data = json.load(f)
+        rows = [
+            LabeledRow(
+                row_id=r["row_id"],
+                data=r["data"],
+                label=r["label"],
+                label_type=LabelType(r.get("label_type", "binary")),
+                confidence=r.get("confidence", 1.0),
+                source=r.get("source", ""),
+                annotated_at=datetime.fromisoformat(r["annotated_at"])
+                if "annotated_at" in r else datetime.now(),
+                annotated_by=r.get("annotated_by", ""),
+                notes=r.get("notes", ""),
+            )
+            for r in data.get("rows", [])
+        ]
+        return cls(
+            name=data.get("name", path.stem),
+            rows=rows,
+            label_type=LabelType(data.get("label_type", "binary")),
+            label_column=data.get("label_column", "is_valid"),
+            metadata=data.get("metadata", {}),
+            created_at=datetime.fromisoformat(data["created_at"])
+            if "created_at" in data else datetime.now(),
+            version=data.get("version", "1.0"),
+        )
+    def to_dataframe(self) -> pl.DataFrame:
+        """Convert to Polars DataFrame with labels.
+        Returns:
+            DataFrame with data and label column
+        """
+        if not self.rows:
+            return pl.DataFrame()
+        # Collect all data
+        data_dicts = [row.data for row in self.rows]
+        labels = [row.label for row in self.rows]
+        # Create DataFrame
+        df = pl.DataFrame(data_dicts)
+        df = df.with_columns(pl.Series(self.label_column, labels))
+        return df
+    def to_json(self, path: str | Path) -> None:
+        """Save dataset to JSON file.
+        Args:
+            path: Output path
+        """
+        data = {
+            "name": self.name,
+            "label_type": self.label_type.value,
+            "label_column": self.label_column,
+            "metadata": self.metadata,
+            "created_at": self.created_at.isoformat(),
+            "version": self.version,
+            "rows": [
+                {
+                    "row_id": r.row_id,
+                    "data": r.data,
+                    "label": r.label,
+                    "label_type": r.label_type.value,
+                    "confidence": r.confidence,
+                    "source": r.source,
+                    "annotated_at": r.annotated_at.isoformat(),
+                    "annotated_by": r.annotated_by,
+                    "notes": r.notes,
+                }
+                for r in self.rows
+            ],
+        }
+        path = Path(path)
+        path.parent.mkdir(parents=True, exist_ok=True)
+        with open(path, "w") as f:
+            json.dump(data, f, indent=2)
+    def split(
+        self,
+        test_ratio: float = 0.2,
+        random_seed: int | None = None,
+        stratify: bool = True,
+    ) -> tuple["ValidationDataset", "ValidationDataset"]:
+        """Split dataset into training and test sets.
+        Args:
+            test_ratio: Ratio of data for test set
+            random_seed: Random seed for reproducibility
+            stratify: Whether to stratify by label
+        Returns:
+            Tuple of (train_dataset, test_dataset)
+        """
+        if random_seed is not None:
+            random.seed(random_seed)
+        if stratify and self.label_type == LabelType.BINARY:
+            # Stratified split
+            positive = [r for r in self.rows if r.label]
+            negative = [r for r in self.rows if not r.label]
+            random.shuffle(positive)
+            random.shuffle(negative)
+            n_pos_test = max(1, int(len(positive) * test_ratio))
+            n_neg_test = max(1, int(len(negative) * test_ratio))
+            test_rows = positive[:n_pos_test] + negative[:n_neg_test]
+            train_rows = positive[n_pos_test:] + negative[n_neg_test:]
+        else:
+            # Random split
+            rows = list(self.rows)
+            random.shuffle(rows)
+            n_test = max(1, int(len(rows) * test_ratio))
+            test_rows = rows[:n_test]
+            train_rows = rows[n_test:]
+        train_ds = ValidationDataset(
+            name=f"{self.name}_train",
+            rows=train_rows,
+            label_type=self.label_type,
+            label_column=self.label_column,
+            metadata={**self.metadata, "split": "train"},
+        )
+        test_ds = ValidationDataset(
+            name=f"{self.name}_test",
+            rows=test_rows,
+            label_type=self.label_type,
+            label_column=self.label_column,
+            metadata={**self.metadata, "split": "test"},
+        )
+        return train_ds, test_ds
+    def get_folds(
+        self,
+        n_folds: int = 5,
+        random_seed: int | None = None,
+    ) -> Iterator[tuple["ValidationDataset", "ValidationDataset"]]:
+        """Generate k-fold cross-validation splits.
+        Args:
+            n_folds: Number of folds
+            random_seed: Random seed for reproducibility
+        Yields:
+            Tuples of (train_fold, test_fold)
+        """
+        if random_seed is not None:
+            random.seed(random_seed)
+        rows = list(self.rows)
+        random.shuffle(rows)
+        fold_size = len(rows) // n_folds
+        for i in range(n_folds):
+            start = i * fold_size
+            end = start + fold_size if i < n_folds - 1 else len(rows)
+            test_rows = rows[start:end]
+            train_rows = rows[:start] + rows[end:]
+            train_ds = ValidationDataset(
+                name=f"{self.name}_fold{i}_train",
+                rows=train_rows,
+                label_type=self.label_type,
+                label_column=self.label_column,
+            )
+            test_ds = ValidationDataset(
+                name=f"{self.name}_fold{i}_test",
+                rows=test_rows,
+                label_type=self.label_type,
+                label_column=self.label_column,
+            )
+            yield train_ds, test_ds
+    def filter_by_confidence(
+        self,
+        min_confidence: float = 0.8,
+    ) -> "ValidationDataset":
+        """Filter to high-confidence labels only.
+        Args:
+            min_confidence: Minimum label confidence
+        Returns:
+            Filtered dataset
+        """
+        filtered_rows = [r for r in self.rows if r.confidence >= min_confidence]
+        return ValidationDataset(
+            name=f"{self.name}_high_confidence",
+            rows=filtered_rows,
+            label_type=self.label_type,
+            label_column=self.label_column,
+            metadata={**self.metadata, "min_confidence": min_confidence},
+        )
+    def get_label_distribution(self) -> dict[Any, int]:
+        """Get distribution of labels.
+        Returns:
+            Dictionary mapping labels to counts
+        """
+        distribution: dict[Any, int] = defaultdict(int)
+        for row in self.rows:
+            distribution[row.label] += 1
+        return dict(distribution)
+# =============================================================================
+# Validation Results
+# =============================================================================
+@dataclass
+class ValidationResult:
+    """Comprehensive validation result.
+    Contains detailed metrics, confidence intervals, and recommendations.
+    """
+    # Core metrics
+    precision: float = 0.0
+    recall: float = 0.0
+    f1_score: float = 0.0
+    accuracy: float = 0.0
+    # Confidence intervals (95%)
+    precision_ci: tuple[float, float] = (0.0, 1.0)
+    recall_ci: tuple[float, float] = (0.0, 1.0)
+    f1_ci: tuple[float, float] = (0.0, 1.0)
+    # Validation metadata
+    n_samples: int = 0
+    n_positive: int = 0
+    n_negative: int = 0
+    confidence: float = 0.0
+    # Confusion matrix
+    true_positives: int = 0
+    true_negatives: int = 0
+    false_positives: int = 0
+    false_negatives: int = 0
+    # Status and recommendations
+    status: ValidationStatus = ValidationStatus.INCONCLUSIVE
+    quality_level: QualityLevel = QualityLevel.UNACCEPTABLE
+    recommendation: str = ""
+    warnings: list[str] = field(default_factory=list)
+    # Method details
+    validation_method: ValidationMethod = ValidationMethod.HOLDOUT
+    method_details: dict[str, Any] = field(default_factory=dict)
+    # Timing
+    validated_at: datetime = field(default_factory=datetime.now)
+    duration_ms: float = 0.0
+    @property
+    def confusion_matrix(self) -> ConfusionMatrix:
+        """Get confusion matrix."""
+        return ConfusionMatrix(
+            true_positives=self.true_positives,
+            true_negatives=self.true_negatives,
+            false_positives=self.false_positives,
+            false_negatives=self.false_negatives,
+        )
+    @property
+    def specificity(self) -> float:
+        """Calculate specificity."""
+        if self.true_negatives + self.false_positives == 0:
+            return 0.0
+        return self.true_negatives / (self.true_negatives + self.false_positives)
+    @property
+    def mcc(self) -> float:
+        """Calculate Matthews Correlation Coefficient."""
+        return self.confusion_matrix.mcc
+    def to_dict(self) -> dict[str, Any]:
+        """Convert to dictionary."""
+        return {
+            "precision": self.precision,
+            "recall": self.recall,
+            "f1_score": self.f1_score,
+            "accuracy": self.accuracy,
+            "precision_ci": self.precision_ci,
+            "recall_ci": self.recall_ci,
+            "f1_ci": self.f1_ci,
+            "n_samples": self.n_samples,
+            "n_positive": self.n_positive,
+            "n_negative": self.n_negative,
+            "confidence": self.confidence,
+            "confusion_matrix": {
+                "true_positives": self.true_positives,
+                "true_negatives": self.true_negatives,
+                "false_positives": self.false_positives,
+                "false_negatives": self.false_negatives,
+            },
+            "status": self.status.value,
+            "quality_level": self.quality_level.value,
+            "recommendation": self.recommendation,
+            "warnings": self.warnings,
+            "validation_method": self.validation_method.value,
+            "method_details": self.method_details,
+            "validated_at": self.validated_at.isoformat(),
+            "duration_ms": self.duration_ms,
+        }
+    def to_quality_metrics(self) -> QualityMetrics:
+        """Convert to QualityMetrics for compatibility."""
+        return QualityMetrics.from_confusion_matrix(
+            self.confusion_matrix,
+            sample_size=self.n_samples,
+            population_size=self.n_samples,
+        )
+@dataclass
+class ValidationReport:
+    """Complete validation report for multiple rules."""
+    rule_results: dict[str, ValidationResult] = field(default_factory=dict)
+    overall_status: ValidationStatus = ValidationStatus.INCONCLUSIVE
+    summary: str = ""
+    recommendations: list[str] = field(default_factory=list)
+    dataset_info: dict[str, Any] = field(default_factory=dict)
+    generated_at: datetime = field(default_factory=datetime.now)
+    def add_result(self, rule_name: str, result: ValidationResult) -> None:
+        """Add a rule validation result."""
+        self.rule_results[rule_name] = result
+        self._update_overall_status()
+    def _update_overall_status(self) -> None:
+        """Update overall status based on individual results."""
+        if not self.rule_results:
+            self.overall_status = ValidationStatus.INCONCLUSIVE
+            return
+        statuses = [r.status for r in self.rule_results.values()]
+        if all(s == ValidationStatus.PASSED for s in statuses):
+            self.overall_status = ValidationStatus.PASSED
+        elif any(s == ValidationStatus.FAILED for s in statuses):
+            self.overall_status = ValidationStatus.FAILED
+        elif any(s == ValidationStatus.DEGRADED for s in statuses):
+            self.overall_status = ValidationStatus.DEGRADED
+        else:
+            self.overall_status = ValidationStatus.INCONCLUSIVE
+    def to_dict(self) -> dict[str, Any]:
+        """Convert to dictionary."""
+        return {
+            "rule_results": {
+                name: result.to_dict()
+                for name, result in self.rule_results.items()
+            },
+            "overall_status": self.overall_status.value,
+            "summary": self.summary,
+            "recommendations": self.recommendations,
+            "dataset_info": self.dataset_info,
+            "generated_at": self.generated_at.isoformat(),
+        }
+# =============================================================================
+# Validation Strategies
+# =============================================================================
+class ValidationStrategy(ABC):
+    """Abstract base class for validation strategies."""
+    name: str = "base"
+    @abstractmethod
+    def validate(
+        self,
+        rule: RuleProtocol | ValidationRule,
+        dataset: ValidationDataset,
+        column: str,
+    ) -> ValidationResult:
+        """Validate a rule against labeled data.
+        Args:
+            rule: Rule to validate
+            dataset: Labeled validation dataset
+            column: Column to validate
+        Returns:
+            Validation result
+        """
+        pass
+class HoldoutValidation(ValidationStrategy):
+    """Simple holdout validation strategy."""
+    name = "holdout"
+    def __init__(
+        self,
+        quality_threshold: float = 0.70,
+        min_samples: int = 30,
+    ):
+        self.quality_threshold = quality_threshold
+        self.min_samples = min_samples
+    def validate(
+        self,
+        rule: RuleProtocol | ValidationRule,
+        dataset: ValidationDataset,
+        column: str,
+    ) -> ValidationResult:
+        """Validate using holdout method."""
+        start_time = datetime.now()
+        if len(dataset) < self.min_samples:
+            return ValidationResult(
+                status=ValidationStatus.INCONCLUSIVE,
+                recommendation=f"Need at least {self.min_samples} samples, got {len(dataset)}",
+                n_samples=len(dataset),
+            )
+        # Convert to DataFrame
+        df = dataset.to_dataframe()
+        # Get predictions
+        predictions = rule.validate_column(df, column)
+        # Get ground truth
+        ground_truth = df.get_column(dataset.label_column)
+        # Calculate confusion matrix
+        result = self._calculate_metrics(
+            predictions.to_list(),
+            ground_truth.to_list(),
+        )
+        # Determine status
+        if result.f1_score >= self.quality_threshold:
+            result.status = ValidationStatus.PASSED
+            result.recommendation = (
+                f"Rule meets quality threshold (F1={result.f1_score:.2%} >= {self.quality_threshold:.0%})"
+            )
+        else:
+            result.status = ValidationStatus.FAILED
+            result.recommendation = (
+                f"Rule below quality threshold (F1={result.f1_score:.2%} < {self.quality_threshold:.0%})"
+            )
+        result.quality_level = QualityLevel.from_f1(result.f1_score)
+        result.validation_method = ValidationMethod.HOLDOUT
+        result.duration_ms = (datetime.now() - start_time).total_seconds() * 1000
+        return result
+    def _calculate_metrics(
+        self,
+        predictions: list[bool],
+        ground_truth: list[bool],
+    ) -> ValidationResult:
+        """Calculate validation metrics."""
+        tp = tn = fp = fn = 0
+        for pred, truth in zip(predictions, ground_truth):
+            if pred and truth:
+                tp += 1
+            elif not pred and not truth:
+                tn += 1
+            elif pred and not truth:
+                fp += 1
+            else:
+                fn += 1
+        n = len(predictions)
+        n_pos = sum(1 for t in ground_truth if t)
+        n_neg = n - n_pos
+        precision = tp / (tp + fp) if (tp + fp) > 0 else 0.0
+        recall = tp / (tp + fn) if (tp + fn) > 0 else 0.0
+        f1 = 2 * precision * recall / (precision + recall) if (precision + recall) > 0 else 0.0
+        accuracy = (tp + tn) / n if n > 0 else 0.0
+        # Calculate confidence intervals using Wilson score
+        precision_ci = self._wilson_ci(tp, tp + fp)
+        recall_ci = self._wilson_ci(tp, tp + fn)
+        return ValidationResult(
+            precision=precision,
+            recall=recall,
+            f1_score=f1,
+            accuracy=accuracy,
+            precision_ci=precision_ci,
+            recall_ci=recall_ci,
+            n_samples=n,
+            n_positive=n_pos,
+            n_negative=n_neg,
+            true_positives=tp,
+            true_negatives=tn,
+            false_positives=fp,
+            false_negatives=fn,
+            confidence=min(1.0, n / 100),  # Higher confidence with more samples
+        )
+    @staticmethod
+    def _wilson_ci(
+        successes: int,
+        trials: int,
+        z: float = 1.96,
+    ) -> tuple[float, float]:
+        """Calculate Wilson confidence interval."""
+        if trials == 0:
+            return (0.0, 1.0)
+        p = successes / trials
+        denominator = 1 + z * z / trials
+        centre = p + z * z / (2 * trials)
+        margin = z * math.sqrt((p * (1 - p) + z * z / (4 * trials)) / trials)
+        lower = max(0.0, (centre - margin) / denominator)
+        upper = min(1.0, (centre + margin) / denominator)
+        return (lower, upper)
+class CrossValidationStrategy(ValidationStrategy):
+    """K-fold cross-validation strategy."""
+    name = "cross_validation"
+    def __init__(
+        self,
+        n_folds: int = 5,
+        quality_threshold: float = 0.70,
+        random_seed: int | None = None,
+    ):
+        self.n_folds = n_folds
+        self.quality_threshold = quality_threshold
+        self.random_seed = random_seed
+    def validate(
+        self,
+        rule: RuleProtocol | ValidationRule,
+        dataset: ValidationDataset,
+        column: str,
+    ) -> ValidationResult:
+        """Validate using k-fold cross-validation."""
+        start_time = datetime.now()
+        fold_metrics: list[dict[str, float]] = []
+        for train_ds, test_ds in dataset.get_folds(
+            n_folds=self.n_folds,
+            random_seed=self.random_seed,
+        ):
+            df = test_ds.to_dataframe()
+            predictions = rule.validate_column(df, column)
+            ground_truth = df.get_column(dataset.label_column)
+            # Calculate fold metrics
+            metrics = self._calculate_fold_metrics(
+                predictions.to_list(),
+                ground_truth.to_list(),
+            )
+            fold_metrics.append(metrics)
+        # Aggregate across folds
+        result = self._aggregate_folds(fold_metrics, len(dataset))
+        # Determine status
+        if result.f1_score >= self.quality_threshold:
+            result.status = ValidationStatus.PASSED
+        else:
+            result.status = ValidationStatus.FAILED
+        result.quality_level = QualityLevel.from_f1(result.f1_score)
+        result.validation_method = ValidationMethod.CROSS_VALIDATION
+        result.method_details = {
+            "n_folds": self.n_folds,
+            "fold_f1_scores": [m["f1"] for m in fold_metrics],
+        }
+        result.duration_ms = (datetime.now() - start_time).total_seconds() * 1000
+        return result
+    def _calculate_fold_metrics(
+        self,
+        predictions: list[bool],
+        ground_truth: list[bool],
+    ) -> dict[str, float]:
+        """Calculate metrics for a single fold."""
+        tp = tn = fp = fn = 0
+        for pred, truth in zip(predictions, ground_truth):
+            if pred and truth:
+                tp += 1
+            elif not pred and not truth:
+                tn += 1
+            elif pred and not truth:
+                fp += 1
+            else:
+                fn += 1
+        precision = tp / (tp + fp) if (tp + fp) > 0 else 0.0
+        recall = tp / (tp + fn) if (tp + fn) > 0 else 0.0
+        f1 = 2 * precision * recall / (precision + recall) if (precision + recall) > 0 else 0.0
+        return {
+            "precision": precision,
+            "recall": recall,
+            "f1": f1,
+            "tp": tp,
+            "tn": tn,
+            "fp": fp,
+            "fn": fn,
+        }
+    def _aggregate_folds(
+        self,
+        fold_metrics: list[dict[str, float]],
+        total_samples: int,
+    ) -> ValidationResult:
+        """Aggregate metrics across folds."""
+        precisions = [m["precision"] for m in fold_metrics]
+        recalls = [m["recall"] for m in fold_metrics]
+        f1s = [m["f1"] for m in fold_metrics]
+        # Calculate mean and confidence intervals
+        mean_precision = statistics.mean(precisions)
+        mean_recall = statistics.mean(recalls)
+        mean_f1 = statistics.mean(f1s)
+        std_precision = statistics.stdev(precisions) if len(precisions) > 1 else 0.0
+        std_recall = statistics.stdev(recalls) if len(recalls) > 1 else 0.0
+        std_f1 = statistics.stdev(f1s) if len(f1s) > 1 else 0.0
+        # 95% CI = mean +/- 1.96 * std / sqrt(n)
+        z = 1.96
+        n = len(fold_metrics)
+        margin_precision = z * std_precision / math.sqrt(n) if n > 0 else 0.0
+        margin_recall = z * std_recall / math.sqrt(n) if n > 0 else 0.0
+        margin_f1 = z * std_f1 / math.sqrt(n) if n > 0 else 0.0
+        # Sum confusion matrix across folds
+        total_tp = sum(int(m["tp"]) for m in fold_metrics)
+        total_tn = sum(int(m["tn"]) for m in fold_metrics)
+        total_fp = sum(int(m["fp"]) for m in fold_metrics)
+        total_fn = sum(int(m["fn"]) for m in fold_metrics)
+        # Calculate consistency-based confidence
+        f1_cv = std_f1 / mean_f1 if mean_f1 > 0 else 1.0
+        confidence = max(0.0, 1.0 - f1_cv)
+        return ValidationResult(
+            precision=mean_precision,
+            recall=mean_recall,
+            f1_score=mean_f1,
+            accuracy=(total_tp + total_tn) / (total_tp + total_tn + total_fp + total_fn)
+            if (total_tp + total_tn + total_fp + total_fn) > 0 else 0.0,
+            precision_ci=(
+                max(0.0, mean_precision - margin_precision),
+                min(1.0, mean_precision + margin_precision),
+            ),
+            recall_ci=(
+                max(0.0, mean_recall - margin_recall),
+                min(1.0, mean_recall + margin_recall),
+            ),
+            f1_ci=(
+                max(0.0, mean_f1 - margin_f1),
+                min(1.0, mean_f1 + margin_f1),
+            ),
+            n_samples=total_samples,
+            true_positives=total_tp,
+            true_negatives=total_tn,
+            false_positives=total_fp,
+            false_negatives=total_fn,
+            confidence=confidence,
+            recommendation=f"Cross-validated F1: {mean_f1:.2%} (±{margin_f1:.2%})",
+        )
+class BootstrapValidation(ValidationStrategy):
+    """Bootstrap resampling validation strategy."""
+    name = "bootstrap"
+    def __init__(
+        self,
+        n_iterations: int = 1000,
+        sample_ratio: float = 0.8,
+        quality_threshold: float = 0.70,
+        random_seed: int | None = None,
+    ):
+        self.n_iterations = n_iterations
+        self.sample_ratio = sample_ratio
+        self.quality_threshold = quality_threshold
+        self.random_seed = random_seed
+    def validate(
+        self,
+        rule: RuleProtocol | ValidationRule,
+        dataset: ValidationDataset,
+        column: str,
+    ) -> ValidationResult:
+        """Validate using bootstrap resampling."""
+        start_time = datetime.now()
+        if self.random_seed is not None:
+            random.seed(self.random_seed)
+        df = dataset.to_dataframe()
+        n = len(df)
+        sample_size = int(n * self.sample_ratio)
+        # Collect bootstrap samples
+        f1_scores: list[float] = []
+        precisions: list[float] = []
+        recalls: list[float] = []
+        for _ in range(self.n_iterations):
+            # Sample with replacement
+            indices = [random.randint(0, n - 1) for _ in range(sample_size)]
+            sample_df = df[indices]
+            predictions = rule.validate_column(sample_df, column)
+            ground_truth = sample_df.get_column(dataset.label_column)
+            metrics = self._calculate_metrics(
+                predictions.to_list(),
+                ground_truth.to_list(),
+            )
+            f1_scores.append(metrics["f1"])
+            precisions.append(metrics["precision"])
+            recalls.append(metrics["recall"])
+        # Calculate percentile confidence intervals
+        f1_scores.sort()
+        precisions.sort()
+        recalls.sort()
+        lower_idx = int(0.025 * self.n_iterations)
+        upper_idx = int(0.975 * self.n_iterations)
+        result = ValidationResult(
+            precision=statistics.mean(precisions),
+            recall=statistics.mean(recalls),
+            f1_score=statistics.mean(f1_scores),
+            precision_ci=(precisions[lower_idx], precisions[upper_idx]),
+            recall_ci=(recalls[lower_idx], recalls[upper_idx]),
+            f1_ci=(f1_scores[lower_idx], f1_scores[upper_idx]),
+            n_samples=n,
+            confidence=1.0 - statistics.stdev(f1_scores) if len(f1_scores) > 1 else 0.5,
+            validation_method=ValidationMethod.BOOTSTRAP,
+            method_details={
+                "n_iterations": self.n_iterations,
+                "sample_ratio": self.sample_ratio,
+            },
+        )
+        if result.f1_score >= self.quality_threshold:
+            result.status = ValidationStatus.PASSED
+        else:
+            result.status = ValidationStatus.FAILED
+        result.quality_level = QualityLevel.from_f1(result.f1_score)
+        result.recommendation = (
+            f"Bootstrap F1: {result.f1_score:.2%} "
+            f"(95% CI: [{result.f1_ci[0]:.2%}, {result.f1_ci[1]:.2%}])"
+        )
+        result.duration_ms = (datetime.now() - start_time).total_seconds() * 1000
+        return result
+    def _calculate_metrics(
+        self,
+        predictions: list[bool],
+        ground_truth: list[bool],
+    ) -> dict[str, float]:
+        """Calculate metrics for a bootstrap sample."""
+        tp = tn = fp = fn = 0
+        for pred, truth in zip(predictions, ground_truth):
+            if pred and truth:
+                tp += 1
+            elif not pred and not truth:
+                tn += 1
+            elif pred and not truth:
+                fp += 1
+            else:
+                fn += 1
+        precision = tp / (tp + fp) if (tp + fp) > 0 else 0.0
+        recall = tp / (tp + fn) if (tp + fn) > 0 else 0.0
+        f1 = 2 * precision * recall / (precision + recall) if (precision + recall) > 0 else 0.0
+        return {"precision": precision, "recall": recall, "f1": f1}
+# =============================================================================
+# Strategy Registry
+# =============================================================================
+class ValidationStrategyRegistry:
+    """Registry for validation strategies."""
+    def __init__(self) -> None:
+        self._strategies: dict[str, type[ValidationStrategy]] = {}
+    def register(
+        self,
+        name: str,
+        strategy_class: type[ValidationStrategy],
+    ) -> None:
+        """Register a validation strategy."""
+        self._strategies[name] = strategy_class
+    def create(self, name: str, **kwargs: Any) -> ValidationStrategy:
+        """Create a strategy instance."""
+        if name not in self._strategies:
+            raise KeyError(
+                f"Unknown strategy: {name}. "
+                f"Available: {list(self._strategies.keys())}"
+            )
+        return self._strategies[name](**kwargs)
+    def list_strategies(self) -> list[str]:
+        """List registered strategy names."""
+        return list(self._strategies.keys())
+# Global registry
+validation_strategy_registry = ValidationStrategyRegistry()
+validation_strategy_registry.register("holdout", HoldoutValidation)
+validation_strategy_registry.register("cross_validation", CrossValidationStrategy)
+validation_strategy_registry.register("bootstrap", BootstrapValidation)
+# =============================================================================
+# Main Validator
+# =============================================================================
+class LabeledDataValidator:
+    """Main validator using labeled ground truth data.
+    Provides comprehensive rule quality validation with:
+    - Multiple validation strategies
+    - Detailed confidence intervals
+    - Actionable recommendations
+    Example:
+        validator = LabeledDataValidator(strategy="cross_validation")
+        # Validate single rule
+        result = validator.validate(rule, dataset, "email_column")
+        print(f"F1: {result.f1_score:.2%}")
+        # Validate multiple rules
+        report = validator.validate_all(rules, dataset)
+        print(report.overall_status)
+    """
+    def __init__(
+        self,
+        strategy: str | ValidationStrategy = "cross_validation",
+        strategy_options: dict[str, Any] | None = None,
+        quality_threshold: float = 0.70,
+        min_samples: int = 30,
+    ):
+        """Initialize validator.
+        Args:
+            strategy: Validation strategy name or instance
+            strategy_options: Options for strategy construction
+            quality_threshold: Minimum F1 for passing
+            min_samples: Minimum samples required
+        """
+        self.quality_threshold = quality_threshold
+        self.min_samples = min_samples
+        self._cache: dict[str, ValidationResult] = {}
+        self._lock = threading.Lock()
+        if isinstance(strategy, ValidationStrategy):
+            self._strategy = strategy
+        else:
+            options = strategy_options or {}
+            options.setdefault("quality_threshold", quality_threshold)
+            self._strategy = validation_strategy_registry.create(strategy, **options)
+    def validate(
+        self,
+        rule: RuleProtocol | ValidationRule,
+        dataset: ValidationDataset,
+        column: str | None = None,
+        use_cache: bool = True,
+    ) -> ValidationResult:
+        """Validate a rule against labeled data.
+        Args:
+            rule: Rule to validate
+            dataset: Labeled validation dataset
+            column: Column to validate (uses rule.column if None)
+            use_cache: Whether to use cached results
+        Returns:
+            Validation result
+        """
+        column = column or rule.column
+        if column is None:
+            return ValidationResult(
+                status=ValidationStatus.INCONCLUSIVE,
+                recommendation="No column specified for validation",
+            )
+        # Check cache
+        cache_key = self._make_cache_key(rule, dataset, column)
+        if use_cache:
+            with self._lock:
+                if cache_key in self._cache:
+                    return self._cache[cache_key]
+        # Check sample size
+        if len(dataset) < self.min_samples:
+            return ValidationResult(
+                status=ValidationStatus.INCONCLUSIVE,
+                recommendation=f"Need at least {self.min_samples} samples",
+                n_samples=len(dataset),
+                warnings=[f"Only {len(dataset)} samples available"],
+            )
+        # Validate
+        result = self._strategy.validate(rule, dataset, column)
+        # Add warnings for edge cases
+        if result.n_positive < 10 or result.n_negative < 10:
+            result.warnings.append(
+                "Imbalanced labels may affect reliability"
+            )
+        if result.confidence < 0.7:
+            result.warnings.append(
+                "Low confidence - consider collecting more labels"
+            )
+        # Cache result
+        if use_cache:
+            with self._lock:
+                self._cache[cache_key] = result
+        return result
+    def validate_all(
+        self,
+        rules: list[RuleProtocol | ValidationRule],
+        dataset: ValidationDataset,
+    ) -> ValidationReport:
+        """Validate multiple rules.
+        Args:
+            rules: Rules to validate
+            dataset: Labeled validation dataset
+        Returns:
+            Complete validation report
+        """
+        report = ValidationReport(
+            dataset_info={
+                "name": dataset.name,
+                "size": len(dataset),
+                "label_distribution": dataset.get_label_distribution(),
+            },
+        )
+        passed = 0
+        failed = 0
+        for rule in rules:
+            result = self.validate(rule, dataset)
+            report.add_result(rule.name, result)
+            if result.status == ValidationStatus.PASSED:
+                passed += 1
+            elif result.status == ValidationStatus.FAILED:
+                failed += 1
+        # Generate summary
+        report.summary = (
+            f"Validated {len(rules)} rules: "
+            f"{passed} passed, {failed} failed, "
+            f"{len(rules) - passed - failed} inconclusive"
+        )
+        # Generate recommendations
+        if failed > 0:
+            report.recommendations.append(
+                f"{failed} rules failed validation - review and adjust thresholds or rule logic"
+            )
+        low_confidence = [
+            name for name, result in report.rule_results.items()
+            if result.confidence < 0.7
+        ]
+        if low_confidence:
+            report.recommendations.append(
+                f"Low confidence for rules: {', '.join(low_confidence)} - collect more labels"
+            )
+        return report
+    def compare_rules(
+        self,
+        rules: list[RuleProtocol | ValidationRule],
+        dataset: ValidationDataset,
+        column: str,
+    ) -> list[tuple[str, ValidationResult]]:
+        """Compare multiple rules for the same column.
+        Args:
+            rules: Rules to compare
+            dataset: Labeled validation dataset
+            column: Column to validate
+        Returns:
+            Rules sorted by F1 score (best first)
+        """
+        results = [
+            (rule.name, self.validate(rule, dataset, column))
+            for rule in rules
+        ]
+        return sorted(results, key=lambda x: x[1].f1_score, reverse=True)
+    def _make_cache_key(
+        self,
+        rule: RuleProtocol | ValidationRule,
+        dataset: ValidationDataset,
+        column: str,
+    ) -> str:
+        """Create cache key."""
+        rule_str = f"{rule.name}:{rule.rule_type}"
+        dataset_hash = hashlib.sha256(
+            f"{dataset.name}:{len(dataset)}:{dataset.version}".encode()
+        ).hexdigest()[:16]
+        return f"{rule_str}:{column}:{dataset_hash}"
+    def clear_cache(self) -> None:
+        """Clear validation cache."""
+        with self._lock:
+            self._cache.clear()
+# =============================================================================
+# A/B Testing
+# =============================================================================
+@dataclass
+class ABTestResult:
+    """Result of A/B testing between two rules."""
+    rule_a_name: str
+    rule_b_name: str
+    rule_a_f1: float
+    rule_b_f1: float
+    difference: float
+    p_value: float
+    significant: bool
+    winner: str | None
+    confidence_level: float = 0.95
+    recommendation: str = ""
+    def to_dict(self) -> dict[str, Any]:
+        """Convert to dictionary."""
+        return {
+            "rule_a_name": self.rule_a_name,
+            "rule_b_name": self.rule_b_name,
+            "rule_a_f1": self.rule_a_f1,
+            "rule_b_f1": self.rule_b_f1,
+            "difference": self.difference,
+            "p_value": self.p_value,
+            "significant": self.significant,
+            "winner": self.winner,
+            "confidence_level": self.confidence_level,
+            "recommendation": self.recommendation,
+        }
+class RuleABTester:
+    """A/B testing for comparing rule quality.
+    Performs statistical tests to determine if one rule
+    is significantly better than another.
+    Example:
+        tester = RuleABTester()
+        result = tester.test(rule_a, rule_b, dataset, "column")
+        if result.significant:
+            print(f"Winner: {result.winner}")
+        else:
+            print("No significant difference")
+    """
+    def __init__(
+        self,
+        n_iterations: int = 1000,
+        confidence_level: float = 0.95,
+        random_seed: int | None = None,
+    ):
+        """Initialize A/B tester.
+        Args:
+            n_iterations: Number of bootstrap iterations
+            confidence_level: Confidence level for significance
+            random_seed: Random seed for reproducibility
+        """
+        self.n_iterations = n_iterations
+        self.confidence_level = confidence_level
+        self.random_seed = random_seed
+    def test(
+        self,
+        rule_a: RuleProtocol | ValidationRule,
+        rule_b: RuleProtocol | ValidationRule,
+        dataset: ValidationDataset,
+        column: str,
+    ) -> ABTestResult:
+        """Perform A/B test between two rules.
+        Args:
+            rule_a: First rule
+            rule_b: Second rule
+            dataset: Labeled validation dataset
+            column: Column to validate
+        Returns:
+            A/B test result
+        """
+        if self.random_seed is not None:
+            random.seed(self.random_seed)
+        df = dataset.to_dataframe()
+        n = len(df)
+        # Calculate observed F1 scores
+        pred_a = rule_a.validate_column(df, column)
+        pred_b = rule_b.validate_column(df, column)
+        ground_truth = df.get_column(dataset.label_column)
+        f1_a = self._calculate_f1(pred_a.to_list(), ground_truth.to_list())
+        f1_b = self._calculate_f1(pred_b.to_list(), ground_truth.to_list())
+        observed_diff = f1_a - f1_b
+        # Bootstrap test
+        diff_samples = []
+        for _ in range(self.n_iterations):
+            indices = [random.randint(0, n - 1) for _ in range(n)]
+            sample_df = df[indices]
+            sample_pred_a = rule_a.validate_column(sample_df, column)
+            sample_pred_b = rule_b.validate_column(sample_df, column)
+            sample_gt = sample_df.get_column(dataset.label_column)
+            sample_f1_a = self._calculate_f1(
+                sample_pred_a.to_list(), sample_gt.to_list()
+            )
+            sample_f1_b = self._calculate_f1(
+                sample_pred_b.to_list(), sample_gt.to_list()
+            )
+            diff_samples.append(sample_f1_a - sample_f1_b)
+        # Calculate p-value (two-tailed)
+        # Under null hypothesis, difference centers at 0
+        centered = [d - observed_diff for d in diff_samples]
+        extreme_count = sum(1 for d in centered if abs(d) >= abs(observed_diff))
+        p_value = extreme_count / self.n_iterations
+        # Determine significance
+        alpha = 1 - self.confidence_level
+        significant = p_value < alpha
+        # Determine winner
+        if significant:
+            winner = rule_a.name if observed_diff > 0 else rule_b.name
+            recommendation = (
+                f"{winner} is significantly better (p={p_value:.4f})"
+            )
+        else:
+            winner = None
+            recommendation = (
+                f"No significant difference (p={p_value:.4f})"
+            )
+        return ABTestResult(
+            rule_a_name=rule_a.name,
+            rule_b_name=rule_b.name,
+            rule_a_f1=f1_a,
+            rule_b_f1=f1_b,
+            difference=observed_diff,
+            p_value=p_value,
+            significant=significant,
+            winner=winner,
+            confidence_level=self.confidence_level,
+            recommendation=recommendation,
+        )
+    def _calculate_f1(
+        self,
+        predictions: list[bool],
+        ground_truth: list[bool],
+    ) -> float:
+        """Calculate F1 score."""
+        tp = sum(1 for p, t in zip(predictions, ground_truth) if p and t)
+        fp = sum(1 for p, t in zip(predictions, ground_truth) if p and not t)
+        fn = sum(1 for p, t in zip(predictions, ground_truth) if not p and t)
+        precision = tp / (tp + fp) if (tp + fp) > 0 else 0.0
+        recall = tp / (tp + fn) if (tp + fn) > 0 else 0.0
+        return 2 * precision * recall / (precision + recall) if (precision + recall) > 0 else 0.0
+# =============================================================================
+# Convenience Functions
+# =============================================================================
+def validate_rule(
+    rule: RuleProtocol | ValidationRule,
+    dataset: ValidationDataset,
+    column: str | None = None,
+    strategy: str = "cross_validation",
+    **kwargs: Any,
+) -> ValidationResult:
+    """Validate a rule against labeled data.
+    Args:
+        rule: Rule to validate
+        dataset: Labeled validation dataset
+        column: Column to validate
+        strategy: Validation strategy
+        **kwargs: Additional options
+    Returns:
+        Validation result
+    """
+    validator = LabeledDataValidator(strategy=strategy, **kwargs)
+    return validator.validate(rule, dataset, column)
+def create_validation_suite(
+    rules: list[RuleProtocol | ValidationRule],
+    dataset: ValidationDataset,
+    strategy: str = "cross_validation",
+) -> ValidationReport:
+    """Create a validation suite for multiple rules.
+    Args:
+        rules: Rules to validate
+        dataset: Labeled validation dataset
+        strategy: Validation strategy
+    Returns:
+        Complete validation report
+    """
+    validator = LabeledDataValidator(strategy=strategy)
+    return validator.validate_all(rules, dataset)
+def compare_rule_quality(
+    rule_a: RuleProtocol | ValidationRule,
+    rule_b: RuleProtocol | ValidationRule,
+    dataset: ValidationDataset,
+    column: str,
+) -> ABTestResult:
+    """Compare two rules using A/B testing.
+    Args:
+        rule_a: First rule
+        rule_b: Second rule
+        dataset: Labeled validation dataset
+        column: Column to validate
+    Returns:
+        A/B test result
+    """
+    tester = RuleABTester()
+    return tester.test(rule_a, rule_b, dataset, column)