PyPI - etlplus - Versions diffs - 0.15.0__py3-none-any.whl → 0.16.6__py3-none-any.whl - Mend

etlplus 0.15.0py3-none-any.whl → 0.16.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (130) hide show

etlplus/README.md +25 -3
etlplus/__init__.py +2 -0
etlplus/api/README.md +31 -0
etlplus/api/__init__.py +14 -14
etlplus/api/auth.py +10 -7
etlplus/api/config.py +8 -13
etlplus/api/endpoint_client.py +20 -20
etlplus/api/errors.py +4 -4
etlplus/api/pagination/__init__.py +6 -6
etlplus/api/pagination/config.py +12 -10
etlplus/api/pagination/paginator.py +6 -7
etlplus/api/rate_limiting/__init__.py +2 -2
etlplus/api/rate_limiting/config.py +14 -14
etlplus/api/rate_limiting/rate_limiter.py +3 -3
etlplus/api/request_manager.py +4 -4
etlplus/api/retry_manager.py +8 -8
etlplus/api/transport.py +11 -11
etlplus/api/types.py +131 -11
etlplus/api/utils.py +50 -50
etlplus/cli/commands.py +93 -60
etlplus/cli/constants.py +1 -1
etlplus/cli/handlers.py +43 -26
etlplus/cli/io.py +2 -2
etlplus/cli/main.py +2 -2
etlplus/cli/state.py +4 -7
etlplus/{workflow/pipeline.py → config.py} +62 -99
etlplus/connector/__init__.py +43 -0
etlplus/connector/api.py +161 -0
etlplus/connector/connector.py +26 -0
etlplus/connector/core.py +132 -0
etlplus/connector/database.py +122 -0
etlplus/connector/enums.py +52 -0
etlplus/connector/file.py +120 -0
etlplus/connector/types.py +40 -0
etlplus/connector/utils.py +122 -0
etlplus/database/ddl.py +2 -2
etlplus/database/engine.py +19 -3
etlplus/database/orm.py +2 -0
etlplus/enums.py +36 -200
etlplus/file/_imports.py +1 -0
etlplus/file/_io.py +52 -4
etlplus/file/accdb.py +3 -2
etlplus/file/arrow.py +3 -2
etlplus/file/avro.py +3 -2
etlplus/file/bson.py +3 -2
etlplus/file/cbor.py +3 -2
etlplus/file/cfg.py +3 -2
etlplus/file/conf.py +3 -2
etlplus/file/core.py +11 -8
etlplus/file/csv.py +3 -2
etlplus/file/dat.py +3 -2
etlplus/file/dta.py +3 -2
etlplus/file/duckdb.py +3 -2
etlplus/file/enums.py +1 -1
etlplus/file/feather.py +3 -2
etlplus/file/fwf.py +3 -2
etlplus/file/gz.py +3 -2
etlplus/file/hbs.py +3 -2
etlplus/file/hdf5.py +3 -2
etlplus/file/ini.py +3 -2
etlplus/file/ion.py +3 -2
etlplus/file/jinja2.py +3 -2
etlplus/file/json.py +5 -16
etlplus/file/log.py +3 -2
etlplus/file/mat.py +3 -2
etlplus/file/mdb.py +3 -2
etlplus/file/msgpack.py +3 -2
etlplus/file/mustache.py +3 -2
etlplus/file/nc.py +3 -2
etlplus/file/ndjson.py +3 -2
etlplus/file/numbers.py +3 -2
etlplus/file/ods.py +3 -2
etlplus/file/orc.py +3 -2
etlplus/file/parquet.py +3 -2
etlplus/file/pb.py +3 -2
etlplus/file/pbf.py +3 -2
etlplus/file/properties.py +3 -2
etlplus/file/proto.py +3 -2
etlplus/file/psv.py +3 -2
etlplus/file/rda.py +3 -2
etlplus/file/rds.py +3 -2
etlplus/file/sas7bdat.py +3 -2
etlplus/file/sav.py +3 -2
etlplus/file/sqlite.py +3 -2
etlplus/file/stub.py +1 -0
etlplus/file/sylk.py +3 -2
etlplus/file/tab.py +3 -2
etlplus/file/toml.py +3 -2
etlplus/file/tsv.py +3 -2
etlplus/file/txt.py +4 -3
etlplus/file/vm.py +3 -2
etlplus/file/wks.py +3 -2
etlplus/file/xls.py +3 -2
etlplus/file/xlsm.py +3 -2
etlplus/file/xlsx.py +3 -2
etlplus/file/xml.py +9 -3
etlplus/file/xpt.py +3 -2
etlplus/file/yaml.py +5 -16
etlplus/file/zip.py +3 -2
etlplus/file/zsav.py +3 -2
etlplus/ops/__init__.py +1 -0
etlplus/ops/enums.py +173 -0
etlplus/ops/extract.py +222 -23
etlplus/ops/load.py +155 -36
etlplus/ops/run.py +92 -107
etlplus/ops/transform.py +48 -29
etlplus/ops/types.py +147 -0
etlplus/ops/utils.py +11 -40
etlplus/ops/validate.py +16 -16
etlplus/types.py +6 -102
etlplus/utils.py +163 -29
etlplus/workflow/README.md +0 -24
etlplus/workflow/__init__.py +2 -15
etlplus/workflow/dag.py +23 -1
etlplus/workflow/jobs.py +83 -39
etlplus/workflow/profile.py +4 -2
{etlplus-0.15.0.dist-info → etlplus-0.16.6.dist-info}/METADATA +4 -4
etlplus-0.16.6.dist-info/RECORD +143 -0
{etlplus-0.15.0.dist-info → etlplus-0.16.6.dist-info}/WHEEL +1 -1
etlplus/config/README.md +0 -50
etlplus/config/__init__.py +0 -33
etlplus/config/types.py +0 -140
etlplus/dag.py +0 -103
etlplus/workflow/connector.py +0 -373
etlplus/workflow/types.py +0 -115
etlplus/workflow/utils.py +0 -120
etlplus-0.15.0.dist-info/RECORD +0 -139
{etlplus-0.15.0.dist-info → etlplus-0.16.6.dist-info}/entry_points.txt +0 -0
{etlplus-0.15.0.dist-info → etlplus-0.16.6.dist-info}/licenses/LICENSE +0 -0
{etlplus-0.15.0.dist-info → etlplus-0.16.6.dist-info}/top_level.txt +0 -0

etlplus/ops/run.py CHANGED Viewed

@@ -6,31 +6,23 @@ A module for running ETL jobs defined in YAML configurations.
 from __future__ import annotations
-from collections.abc import Mapping
 from typing import Any
 from typing import Final
 from typing import cast
-from urllib.parse import urlsplit
-from urllib.parse import urlunsplit
-from ..api import EndpointClient  # noqa: F401 (re-exported for tests)
 from ..api import HttpMethod
-from ..api import PaginationConfigMap
-from ..api import RequestOptions
-from ..api import compose_api_request_env
-from ..api import compose_api_target_env
-from ..api import paginate_with_client
-from ..enums import DataConnectorType
+from ..config import Config
+from ..connector import DataConnectorType
 from ..file import FileFormat
+from ..ops.types import PipelineConfig
 from ..types import JSONData
 from ..types import JSONDict
-from ..types import PipelineConfig
 from ..types import StrPath
-from ..types import Timeout
 from ..utils import print_json
-from ..workflow import load_pipeline_config
 from .extract import extract
+from .extract import extract_from_api_source
 from .load import load
+from .load import load_to_api_target
 from .transform import transform
 from .utils import maybe_validate
 from .validate import validate
@@ -54,6 +46,75 @@ DEFAULT_CONFIG_PATH: Final[str] = 'in/pipeline.yml'
 # SECTION: INTERNAL FUNCTIONS =============================================== #
+def _index_connectors(
+    connectors: list[Any],
+    *,
+    label: str,
+) -> dict[str, Any]:
+    """
+    Index connectors by name with a helpful error on duplicates.
+    Parameters
+    ----------
+    connectors : list[Any]
+        Connector objects to index.
+    label : str
+        Label used in error messages (e.g., ``"source"``).
+    Returns
+    -------
+    dict[str, Any]
+        Mapping of connector names to connector objects.
+    Raises
+    ------
+    ValueError
+        If duplicate connector names are found.
+    """
+    indexed: dict[str, Any] = {}
+    for connector in connectors:
+        name = getattr(connector, 'name', None)
+        if not isinstance(name, str) or not name:
+            continue
+        if name in indexed:
+            raise ValueError(f'Duplicate {label} connector name: {name}')
+        indexed[name] = connector
+    return indexed
+def _require_named_connector(
+    connectors: dict[str, Any],
+    name: str,
+    *,
+    label: str,
+) -> Any:
+    """
+    Return a connector by name or raise a helpful error.
+    Parameters
+    ----------
+    connectors : dict[str, Any]
+        Mapping of connector names to connector objects.
+    name : str
+        Connector name to retrieve.
+    label : str
+        Label used in error messages (e.g., ``"source"``).
+    Returns
+    -------
+    Any
+        Connector object.
+    Raises
+    ------
+    ValueError
+        If the connector name is not found.
+    """
+    if name not in connectors:
+        raise ValueError(f'Unknown {label}: {name}')
+    return connectors[name]
 def _resolve_validation_config(
     job_obj: Any,
     cfg: Any,
@@ -94,7 +155,7 @@ def run(
     Run a pipeline job defined in a YAML configuration.
     By default it reads the configuration from ``in/pipeline.yml``, but callers
-    can provide an explicit ``config_path`` to override this.
+    can provide an explicit *config_path* to override this.
     Parameters
     ----------
@@ -115,23 +176,25 @@ def run(
         If the job is not found or if there are configuration issues.
     """
     cfg_path = config_path or DEFAULT_CONFIG_PATH
-    cfg = load_pipeline_config(cfg_path, substitute=True)
+    cfg = Config.from_yaml(cfg_path, substitute=True)
     # Lookup job by name
     if not (job_obj := next((j for j in cfg.jobs if j.name == job), None)):
         raise ValueError(f'Job not found: {job}')
     # Index sources/targets by name
-    sources_by_name = {getattr(s, 'name', None): s for s in cfg.sources}
-    targets_by_name = {getattr(t, 'name', None): t for t in cfg.targets}
+    sources_by_name = _index_connectors(cfg.sources, label='source')
+    targets_by_name = _index_connectors(cfg.targets, label='target')
     # Extract.
     if not job_obj.extract:
         raise ValueError('Job missing "extract" section')
     source_name = job_obj.extract.source
-    if source_name not in sources_by_name:
-        raise ValueError(f'Unknown source: {source_name}')
-    source_obj = sources_by_name[source_name]
+    source_obj = _require_named_connector(
+        sources_by_name,
+        source_name,
+        label='source',
+    )
     ex_opts: dict[str, Any] = job_obj.extract.options or {}
     data: Any
@@ -151,68 +214,7 @@ def run(
             conn = getattr(source_obj, 'connection_string', '')
             data = extract('database', conn)
         case DataConnectorType.API:
-            env = compose_api_request_env(cfg, source_obj, ex_opts)
-            if (
-                env.get('use_endpoints')
-                and env.get('base_url')
-                and env.get('endpoints_map')
-                and env.get('endpoint_key')
-            ):
-                # Construct client using module-level EndpointClient so tests
-                # can monkeypatch this class on etlplus.ops.run.
-                ClientClass = EndpointClient  # noqa: N806
-                client = ClientClass(
-                    base_url=cast(str, env.get('base_url')),
-                    base_path=cast(str | None, env.get('base_path')),
-                    endpoints=cast(
-                        dict[str, str],
-                        env.get('endpoints_map', {}),
-                    ),
-                    retry=env.get('retry'),
-                    retry_network_errors=bool(
-                        env.get('retry_network_errors', False),
-                    ),
-                    session=env.get('session'),
-                )
-                data = paginate_with_client(
-                    client,
-                    cast(str, env.get('endpoint_key')),
-                    env.get('params'),
-                    env.get('headers'),
-                    env.get('timeout'),
-                    env.get('pagination'),
-                    cast(float | None, env.get('sleep_seconds')),
-                )
-            else:
-                url = env.get('url')
-                if not url:
-                    raise ValueError('API source missing URL')
-                parts = urlsplit(cast(str, url))
-                base = urlunsplit((parts.scheme, parts.netloc, '', '', ''))
-                ClientClass = EndpointClient  # noqa: N806
-                client = ClientClass(
-                    base_url=base,
-                    base_path=None,
-                    endpoints={},
-                    retry=env.get('retry'),
-                    retry_network_errors=bool(
-                        env.get('retry_network_errors', False),
-                    ),
-                    session=env.get('session'),
-                )
-                request_options = RequestOptions(
-                    params=cast(Mapping[str, Any] | None, env.get('params')),
-                    headers=cast(Mapping[str, str] | None, env.get('headers')),
-                    timeout=cast(Timeout | None, env.get('timeout')),
-                )
-                data = client.paginate_url(
-                    cast(str, url),
-                    cast(PaginationConfigMap | None, env.get('pagination')),
-                    request=request_options,
-                    sleep_seconds=cast(float, env.get('sleep_seconds', 0.0)),
-                )
+            data = extract_from_api_source(cfg, source_obj, ex_opts)
         case _:
             # :meth:`coerce` already raises for invalid connector types, but
             # keep explicit guard for defensive programming.
@@ -256,9 +258,11 @@ def run(
     if not job_obj.load:
         raise ValueError('Job missing "load" section')
     target_name = job_obj.load.target
-    if target_name not in targets_by_name:
-        raise ValueError(f'Unknown target: {target_name}')
-    target_obj = targets_by_name[target_name]
+    target_obj = _require_named_connector(
+        targets_by_name,
+        target_name,
+        label='target',
+    )
     overrides = job_obj.load.overrides or {}
     ttype_raw = getattr(target_obj, 'type', None)
@@ -274,26 +278,7 @@ def run(
                 raise ValueError('File target missing "path"')
             result = load(data, 'file', path, file_format=fmt)
         case DataConnectorType.API:
-            env_t = compose_api_target_env(cfg, target_obj, overrides)
-            url_t = env_t.get('url')
-            if not url_t:
-                raise ValueError('API target missing "url"')
-            kwargs_t: dict[str, Any] = {}
-            headers = env_t.get('headers')
-            if headers:
-                kwargs_t['headers'] = cast(dict[str, str], headers)
-            if env_t.get('timeout') is not None:
-                kwargs_t['timeout'] = env_t.get('timeout')
-            session = env_t.get('session')
-            if session is not None:
-                kwargs_t['session'] = session
-            result = load(
-                data,
-                'api',
-                cast(str, url_t),
-                method=cast(str | Any, env_t.get('method') or 'post'),
-                **kwargs_t,
-            )
+            result = load_to_api_target(cfg, target_obj, overrides, data)
         case DataConnectorType.DATABASE:
             conn = overrides.get('connection_string') or getattr(
                 target_obj,
@@ -328,11 +313,11 @@ def run_pipeline(
     Parameters
     ----------
     source_type : DataConnectorType | str | None, optional
-        Connector type for extraction. When ``None``, ``source`` is assumed
+        Connector type for extraction. When ``None``, *source* is assumed
         to be pre-loaded data and extraction is skipped.
     source : StrPath | JSONData | None, optional
         Data source for extraction or the pre-loaded payload when
-        ``source_type`` is ``None``.
+        *source_type* is ``None``.
     operations : PipelineConfig | None, optional
         Transform configuration passed to :func:`etlplus.ops.transform`.
     target_type : DataConnectorType | str | None, optional

etlplus/ops/transform.py CHANGED Viewed

@@ -44,28 +44,28 @@ from collections.abc import Sequence
 from typing import Any
 from typing import cast
-from ..enums import AggregateName
-from ..enums import OperatorName
-from ..enums import PipelineStep
-from ..types import AggregateFunc
-from ..types import AggregateSpec
-from ..types import FieldName
-from ..types import Fields
-from ..types import FilterSpec
+from ..ops.types import PipelineConfig
 from ..types import JSONData
 from ..types import JSONDict
 from ..types import JSONList
-from ..types import MapSpec
-from ..types import OperatorFunc
-from ..types import PipelineConfig
-from ..types import PipelineStepName
-from ..types import SortKey
-from ..types import StepApplier
-from ..types import StepOrSteps
-from ..types import StepSpec
 from ..types import StrPath
 from ..utils import to_number
+from .enums import AggregateName
+from .enums import OperatorName
+from .enums import PipelineStep
 from .load import load_data
+from .types import AggregateFunc
+from .types import AggregateSpec
+from .types import FieldName
+from .types import Fields
+from .types import FilterSpec
+from .types import MapSpec
+from .types import OperatorFunc
+from .types import PipelineStepName
+from .types import SortKey
+from .types import StepApplier
+from .types import StepOrSteps
+from .types import StepSpec
 # SECTION: EXPORTS ========================================================== #
@@ -110,7 +110,7 @@ def _agg_count(
     present: int,
 ) -> int:
     """
-    Return the provided presence count ``present``.
+    Return the provided presence count *present*.
     Parameters
     ----------
@@ -120,7 +120,7 @@ def _agg_count(
     Returns
     -------
     int
-        The provided presence count ``present``.
+        The provided presence count *present*.
     """
     return present
@@ -206,15 +206,12 @@ def _normalize_specs(
     """
     if config is None:
         return []
-    if isinstance(config, Sequence) and not isinstance(
-        config,
-        (str, bytes, bytearray),
-    ):
+    if _is_sequence_not_text(config):
         # Already a sequence of step specs; normalize to a list.
-        return list(config)  # type: ignore[list-item]
+        return list(cast(Sequence[StepSpec], config))
     # Single spec
-    return [config]
+    return [cast(StepSpec, config)]
 def _normalize_operation_keys(ops: Mapping[Any, Any]) -> dict[str, Any]:
@@ -702,7 +699,31 @@ def _apply_sort_step(
 # -- Helpers -- #
-def _is_plain_fields_list(obj: Any) -> bool:
+def _is_sequence_not_text(
+    obj: Any,
+) -> bool:
+    """
+    Return ``True`` for non-text sequences.
+    Parameters
+    ----------
+    obj : Any
+        The object to check.
+    Returns
+    -------
+    bool
+        ``True`` when *obj* is a non-text sequence.
+    """
+    return isinstance(obj, Sequence) and not isinstance(
+        obj,
+        (str, bytes, bytearray),
+    )
+def _is_plain_fields_list(
+    obj: Any,
+) -> bool:
     """
     Return True if obj is a non-text sequence of non-mapping items.
@@ -719,10 +740,8 @@ def _is_plain_fields_list(obj: Any) -> bool:
         True if obj is a non-text sequence of non-mapping items, False
         otherwise.
     """
-    return (
-        isinstance(obj, Sequence)
-        and not isinstance(obj, (str, bytes, bytearray))
-        and not any(isinstance(x, Mapping) for x in obj)
+    return _is_sequence_not_text(obj) and not any(
+        isinstance(x, Mapping) for x in obj
     )

etlplus/ops/types.py ADDED Viewed

@@ -0,0 +1,147 @@
+"""
+:mod:`etlplus.ops.types` module.
+Shared type aliases leveraged across :mod:`etlplus.ops` modules.
+Notes
+-----
+- Centralizes ops-focused aliases (functions, specs, and pipeline helpers).
+- Relies on Python 3.13 ``type`` statements for readability and IDE support.
+Examples
+--------
+>>> from etlplus.ops.types import AggregateFunc, OperatorFunc
+>>> def total(xs: list[float], _: int) -> float:
+...     return sum(xs)
+>>> agg: AggregateFunc = total
+>>> op: OperatorFunc = lambda a, b: a == b
+"""
+from __future__ import annotations
+from collections.abc import Callable
+from collections.abc import Mapping
+from collections.abc import Sequence
+from typing import Any
+from typing import Literal
+from ..types import JSONList
+from ..types import StrAnyMap
+from ..types import StrSeqMap
+from ..types import StrStrMap
+# SECTION: EXPORTS ========================================================== #
+__all__ = [
+    # Type Aliases (Functions)
+    'AggregateFunc',
+    'OperatorFunc',
+    # Type Aliases (Records & Fields)
+    'FieldName',
+    'Fields',
+    # Type Aliases (Transform Specs)
+    'AggregateSpec',
+    'FilterSpec',
+    'MapSpec',
+    'SelectSpec',
+    'SortSpec',
+    # Type Aliases (Pipelines)
+    'StepOrSteps',
+    'StepSeq',
+    'StepSpec',
+    'PipelineConfig',
+    'PipelineStepName',
+    # Type Aliases (Helpers)
+    'StepApplier',
+    'SortKey',
+]
+# SECTION: TYPE ALIASES ===================================================== #
+# -- Functions -- #
+# TODO: Consider redefining to use `functools.reduce` signature.
+# TODO: Consider adding `**kwargs` to support richer aggregation functions.
+# TODO: Consider constraining first argument to `Sequence[float]`.
+# TODO: Consider constraining return type to `float | int | None`.
+# Callable reducing numeric collections into a summary value.
+type AggregateFunc = Callable[[list[float], int], Any]
+# Binary predicate consumed by filter operations.
+type OperatorFunc = Callable[[Any, Any], bool]
+# -- Records & Fields -- #
+# Individual field identifier referenced inside specs.
+type FieldName = str
+# Ordered list of :data:`FieldName` entries preserving projection order.
+type Fields = list[FieldName]
+# -- Transform Specs -- #
+# Filtering spec expecting ``field``, ``op``, and ``value`` keys.
+type FilterSpec = StrAnyMap
+# Field renaming instructions mapping old keys to new ones.
+type MapSpec = StrStrMap
+# Projection spec as a field list or mapping with metadata.
+#
+# Examples
+# --------
+# >>> from etlplus.ops.types import SelectSpec
+# >>> spec1: SelectSpec = ['a','b']
+# >>> spec2: SelectSpec = {'fields': [...]}
+type SelectSpec = Fields | StrSeqMap
+# Sort directive expressed as a field string or mapping with flags.
+#
+# Examples
+# --------
+# >>> from etlplus.ops.types import SortSpec
+# >>> spec1: SortSpec = 'field'
+# >>> spec2: SortSpec = {'field': 'x', 'reverse': True}
+type SortSpec = str | StrAnyMap
+# Aggregate instruction covering ``field``, ``func``, and optional alias.
+#
+# Supported functions: ``avg``, ``count``, ``max``, ``min``, and ``sum``.
+# Examples
+# --------
+# >>> from etlplus.ops.types import AggregateSpec
+# >>> spec: AggregateSpec = \
+# ...   {'field': 'x', 'func': 'sum' | 'avg' | ..., 'alias'?: '...'}
+type AggregateSpec = StrAnyMap
+# -- Pipelines-- #
+# Unified pipeline step spec consumed by :mod:`etlplus.ops.transform`.
+type StepSpec = AggregateSpec | FilterSpec | MapSpec | SelectSpec | SortSpec
+# Collections of steps
+# Ordered collection of :data:`StepSpec` entries.
+type StepSeq = Sequence[StepSpec]
+# Accepts either a single :data:`StepSpec` or a sequence of them.
+type StepOrSteps = StepSpec | StepSeq
+# Canonical literal names for supported transform stages.
+type PipelineStepName = Literal['aggregate', 'filter', 'map', 'select', 'sort']
+# Mapping from step name to its associated specification payload.
+# TODO: Consider replacing with etlplus.workflow.types.PipelineConfig.
+type PipelineConfig = Mapping[PipelineStepName, StepOrSteps]
+# -- Helpers -- #
+# Callable that applies step configuration to a batch of records.
+type StepApplier = Callable[[JSONList, Any], JSONList]
+# Tuple combining stable sort index and computed sort value.
+type SortKey = tuple[int, Any]

etlplus/ops/utils.py CHANGED Viewed

@@ -7,13 +7,11 @@ The helpers defined here embrace a "high cohesion, low coupling" design by
 isolating normalization, configuration, and logging responsibilities. The
 resulting surface keeps ``maybe_validate`` focused on orchestration while
 offloading ancillary concerns to composable helpers.
 """
 from __future__ import annotations
 from collections.abc import Callable
-from collections.abc import Mapping
 from dataclasses import dataclass
 from types import MappingProxyType
 from typing import Any
@@ -23,12 +21,12 @@ from typing import TypedDict
 from typing import cast
 from ..types import StrAnyMap
-from ..utils import normalized_str
+from ..utils import normalize_choice
 # SECTION: TYPED DICTIONARIES =============================================== #
-class ValidationResult(TypedDict, total=False):
+class ValidationResultDict(TypedDict, total=False):
     """Shape returned by ``validate_fn`` callables."""
     valid: bool
@@ -46,7 +44,7 @@ type ValidationPhase = Literal['before_transform', 'after_transform']
 type ValidationWindow = Literal['before_transform', 'after_transform', 'both']
 type ValidationSeverity = Literal['warn', 'error']
-type ValidateFn = Callable[[Any, Ruleset], ValidationResult]
+type ValidateFn = Callable[[Any, Ruleset], ValidationResultDict]
 type PrintFn = Callable[[Any], None]
@@ -200,21 +198,21 @@ def maybe_validate(
         Failure severity (``"warn"`` or ``"error"``).
     validate_fn : ValidateFn
         Engine that performs validation and returns a
-        :class:`ValidationResult` instance.
+        :class:`ValidationResultDict` instance.
     print_json_fn : PrintFn
         Structured logger invoked when validation fails.
     Returns
     -------
     Any
-        ``payload`` when validation is skipped or when severity is ``"warn"``
+        *payload* when validation is skipped or when severity is ``"warn"``
         and the validation fails. Returns the validator ``data`` payload when
         validation succeeds.
     Raises
     ------
     ValueError
-        Raised when validation fails and ``severity`` is ``"error"``.
+        Raised when validation fails and *severity* is ``"error"``.
     Examples
     --------
@@ -272,7 +270,7 @@ def _log_failure(
     phase: ValidationPhase,
     window: ValidationWindow,
     ruleset_name: str | None,
-    result: ValidationResult,
+    result: ValidationResultDict,
 ) -> None:
     """
     Emit a structured message describing the failed validation.
@@ -287,7 +285,7 @@ def _log_failure(
         Configured validation window.
     ruleset_name : str | None
         Name of the validation ruleset.
-    result : ValidationResult
+    result : ValidationResultDict
         Result of the failed validation.
     """
     printer(
@@ -320,7 +318,7 @@ def _normalize_phase(
     """
     return cast(
         ValidationPhase,
-        _normalize_choice(
+        normalize_choice(
             value,
             mapping=_PHASE_CHOICES,
             default='before_transform',
@@ -346,7 +344,7 @@ def _normalize_severity(
     """
     return cast(
         ValidationSeverity,
-        _normalize_choice(
+        normalize_choice(
             value,
             mapping=_SEVERITY_CHOICES,
             default='error',
@@ -372,7 +370,7 @@ def _normalize_window(
     """
     return cast(
         ValidationWindow,
-        _normalize_choice(
+        normalize_choice(
             value,
             mapping=_WINDOW_CHOICES,
             default='both',
@@ -380,33 +378,6 @@ def _normalize_window(
     )
-def _normalize_choice(
-    value: str | None,
-    *,
-    mapping: Mapping[str, str],
-    default: str,
-) -> str:
-    """
-    Normalize a text value against a mapping with a default fallback.
-    Parameters
-    ----------
-    value : str | None
-        Input text to normalize.
-    mapping : Mapping[str, str]
-        Mapping of accepted values to normalized outputs.
-    default : str
-        Default to return when input is missing or unrecognized.
-    Returns
-    -------
-    str
-        Normalized value.
-    """
-    normalized = normalized_str(value)
-    return mapping.get(normalized, default)
 def _rule_name(
     rules: Ruleset,
 ) -> str | None:

etlplus 0.15.0__py3-none-any.whl → 0.16.6__py3-none-any.whl

etlplus 0.15.0py3-none-any.whl → 0.16.6py3-none-any.whl