PyPI - alpha-engine-lib - Versions diffs - 0.35.1__tar.gz → 0.36.0__tar.gz - Mend

alpha-engine-lib 0.35.1tar.gz → 0.36.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (75) hide show

{alpha_engine_lib-0.35.1 → alpha_engine_lib-0.36.0}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: alpha-engine-lib
-Version: 0.35.1
+Version: 0.36.0
 Summary: Shared utilities for the Alpha Engine modules: preflight, structured logging with secret-redaction, ArcticDB universe access, NYSE-calendar dates + freshness predicates, decision capture, cost telemetry, RAG, agent output schemas, SSM-backed secrets, Telegram alerts + SNS fan-out, EC2 spot-launch resilience, SSM log-capture chokepoint, SSM send-command + poll chokepoint, and Step-Functions execution-state projection. Full surface documented in README.
 Author: Brian McMahon
 License: Proprietary

{alpha_engine_lib-0.35.1 → alpha_engine_lib-0.36.0}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 [project]
 name = "alpha-engine-lib"
-version = "0.35.1"
+version = "0.36.0"
 description = "Shared utilities for the Alpha Engine modules: preflight, structured logging with secret-redaction, ArcticDB universe access, NYSE-calendar dates + freshness predicates, decision capture, cost telemetry, RAG, agent output schemas, SSM-backed secrets, Telegram alerts + SNS fan-out, EC2 spot-launch resilience, SSM log-capture chokepoint, SSM send-command + poll chokepoint, and Step-Functions execution-state projection. Full surface documented in README."
 readme = "README.md"
 # EC2 still runs Python 3.9 on the always-on micro instance (boto3 drops

{alpha_engine_lib-0.35.1 → alpha_engine_lib-0.36.0}/src/alpha_engine_lib/__init__.py RENAMED Viewed

@@ -1,3 +1,3 @@
 """alpha-engine-lib — shared utilities for Alpha Engine modules."""
-__version__ = "0.35.1"
+__version__ = "0.36.0"

{alpha_engine_lib-0.35.1 → alpha_engine_lib-0.36.0}/src/alpha_engine_lib/pipeline_status/__init__.py RENAMED Viewed

@@ -31,6 +31,7 @@ on first build, not after the second consumer arrives.
 from __future__ import annotations
 from .read import (
+    PipelineExecutionSummary,
     PipelineRun,
     RunStatus,
     SFNAccessDenied,
@@ -38,6 +39,7 @@ from .read import (
     SFNThrottled,
     TaskRow,
     TaskStatus,
+    list_recent_pipeline_runs,
     read_pipeline_state,
 )
 from .registry import (
@@ -54,6 +56,7 @@ __all__ = [
     "ArchivePageRef",
     "ArtifactReason",
     "PIPELINE_LABELS",
+    "PipelineExecutionSummary",
     "PipelineRun",
     "RunStatus",
     "SFNAccessDenied",
@@ -66,5 +69,6 @@ __all__ = [
     "WAIT_GROUPING",
     "format_failure_message",
     "format_success_message",
+    "list_recent_pipeline_runs",
     "read_pipeline_state",
 ]

{alpha_engine_lib-0.35.1 → alpha_engine_lib-0.36.0}/src/alpha_engine_lib/pipeline_status/read.py RENAMED Viewed

@@ -31,6 +31,7 @@ red banner always names a specific cause.
 from __future__ import annotations
+import json
 import logging
 from dataclasses import dataclass
 from datetime import datetime, timezone
@@ -194,6 +195,39 @@ class PipelineRun(BaseModel):
     tasks: list[TaskRow] = Field(default_factory=list)
     failing_state: Optional[str] = None  # populated only when status == FAILED
     failure_cause: Optional[str] = None  # populated only when status == FAILED
+    # The ``pipeline_role`` carried on this execution's input JSON
+    # (e.g. "weekly" / "daily" / "eod" / "smoke" / "recovery" /
+    # "shell-run" / "backfill" / "operator-replay"). None when the input
+    # JSON doesn't carry the field — typical of pre-Option-D executions
+    # and ad-hoc operator launches that haven't adopted the convention.
+    # The dashboard exposes this in the section header so the operator
+    # always knows whether they're looking at the canonical cadence run
+    # or a smoke / recovery overlay.
+    pipeline_role: Optional[str] = None
+class PipelineExecutionSummary(BaseModel):
+    """Lightweight per-execution summary for the operator dropdown.
+    Returned by :func:`list_recent_pipeline_runs`. Does NOT carry the
+    full per-state task table (that lives on :class:`PipelineRun`) — the
+    dropdown's job is to let the operator pick one execution to inspect
+    in detail, at which point :func:`read_pipeline_state` returns the
+    full run for the chosen ARN.
+    ``pipeline_role`` is parsed from the execution's input JSON via the
+    DescribeExecution call; None when the input lacks the field.
+    """
+    model_config = _STRICT_CONFIG
+    execution_arn: str
+    name: str
+    status: RunStatus
+    start_utc: datetime
+    end_utc: Optional[datetime] = None
+    duration_sec: Optional[float] = None
+    pipeline_role: Optional[str] = None
 # ── Helpers ───────────────────────────────────────────────────────────────
@@ -418,80 +452,79 @@ def _failing_state_from_history(history_events: list[dict]) -> Optional[str]:
     return None
-# ── Public entry point ────────────────────────────────────────────────────
+# ── Role-filter helpers (Option-D execution-picker substrate) ─────────────
-def read_pipeline_state(
-    state_machine_arn: str,
-    *,
-    client: Optional["SFNClient"] = None,
-) -> PipelineRun:
-    """Project the most-recent execution of ``state_machine_arn`` onto a
-    typed :class:`PipelineRun`.
+# Bounds the ListExecutions walk when a role filter is set — we page
+# backwards through history looking for the first execution whose
+# input.pipeline_role matches the filter. 50 is enough to span ~6 months
+# of weekly cadence even if every intervening execution is a smoke /
+# recovery overlay; raise it only if smoke-density is genuinely that high.
+_DEFAULT_ROLE_SEARCH_LIMIT = 50
-    Calls (in order):
-    1. ``states:ListExecutions(stateMachineArn=..., maxResults=1)`` — finds
-       the latest execution arn. If the SF has zero executions, raises
-       :class:`SFNNoExecutions`.
-    2. ``states:DescribeExecution(executionArn=...)`` — top-level status +
-       start/stop + failure cause.
-    3. ``states:GetExecutionHistory(executionArn=..., maxResults=1000)`` —
-       per-state events for the Task row table.
-    Parameters
-    ----------
-    state_machine_arn:
-        Full SF ARN, e.g. ``arn:aws:states:us-east-1:711398986525:stateMachine:alpha-engine-saturday-pipeline``.
-    client:
-        Optional boto3 ``stepfunctions`` client. Tests pass a mock here;
-        production passes None and gets a fresh client per call (cheap;
-        boto3 caches under the hood).
+# ListExecutions page size — boto3 caps at 1000 but we keep pages small
+# so a typical "find the most-recent weekly within the last 50" walk only
+# hits the API once or twice.
+_LIST_EXECUTIONS_PAGE_SIZE = 25
-    Returns
-    -------
-    PipelineRun
-        Fully populated except when ``status == NOT_RUN`` (only
-        ``state_machine_arn`` + ``pretty_label`` + ``status`` set).
-    Raises
-    ------
-    SFNAccessDenied
-        IAM denial on any of the three required actions.
-    SFNThrottled
-        Rate-limit on any of the three.
-    SFNNoExecutions
-        SF exists but has zero executions ever.
-    PipelineStatusError
-        Any other unexpected error path — the caller renders a red banner.
-    """
-    if client is None:  # pragma: no cover — production path
-        import boto3
+def _extract_pipeline_role(describe_resp: dict) -> Optional[str]:
+    """Parse ``input.pipeline_role`` from a DescribeExecution response.
-        client = boto3.client("stepfunctions", region_name=_region_from_arn(state_machine_arn))
+    DescribeExecution returns ``input`` as a JSON-encoded string. The
+    Option-D convention is that all cron-triggered executions carry a
+    ``pipeline_role`` field at top level (``{"pipeline_role": "weekly",
+    ...}``) and ad-hoc operator launches set it explicitly (smoke /
+    recovery / operator-replay / etc).
-    label = _label_for_arn(state_machine_arn)
+    Returns None on:
+    - missing ``input`` field
+    - malformed JSON (logged at WARN; the page renders "role: unknown")
+    - JSON parses but ``pipeline_role`` is absent
-    # 1. ListExecutions
+    Permissive on parse failures (warn + return None rather than raise)
+    because input-shape is operator-controlled and we'd rather show the
+    execution with role=None than blackhole the whole page on a malformed
+    input JSON. Per ``feedback_no_silent_fails`` the WARN log is the
+    recording surface.
+    """
+    raw_input = describe_resp.get("input")
+    if not raw_input or not isinstance(raw_input, str):
+        return None
     try:
-        list_resp = client.list_executions(
-            stateMachineArn=state_machine_arn,
-            maxResults=1,
+        parsed = json.loads(raw_input)
+    except (ValueError, TypeError) as exc:
+        logger.warning(
+            "Could not parse SF execution input JSON; pipeline_role=None: %s", exc
         )
-    except Exception as exc:  # noqa: BLE001 — narrow + re-raise
-        _raise_for_boto_error(exc, "ListExecutions")
+        return None
+    if not isinstance(parsed, dict):
+        return None
+    role = parsed.get("pipeline_role")
+    return role if isinstance(role, str) and role else None
-    executions = list_resp.get("executions") or []
-    if not executions:
-        raise SFNNoExecutions(
-            f"State machine {state_machine_arn} has no executions yet."
-        )
-    latest = executions[0]
-    execution_arn = latest.get("executionArn")
-    execution_name = latest.get("name")
+def _build_pipeline_run_from_execution_arn(
+    execution_arn: str,
+    state_machine_arn: str,
+    *,
+    client: "SFNClient",
+) -> PipelineRun:
+    """Project a known execution ARN onto a typed :class:`PipelineRun`.
+    Helper that holds the DescribeExecution + GetExecutionHistory +
+    materialize-tasks pipeline. Callers responsible for the execution
+    name (passed in via the ARN — derived if not supplied separately).
+    Used by :func:`read_pipeline_state` after the role-filter walk picks
+    the target execution, AND directly when an operator clicks a specific
+    execution in the dropdown.
+    """
+    label = _label_for_arn(state_machine_arn)
+    # Derive execution_name from ARN — the ARN tail is
+    # ``execution:<sm-name>:<execution-name>``.
+    execution_name = execution_arn.rsplit(":", 1)[-1] if execution_arn else None
-    # 2. DescribeExecution
     try:
         describe_resp = client.describe_execution(executionArn=execution_arn)
     except Exception as exc:  # noqa: BLE001 — narrow + re-raise
@@ -501,8 +534,6 @@ def read_pipeline_state(
     try:
         run_status = RunStatus(status_str)
     except ValueError:
-        # Unknown status string from boto3 (forward-compatibility) — fail
-        # loud rather than silently mis-render.
         raise PipelineStatusError(
             f"Unknown SF execution status {status_str!r} from boto3 for {execution_arn}"
         )
@@ -516,8 +547,8 @@ def read_pipeline_state(
     failure_cause = (
         _failure_cause_from(describe_resp) if run_status == RunStatus.FAILED else None
     )
+    pipeline_role = _extract_pipeline_role(describe_resp)
-    # 3. GetExecutionHistory
     try:
         history_resp = client.get_execution_history(
             executionArn=execution_arn,
@@ -545,9 +576,288 @@ def read_pipeline_state(
         tasks=tasks,
         failing_state=failing_state,
         failure_cause=failure_cause,
+        pipeline_role=pipeline_role,
+    )
+def _find_execution_matching_role(
+    state_machine_arn: str,
+    role_filter: set[str],
+    *,
+    client: "SFNClient",
+    search_limit: int,
+) -> Optional[tuple[str, Optional[str]]]:
+    """Walk ListExecutions pages until finding an execution whose
+    ``input.pipeline_role`` ∈ ``role_filter``, or until ``search_limit``
+    executions have been inspected.
+    Returns ``(execution_arn, role)`` on hit, ``None`` on exhaustion.
+    The N+1 DescribeExecution calls are the cost of the role filter;
+    typical cron-cadence SFs find a match within the first 1-3 executions
+    so the cost is bounded in practice. Smoke-heavy windows pay more but
+    the ``search_limit`` cap bounds worst case.
+    Caller is responsible for translating None into the right outcome —
+    either SFNNoExecutions (when ListExecutions was empty in the first
+    page) or a "no execution matches filter" fallback signal.
+    """
+    inspected = 0
+    next_token: Optional[str] = None
+    while inspected < search_limit:
+        kwargs: dict[str, Any] = {
+            "stateMachineArn": state_machine_arn,
+            "maxResults": min(_LIST_EXECUTIONS_PAGE_SIZE, search_limit - inspected),
+        }
+        if next_token:
+            kwargs["nextToken"] = next_token
+        try:
+            list_resp = client.list_executions(**kwargs)
+        except Exception as exc:  # noqa: BLE001 — narrow + re-raise
+            _raise_for_boto_error(exc, "ListExecutions")
+        executions = list_resp.get("executions") or []
+        if not executions:
+            return None
+        for ex in executions:
+            inspected += 1
+            execution_arn = ex.get("executionArn")
+            if not execution_arn:
+                continue
+            try:
+                describe_resp = client.describe_execution(executionArn=execution_arn)
+            except Exception as exc:  # noqa: BLE001 — narrow + re-raise
+                _raise_for_boto_error(exc, "DescribeExecution")
+            role = _extract_pipeline_role(describe_resp)
+            if role is not None and role in role_filter:
+                return execution_arn, role
+        next_token = list_resp.get("nextToken")
+        if not next_token:
+            return None
+    return None
+# ── Public entry point ────────────────────────────────────────────────────
+def read_pipeline_state(
+    state_machine_arn: str,
+    *,
+    role_filter: Optional[set[str]] = None,
+    search_limit: int = _DEFAULT_ROLE_SEARCH_LIMIT,
+    execution_arn: Optional[str] = None,
+    client: Optional["SFNClient"] = None,
+) -> PipelineRun:
+    """Project the chosen execution of ``state_machine_arn`` onto a typed
+    :class:`PipelineRun`.
+    Default behavior (no ``role_filter``, no ``execution_arn``) is
+    backwards-compatible: returns the most-recent execution per
+    ``ListExecutions maxResults=1``, same as pre-Option-D.
+    Option-D execution-picker semantics:
+    - When ``execution_arn`` is set, fetches that specific execution
+      directly (bypasses ListExecutions). Used by the dashboard's
+      dropdown "click a row to inspect this execution" path.
+    - When ``role_filter`` is set, walks ListExecutions pages until
+      finding the most-recent execution whose ``input.pipeline_role``
+      is in the filter set. If none match within ``search_limit``
+      executions, raises :class:`SFNNoExecutions` with a message naming
+      the filter — the caller (page 25) renders a banner like "No
+      'weekly' execution in the last 50 runs; click 'View other recent
+      executions' to inspect what's actually been running."
+    Parameters
+    ----------
+    state_machine_arn:
+        Full SF ARN.
+    role_filter:
+        Optional set of ``pipeline_role`` values to filter executions by
+        (e.g. ``{"weekly"}`` for the Saturday-SF cadence run, ``{"daily"}``
+        for the Weekday-SF cadence run). ``None`` = no filter (most-recent
+        regardless of role — current behavior).
+    search_limit:
+        Bounds the role-filter walk. Default 50 — see
+        :data:`_DEFAULT_ROLE_SEARCH_LIMIT`. Ignored when ``role_filter``
+        is None.
+    execution_arn:
+        Optional specific execution ARN to fetch. When set, both
+        ``role_filter`` and ``search_limit`` are ignored.
+    client:
+        Optional boto3 ``stepfunctions`` client. Tests pass a mock here;
+        production passes None.
+    Raises
+    ------
+    SFNAccessDenied
+        IAM denial on any of the three required actions.
+    SFNThrottled
+        Rate-limit on any of the three.
+    SFNNoExecutions
+        SF has zero executions, OR ``role_filter`` is set and no
+        execution within the search window matches.
+    PipelineStatusError
+        Any other unexpected error path.
+    """
+    if client is None:  # pragma: no cover — production path
+        import boto3
+        client = boto3.client("stepfunctions", region_name=_region_from_arn(state_machine_arn))
+    # Path 1: explicit execution_arn — fetch directly.
+    if execution_arn is not None:
+        return _build_pipeline_run_from_execution_arn(
+            execution_arn, state_machine_arn, client=client
+        )
+    # Path 2: role_filter — walk ListExecutions until match.
+    if role_filter:
+        match = _find_execution_matching_role(
+            state_machine_arn, role_filter, client=client, search_limit=search_limit
+        )
+        if match is None:
+            raise SFNNoExecutions(
+                f"No execution with pipeline_role in {sorted(role_filter)!r} "
+                f"found within last {search_limit} executions of {state_machine_arn}."
+            )
+        matched_arn, _matched_role = match
+        return _build_pipeline_run_from_execution_arn(
+            matched_arn, state_machine_arn, client=client
+        )
+    # Path 3 (default): most-recent execution regardless of role —
+    # backwards-compatible with pre-Option-D callers.
+    try:
+        list_resp = client.list_executions(
+            stateMachineArn=state_machine_arn,
+            maxResults=1,
+        )
+    except Exception as exc:  # noqa: BLE001 — narrow + re-raise
+        _raise_for_boto_error(exc, "ListExecutions")
+    executions = list_resp.get("executions") or []
+    if not executions:
+        raise SFNNoExecutions(
+            f"State machine {state_machine_arn} has no executions yet."
+        )
+    latest = executions[0]
+    return _build_pipeline_run_from_execution_arn(
+        latest.get("executionArn"), state_machine_arn, client=client
     )
+def list_recent_pipeline_runs(
+    state_machine_arn: str,
+    *,
+    limit: int = 10,
+    role_filter: Optional[set[str]] = None,
+    client: Optional["SFNClient"] = None,
+) -> list[PipelineExecutionSummary]:
+    """Return lightweight summaries of the most-recent N executions.
+    Backs the page-25 "View other recent executions" disclosure: shows
+    the operator what's been running on this SF, ranked most-recent
+    first, with the ``pipeline_role`` of each so smoke vs. weekly vs.
+    recovery is visible at a glance.
+    Each summary requires one ``DescribeExecution`` call (to extract
+    ``pipeline_role`` from the input JSON) on top of one
+    ``ListExecutions`` call, so this is O(limit) API calls. Default
+    ``limit=10`` puts the dashboard's "show me last N" view at ~11
+    SF API calls per page render — well within the 25-TPS soft limit
+    states:DescribeExecution applies.
+    Parameters
+    ----------
+    state_machine_arn:
+        Full SF ARN.
+    limit:
+        Max number of executions to return. Default 10.
+    role_filter:
+        Optional pre-filter (returns only executions whose
+        ``pipeline_role`` ∈ ``role_filter``). When set, the API call
+        budget grows because we may have to walk past role-mismatched
+        executions; bounded by an internal walk cap of ``limit * 5``.
+    client:
+        Optional boto3 ``stepfunctions`` client.
+    """
+    if client is None:  # pragma: no cover — production path
+        import boto3
+        client = boto3.client("stepfunctions", region_name=_region_from_arn(state_machine_arn))
+    walk_cap = limit if role_filter is None else min(limit * 5, _DEFAULT_ROLE_SEARCH_LIMIT)
+    summaries: list[PipelineExecutionSummary] = []
+    inspected = 0
+    next_token: Optional[str] = None
+    while len(summaries) < limit and inspected < walk_cap:
+        kwargs: dict[str, Any] = {
+            "stateMachineArn": state_machine_arn,
+            "maxResults": min(_LIST_EXECUTIONS_PAGE_SIZE, walk_cap - inspected),
+        }
+        if next_token:
+            kwargs["nextToken"] = next_token
+        try:
+            list_resp = client.list_executions(**kwargs)
+        except Exception as exc:  # noqa: BLE001 — narrow + re-raise
+            _raise_for_boto_error(exc, "ListExecutions")
+        executions = list_resp.get("executions") or []
+        if not executions:
+            break
+        for ex in executions:
+            inspected += 1
+            execution_arn = ex.get("executionArn")
+            if not execution_arn:
+                continue
+            try:
+                describe_resp = client.describe_execution(executionArn=execution_arn)
+            except Exception as exc:  # noqa: BLE001 — narrow + re-raise
+                _raise_for_boto_error(exc, "DescribeExecution")
+            role = _extract_pipeline_role(describe_resp)
+            if role_filter is not None and role not in role_filter:
+                continue
+            status_str = describe_resp.get("status", "RUNNING")
+            try:
+                status = RunStatus(status_str)
+            except ValueError:
+                raise PipelineStatusError(
+                    f"Unknown SF execution status {status_str!r} from boto3 for {execution_arn}"
+                )
+            start_utc = _parse_ts(describe_resp.get("startDate"))
+            end_utc = _parse_ts(describe_resp.get("stopDate"))
+            duration: Optional[float] = None
+            if start_utc is not None and end_utc is not None:
+                duration = (end_utc - start_utc).total_seconds()
+            if start_utc is None:
+                # An execution without a start time is degenerate; skip
+                # rather than fail the whole list.
+                continue
+            summaries.append(
+                PipelineExecutionSummary(
+                    execution_arn=execution_arn,
+                    name=ex.get("name") or execution_arn.rsplit(":", 1)[-1],
+                    status=status,
+                    start_utc=start_utc,
+                    end_utc=end_utc,
+                    duration_sec=duration,
+                    pipeline_role=role,
+                )
+            )
+            if len(summaries) >= limit:
+                break
+        next_token = list_resp.get("nextToken")
+        if not next_token:
+            break
+    return summaries
 def _raise_for_boto_error(exc: Exception, action: str) -> None:
     """Translate a boto3 exception into a typed PipelineStatusError.

{alpha_engine_lib-0.35.1 → alpha_engine_lib-0.36.0}/src/alpha_engine_lib.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: alpha-engine-lib
-Version: 0.35.1
+Version: 0.36.0
 Summary: Shared utilities for the Alpha Engine modules: preflight, structured logging with secret-redaction, ArcticDB universe access, NYSE-calendar dates + freshness predicates, decision capture, cost telemetry, RAG, agent output schemas, SSM-backed secrets, Telegram alerts + SNS fan-out, EC2 spot-launch resilience, SSM log-capture chokepoint, SSM send-command + poll chokepoint, and Step-Functions execution-state projection. Full surface documented in README.
 Author: Brian McMahon
 License: Proprietary

{alpha_engine_lib-0.35.1 → alpha_engine_lib-0.36.0}/tests/test_pipeline_status_read.py RENAMED Viewed

@@ -23,6 +23,7 @@ from unittest.mock import MagicMock
 import pytest
 from alpha_engine_lib.pipeline_status import (
+    PipelineExecutionSummary,
     PipelineRun,
     RunStatus,
     SFNAccessDenied,
@@ -30,10 +31,12 @@ from alpha_engine_lib.pipeline_status import (
     SFNThrottled,
     TaskRow,
     TaskStatus,
+    list_recent_pipeline_runs,
     read_pipeline_state,
 )
 from alpha_engine_lib.pipeline_status.read import (
     PipelineStatusError,
+    _extract_pipeline_role,
     _failure_cause_from,
     _materialize_tasks,
     _parse_ts,
@@ -535,3 +538,248 @@ def test_task_row_archive_round_trips_through_json_for_artifact_reason():
         "round-trip — same regression class as the ArchivePageRef test."
     )
     assert "Terminal success" in round_tripped_task.archive.reason
+# ── pipeline_role extraction (Option-D substrate) ─────────────────────────
+def test_extract_pipeline_role_happy_path():
+    """Standard EventBridge cron payload with pipeline_role set."""
+    describe = {
+        "input": '{"pipeline_role": "weekly", "run_date": "2026-05-30"}',
+    }
+    assert _extract_pipeline_role(describe) == "weekly"
+def test_extract_pipeline_role_missing_field():
+    """Pre-Option-D execution input (no pipeline_role key) returns None."""
+    describe = {"input": '{"run_date": "2026-05-30"}'}
+    assert _extract_pipeline_role(describe) is None
+def test_extract_pipeline_role_missing_input_field():
+    """DescribeExecution may omit the input field entirely on terminal
+    states (rare but possible) — degrade to None, not crash."""
+    assert _extract_pipeline_role({}) is None
+    assert _extract_pipeline_role({"input": None}) is None
+    assert _extract_pipeline_role({"input": ""}) is None
+def test_extract_pipeline_role_malformed_json():
+    """Malformed input JSON — WARN-and-return-None per the lib's
+    permissive parse policy. Recording surface is the WARN log."""
+    describe = {"input": "{not valid json"}
+    assert _extract_pipeline_role(describe) is None
+def test_extract_pipeline_role_input_is_array_not_object():
+    """SF allows array-shaped input; defensively handle it (return None
+    rather than raise) — pipeline_role is a top-level field on object
+    inputs only."""
+    describe = {"input": '["weekly"]'}
+    assert _extract_pipeline_role(describe) is None
+def test_extract_pipeline_role_empty_string_returns_none():
+    """An explicit empty string in pipeline_role is treated as 'not set'
+    so the dashboard renders 'role: unknown' instead of '': empty cells
+    are operator-noise."""
+    describe = {"input": '{"pipeline_role": ""}'}
+    assert _extract_pipeline_role(describe) is None
+# ── Role filter + execution_arn paths in read_pipeline_state ──────────────
+def _make_describe_response(*, status="SUCCEEDED", role: Optional[str] = None) -> dict:
+    """Build a DescribeExecution response carrying an optional
+    pipeline_role on the input JSON. Default times preserved."""
+    body: dict = {
+        "status": status,
+        "startDate": datetime(2026, 5, 24, 9, 0, tzinfo=timezone.utc),
+        "stopDate": datetime(2026, 5, 24, 11, 30, tzinfo=timezone.utc),
+    }
+    if role is not None:
+        body["input"] = f'{{"pipeline_role": "{role}", "run_date": "2026-05-24"}}'
+    else:
+        body["input"] = '{"run_date": "2026-05-24"}'
+    return body
+def _make_multi_execution_mock(
+    *,
+    executions: list[dict],
+    describe_by_arn: dict[str, dict],
+) -> MagicMock:
+    """Build an SFN mock where ListExecutions returns a list and
+    DescribeExecution dispatches by executionArn to the right response."""
+    client = MagicMock()
+    client.list_executions.return_value = {"executions": executions}
+    def _dispatch(executionArn: str, **_kwargs):
+        return describe_by_arn[executionArn]
+    client.describe_execution.side_effect = _dispatch
+    client.get_execution_history.return_value = {"events": []}
+    return client
+def test_read_pipeline_state_default_returns_most_recent_unchanged():
+    """No role_filter, no execution_arn — same as pre-Option-D: most-recent
+    execution per ListExecutions maxResults=1."""
+    client = _make_sfn_mock()
+    run = read_pipeline_state(SATURDAY_ARN, client=client)
+    assert run.status == RunStatus.SUCCEEDED
+    # ListExecutions was called with maxResults=1 (default path).
+    client.list_executions.assert_called_once()
+    call_kwargs = client.list_executions.call_args.kwargs
+    assert call_kwargs.get("maxResults") == 1
+def test_read_pipeline_state_with_role_filter_finds_first_match():
+    """Three executions in history: smoke / weekly / smoke. Filter to
+    'weekly' — picks the middle one."""
+    smoke1_arn = EXECUTION_ARN + "-smoke1"
+    weekly_arn = EXECUTION_ARN + "-weekly"
+    smoke2_arn = EXECUTION_ARN + "-smoke2"
+    client = _make_multi_execution_mock(
+        executions=[
+            {"executionArn": smoke1_arn, "name": "smoke-l1995"},
+            {"executionArn": weekly_arn, "name": "weekly-20260524T090000"},
+            {"executionArn": smoke2_arn, "name": "smoke-debug"},
+        ],
+        describe_by_arn={
+            smoke1_arn: _make_describe_response(role="smoke"),
+            weekly_arn: _make_describe_response(role="weekly"),
+            smoke2_arn: _make_describe_response(role="smoke"),
+        },
+    )
+    run = read_pipeline_state(SATURDAY_ARN, role_filter={"weekly"}, client=client)
+    assert run.execution_arn == weekly_arn
+    assert run.pipeline_role == "weekly"
+def test_read_pipeline_state_with_role_filter_no_match_raises():
+    """Three smoke executions, filter to 'weekly' — raises
+    SFNNoExecutions naming the filter so the caller can render an
+    operator-actionable banner."""
+    client = _make_multi_execution_mock(
+        executions=[
+            {"executionArn": EXECUTION_ARN + f"-{i}", "name": f"smoke-{i}"}
+            for i in range(3)
+        ],
+        describe_by_arn={
+            EXECUTION_ARN + f"-{i}": _make_describe_response(role="smoke")
+            for i in range(3)
+        },
+    )
+    with pytest.raises(SFNNoExecutions) as exc_info:
+        read_pipeline_state(
+            SATURDAY_ARN, role_filter={"weekly"}, search_limit=10, client=client
+        )
+    assert "weekly" in str(exc_info.value)
+def test_read_pipeline_state_with_role_filter_treats_missing_role_as_no_match():
+    """Pre-Option-D executions lack pipeline_role; role_filter must NOT
+    match those (otherwise the filter is no filter at all). The walk
+    keeps going until an explicitly-tagged execution turns up."""
+    untagged_arn = EXECUTION_ARN + "-untagged"
+    weekly_arn = EXECUTION_ARN + "-weekly"
+    client = _make_multi_execution_mock(
+        executions=[
+            {"executionArn": untagged_arn, "name": "old-pre-option-d"},
+            {"executionArn": weekly_arn, "name": "weekly-20260524T090000"},
+        ],
+        describe_by_arn={
+            untagged_arn: _make_describe_response(role=None),
+            weekly_arn: _make_describe_response(role="weekly"),
+        },
+    )
+    run = read_pipeline_state(SATURDAY_ARN, role_filter={"weekly"}, client=client)
+    assert run.execution_arn == weekly_arn
+def test_read_pipeline_state_with_execution_arn_fetches_specific_execution():
+    """Dropdown-click path: when execution_arn is set, the function fetches
+    that specific execution directly (bypasses ListExecutions). role_filter
+    and search_limit are ignored on this path."""
+    target_arn = EXECUTION_ARN + "-specific"
+    client = _make_multi_execution_mock(
+        executions=[],  # ListExecutions intentionally empty — proves it's not called
+        describe_by_arn={target_arn: _make_describe_response(role="smoke")},
+    )
+    run = read_pipeline_state(SATURDAY_ARN, execution_arn=target_arn, client=client)
+    assert run.execution_arn == target_arn
+    assert run.pipeline_role == "smoke"
+    # ListExecutions must NOT have been called on the execution_arn path.
+    client.list_executions.assert_not_called()
+def test_read_pipeline_state_carries_pipeline_role_to_returned_run():
+    """The pipeline_role field on PipelineRun is populated from input JSON
+    even when no role_filter is applied (default path) — the dashboard's
+    section header shows it regardless of how the execution was picked."""
+    client = _make_sfn_mock(
+        describe_response=_make_describe_response(role="weekly"),
+    )
+    run = read_pipeline_state(SATURDAY_ARN, client=client)
+    assert run.pipeline_role == "weekly"
+def test_read_pipeline_state_pipeline_role_none_when_input_lacks_role():
+    """No pipeline_role in input → PipelineRun.pipeline_role is None
+    (rendered as 'role: unknown' on the dashboard)."""
+    client = _make_sfn_mock(
+        describe_response=_make_describe_response(role=None),
+    )
+    run = read_pipeline_state(SATURDAY_ARN, client=client)
+    assert run.pipeline_role is None
+# ── list_recent_pipeline_runs ─────────────────────────────────────────────
+def test_list_recent_pipeline_runs_returns_summaries_with_roles():
+    """Returns last N executions, each carrying its pipeline_role for the
+    operator dropdown's at-a-glance smoke-vs-weekly distinction."""
+    arns = [EXECUTION_ARN + f"-{i}" for i in range(5)]
+    roles = ["smoke", "weekly", "smoke", "weekly", "recovery"]
+    client = _make_multi_execution_mock(
+        executions=[
+            {"executionArn": a, "name": f"exec-{i}"} for i, a in enumerate(arns)
+        ],
+        describe_by_arn={a: _make_describe_response(role=r) for a, r in zip(arns, roles)},
+    )
+    summaries = list_recent_pipeline_runs(SATURDAY_ARN, limit=5, client=client)
+    assert len(summaries) == 5
+    assert all(isinstance(s, PipelineExecutionSummary) for s in summaries)
+    assert [s.pipeline_role for s in summaries] == roles
+def test_list_recent_pipeline_runs_role_filter_pre_filters():
+    """When role_filter is set, only matching executions are returned —
+    the operator's "show me weekly runs only" view."""
+    arns = [EXECUTION_ARN + f"-{i}" for i in range(6)]
+    roles = ["smoke", "weekly", "smoke", "weekly", "recovery", "weekly"]
+    client = _make_multi_execution_mock(
+        executions=[
+            {"executionArn": a, "name": f"exec-{i}"} for i, a in enumerate(arns)
+        ],
+        describe_by_arn={a: _make_describe_response(role=r) for a, r in zip(arns, roles)},
+    )
+    summaries = list_recent_pipeline_runs(
+        SATURDAY_ARN, limit=10, role_filter={"weekly"}, client=client
+    )
+    assert len(summaries) == 3
+    assert all(s.pipeline_role == "weekly" for s in summaries)
+def test_list_recent_pipeline_runs_empty_returns_empty_list():
+    """Zero executions → empty list (NOT SFNNoExecutions). The dropdown
+    just renders 'no executions yet' inline; the page-25 section banner
+    is the load-bearing error surface, not this lighter-weight API."""
+    client = MagicMock()
+    client.list_executions.return_value = {"executions": []}
+    summaries = list_recent_pipeline_runs(SATURDAY_ARN, limit=5, client=client)
+    assert summaries == []