PyPI - spanforge - Versions diffs - 1.0.0__py3-none-any.whl - Mend

spanforge 1.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (174) hide show

spanforge/__init__.py +815 -0
spanforge/_ansi.py +93 -0
spanforge/_batch_exporter.py +409 -0
spanforge/_cli.py +2094 -0
spanforge/_cli_audit.py +639 -0
spanforge/_cli_compliance.py +711 -0
spanforge/_cli_cost.py +243 -0
spanforge/_cli_ops.py +791 -0
spanforge/_cli_phase11.py +356 -0
spanforge/_hooks.py +337 -0
spanforge/_server.py +1708 -0
spanforge/_span.py +1036 -0
spanforge/_store.py +288 -0
spanforge/_stream.py +664 -0
spanforge/_trace.py +335 -0
spanforge/_tracer.py +254 -0
spanforge/actor.py +141 -0
spanforge/alerts.py +469 -0
spanforge/auto.py +464 -0
spanforge/baseline.py +335 -0
spanforge/cache.py +635 -0
spanforge/compliance.py +325 -0
spanforge/config.py +532 -0
spanforge/consent.py +228 -0
spanforge/consumer.py +377 -0
spanforge/core/__init__.py +5 -0
spanforge/core/compliance_mapping.py +1254 -0
spanforge/cost.py +600 -0
spanforge/debug.py +548 -0
spanforge/deprecations.py +205 -0
spanforge/drift.py +482 -0
spanforge/egress.py +58 -0
spanforge/eval.py +648 -0
spanforge/event.py +1064 -0
spanforge/exceptions.py +240 -0
spanforge/explain.py +178 -0
spanforge/export/__init__.py +69 -0
spanforge/export/append_only.py +337 -0
spanforge/export/cloud.py +357 -0
spanforge/export/datadog.py +497 -0
spanforge/export/grafana.py +320 -0
spanforge/export/jsonl.py +195 -0
spanforge/export/openinference.py +158 -0
spanforge/export/otel_bridge.py +294 -0
spanforge/export/otlp.py +811 -0
spanforge/export/otlp_bridge.py +233 -0
spanforge/export/redis_backend.py +282 -0
spanforge/export/siem_schema.py +98 -0
spanforge/export/siem_splunk.py +264 -0
spanforge/export/siem_syslog.py +212 -0
spanforge/export/webhook.py +299 -0
spanforge/exporters/__init__.py +30 -0
spanforge/exporters/console.py +271 -0
spanforge/exporters/jsonl.py +144 -0
spanforge/exporters/sqlite.py +142 -0
spanforge/gate.py +1150 -0
spanforge/governance.py +181 -0
spanforge/hitl.py +295 -0
spanforge/http.py +187 -0
spanforge/inspect.py +427 -0
spanforge/integrations/__init__.py +45 -0
spanforge/integrations/_pricing.py +280 -0
spanforge/integrations/anthropic.py +388 -0
spanforge/integrations/azure_openai.py +133 -0
spanforge/integrations/bedrock.py +292 -0
spanforge/integrations/crewai.py +251 -0
spanforge/integrations/gemini.py +351 -0
spanforge/integrations/groq.py +442 -0
spanforge/integrations/langchain.py +349 -0
spanforge/integrations/langgraph.py +306 -0
spanforge/integrations/llamaindex.py +373 -0
spanforge/integrations/ollama.py +287 -0
spanforge/integrations/openai.py +368 -0
spanforge/integrations/together.py +483 -0
spanforge/io.py +214 -0
spanforge/lint.py +322 -0
spanforge/metrics.py +417 -0
spanforge/metrics_export.py +343 -0
spanforge/migrate.py +402 -0
spanforge/model_registry.py +278 -0
spanforge/models.py +389 -0
spanforge/namespaces/__init__.py +254 -0
spanforge/namespaces/audit.py +256 -0
spanforge/namespaces/cache.py +237 -0
spanforge/namespaces/chain.py +77 -0
spanforge/namespaces/confidence.py +72 -0
spanforge/namespaces/consent.py +92 -0
spanforge/namespaces/cost.py +179 -0
spanforge/namespaces/decision.py +143 -0
spanforge/namespaces/diff.py +157 -0
spanforge/namespaces/drift.py +80 -0
spanforge/namespaces/eval_.py +251 -0
spanforge/namespaces/feedback.py +241 -0
spanforge/namespaces/fence.py +193 -0
spanforge/namespaces/guard.py +105 -0
spanforge/namespaces/hitl.py +91 -0
spanforge/namespaces/latency.py +72 -0
spanforge/namespaces/prompt.py +190 -0
spanforge/namespaces/redact.py +173 -0
spanforge/namespaces/retrieval.py +379 -0
spanforge/namespaces/runtime_governance.py +494 -0
spanforge/namespaces/template.py +208 -0
spanforge/namespaces/tool_call.py +77 -0
spanforge/namespaces/trace.py +1029 -0
spanforge/normalizer.py +171 -0
spanforge/plugins.py +82 -0
spanforge/presidio_backend.py +349 -0
spanforge/processor.py +258 -0
spanforge/prompt_registry.py +418 -0
spanforge/py.typed +0 -0
spanforge/redact.py +914 -0
spanforge/regression.py +192 -0
spanforge/runtime_policy.py +159 -0
spanforge/sampling.py +511 -0
spanforge/schema.py +183 -0
spanforge/schemas/v1.0/schema.json +170 -0
spanforge/schemas/v2.0/schema.json +536 -0
spanforge/sdk/__init__.py +625 -0
spanforge/sdk/_base.py +584 -0
spanforge/sdk/_base.pyi +71 -0
spanforge/sdk/_exceptions.py +1096 -0
spanforge/sdk/_types.py +2184 -0
spanforge/sdk/alert.py +1514 -0
spanforge/sdk/alert.pyi +56 -0
spanforge/sdk/audit.py +1196 -0
spanforge/sdk/audit.pyi +67 -0
spanforge/sdk/cec.py +1215 -0
spanforge/sdk/cec.pyi +37 -0
spanforge/sdk/config.py +641 -0
spanforge/sdk/config.pyi +55 -0
spanforge/sdk/enterprise.py +714 -0
spanforge/sdk/enterprise.pyi +79 -0
spanforge/sdk/explain.py +170 -0
spanforge/sdk/fallback.py +432 -0
spanforge/sdk/feedback.py +351 -0
spanforge/sdk/gate.py +874 -0
spanforge/sdk/gate.pyi +51 -0
spanforge/sdk/identity.py +2114 -0
spanforge/sdk/identity.pyi +47 -0
spanforge/sdk/lineage.py +175 -0
spanforge/sdk/observe.py +1065 -0
spanforge/sdk/observe.pyi +50 -0
spanforge/sdk/operator.py +338 -0
spanforge/sdk/pii.py +1473 -0
spanforge/sdk/pii.pyi +119 -0
spanforge/sdk/pipelines.py +458 -0
spanforge/sdk/pipelines.pyi +39 -0
spanforge/sdk/policy.py +930 -0
spanforge/sdk/rag.py +594 -0
spanforge/sdk/rbac.py +280 -0
spanforge/sdk/registry.py +430 -0
spanforge/sdk/registry.pyi +46 -0
spanforge/sdk/scope.py +279 -0
spanforge/sdk/secrets.py +293 -0
spanforge/sdk/secrets.pyi +25 -0
spanforge/sdk/security.py +560 -0
spanforge/sdk/security.pyi +57 -0
spanforge/sdk/trust.py +472 -0
spanforge/sdk/trust.pyi +41 -0
spanforge/secrets.py +799 -0
spanforge/signing.py +1179 -0
spanforge/stats.py +100 -0
spanforge/stream.py +560 -0
spanforge/testing.py +378 -0
spanforge/testing_mocks.py +1052 -0
spanforge/trace.py +199 -0
spanforge/types.py +696 -0
spanforge/ulid.py +300 -0
spanforge/validate.py +379 -0
spanforge-1.0.0.dist-info/METADATA +1509 -0
spanforge-1.0.0.dist-info/RECORD +174 -0
spanforge-1.0.0.dist-info/WHEEL +4 -0
spanforge-1.0.0.dist-info/entry_points.txt +5 -0
spanforge-1.0.0.dist-info/licenses/LICENSE +128 -0

spanforge/sampling.py ADDED Viewed

@@ -0,0 +1,511 @@
+"""spanforge.sampling — Sampling strategies for span/event emission.
+Samplers decide **at observation time** whether a span or event should be
+exported.  They are composable: a :class:`ParentBasedSampler` delegates to a
+root sampler for new traces and honours the parent's decision for child spans.
+Configure via :func:`spanforge.configure`::
+    from spanforge import configure
+    from spanforge.sampling import RatioSampler, ParentBasedSampler
+    configure(sampler=ParentBasedSampler(root_sampler=RatioSampler(0.1)))
+Built-in samplers
+-----------------
+=========================================  =====================================
+Class                                      Description
+=========================================  =====================================
+:class:`AlwaysOnSampler`                   Export every span (default).
+:class:`AlwaysOffSampler`                  Drop every span.
+:class:`RatioSampler`                      Probabilistic head-based sampling.
+:class:`ParentBasedSampler`               Honour parent trace flags; use
+                                           ``root_sampler`` for new traces.
+:class:`RuleBasedSampler`                  Per-operation / per-model rules.
+:class:`TailBasedSampler`                  Buffer spans, decide after span ends
+                                           (e.g. always keep errors).
+=========================================  =====================================
+Custom samplers
+---------------
+Implement the :class:`Sampler` protocol::
+    class MySampler:
+        def should_sample(self, span_or_event, cfg) -> bool:
+            return True  # or False
+"""
+from __future__ import annotations
+import contextlib
+import hashlib
+import logging
+import secrets
+import threading
+from typing import TYPE_CHECKING, Any, Protocol, runtime_checkable
+if TYPE_CHECKING:
+    from collections.abc import Generator
+__all__ = [
+    "AlwaysOffSampler",
+    "AlwaysOnSampler",
+    "ComplianceSampler",
+    "ParentBasedSampler",
+    "RatioSampler",
+    "RuleBasedSampler",
+    "Sampler",
+    "TailBasedSampler",
+    "bypass_sampling",
+]
+_log = logging.getLogger("spanforge.sampling")
+# ---------------------------------------------------------------------------
+# Protocol
+# ---------------------------------------------------------------------------
+@runtime_checkable
+class Sampler(Protocol):
+    """Protocol implemented by all samplers.
+    Args:
+        span_or_event: The :class:`~spanforge._span.Span` or
+            :class:`~spanforge.event.Event` being considered.
+        cfg: The active :class:`~spanforge.config.SpanForgeConfig`.
+    Returns:
+        ``True`` if the span/event should be exported, ``False`` to drop it.
+    """
+    def should_sample(self, span_or_event: Any, cfg: Any) -> bool:
+        """Return ``True`` to export, ``False`` to drop."""
+        ...
+# ---------------------------------------------------------------------------
+# Always-on / Always-off
+# ---------------------------------------------------------------------------
+class AlwaysOnSampler:
+    """Export every span.  This is the SDK default when no sampler is set."""
+    def should_sample(self, span_or_event: Any, cfg: Any) -> bool:
+        """Always returns True — every span is sampled."""
+        return True
+class AlwaysOffSampler:
+    """Drop every span.  Useful for completely silencing test code."""
+    def should_sample(self, span_or_event: Any, cfg: Any) -> bool:
+        """Always returns False — every span is dropped."""
+        return False
+    def __repr__(self) -> str:
+        return "AlwaysOffSampler()"
+# ---------------------------------------------------------------------------
+# Ratio / probabilistic
+# ---------------------------------------------------------------------------
+class RatioSampler:
+    """Probabilistic head-based sampler.
+    Makes a deterministic decision based on the span's ``trace_id`` so that
+    all spans in the same trace receive the *same* sampling decision.
+    Args:
+        rate: Fraction of traces to export.  ``1.0`` exports all,
+              ``0.0`` exports none, ``0.1`` exports roughly one-in-ten.
+    Raises:
+        ValueError: If *rate* is not in ``[0.0, 1.0]``.
+    """
+    def __init__(self, rate: float) -> None:
+        if not 0.0 <= rate <= 1.0:
+            raise ValueError(f"RatioSampler.rate must be in [0.0, 1.0], got {rate!r}")
+        self._rate = rate
+        # Threshold in [0, 2^64) — use the upper bound as an integer range.
+        self._threshold = int(rate * (2**64))
+    @property
+    def rate(self) -> float:
+        """The configured sampling fraction in [0.0, 1.0]."""
+        return self._rate
+    def should_sample(self, span_or_event: Any, cfg: Any) -> bool:
+        """Return True if the span's trace_id hashes below the configured threshold."""
+        if self._rate >= 1.0:
+            return True
+        if self._rate <= 0.0:
+            return False
+        trace_id = _get_trace_id(span_or_event)
+        if trace_id is None:
+            return True  # no trace context — fall through to export
+        # SHA-256 of the trace_id for uniform distribution regardless of
+        # whether trace_id is a UUID, ULID, or 32-hex string.
+        digest = hashlib.sha256(trace_id.encode()).digest()
+        # Use first 8 bytes as a big-endian uint64.
+        value = int.from_bytes(digest[:8], "big")
+        return value < self._threshold
+    def __repr__(self) -> str:
+        return f"RatioSampler(rate={self._rate!r})"
+# ---------------------------------------------------------------------------
+# Parent-based
+# ---------------------------------------------------------------------------
+class ParentBasedSampler:
+    """Honour the parent span's sampling decision; use ``root_sampler`` for roots.
+    This mirrors the OpenTelemetry ``ParentBased`` sampler spec so that the
+    entire trace follows a single consistent decision.
+    Args:
+        root_sampler: The sampler to use for root spans (no parent).
+            Defaults to :class:`AlwaysOnSampler`.
+        remote_parent_sampled: Decision for remote-parent spans where the
+            parent *was* sampled.  Defaults to ``True`` (always export).
+        remote_parent_not_sampled: Decision for remote-parent spans where the
+            parent was *not* sampled.  Defaults to ``False`` (always drop).
+    """
+    def __init__(
+        self,
+        root_sampler: Any | None = None,
+        *,
+        remote_parent_sampled: bool = True,
+        remote_parent_not_sampled: bool = False,
+    ) -> None:
+        self._root = root_sampler if root_sampler is not None else AlwaysOnSampler()
+        self._remote_sampled = remote_parent_sampled
+        self._remote_not_sampled = remote_parent_not_sampled
+    def should_sample(self, span_or_event: Any, cfg: Any) -> bool:
+        """Delegate to root_sampler for roots; honour parent decision for child spans."""
+        # Check if there's an incoming traceparent (remote parent).
+        traceparent = getattr(span_or_event, "traceparent", None)
+        if traceparent is not None:
+            # Parse the trace-flags byte (last field of W3C traceparent).
+            # Format: 00-{trace_id}-{parent_id}-{flags}
+            try:
+                flags = int(traceparent.rsplit("-", 1)[-1], 16)
+                sampled_flag = bool(flags & 0x01)
+            except (ValueError, IndexError):
+                sampled_flag = False  # conservative: corrupt flags → don't sample
+            return self._remote_sampled if sampled_flag else self._remote_not_sampled
+        # Check if there's a local parent span via spanforge's context stack.
+        parent_id = getattr(span_or_event, "parent_span_id", None)
+        if parent_id is not None:
+            # Local parent — honour the parent decision (keep the span since
+            # the parent was already sampled to get to this point).
+            return True
+        # Root span — delegate to root_sampler.
+        return self._root.should_sample(span_or_event, cfg)
+    def __repr__(self) -> str:
+        return (
+            f"ParentBasedSampler(root_sampler={self._root!r}, "
+            f"remote_parent_sampled={self._remote_sampled!r}, "
+            f"remote_parent_not_sampled={self._remote_not_sampled!r})"
+        )
+# ---------------------------------------------------------------------------
+# Rule-based
+# ---------------------------------------------------------------------------
+class RuleBasedSampler:
+    """Sample based on user-defined attribute rules.
+    Each rule is a ``dict`` mapping span attribute names to match values.
+    A rule matches when *all* specified attributes equal their target values
+    on the span.  The first matching rule wins.
+    Rules list entries are dicts with keys:
+    * ``match``: ``dict[str, Any]`` — attribute → expected-value pairs.
+    * ``sample``: ``bool`` — whether to export when matched.
+    A default decision (``default``) applies when no rule matches.
+    Args:
+        rules: Ordered list of rule dicts.
+        default: Sampling decision when no rule matches.  Defaults to
+            ``True`` (export everything by default).
+    Example::
+        sampler = RuleBasedSampler(
+            rules=[
+                {"match": {"span_name": "health_check"}, "sample": False},
+                {"match": {"operation": "chat", "model.name": "gpt-4o"}, "sample": True},
+            ],
+            default=True,
+        )
+    """
+    def __init__(
+        self,
+        rules: list[dict[str, Any]] | None = None,
+        *,
+        default: bool = True,
+    ) -> None:
+        self._rules: list[dict[str, Any]] = list(rules or [])
+        self._default = default
+    def should_sample(self, span_or_event: Any, cfg: Any) -> bool:
+        """Return the first matching rule's decision, or the default."""
+        for rule in self._rules:
+            match = rule.get("match", {})
+            decision = rule.get("sample", self._default)
+            if self._matches(span_or_event, match):
+                return bool(decision)
+        return self._default
+    @staticmethod
+    def _matches(obj: Any, match: dict[str, Any]) -> bool:
+        for key, expected in match.items():
+            # Support dotted attribute paths, e.g. "model.name".
+            parts = key.split(".", 1)
+            val = getattr(obj, parts[0], None)
+            if len(parts) == 2 and val is not None:
+                val = getattr(val, parts[1], None)
+            if val != expected:
+                return False
+        return True
+    def __repr__(self) -> str:
+        return f"RuleBasedSampler(rules={self._rules!r}, default={self._default!r})"
+# ---------------------------------------------------------------------------
+# Tail-based
+# ---------------------------------------------------------------------------
+class TailBasedSampler:
+    """Buffer spans and decide whether to export after the span ends.
+    Tail sampling inspects the *final* span state (e.g. error status, latency)
+    before making an export decision.  This enables use cases like:
+    * Always export error spans.
+    * Always export spans with ``duration_ms > threshold``.
+    * Sample only the slow-path at a given rate.
+    Because decisions are made at ``on_end``, this sampler is designed to
+    work alongside :class:`~spanforge.processor.SpanProcessor`.  The
+    :meth:`should_sample` method is called by the SDK just before export.
+    Args:
+        always_sample_errors: If ``True``, spans with ``status == "error"``
+            are always exported regardless of other rules.  (Default: ``True``)
+        always_sample_slow_ms: If set, spans with ``duration_ms >=`` this
+            value are always exported.  (Default: ``None``)
+        fallback_sampler: Sampler used for spans that don't match the above
+            conditions.  Defaults to :class:`AlwaysOnSampler`.
+        buffer_size: Maximum number of *pending* span decisions to hold in
+            memory.  Oldest are evicted when the buffer is full.
+            (Default: 1 000)
+    Note:
+        This implementation makes the sampling decision at the time
+        :meth:`should_sample` is called (typically just before export).
+        The ``buffer_size`` parameter controls how many span IDs are tracked
+        to deduplicate decisions within a single process.
+    """
+    def __init__(
+        self,
+        *,
+        always_sample_errors: bool = True,
+        always_sample_slow_ms: float | None = None,
+        fallback_sampler: Any | None = None,
+    ) -> None:
+        self._always_errors = always_sample_errors
+        self._slow_ms = always_sample_slow_ms
+        self._fallback = fallback_sampler if fallback_sampler is not None else AlwaysOnSampler()
+        self._lock = threading.Lock()
+    def should_sample(self, span_or_event: Any, cfg: Any) -> bool:
+        """Return True if the span should be exported based on error/latency rules."""
+        # Error spans — always sample.
+        if self._always_errors:
+            status = getattr(span_or_event, "status", None)
+            if isinstance(status, str) and status == "error":
+                return True
+        # Slow spans — always sample.
+        if self._slow_ms is not None:
+            duration = getattr(span_or_event, "duration_ms", None)
+            if isinstance(duration, (int, float)) and duration >= self._slow_ms:
+                return True
+        # Fallback sampler for normal spans.
+        return self._fallback.should_sample(span_or_event, cfg)
+    def __repr__(self) -> str:
+        return (
+            f"TailBasedSampler("
+            f"always_sample_errors={self._always_errors!r}, "
+            f"always_sample_slow_ms={self._slow_ms!r}, "
+            f"fallback_sampler={self._fallback!r})"
+        )
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+def _get_trace_id(obj: Any) -> str | None:
+    """Extract trace_id from a Span or Event."""
+    # Direct attribute on Span.
+    tid = getattr(obj, "trace_id", None)
+    if isinstance(tid, str) and tid:
+        return tid
+    # Nested inside payload dict (Event.payload["trace_id"]).
+    payload = getattr(obj, "payload", None)
+    if isinstance(payload, dict):
+        tid = payload.get("trace_id")
+        if isinstance(tid, str) and tid:
+            return tid
+    return None
+def _get_event_type(obj: Any) -> str | None:
+    """Extract event_type string from a Span or Event."""
+    et = getattr(obj, "event_type", None)
+    if et is not None:
+        return str(et)
+    return None
+# ---------------------------------------------------------------------------
+# Compliance-aware sampler (SF-16)
+# ---------------------------------------------------------------------------
+_DEFAULT_ALWAYS_RECORD: frozenset[str] = frozenset(
+    {
+        "llm.redact.",
+        "llm.audit.",
+        "llm.guard.",
+        "llm.cost.",
+    }
+)
+class ComplianceSampler:
+    """Compliance-aware sampler that never drops critical event types.
+    Events whose ``event_type`` starts with any prefix in *always_record*
+    are always exported (100% recording). All other events are sampled
+    at *base_rate* using deterministic trace-ID-based hashing so entire
+    traces are kept or dropped together.
+    Args:
+        base_rate: Fraction of non-compliance events to export (0.0-1.0).
+        always_record: Frozenset of event-type prefixes that bypass sampling.
+            Defaults to ``llm.redact.``, ``llm.audit.``, ``llm.guard.``,
+            ``llm.cost.``.
+    Example::
+        sampler = ComplianceSampler(base_rate=0.1)
+        # llm.audit.* events → always recorded
+        # llm.trace.* events → ~10% recorded
+    """
+    def __init__(
+        self,
+        base_rate: float = 0.1,
+        always_record: frozenset[str] | None = None,
+    ) -> None:
+        if not 0.0 <= base_rate <= 1.0:
+            raise ValueError(
+                f"ComplianceSampler.base_rate must be in [0.0, 1.0], got {base_rate!r}"
+            )
+        self._base_rate = base_rate
+        self._always_record = always_record if always_record is not None else _DEFAULT_ALWAYS_RECORD
+        self._threshold = int(base_rate * (2**64))
+    @property
+    def base_rate(self) -> float:
+        """The base sampling fraction for non-compliance events."""
+        return self._base_rate
+    @property
+    def always_record(self) -> frozenset[str]:
+        """Frozenset of event-type prefixes that are always recorded."""
+        return self._always_record
+    def should_sample(self, span_or_event: Any, cfg: Any) -> bool:
+        """Return True for compliance-critical events; sample others at base_rate."""
+        # Check if bypass is active
+        if getattr(_bypass_active, "value", False):
+            return True
+        # Always record compliance-critical events
+        event_type = _get_event_type(span_or_event)
+        if event_type is not None:
+            for prefix in self._always_record:
+                if event_type.startswith(prefix):
+                    return True
+        # Deterministic trace-ID-based sampling for other events
+        if self._base_rate >= 1.0:
+            return True
+        if self._base_rate <= 0.0:
+            return False
+        trace_id = _get_trace_id(span_or_event)
+        if trace_id is not None:
+            digest = hashlib.sha256(trace_id.encode()).digest()
+            value = int.from_bytes(digest[:8], "big")
+            return value < self._threshold
+        # No trace_id — fall back to random
+        return (secrets.randbits(32) / 0xFFFF_FFFF) < self._base_rate
+    def __repr__(self) -> str:
+        return f"ComplianceSampler(base_rate={self._base_rate!r})"
+# ---------------------------------------------------------------------------
+# Sampling bypass context manager (SF-16-D)
+# ---------------------------------------------------------------------------
+_bypass_active: threading.local = threading.local()
+@contextlib.contextmanager
+def bypass_sampling() -> Generator[None, None, None]:
+    """Context manager that forces all sampling decisions to return ``True``.
+    Used by compliance report generation to ensure reports reflect the
+    complete audit trail, not the sampled subset::
+        with bypass_sampling():
+            package = engine.generate_evidence_package(...)
+    """
+    prev = getattr(_bypass_active, "value", False)
+    _bypass_active.value = True
+    try:
+        yield
+    finally:
+        _bypass_active.value = prev

spanforge/schema.py ADDED Viewed

@@ -0,0 +1,183 @@
+"""spanforge.schema — Lightweight JSON Schema validator.
+Provides :func:`validate`, a zero-dependency validator that supports the most
+commonly needed JSON Schema keywords: ``type``, ``required``, ``properties``,
+``items``, ``enum``, ``minimum``, ``maximum``, ``minLength``, and
+``maxLength``.  It returns a list of human-readable error strings (empty list
+= valid), making it easy to surface schema violations in log messages or
+CI output without throwing exceptions.
+Intended for validating structured LLM output (e.g. function-calling
+responses, JSON-mode completions) anywhere in the spanforge ecosystem.
+Usage::
+    from spanforge.schema import validate
+    schema = {
+        "type": "object",
+        "required": ["answer", "confidence"],
+        "properties": {
+            "answer": {"type": "string"},
+            "confidence": {"type": "number", "minimum": 0.0, "maximum": 1.0},
+        },
+    }
+    errors = validate({"answer": "Paris", "confidence": 0.95}, schema)
+    assert errors == []
+    errors = validate({"answer": 42}, schema)
+    # errors == ["$.answer: expected type string, got int",
+    #            "$: missing required property 'confidence'"]
+"""
+from __future__ import annotations
+from typing import Any
+__all__ = ["SchemaValidationError", "validate"]
+class SchemaValidationError(ValueError):
+    """Raised by :func:`validate_strict` when validation fails.
+    Attributes:
+        errors:  The list of error strings from :func:`validate`.
+    """
+    def __init__(self, errors: list[str]) -> None:
+        self.errors = errors
+        super().__init__("; ".join(errors))
+# JSON Schema "type" → Python type(s) mapping
+_TYPE_MAP: dict[str, type | tuple[type, ...]] = {
+    "string": str,
+    "number": (int, float),
+    "integer": int,
+    "boolean": bool,
+    "array": list,
+    "object": dict,
+    "null": type(None),
+}
+def validate(
+    instance: Any,
+    schema: dict[str, Any],
+    path: str = "$",
+) -> list[str]:
+    """Validate *instance* against a JSON Schema subset.
+    Supported keywords
+    ------------------
+    * ``type`` — ``"string"``, ``"number"``, ``"integer"``, ``"boolean"``,
+      ``"array"``, ``"object"``, ``"null"``
+    * ``enum`` — list of allowed values
+    * ``required`` — list of required property names (objects only)
+    * ``properties`` — sub-schema per property name (objects only)
+    * ``items`` — sub-schema for every array element (arrays only)
+    * ``minimum`` / ``maximum`` — inclusive bounds (numbers only)
+    * ``minLength`` / ``maxLength`` — length bounds (strings only)
+    Args:
+        instance:  The Python value to validate.
+        schema:    A JSON Schema dict (subset supported as described above).
+        path:      JSONPath-style prefix used in error messages.  Defaults to
+                   ``"$"`` (document root).  Recursive calls set sub-paths
+                   automatically; callers usually leave this as default.
+    Returns:
+        A list of error strings.  An empty list means the instance is valid.
+    Example::
+        errors = validate("hello", {"type": "string", "minLength": 3})
+        assert errors == []
+        errors = validate(2, {"type": "string"})
+        assert errors == ["$: expected type string, got int"]
+    """
+    errors: list[str] = []
+    schema_type = schema.get("type")
+    # --- type check ---
+    if schema_type is not None:
+        expected = _TYPE_MAP.get(schema_type)
+        if expected is not None:
+            # Special case: bool is a subclass of int in Python, but JSON
+            # Schema treats them as distinct types.  Check bool BEFORE the
+            # isinstance() call because isinstance(True, int) is True.
+            if isinstance(instance, bool) and schema_type in ("integer", "number"):
+                errors.append(f"{path}: expected type {schema_type}, got bool")
+                return errors  # type mismatch; sub-checks meaningless
+            if not isinstance(instance, expected):
+                errors.append(f"{path}: expected type {schema_type}, got {type(instance).__name__}")
+                return errors  # type mismatch; sub-checks are meaningless
+    # --- enum check ---
+    if "enum" in schema and instance not in schema["enum"]:
+        errors.append(f"{path}: value {instance!r} not in enum {schema['enum']!r}")
+    # --- object checks ---
+    if schema_type == "object" and isinstance(instance, dict):
+        errors.extend(
+            f"{path}: missing required property {key!r}"
+            for key in schema.get("required", [])
+            if key not in instance
+        )
+        for key, sub_schema in schema.get("properties", {}).items():
+            if key in instance:
+                errors.extend(validate(instance[key], sub_schema, f"{path}.{key}"))
+    # --- array checks ---
+    if schema_type == "array" and isinstance(instance, list):
+        items_schema = schema.get("items")
+        if items_schema is not None:
+            for i, item in enumerate(instance):
+                errors.extend(validate(item, items_schema, f"{path}[{i}]"))
+    # --- numeric bounds ---
+    if (
+        schema_type in ("number", "integer")
+        and isinstance(instance, (int, float))
+        and not isinstance(instance, bool)
+    ):
+        if "minimum" in schema and instance < schema["minimum"]:
+            errors.append(f"{path}: {instance} is less than minimum {schema['minimum']}")
+        if "maximum" in schema and instance > schema["maximum"]:
+            errors.append(f"{path}: {instance} is greater than maximum {schema['maximum']}")
+    # --- string length ---
+    if schema_type == "string" and isinstance(instance, str):
+        if "minLength" in schema and len(instance) < schema["minLength"]:
+            errors.append(
+                f"{path}: string length {len(instance)} is less than "
+                f"minLength {schema['minLength']}"
+            )
+        if "maxLength" in schema and len(instance) > schema["maxLength"]:
+            errors.append(
+                f"{path}: string length {len(instance)} exceeds maxLength {schema['maxLength']}"
+            )
+    return errors
+def validate_strict(
+    instance: Any,
+    schema: dict[str, Any],
+    path: str = "$",
+) -> None:
+    """Like :func:`validate` but raises :class:`SchemaValidationError` on failure.
+    Args:
+        instance:  The value to validate.
+        schema:    JSON Schema dict.
+        path:      Starting path prefix (default ``"$"``).
+    Raises:
+        SchemaValidationError: When :func:`validate` returns any errors.
+    """
+    errors = validate(instance, schema, path)
+    if errors:
+        raise SchemaValidationError(errors)