PyPI - invarlock - Versions diffs - 0.3.1__py3-none-any.whl → 0.3.3__py3-none-any.whl - Mend

invarlock 0.3.1py3-none-any.whl → 0.3.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (40) hide show

invarlock/__init__.py +1 -1
invarlock/_data/runtime/tiers.yaml +61 -0
invarlock/adapters/hf_loading.py +97 -0
invarlock/calibration/__init__.py +6 -0
invarlock/calibration/spectral_null.py +301 -0
invarlock/calibration/variance_ve.py +154 -0
invarlock/cli/app.py +15 -0
invarlock/cli/commands/calibrate.py +576 -0
invarlock/cli/commands/doctor.py +9 -3
invarlock/cli/commands/explain_gates.py +53 -9
invarlock/cli/commands/plugins.py +12 -2
invarlock/cli/commands/run.py +181 -79
invarlock/cli/commands/verify.py +40 -0
invarlock/cli/config.py +11 -1
invarlock/cli/determinism.py +252 -0
invarlock/core/auto_tuning.py +215 -17
invarlock/core/bootstrap.py +137 -5
invarlock/core/registry.py +9 -4
invarlock/core/runner.py +305 -35
invarlock/eval/bench.py +467 -141
invarlock/eval/bench_regression.py +12 -0
invarlock/eval/bootstrap.py +3 -1
invarlock/eval/data.py +29 -7
invarlock/eval/primary_metric.py +20 -5
invarlock/guards/rmt.py +536 -46
invarlock/guards/spectral.py +217 -10
invarlock/guards/variance.py +124 -42
invarlock/reporting/certificate.py +476 -45
invarlock/reporting/certificate_schema.py +4 -1
invarlock/reporting/guards_analysis.py +108 -10
invarlock/reporting/normalizer.py +24 -1
invarlock/reporting/policy_utils.py +97 -15
invarlock/reporting/primary_metric_utils.py +17 -0
invarlock/reporting/validate.py +10 -10
{invarlock-0.3.1.dist-info → invarlock-0.3.3.dist-info}/METADATA +12 -10
{invarlock-0.3.1.dist-info → invarlock-0.3.3.dist-info}/RECORD +40 -33
{invarlock-0.3.1.dist-info → invarlock-0.3.3.dist-info}/WHEEL +0 -0
{invarlock-0.3.1.dist-info → invarlock-0.3.3.dist-info}/entry_points.txt +0 -0
{invarlock-0.3.1.dist-info → invarlock-0.3.3.dist-info}/licenses/LICENSE +0 -0
{invarlock-0.3.1.dist-info → invarlock-0.3.3.dist-info}/top_level.txt +0 -0

invarlock/cli/determinism.py ADDED Viewed

@@ -0,0 +1,252 @@
+"""Determinism presets for CI/release runs.
+Centralizes:
+- Seeds (python/numpy/torch)
+- Thread caps (OMP/MKL/etc + torch threads)
+- TF32 policy
+- torch deterministic algorithms
+- A structured "determinism level" for certificate provenance
+"""
+from __future__ import annotations
+import os
+import random
+from typing import Any
+import numpy as np
+from invarlock.model_utils import set_seed
+try:  # optional torch
+    import torch
+except Exception:  # pragma: no cover
+    torch = None  # type: ignore[assignment]
+_THREAD_ENV_VARS: tuple[str, ...] = (
+    "OMP_NUM_THREADS",
+    "MKL_NUM_THREADS",
+    "OPENBLAS_NUM_THREADS",
+    "NUMEXPR_NUM_THREADS",
+    "VECLIB_MAXIMUM_THREADS",
+)
+def _coerce_int(value: Any, default: int) -> int:
+    try:
+        return int(value)
+    except Exception:
+        return int(default)
+def _coerce_profile(profile: str | None) -> str:
+    try:
+        return (profile or "").strip().lower()
+    except Exception:
+        return ""
+def _coerce_device(device: str | None) -> str:
+    try:
+        return (device or "").strip().lower()
+    except Exception:
+        return "cpu"
+def apply_determinism_preset(
+    *,
+    profile: str | None,
+    device: str | None,
+    seed: int,
+    threads: int = 1,
+) -> dict[str, Any]:
+    """Apply a determinism preset and return a provenance payload."""
+    prof = _coerce_profile(profile)
+    dev = _coerce_device(device)
+    threads_i = max(1, _coerce_int(threads, 1))
+    requested = "off"
+    if prof in {"ci", "release"}:
+        requested = "strict"
+    env_set: dict[str, Any] = {}
+    torch_flags: dict[str, Any] = {}
+    notes: list[str] = []
+    # Thread caps (best-effort): make CPU determinism explicit and reduce drift.
+    if requested == "strict":
+        for var in _THREAD_ENV_VARS:
+            os.environ[var] = str(threads_i)
+            env_set[var] = os.environ.get(var)
+    # CUDA determinism: cuBLAS workspace config.
+    if requested == "strict" and dev.startswith("cuda"):
+        preferred = ":4096:8"
+        fallback = ":16:8"
+        if "CUBLAS_WORKSPACE_CONFIG" not in os.environ:
+            selected = preferred
+            if torch is not None:
+                try:
+                    mem_bytes = int(torch.cuda.get_device_properties(0).total_memory)
+                    if mem_bytes and mem_bytes < 8 * 1024**3:
+                        selected = fallback
+                except Exception:
+                    selected = preferred
+            os.environ["CUBLAS_WORKSPACE_CONFIG"] = selected
+        env_set["CUBLAS_WORKSPACE_CONFIG"] = os.environ.get("CUBLAS_WORKSPACE_CONFIG")
+    if requested == "strict":
+        os.environ.setdefault("TOKENIZERS_PARALLELISM", "false")
+        env_set["TOKENIZERS_PARALLELISM"] = os.environ.get("TOKENIZERS_PARALLELISM")
+    # Seed all RNGs (python/numpy/torch) using the existing helper for parity.
+    set_seed(int(seed))
+    # Derive a stable seed bundle for provenance.
+    seed_bundle = {
+        "python": int(seed),
+        "numpy": int(seed),
+        "torch": None,
+    }
+    try:
+        numpy_seed = int(np.random.get_state()[1][0])
+        seed_bundle["numpy"] = int(numpy_seed)
+    except Exception:
+        pass
+    if torch is not None:
+        try:
+            seed_bundle["torch"] = int(torch.initial_seed())
+        except Exception:
+            seed_bundle["torch"] = int(seed)
+    # Torch-specific controls.
+    level = "off" if requested == "off" else "strict"
+    if requested == "strict":
+        if torch is None:
+            level = "tolerance"
+            notes.append("torch_unavailable")
+        else:
+            # Thread caps.
+            try:
+                if hasattr(torch, "set_num_threads"):
+                    torch.set_num_threads(threads_i)
+                if hasattr(torch, "set_num_interop_threads"):
+                    torch.set_num_interop_threads(threads_i)
+                torch_flags["torch_threads"] = threads_i
+            except Exception:
+                level = "tolerance"
+                notes.append("torch_thread_caps_failed")
+            # Disable TF32 for determinism.
+            try:
+                matmul = getattr(
+                    getattr(torch.backends, "cuda", object()), "matmul", None
+                )
+                if matmul is not None and hasattr(matmul, "allow_tf32"):
+                    matmul.allow_tf32 = False
+                cudnn_mod = getattr(torch.backends, "cudnn", None)
+                if cudnn_mod is not None and hasattr(cudnn_mod, "allow_tf32"):
+                    cudnn_mod.allow_tf32 = False
+            except Exception:
+                level = "tolerance"
+                notes.append("tf32_policy_failed")
+            # Deterministic algorithms.
+            try:
+                if hasattr(torch, "use_deterministic_algorithms"):
+                    torch.use_deterministic_algorithms(True, warn_only=False)
+            except Exception:
+                # Downgrade to tolerance-based determinism rather than crashing.
+                level = "tolerance"
+                notes.append("deterministic_algorithms_unavailable")
+                try:
+                    if hasattr(torch, "use_deterministic_algorithms"):
+                        torch.use_deterministic_algorithms(True, warn_only=True)
+                except Exception:
+                    pass
+            # cuDNN knobs.
+            try:
+                cudnn_mod = getattr(torch.backends, "cudnn", None)
+                if cudnn_mod is not None:
+                    cudnn_mod.benchmark = False
+                    if hasattr(cudnn_mod, "deterministic"):
+                        cudnn_mod.deterministic = True
+            except Exception:
+                level = "tolerance"
+                notes.append("cudnn_determinism_failed")
+            # Snapshot applied flags for provenance.
+            try:
+                det_enabled = getattr(
+                    torch, "are_deterministic_algorithms_enabled", None
+                )
+                if callable(det_enabled):
+                    torch_flags["deterministic_algorithms"] = bool(det_enabled())
+            except Exception:
+                pass
+            try:
+                cudnn_mod = getattr(torch.backends, "cudnn", None)
+                if cudnn_mod is not None:
+                    torch_flags["cudnn_deterministic"] = bool(
+                        getattr(cudnn_mod, "deterministic", False)
+                    )
+                    torch_flags["cudnn_benchmark"] = bool(
+                        getattr(cudnn_mod, "benchmark", False)
+                    )
+                    if hasattr(cudnn_mod, "allow_tf32"):
+                        torch_flags["cudnn_allow_tf32"] = bool(
+                            getattr(cudnn_mod, "allow_tf32", False)
+                        )
+            except Exception:
+                pass
+            try:
+                matmul = getattr(
+                    getattr(torch.backends, "cuda", object()), "matmul", None
+                )
+                if matmul is not None and hasattr(matmul, "allow_tf32"):
+                    torch_flags["cuda_matmul_allow_tf32"] = bool(matmul.allow_tf32)
+            except Exception:
+                pass
+    # Normalized level is always one of these.
+    if level not in {"off", "strict", "tolerance"}:
+        level = "tolerance" if requested == "strict" else "off"
+    # Extra breadcrumb: random module state is not easily serializable; include a coarse marker.
+    try:
+        torch_flags["python_random"] = isinstance(random.random(), float)
+    except Exception:
+        pass
+    payload = {
+        "requested": requested,
+        "level": level,
+        "profile": prof or None,
+        "device": dev,
+        "threads": threads_i if requested == "strict" else None,
+        "seed": int(seed),
+        "seeds": seed_bundle,
+        "env": env_set,
+        "torch": torch_flags,
+        "notes": notes,
+    }
+    # Remove empty sections for stable artifacts.
+    if not payload["env"]:
+        payload.pop("env", None)
+    if not payload["torch"]:
+        payload.pop("torch", None)
+    if not payload["notes"]:
+        payload.pop("notes", None)
+    if payload.get("threads") is None:
+        payload.pop("threads", None)
+    if payload.get("profile") is None:
+        payload.pop("profile", None)
+    return payload
+__all__ = ["apply_determinism_preset"]

invarlock/core/auto_tuning.py CHANGED Viewed

@@ -7,9 +7,21 @@ Maps tier settings (conservative/balanced/aggressive) to specific guard paramete
 """
 import copy
+import os
+from functools import lru_cache
+from importlib import resources as _ires
+from pathlib import Path
 from typing import Any
-__all__ = ["resolve_tier_policies", "TIER_POLICIES", "EDIT_ADJUSTMENTS"]
+import yaml
+__all__ = [
+    "clear_tier_policies_cache",
+    "get_tier_policies",
+    "resolve_tier_policies",
+    "TIER_POLICIES",
+    "EDIT_ADJUSTMENTS",
+]
 # Base tier policy mappings
@@ -198,10 +210,183 @@ EDIT_ADJUSTMENTS: dict[str, dict[str, dict[str, Any]]] = {
 }
+def _deep_merge(base: dict[str, Any], override: dict[str, Any]) -> dict[str, Any]:
+    out = copy.deepcopy(base)
+    for key, value in override.items():
+        if isinstance(value, dict) and isinstance(out.get(key), dict):
+            out[key] = _deep_merge(out[key], value)
+        else:
+            out[key] = copy.deepcopy(value)
+    return out
+def _load_runtime_yaml(
+    config_root: str | None, *rel_parts: str
+) -> dict[str, Any] | None:
+    """Load YAML from runtime config locations.
+    Search order:
+      1) $INVARLOCK_CONFIG_ROOT/runtime/...
+      2) invarlock._data.runtime package resources
+    """
+    if config_root:
+        p = Path(config_root) / "runtime"
+        for part in rel_parts:
+            p = p / part
+        if p.exists():
+            data = yaml.safe_load(p.read_text(encoding="utf-8")) or {}
+            if not isinstance(data, dict):
+                raise ValueError("Runtime YAML must be a mapping")
+            return data
+    try:
+        base = _ires.files("invarlock._data.runtime")
+        res = base
+        for part in rel_parts:
+            res = res.joinpath(part)
+        if getattr(res, "is_file", None) and res.is_file():  # type: ignore[attr-defined]
+            text = res.read_text(encoding="utf-8")  # type: ignore[assignment]
+            data = yaml.safe_load(text) or {}
+            if not isinstance(data, dict):
+                raise ValueError("Runtime YAML must be a mapping")
+            return data
+    except Exception:
+        return None
+    return None
+def _normalize_family_caps(caps: Any) -> dict[str, dict[str, float]]:
+    normalized: dict[str, dict[str, float]] = {}
+    if not isinstance(caps, dict):
+        return normalized
+    for family, value in caps.items():
+        family_key = str(family)
+        if isinstance(value, dict):
+            kappa = value.get("kappa")
+            if isinstance(kappa, int | float):
+                normalized[family_key] = {"kappa": float(kappa)}
+        elif isinstance(value, int | float):
+            normalized[family_key] = {"kappa": float(value)}
+    return normalized
+def _normalize_multiple_testing(mt: Any) -> dict[str, Any]:
+    if not isinstance(mt, dict):
+        return {}
+    out: dict[str, Any] = {}
+    method = mt.get("method")
+    if method is not None:
+        out["method"] = str(method).lower()
+    alpha = mt.get("alpha")
+    try:
+        if alpha is not None:
+            out["alpha"] = float(alpha)
+    except Exception:
+        pass
+    m_val = mt.get("m")
+    try:
+        if m_val is not None:
+            out["m"] = int(m_val)
+    except Exception:
+        pass
+    return out
+def _tier_entry_to_policy(tier_entry: dict[str, Any]) -> dict[str, dict[str, Any]]:
+    """Map a tiers.yaml entry to the canonical policy shape."""
+    out: dict[str, dict[str, Any]] = {}
+    metrics = tier_entry.get("metrics")
+    if isinstance(metrics, dict):
+        out["metrics"] = copy.deepcopy(metrics)
+    spectral_src = tier_entry.get("spectral") or tier_entry.get("spectral_guard")
+    if isinstance(spectral_src, dict):
+        spectral = copy.deepcopy(spectral_src)
+        if "family_caps" in spectral:
+            spectral["family_caps"] = _normalize_family_caps(
+                spectral.get("family_caps")
+            )
+        if "multiple_testing" in spectral:
+            spectral["multiple_testing"] = _normalize_multiple_testing(
+                spectral.get("multiple_testing")
+            )
+        out["spectral"] = spectral
+    rmt_src = tier_entry.get("rmt") or tier_entry.get("rmt_guard")
+    if isinstance(rmt_src, dict):
+        rmt = copy.deepcopy(rmt_src)
+        eps = rmt.get("epsilon_by_family")
+        if isinstance(eps, dict):
+            rmt["epsilon_by_family"] = {
+                str(k): float(v) for k, v in eps.items() if isinstance(v, int | float)
+            }
+            # Backward-compat: keep epsilon alias
+            rmt["epsilon"] = dict(rmt["epsilon_by_family"])
+        out["rmt"] = rmt
+    variance_src = tier_entry.get("variance") or tier_entry.get("variance_guard")
+    if isinstance(variance_src, dict):
+        out["variance"] = copy.deepcopy(variance_src)
+    return out
+@lru_cache(maxsize=8)
+def _load_tier_policies_cached(config_root: str | None) -> dict[str, dict[str, Any]]:
+    tiers = _load_runtime_yaml(config_root, "tiers.yaml") or {}
+    merged: dict[str, dict[str, Any]] = {}
+    # Start from defaults, then overlay tiers.yaml per-tier.
+    for tier_name, defaults in TIER_POLICIES.items():
+        merged[str(tier_name).lower()] = copy.deepcopy(defaults)
+    for tier_name, entry in tiers.items():
+        if not isinstance(entry, dict):
+            continue
+        tier_key = str(tier_name).lower()
+        resolved_entry = _tier_entry_to_policy(entry)
+        if tier_key not in merged:
+            merged[tier_key] = {}
+        merged[tier_key] = _deep_merge(merged[tier_key], resolved_entry)
+    return merged
+def get_tier_policies(*, config_root: str | None = None) -> dict[str, dict[str, Any]]:
+    """Return tier policies loaded from runtime tiers.yaml (with safe defaults)."""
+    root = config_root
+    if root is None:
+        root = os.getenv("INVARLOCK_CONFIG_ROOT") or None
+    return _load_tier_policies_cached(root)
+def clear_tier_policies_cache() -> None:
+    _load_tier_policies_cached.cache_clear()
+def _load_profile_overrides(
+    profile: str | None, *, config_root: str | None
+) -> dict[str, Any]:
+    if not profile:
+        return {}
+    prof = str(profile).strip().lower()
+    candidate = _load_runtime_yaml(config_root, "profiles", f"{prof}.yaml")
+    if candidate is None and prof == "ci":
+        candidate = _load_runtime_yaml(config_root, "profiles", "ci_cpu.yaml") or {}
+    if not isinstance(candidate, dict):
+        return {}
+    return candidate
 def resolve_tier_policies(
     tier: str,
     edit_name: str | None = None,
     explicit_overrides: dict[str, dict[str, Any]] | None = None,
+    *,
+    profile: str | None = None,
+    config_root: str | None = None,
 ) -> dict[str, dict[str, Any]]:
     """
     Resolve tier-based guard policies with edit-specific adjustments and explicit overrides.
@@ -217,33 +402,45 @@ def resolve_tier_policies(
     Raises:
         ValueError: If tier is not recognized
     """
-    if tier not in TIER_POLICIES:
+    tier_key = str(tier).lower()
+    tier_policies = get_tier_policies(config_root=config_root)
+    if tier_key not in tier_policies:
         raise ValueError(
-            f"Unknown tier '{tier}'. Valid tiers: {list(TIER_POLICIES.keys())}"
+            f"Unknown tier '{tier}'. Valid tiers: {list(tier_policies.keys())}"
         )
     # Start with base tier policies
-    policies: dict[str, dict[str, Any]] = copy.deepcopy(TIER_POLICIES[tier])
+    policies: dict[str, dict[str, Any]] = copy.deepcopy(tier_policies[tier_key])
+    # Apply profile overrides (when available)
+    overrides = _load_profile_overrides(profile, config_root=config_root)
+    guards = overrides.get("guards") if isinstance(overrides, dict) else None
+    if isinstance(guards, dict):
+        for guard_name, guard_overrides in guards.items():
+            key = str(guard_name).lower()
+            if not isinstance(guard_overrides, dict):
+                continue
+            if key in policies and isinstance(policies[key], dict):
+                policies[key] = _deep_merge(policies[key], guard_overrides)
+            else:
+                policies[key] = copy.deepcopy(guard_overrides)
     # Apply edit-specific adjustments
     if edit_name and edit_name in EDIT_ADJUSTMENTS:
         edit_adjustments = EDIT_ADJUSTMENTS[edit_name]
         for guard_name, adjustments in edit_adjustments.items():
-            if guard_name in policies:
-                guard_policy = policies[guard_name]
-                assert isinstance(guard_policy, dict)
-                guard_policy.update(adjustments)
+            if guard_name in policies and isinstance(policies.get(guard_name), dict):
+                policies[guard_name] = _deep_merge(policies[guard_name], adjustments)
     # Apply explicit overrides (highest precedence)
     if explicit_overrides:
         for guard_name, overrides in explicit_overrides.items():
-            if guard_name in policies:
-                guard_policy = policies[guard_name]
-                assert isinstance(guard_policy, dict)
-                guard_policy.update(overrides)
-            else:
+            if guard_name in policies and isinstance(policies.get(guard_name), dict):
+                if isinstance(overrides, dict):
+                    policies[guard_name] = _deep_merge(policies[guard_name], overrides)
+            elif isinstance(overrides, dict):
                 # Create new guard policy if not in base tier
-                policies[guard_name] = overrides.copy()
+                policies[guard_name] = copy.deepcopy(overrides)
     return policies
@@ -273,7 +470,7 @@ def get_tier_summary(tier: str, edit_name: str | None = None) -> dict[str, Any]:
             "tier": tier,
             "edit_name": edit_name,
             "error": str(e),
-            "valid_tiers": list(TIER_POLICIES.keys()),
+            "valid_tiers": list(get_tier_policies().keys()),
         }
@@ -304,8 +501,9 @@ def validate_tier_config(config: Any) -> tuple[bool, str | None]:
         return False, "Missing 'tier' in auto configuration"
     tier = config["tier"]
-    if tier not in TIER_POLICIES:
-        valid_options = list(TIER_POLICIES.keys())
+    tier_policies = get_tier_policies()
+    if tier not in tier_policies:
+        valid_options = list(tier_policies.keys())
         return False, f"Invalid tier '{tier}'. Valid options: {valid_options}"
     if "enabled" in config and not isinstance(config["enabled"], bool):

invarlock 0.3.1__py3-none-any.whl → 0.3.3__py3-none-any.whl

invarlock 0.3.1py3-none-any.whl → 0.3.3py3-none-any.whl