PyPI - multi-forge - Versions diffs - 0.2.0__py3-none-any.whl - Mend

multi-forge 0.2.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (311) hide show

forge/__init__.py +3 -0
forge/_extensions/agents/.gitkeep +0 -0
forge/_extensions/commands/.gitkeep +0 -0
forge/_extensions/skills/analyze/SKILL.md +87 -0
forge/_extensions/skills/challenge/SKILL.md +91 -0
forge/_extensions/skills/consensus/SKILL.md +120 -0
forge/_extensions/skills/consensus/resources/code_consensus_evaluation.md +94 -0
forge/_extensions/skills/consensus/resources/consensus_evaluation.md +70 -0
forge/_extensions/skills/consensus/resources/synthesis.md +101 -0
forge/_extensions/skills/debate/SKILL.md +116 -0
forge/_extensions/skills/debate/resources/code_debate_evaluation.md +101 -0
forge/_extensions/skills/debate/resources/debate_evaluation.md +90 -0
forge/_extensions/skills/panel/SKILL.md +141 -0
forge/_extensions/skills/panel/resources/synthesis.md +103 -0
forge/_extensions/skills/qa/SKILL.md +704 -0
forge/_extensions/skills/qa/resources/checklist/0-enable.md +78 -0
forge/_extensions/skills/qa/resources/checklist/1-preflight.md +24 -0
forge/_extensions/skills/qa/resources/checklist/10-resume.md +143 -0
forge/_extensions/skills/qa/resources/checklist/11-config.md +150 -0
forge/_extensions/skills/qa/resources/checklist/12-search.md +58 -0
forge/_extensions/skills/qa/resources/checklist/13-guard.md +237 -0
forge/_extensions/skills/qa/resources/checklist/14-workflow.md +305 -0
forge/_extensions/skills/qa/resources/checklist/15-skills.md +155 -0
forge/_extensions/skills/qa/resources/checklist/16-handoff.md +224 -0
forge/_extensions/skills/qa/resources/checklist/17-info.md +50 -0
forge/_extensions/skills/qa/resources/checklist/18-disable.md +84 -0
forge/_extensions/skills/qa/resources/checklist/19-uninstall.md +146 -0
forge/_extensions/skills/qa/resources/checklist/2-extensions.md +188 -0
forge/_extensions/skills/qa/resources/checklist/20-cleanup.md +36 -0
forge/_extensions/skills/qa/resources/checklist/3-auth.md +234 -0
forge/_extensions/skills/qa/resources/checklist/4-proxy.md +481 -0
forge/_extensions/skills/qa/resources/checklist/5-session.md +541 -0
forge/_extensions/skills/qa/resources/checklist/6-hooks.md +275 -0
forge/_extensions/skills/qa/resources/checklist/7-costs.md +309 -0
forge/_extensions/skills/qa/resources/checklist/8-status-line.md +174 -0
forge/_extensions/skills/qa/resources/checklist/9-direct-commands.md +146 -0
forge/_extensions/skills/qa/resources/checklist.md +103 -0
forge/_extensions/skills/qa/resources/report-template.md +62 -0
forge/_extensions/skills/qa/scripts/start-container.sh +529 -0
forge/_extensions/skills/qa/scripts/walkthrough-state.py +1137 -0
forge/_extensions/skills/review/SKILL.md +125 -0
forge/_extensions/skills/review/references/claude-4.6.md +474 -0
forge/_extensions/skills/review/references/claude-4.7.md +710 -0
forge/_extensions/skills/review/references/gemini-3.1.md +546 -0
forge/_extensions/skills/review/references/gpt-5.5.md +490 -0
forge/_extensions/skills/review/references/skills-writing-guide.md +1588 -0
forge/_extensions/skills/review/resources/code-anthropic.md +160 -0
forge/_extensions/skills/review/resources/code-gemini.md +184 -0
forge/_extensions/skills/review/resources/code-openai.md +203 -0
forge/_extensions/skills/review/resources/code.md +160 -0
forge/_extensions/skills/review-docs/SKILL.md +121 -0
forge/_extensions/skills/review-docs/resources/docs-anthropic.md +170 -0
forge/_extensions/skills/review-docs/resources/docs-gemini.md +204 -0
forge/_extensions/skills/review-docs/resources/docs-openai.md +231 -0
forge/_extensions/skills/review-docs/resources/docs.md +170 -0
forge/_extensions/skills/smoke-test/SKILL.md +27 -0
forge/_extensions/skills/smoke-test/scripts/smoke-test.sh +118 -0
forge/_extensions/skills/understand/SKILL.md +148 -0
forge/_extensions/skills/understand/resources/code-anthropic.md +163 -0
forge/_extensions/skills/understand/resources/code-gemini.md +194 -0
forge/_extensions/skills/understand/resources/code-openai.md +181 -0
forge/_extensions/skills/understand/resources/code.md +163 -0
forge/_extensions/skills/understand/resources/docs-anthropic.md +177 -0
forge/_extensions/skills/understand/resources/docs-gemini.md +202 -0
forge/_extensions/skills/understand/resources/docs-openai.md +191 -0
forge/_extensions/skills/understand/resources/docs.md +177 -0
forge/_extensions/skills/walkthrough/SKILL.md +599 -0
forge/_extensions/skills/walkthrough/resources/checklist.md +765 -0
forge/_extensions/skills/walkthrough/scripts/run-in-repo.sh +118 -0
forge/_extensions/skills/walkthrough/scripts/setup-test-repo.sh +198 -0
forge/_extensions/skills/walkthrough/scripts/walkthrough-state.py +1137 -0
forge/backend/__init__.py +174 -0
forge/backend/adapters/__init__.py +38 -0
forge/backend/adapters/litellm.py +158 -0
forge/backend/creation.py +89 -0
forge/backend/registry.py +178 -0
forge/cli/__init__.py +16 -0
forge/cli/auth.py +483 -0
forge/cli/backend.py +298 -0
forge/cli/claude.py +411 -0
forge/cli/config_cmd.py +303 -0
forge/cli/extensions.py +1001 -0
forge/cli/gc.py +165 -0
forge/cli/guard.py +1018 -0
forge/cli/guards.py +106 -0
forge/cli/handoff.py +110 -0
forge/cli/hooks/__init__.py +36 -0
forge/cli/hooks/_group.py +20 -0
forge/cli/hooks/_helpers.py +149 -0
forge/cli/hooks/commands.py +1677 -0
forge/cli/hooks/direct_commands.py +1304 -0
forge/cli/hooks/install.py +232 -0
forge/cli/hooks/policy.py +151 -0
forge/cli/hooks/read_hygiene.py +74 -0
forge/cli/hooks/verification.py +370 -0
forge/cli/logs.py +406 -0
forge/cli/main.py +292 -0
forge/cli/proxy.py +1821 -0
forge/cli/proxy_costs.py +313 -0
forge/cli/search.py +416 -0
forge/cli/session.py +892 -0
forge/cli/session_addendum.py +81 -0
forge/cli/session_fork.py +750 -0
forge/cli/session_handoff.py +141 -0
forge/cli/session_lifecycle.py +2053 -0
forge/cli/session_manage.py +1336 -0
forge/cli/session_memory.py +201 -0
forge/cli/status_line.py +1398 -0
forge/cli/workflow.py +1964 -0
forge/config/__init__.py +110 -0
forge/config/dataclass_utils.py +88 -0
forge/config/defaults/__init__.py +0 -0
forge/config/defaults/backends/__init__.py +0 -0
forge/config/defaults/backends/litellm.yaml +196 -0
forge/config/defaults/templates/__init__.py +0 -0
forge/config/defaults/templates/litellm-anthropic-local.yaml +33 -0
forge/config/defaults/templates/litellm-anthropic.yaml +24 -0
forge/config/defaults/templates/litellm-gemini-flash-local.yaml +37 -0
forge/config/defaults/templates/litellm-gemini-local.yaml +32 -0
forge/config/defaults/templates/litellm-gemini-test.yaml +34 -0
forge/config/defaults/templates/litellm-gemini.yaml +21 -0
forge/config/defaults/templates/litellm-openai-codex-local.yaml +36 -0
forge/config/defaults/templates/litellm-openai-local.yaml +38 -0
forge/config/defaults/templates/litellm-openai.yaml +28 -0
forge/config/defaults/templates/openrouter-anthropic.yaml +23 -0
forge/config/defaults/templates/openrouter-deepseek.yaml +26 -0
forge/config/defaults/templates/openrouter-gemini-flash.yaml +26 -0
forge/config/defaults/templates/openrouter-gemini.yaml +23 -0
forge/config/defaults/templates/openrouter-glm.yaml +23 -0
forge/config/defaults/templates/openrouter-kimi.yaml +30 -0
forge/config/defaults/templates/openrouter-minimax.yaml +26 -0
forge/config/defaults/templates/openrouter-openai-codex.yaml +23 -0
forge/config/defaults/templates/openrouter-openai.yaml +28 -0
forge/config/defaults/templates/openrouter-qwen.yaml +25 -0
forge/config/loader.py +675 -0
forge/config/schema.py +448 -0
forge/core/__init__.py +5 -0
forge/core/auth/__init__.py +67 -0
forge/core/auth/capabilities.py +219 -0
forge/core/auth/credentials_file.py +244 -0
forge/core/auth/protocols.py +18 -0
forge/core/auth/secrets.py +243 -0
forge/core/auth/template_secrets.py +112 -0
forge/core/data/__init__.py +5 -0
forge/core/data/model_catalog.yaml +1522 -0
forge/core/data/pricing.yaml +140 -0
forge/core/data/system_prompt_addendums/__init__.py +0 -0
forge/core/data/system_prompt_addendums/gemini.md +330 -0
forge/core/data/system_prompt_addendums/openai.md +328 -0
forge/core/llm/__init__.py +231 -0
forge/core/llm/clients/__init__.py +14 -0
forge/core/llm/clients/base.py +115 -0
forge/core/llm/clients/litellm.py +619 -0
forge/core/llm/clients/openai_compat.py +244 -0
forge/core/llm/clients/openrouter.py +234 -0
forge/core/llm/credentials.py +439 -0
forge/core/llm/detection.py +86 -0
forge/core/llm/errors.py +44 -0
forge/core/llm/protocols.py +80 -0
forge/core/llm/types.py +176 -0
forge/core/logging.py +146 -0
forge/core/models/__init__.py +91 -0
forge/core/models/catalog.py +467 -0
forge/core/models/pricing.py +165 -0
forge/core/models/types.py +167 -0
forge/core/naming.py +212 -0
forge/core/ops/__init__.py +73 -0
forge/core/ops/context.py +141 -0
forge/core/ops/gc.py +802 -0
forge/core/ops/proxy.py +146 -0
forge/core/ops/resolution.py +135 -0
forge/core/ops/session.py +344 -0
forge/core/ops/session_context.py +548 -0
forge/core/paths.py +38 -0
forge/core/process.py +54 -0
forge/core/reactive/__init__.py +38 -0
forge/core/reactive/cost_tracking.py +300 -0
forge/core/reactive/env.py +180 -0
forge/core/reactive/proxy.py +78 -0
forge/core/reactive/routing.py +622 -0
forge/core/reactive/session_runner.py +185 -0
forge/core/reactive/structured_output.py +62 -0
forge/core/reactive/tagger.py +94 -0
forge/core/reactive/throttle.py +132 -0
forge/core/state/__init__.py +59 -0
forge/core/state/exceptions.py +59 -0
forge/core/state/io.py +140 -0
forge/core/state/lock.py +99 -0
forge/core/state/timestamps.py +60 -0
forge/core/transcript.py +78 -0
forge/core/typing_helpers.py +24 -0
forge/core/workqueue/__init__.py +67 -0
forge/core/workqueue/queue.py +552 -0
forge/core/workqueue/types.py +63 -0
forge/guard/__init__.py +26 -0
forge/guard/deterministic/__init__.py +26 -0
forge/guard/deterministic/base.py +158 -0
forge/guard/deterministic/coding_standards.py +256 -0
forge/guard/deterministic/registry.py +148 -0
forge/guard/deterministic/tdd.py +171 -0
forge/guard/engine.py +216 -0
forge/guard/protocols.py +91 -0
forge/guard/queries.py +96 -0
forge/guard/semantic/__init__.py +34 -0
forge/guard/semantic/promotion.py +18 -0
forge/guard/semantic/supervisor.py +813 -0
forge/guard/semantic/verdict.py +183 -0
forge/guard/store.py +124 -0
forge/guard/team/__init__.py +6 -0
forge/guard/team/config.py +24 -0
forge/guard/team/handlers.py +209 -0
forge/guard/team/prompts.py +41 -0
forge/guard/types.py +125 -0
forge/guard/workflow/__init__.py +17 -0
forge/guard/workflow/branches.py +67 -0
forge/guard/workflow/config.py +63 -0
forge/guard/workflow/divergence.py +113 -0
forge/guard/workflow/policy.py +87 -0
forge/guard/workflow/stages.py +205 -0
forge/install/__init__.py +55 -0
forge/install/cli.py +281 -0
forge/install/exceptions.py +163 -0
forge/install/hooks.py +109 -0
forge/install/installer.py +1037 -0
forge/install/models.py +321 -0
forge/install/preset.py +272 -0
forge/install/settings_merge.py +831 -0
forge/install/tracking.py +238 -0
forge/install/version.py +141 -0
forge/proxy/__init__.py +0 -0
forge/proxy/base_client.py +181 -0
forge/proxy/client_adapter.py +476 -0
forge/proxy/client_factory.py +531 -0
forge/proxy/converters.py +1206 -0
forge/proxy/cost_logger.py +132 -0
forge/proxy/cost_tracker.py +242 -0
forge/proxy/data_models.py +338 -0
forge/proxy/error_hints.py +92 -0
forge/proxy/metrics.py +222 -0
forge/proxy/model_spec.py +158 -0
forge/proxy/proxies.py +333 -0
forge/proxy/proxy_identity.py +134 -0
forge/proxy/proxy_orchestrator.py +1018 -0
forge/proxy/proxy_startup.py +54 -0
forge/proxy/server.py +1561 -0
forge/proxy/utils.py +537 -0
forge/review/__init__.py +6 -0
forge/review/adversarial.py +111 -0
forge/review/consensus.py +236 -0
forge/review/engine.py +356 -0
forge/review/models.py +437 -0
forge/review/resources/__init__.py +5 -0
forge/review/resources/codereview-performance.md +85 -0
forge/review/resources/codereview-quick.md +75 -0
forge/review/resources/codereview-security.md +92 -0
forge/review/resources/codereview.md +85 -0
forge/review/resources/docreview-quick.md +75 -0
forge/review/resources/docreview.md +86 -0
forge/review/resources/thinkdeep.md +89 -0
forge/review/routing.py +368 -0
forge/review/synthesis.py +73 -0
forge/runtime_config.py +438 -0
forge/search/__init__.py +55 -0
forge/search/bm25_store.py +264 -0
forge/search/content_store.py +197 -0
forge/search/engine.py +352 -0
forge/search/exceptions.py +51 -0
forge/search/extractor.py +234 -0
forge/search/index_state.py +295 -0
forge/search/store.py +215 -0
forge/search/tokenizer.py +24 -0
forge/session/__init__.py +130 -0
forge/session/active.py +339 -0
forge/session/artifacts.py +202 -0
forge/session/claude/__init__.py +50 -0
forge/session/claude/cleanup.py +105 -0
forge/session/claude/invoke.py +236 -0
forge/session/claude/paths.py +200 -0
forge/session/cleanup.py +216 -0
forge/session/config.py +34 -0
forge/session/direct_model.py +107 -0
forge/session/effective.py +169 -0
forge/session/exceptions.py +255 -0
forge/session/handoff.py +881 -0
forge/session/handoff_agent.py +544 -0
forge/session/hooks/__init__.py +35 -0
forge/session/hooks/models.py +73 -0
forge/session/hooks/session_start.py +507 -0
forge/session/identity.py +84 -0
forge/session/index.py +553 -0
forge/session/manager.py +1506 -0
forge/session/models.py +572 -0
forge/session/overrides.py +344 -0
forge/session/plan_resolution.py +286 -0
forge/session/prev_sessions.py +128 -0
forge/session/store.py +431 -0
forge/session/validation.py +47 -0
forge/session/worktree/__init__.py +65 -0
forge/session/worktree/cleanup.py +262 -0
forge/session/worktree/config_copy.py +203 -0
forge/session/worktree/create.py +332 -0
forge/sidecar/__init__.py +29 -0
forge/sidecar/container.py +161 -0
forge/sidecar/docker.py +86 -0
forge/sidecar/secrets.py +19 -0
multi_forge-0.2.0.dist-info/METADATA +242 -0
multi_forge-0.2.0.dist-info/RECORD +311 -0
multi_forge-0.2.0.dist-info/WHEEL +4 -0
multi_forge-0.2.0.dist-info/entry_points.txt +2 -0
multi_forge-0.2.0.dist-info/licenses/LICENSE +203 -0
multi_forge-0.2.0.dist-info/licenses/NOTICE +14 -0

forge/guard/deterministic/tdd.py ADDED Viewed

@@ -0,0 +1,171 @@
+"""TDD bundle policies.
+Enforces test-driven development workflow:
+- tests-before-impl: Must touch tests before implementing in src/
+- no-skip-tests: Blocks adding pytest.skip or similar patterns
+"""
+from __future__ import annotations
+from typing import Any
+from forge.guard.deterministic.base import (
+    DeterministicPolicy,
+    StatefulDeterministicPolicy,
+)
+from forge.guard.types import ActionContext, PolicyDecision, Violation
+# Patterns that indicate test skipping
+SKIP_PATTERNS = [
+    r"pytest\.skip\(",
+    r"@pytest\.mark\.skip\b",
+    r"@pytest\.mark\.skipif\b",
+    r"unittest\.skip\b",
+    r"@unittest\.skip\b",
+]
+class TDDEnforcementPolicy(StatefulDeterministicPolicy):
+    """Enforce that tests are touched before implementation code.
+    State tracking:
+    - When Write/Edit targets tests/, record path in tests_touched
+    - When Write/Edit targets src/ and tests_touched is empty, deny (or warn)
+    This policy is stateful because it needs to remember across hook invocations
+    which test files have been touched in the current session.
+    """
+    def __init__(self, *, strict: bool = True) -> None:
+        """Initialize the policy.
+        Args:
+            strict: If True, deny impl without tests. If False, warn only.
+        """
+        self.strict = strict
+        self._tests_touched: set[str] = set()
+    @property
+    def policy_id(self) -> str:
+        return "tdd.tests-before-impl"
+    @property
+    def description(self) -> str:
+        mode = "strict" if self.strict else "permissive"
+        return f"Require test changes before implementation changes ({mode} mode)"
+    @property
+    def intent(self) -> str:
+        return (
+            "Test-driven development: write tests first to define expected behavior, "
+            "then implement. This catches design issues early and ensures every change "
+            "has test coverage from the start."
+        )
+    def applies_to(self, context: ActionContext) -> bool:
+        """Apply to Write/Edit on tests/ or src/ paths."""
+        if context.tool_name not in ("Write", "Edit"):
+            return False
+        path = context.target_path
+        if path is None:
+            return False
+        # Only care about tests/ and src/ directories
+        return self._is_under_directory(path, "tests") or self._is_under_directory(path, "src")
+    def _evaluate(self, context: ActionContext) -> PolicyDecision:
+        """Evaluate the TDD workflow.
+        Logic:
+        1. If writing to tests/, record the path and allow
+        2. If writing to src/ and no tests touched, deny (strict) or warn (permissive)
+        3. Otherwise, allow
+        """
+        path = context.target_path
+        if path is None:
+            return self._allow()
+        # Touching a test file - record it and allow
+        if self._is_under_directory(path, "tests"):
+            self._tests_touched.add(path)
+            return self._allow()
+        # Touching implementation - check if tests were touched first
+        if self._is_under_directory(path, "src"):
+            if not self._tests_touched:
+                violation = Violation(
+                    rule_id=self.policy_id,
+                    message="Implementation changes require test changes first",
+                    severity="high",
+                    evidence=f"Writing to {path} without touching any test files",
+                    suggested_fix="Write or update tests in tests/ directory before modifying src/ code",
+                )
+                if self.strict:
+                    return self._deny([violation])
+                else:
+                    return self._warn([violation.message])
+        return self._allow()
+    def get_state(self) -> dict[str, Any]:
+        """Return current state for persistence."""
+        return {"tests_touched": list(self._tests_touched)}
+    def set_state(self, state: dict[str, Any]) -> None:
+        """Restore state from persisted data."""
+        self._tests_touched = set(state.get("tests_touched", []))
+class NoSkipTestsPolicy(DeterministicPolicy):
+    """Block adding test skip patterns.
+    Prevents:
+    - pytest.skip()
+    - @pytest.mark.skip
+    - @pytest.mark.skipif
+    - unittest.skip
+    """
+    @property
+    def policy_id(self) -> str:
+        return "tdd.no-skip-tests"
+    @property
+    def description(self) -> str:
+        return "Block adding pytest.skip or similar test-skipping patterns"
+    @property
+    def intent(self) -> str:
+        return (
+            "Skipped tests hide broken functionality. Every test should either pass or "
+            "be deleted. If a test cannot run, fix the environment or the code rather "
+            "than skipping it."
+        )
+    def applies_to(self, context: ActionContext) -> bool:
+        """Apply to Write/Edit with content that might contain skip patterns."""
+        if context.tool_name not in ("Write", "Edit"):
+            return False
+        # Only check if there's content to analyze
+        return context.new_content is not None
+    def _evaluate(self, context: ActionContext) -> PolicyDecision:
+        """Check for skip patterns in content."""
+        matched = self._matches_any_pattern(context.new_content, SKIP_PATTERNS)
+        if matched:
+            violations = [
+                Violation(
+                    rule_id=self.policy_id,
+                    message="Test skip patterns are not allowed",
+                    severity="high",
+                    evidence=f"Found skip pattern(s): {', '.join(matched)}",
+                    suggested_fix="Remove the skip pattern and fix the underlying issue",
+                )
+            ]
+            return self._deny(violations)
+        return self._allow()

forge/guard/engine.py ADDED Viewed

@@ -0,0 +1,216 @@
+"""Policy composition engine.
+The PolicyEngine evaluates multiple policies against an action and
+composes their decisions using the "any deny blocks" rule.
+"""
+from __future__ import annotations
+import logging
+from dataclasses import dataclass, field
+from typing import Any
+from forge.core.state import now_iso
+from forge.guard.protocols import Policy, StatefulPolicy
+from forge.guard.types import (
+    ActionContext,
+    CompositeDecision,
+    DecisionType,
+    FailMode,
+    PolicyDecision,
+)
+_log = logging.getLogger(__name__)
+@dataclass
+class PolicyEngine:
+    """Composes multiple policies and produces a unified decision.
+    Composition rules:
+    - Policies are evaluated in registration order
+    - Any deny blocks the action (unless fail_mode is "open" and it's an error)
+    - needs_review is resolved by semantic supervisor when it participates
+    - Warnings accumulate from all policies
+    - State is collected from stateful policies for persistence
+    Attributes:
+        policies: List of registered policies
+        fail_mode: Default behavior on policy errors ("open" = allow, "closed" = deny)
+    """
+    policies: list[Policy] = field(default_factory=list)
+    fail_mode: FailMode = "open"
+    # Collected state from stateful policies (for persistence)
+    _collected_state: dict[str, dict[str, Any]] = field(default_factory=dict)
+    def register(self, policy: Policy) -> None:
+        """Register a policy with the engine."""
+        self.policies.append(policy)
+        _log.debug("Registered policy: %s", policy.policy_id)
+    def restore_state(self, persisted_state: dict[str, Any] | None) -> None:
+        """Restore state to all stateful policies.
+        Called at the start of evaluation to restore state from the session manifest.
+        Args:
+            persisted_state: Dict mapping policy_id to state dict
+        """
+        if persisted_state is None:
+            return
+        for policy in self.policies:
+            if isinstance(policy, StatefulPolicy):
+                policy_state = persisted_state.get(policy.policy_id)
+                if policy_state is not None:
+                    try:
+                        policy.set_state(policy_state)
+                        _log.debug("Restored state for %s", policy.policy_id)
+                    except Exception as e:
+                        _log.warning("Failed to restore state for %s: %s", policy.policy_id, e)
+    def get_collected_state(self) -> dict[str, dict[str, Any]]:
+        """Get collected state from all stateful policies.
+        Called after evaluation to persist state to the session manifest.
+        Returns:
+            Dict mapping policy_id to state dict
+        """
+        return self._collected_state.copy()
+    def evaluate(self, context: ActionContext) -> CompositeDecision:
+        """Evaluate all applicable policies and compose results.
+        Args:
+            context: The action being evaluated
+        Returns:
+            CompositeDecision with:
+            - final_decision: allow/deny/warn/needs_review based on composition
+            - decisions: individual policy decisions for debugging
+            - blocking_violations: violations that caused deny
+            - all_warnings: accumulated warnings
+        """
+        decisions: list[PolicyDecision] = []
+        blocking_violations: list = []
+        all_warnings: list[str] = []
+        needs_review = False
+        for policy in self.policies:
+            # Check if policy applies
+            try:
+                if not policy.applies_to(context):
+                    _log.debug(
+                        "Policy %s does not apply to %s",
+                        policy.policy_id,
+                        context.tool_name,
+                    )
+                    continue
+            except Exception as e:
+                _log.warning("Policy %s.applies_to() failed: %s", policy.policy_id, e)
+                if self.fail_mode == "closed":
+                    decisions.append(
+                        PolicyDecision(
+                            decision="deny",
+                            policy_id=policy.policy_id,
+                            warnings=[f"Policy applies_to() failed (fail-closed): {e}"],
+                        )
+                    )
+                continue
+            # Evaluate policy
+            try:
+                decision = policy.evaluate(context)
+                decision.evaluated_at = now_iso()
+                decisions.append(decision)
+                _log.debug(
+                    "Policy %s evaluated: %s (%d violations)",
+                    policy.policy_id,
+                    decision.decision,
+                    len(decision.violations),
+                )
+            except Exception as e:
+                _log.warning("Policy %s.evaluate() failed: %s", policy.policy_id, e)
+                if self.fail_mode == "open":
+                    decisions.append(
+                        PolicyDecision(
+                            decision="allow",
+                            policy_id=policy.policy_id,
+                            warnings=[f"Policy evaluation failed (fail-open): {e}"],
+                        )
+                    )
+                else:
+                    decisions.append(
+                        PolicyDecision(
+                            decision="deny",
+                            policy_id=policy.policy_id,
+                            warnings=[f"Policy evaluation failed (fail-closed): {e}"],
+                        )
+                    )
+                continue
+            # Collect state from stateful policies
+            if isinstance(policy, StatefulPolicy):
+                try:
+                    self._collected_state[policy.policy_id] = policy.get_state()
+                except Exception as e:
+                    _log.warning("Failed to get state from %s: %s", policy.policy_id, e)
+        # Compose decisions
+        final_decision: DecisionType = "allow"
+        for d in decisions:
+            all_warnings.extend(d.warnings)
+            if d.decision == "deny":
+                final_decision = "deny"
+                blocking_violations.extend(d.violations)
+            elif d.decision == "needs_review":
+                needs_review = True
+            elif d.decision == "warn" and final_decision == "allow":
+                final_decision = "warn"
+        review_resolved = any(d.policy_id == "semantic.supervisor" and d.decision != "needs_review" for d in decisions)
+        # If any policy needs review and no supervisor resolved it, escalate.
+        if needs_review and not review_resolved and final_decision not in ("deny",):
+            final_decision = "needs_review"
+        return CompositeDecision(
+            final_decision=final_decision,
+            decisions=decisions,
+            blocking_violations=blocking_violations,
+            all_warnings=all_warnings,
+        )
+def build_engine(
+    bundles: list[str],
+    fail_mode: FailMode = "open",
+    bundle_config: dict[str, dict[str, Any]] | None = None,
+) -> PolicyEngine:
+    """Build a PolicyEngine with policies from the specified bundles.
+    Args:
+        bundles: List of bundle names (e.g., ["tdd", "coding_standards"])
+        fail_mode: Behavior on policy errors
+        bundle_config: Per-bundle configuration (e.g., {"tdd": {"strict": False}}).
+    Returns:
+        Configured PolicyEngine
+    """
+    from forge.guard.deterministic.registry import get_bundle_policies
+    engine = PolicyEngine(fail_mode=fail_mode)
+    for bundle in bundles:
+        config = bundle_config.get(bundle) if bundle_config else None
+        for policy in get_bundle_policies(bundle, config=config):
+            engine.register(policy)
+    return engine

forge/guard/protocols.py ADDED Viewed

@@ -0,0 +1,91 @@
+"""Policy protocol definitions.
+All policies (deterministic and semantic) implement these protocols,
+enabling uniform composition in the PolicyEngine.
+"""
+from __future__ import annotations
+from typing import Any, Protocol, runtime_checkable
+from forge.guard.types import ActionContext, PolicyDecision
+@runtime_checkable
+class Policy(Protocol):
+    """Interface all policies must implement.
+    Policies are evaluated against an ActionContext and return a PolicyDecision.
+    The `applies_to` method enables filtering/short-circuiting before evaluation.
+    Example:
+        class MyPolicy:
+            @property
+            def policy_id(self) -> str:
+                return "my-bundle.my-rule"
+            def applies_to(self, context: ActionContext) -> bool:
+                return context.tool_name == "Write"
+            def evaluate(self, context: ActionContext) -> PolicyDecision:
+                # Check something and return decision
+                return PolicyDecision(decision="allow", policy_id=self.policy_id)
+    """
+    @property
+    def policy_id(self) -> str:
+        """Unique identifier for this policy (e.g., 'tdd.tests-before-impl')."""
+        ...
+    @property
+    def description(self) -> str:
+        """Human-readable description of what this policy enforces."""
+        ...
+    def applies_to(self, context: ActionContext) -> bool:
+        """Return True if this policy should evaluate the given action.
+        Used for filtering/throttling before full evaluation. Policies that
+        don't apply to the action should return False to skip evaluation.
+        """
+        ...
+    def evaluate(self, context: ActionContext) -> PolicyDecision:
+        """Evaluate the action and return a decision.
+        For deterministic policies: synchronous, fast.
+        For semantic policies: may invoke LLM (should be throttled).
+        """
+        ...
+@runtime_checkable
+class StatefulPolicy(Policy, Protocol):
+    """Protocol for policies that track state across actions.
+    Stateful policies (e.g., TDD's "tests touched before impl") need to
+    persist state across hook invocations. Since hooks are short-lived
+    processes, state is persisted to the session manifest.
+    The PolicyEngine calls get_state() after evaluation to persist state,
+    and set_state() at the start to restore it.
+    Example:
+        class TDDEnforcementPolicy:
+            def __init__(self):
+                self._tests_touched: set[str] = set()
+            def get_state(self) -> dict[str, Any]:
+                return {"tests_touched": list(self._tests_touched)}
+            def set_state(self, state: dict[str, Any]) -> None:
+                self._tests_touched = set(state.get("tests_touched", []))
+    """
+    def get_state(self) -> dict[str, Any]:
+        """Return current policy state for persistence."""
+        ...
+    def set_state(self, state: dict[str, Any]) -> None:
+        """Restore policy state from persisted data."""
+        ...

forge/guard/queries.py ADDED Viewed

@@ -0,0 +1,96 @@
+"""Read-only queries about supervisor relationships and session policy state.
+Used by both the CLI (``forge guard status``) and direct commands
+(``%guard status``) to display supervisor metadata and discover
+supervised sessions.
+"""
+from __future__ import annotations
+import re
+from forge.session import SessionStore
+from forge.session.effective import compute_effective_intent
+from forge.session.models import SessionState
+_UUID_RE = re.compile(r"^[0-9a-fA-F]{8}-[0-9a-fA-F]{4}-[0-9a-fA-F]{4}-[0-9a-fA-F]{4}-[0-9a-fA-F]{12}$")
+def read_scoped_supervisor_target(
+    resume_id: str,
+    supervisor_forge_root: str | None,
+    fallback_forge_root: str | None,
+) -> SessionState | None:
+    """Return supervisor target state, preferring the supervisor's stored scope.
+    Handles both session-name and raw-UUID resume_id values. UUIDs are
+    resolved via the index's reverse lookup (find_session_by_uuid).
+    """
+    try:
+        from forge.session.manager import SessionManager
+        mgr = SessionManager()
+        fr = supervisor_forge_root or fallback_forge_root
+        # Try name-based lookup first (common case)
+        if not _UUID_RE.fullmatch(resume_id):
+            return mgr.get_session(resume_id, forge_root=fr)
+        # UUID: reverse lookup through the index
+        result = mgr.index_store.find_session_by_uuid(resume_id)
+        if result is None:
+            return None
+        display_name, entry_fr = result
+        return mgr.get_session(display_name, forge_root=entry_fr)
+    except Exception:
+        return None
+def find_sessions_supervised_by(
+    target_name: str,
+    target_uuid: str | None,
+    target_forge_root: str | None,
+) -> list[str]:
+    """Find repo-scoped sessions whose supervisor points to the target.
+    Matches on session name or Claude UUID. Verifies forge_root alignment
+    when set to prevent false matches from duplicate names across projects.
+    Best-effort: skips broken manifests, never crashes.
+    Cost: O(N) manifest reads where N = repo-scoped sessions. Acceptable
+    for typical workflows (2-10 sessions per repo).
+    """
+    try:
+        from forge.session.manager import SessionManager
+        mgr = SessionManager()
+        if not target_forge_root:
+            return []
+        project_root = mgr.resolve_project_root(target_forge_root)
+        siblings = mgr.list_sessions(project_root_filter=project_root)
+    except Exception:
+        return []
+    supervised: list[str] = []
+    for sib_name, sib_entry in siblings:
+        if sib_name == target_name:
+            continue
+        try:
+            sib_store = SessionStore(sib_entry.forge_root or sib_entry.worktree_path, sib_name)
+            sib_state = sib_store.read()
+            effective = compute_effective_intent(sib_state)
+            if not effective.policy or not effective.policy.supervisor:
+                continue
+            sup = effective.policy.supervisor
+            if not sup.resume_id:
+                continue
+            matched = sup.resume_id == target_name or (target_uuid and sup.resume_id == target_uuid)
+            if not matched:
+                continue
+            if sup.forge_root and target_forge_root and sup.forge_root != target_forge_root:
+                continue
+            supervised.append(sib_name)
+        except Exception:
+            continue
+    return supervised

forge/guard/semantic/__init__.py ADDED Viewed

@@ -0,0 +1,34 @@
+"""Semantic policies for the Policy Engine.
+Semantic policies use LLM-based evaluation for nuanced judgment calls
+that cannot be expressed as deterministic rules. The primary use case
+is the Supervisor pattern:
+1. Planning session creates and approves a plan (ExitPlanMode)
+2. Session is forked and promoted to supervisor role
+3. Executor actions are validated against the plan by the supervisor
+4. Supervisor returns structured verdicts (aligned/divergent + confidence)
+Throttling and caching prevent excessive LLM calls:
+- Cache key: sha256(tool_name + file_path + content_hash)[:16]
+- Cached verdicts reused within throttle_seconds window
+- Fail-open on timeout/error (configurable)
+"""
+from forge.guard.semantic.supervisor import (
+    SemanticSupervisorPolicy,
+    invoke_supervisor,
+)
+from forge.guard.semantic.verdict import (
+    SupervisorVerdict,
+    parse_supervisor_verdict,
+    verdict_to_decision,
+)
+__all__ = [
+    "SemanticSupervisorPolicy",
+    "SupervisorVerdict",
+    "invoke_supervisor",
+    "parse_supervisor_verdict",
+    "verdict_to_decision",
+]

forge/guard/semantic/promotion.py ADDED Viewed

@@ -0,0 +1,18 @@
+"""Supervisor promotion flow (deferred).
+The full "CLI-Fork Supervision" pattern from design.md §4.1.2 involves:
+1. Forking the planning session via SessionManager
+2. Establishing supervisor session UUID via claude --fork-session
+3. Recording supervisor configuration in the executor session
+The --fork-session flag is available since Claude Code v2.1.77+. The automated
+promotion flow (creating a dedicated supervisor session) is not yet implemented.
+Preferred approach (available now):
+    forge session fork planner --name executor --supervise   # At fork time
+    forge guard supervise planner                            # On existing session
+    %guard supervise planner                                 # In-session
+Manual approach (still works):
+    forge session set policy.supervisor.resume_id <name-or-uuid>
+"""