npm - @kontourai/flow-agents - Versions diffs - 0.1.2 → 0.3.0 - Mend

@kontourai/flow-agents 0.1.2 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (117) hide show

package/.github/dependabot.yml +23 -0
package/.github/workflows/release-please.yml +31 -0
package/.github/workflows/runtime-compat.yml +118 -0
package/CHANGELOG.md +46 -0
package/CONTRIBUTING.md +4 -0
package/README.md +80 -18
package/build/src/cli/flow-kit.js +9 -4
package/build/src/cli/init.js +215 -5
package/build/src/cli/runtime-adapter.js +9 -5
package/build/src/cli/telemetry-doctor.js +4 -1
package/build/src/cli/utterance-check.js +65 -1
package/build/src/runtime-adapters.js +34 -0
package/build/src/tools/build-universal-bundles.js +285 -0
package/build/src/tools/filter-installed-packs.js +3 -0
package/build/src/tools/validate-source-tree.js +5 -1
package/console.telemetry.json +115 -20
package/context/scripts/telemetry/lib/config.sh +5 -1
package/context/settings/flow-agents-settings.json +7 -0
package/docs/_layouts/default.html +2 -0
package/docs/context-map.md +1 -0
package/docs/index.md +53 -4
package/docs/integrations/conformance.md +246 -0
package/docs/integrations/framework-adapter.md +275 -0
package/docs/integrations/harness-install.md +213 -0
package/docs/integrations/index.md +58 -0
package/docs/integrations/knowledge-kit-live.md +211 -0
package/docs/kit-authoring-guide.md +169 -0
package/docs/north-star.md +2 -2
package/docs/spec/runtime-hook-surface.md +525 -0
package/docs/survey-utterance-check.md +211 -94
package/docs/vision.md +45 -0
package/evals/acceptance/run.sh +13 -2
package/evals/acceptance/test_knowledge_kit_live.sh +221 -0
package/evals/acceptance/test_opencode_harness.sh +121 -0
package/evals/acceptance/test_pi_harness.sh +113 -0
package/evals/integration/test_bundle_install.sh +226 -1
package/evals/integration/test_bundle_lifecycle.sh +641 -0
package/evals/integration/test_runtime_adapter_activation.sh +113 -1
package/evals/integration/test_utterance_check.sh +291 -44
package/evals/run.sh +2 -0
package/evals/static/test_universal_bundles.sh +137 -2
package/integrations/strands/README.md +256 -0
package/integrations/strands/example.py +74 -0
package/integrations/strands/examples/knowledge_kit_live.py +461 -0
package/integrations/strands/flow_agents_strands/__init__.py +27 -0
package/integrations/strands/flow_agents_strands/hooks.py +194 -0
package/integrations/strands/flow_agents_strands/policy.py +348 -0
package/integrations/strands/flow_agents_strands/steering.py +225 -0
package/integrations/strands/flow_agents_strands/telemetry.py +238 -0
package/integrations/strands/pyproject.toml +38 -0
package/integrations/strands/tests/__init__.py +0 -0
package/integrations/strands/tests/test_hooks.py +392 -0
package/integrations/strands/tests/test_policy.py +315 -0
package/integrations/strands/tests/test_telemetry.py +184 -0
package/integrations/strands-ts/README.md +224 -0
package/integrations/strands-ts/bin/conformance-shim.mjs +257 -0
package/integrations/strands-ts/package.json +53 -0
package/integrations/strands-ts/src/hooks.ts +312 -0
package/integrations/strands-ts/src/index.ts +22 -0
package/integrations/strands-ts/src/policy.ts +345 -0
package/integrations/strands-ts/src/telemetry.ts +251 -0
package/integrations/strands-ts/test/test-policy.ts +322 -0
package/integrations/strands-ts/test/test-steering.ts +159 -0
package/integrations/strands-ts/test/test-telemetry.ts +226 -0
package/integrations/strands-ts/tsconfig.json +20 -0
package/kits/catalog.json +6 -0
package/kits/knowledge/adapters/default-store/index.js +821 -0
package/kits/knowledge/adapters/flow-runner/index.js +1179 -0
package/kits/knowledge/adapters/flow-runner/telemetry.js +174 -0
package/kits/knowledge/docs/README.md +135 -0
package/kits/knowledge/docs/store-contract.md +526 -0
package/kits/knowledge/evals/consolidation/suite.test.js +1234 -0
package/kits/knowledge/evals/contract-suite/suite.test.js +670 -0
package/kits/knowledge/evals/ingest-compile/suite.test.js +574 -0
package/kits/knowledge/evals/synthesis/suite.test.js +909 -0
package/kits/knowledge/flows/compile.flow.json +60 -0
package/kits/knowledge/flows/consolidate.flow.json +77 -0
package/kits/knowledge/flows/ingest.flow.json +60 -0
package/kits/knowledge/flows/store-contract.flow.json +48 -0
package/kits/knowledge/flows/synthesize.flow.json +77 -0
package/kits/knowledge/kit.json +78 -0
package/package.json +7 -2
package/packaging/conformance/README.md +142 -0
package/packaging/conformance/fixtures/config-protection--allow-no-path.json +18 -0
package/packaging/conformance/fixtures/config-protection--allow-safe-file.json +20 -0
package/packaging/conformance/fixtures/config-protection--block-biome.json +20 -0
package/packaging/conformance/fixtures/config-protection--block-eslintrc.json +20 -0
package/packaging/conformance/fixtures/quality-gate--allow-no-path.json +17 -0
package/packaging/conformance/fixtures/quality-gate--allow-nonexistent-file.json +19 -0
package/packaging/conformance/fixtures/stop-goal-fit--allow-clean-cwd.json +17 -0
package/packaging/conformance/fixtures/stop-goal-fit--block-strict-mode.json +23 -0
package/packaging/conformance/fixtures/stop-goal-fit--warn-active-delivery.json +21 -0
package/packaging/conformance/fixtures/workflow-steering--allow-no-state.json +16 -0
package/packaging/conformance/fixtures/workflow-steering--inject-active-state.json +29 -0
package/packaging/conformance/fixtures/workflow-steering--inject-subagent-steering.json +25 -0
package/packaging/conformance/package.json +4 -0
package/packaging/conformance/run-conformance.js +322 -0
package/packaging/manifest.json +59 -0
package/schemas/flow-agents-settings.schema.json +48 -0
package/scripts/README.md +4 -0
package/scripts/dogfood.js +16 -0
package/scripts/hooks/opencode-hook-adapter.js +123 -0
package/scripts/hooks/opencode-telemetry-hook.js +101 -0
package/scripts/hooks/pi-hook-adapter.js +123 -0
package/scripts/hooks/pi-telemetry-hook.js +105 -0
package/scripts/hooks/run-hook.js +8 -0
package/scripts/hooks/utterance-check.js +124 -22
package/scripts/telemetry/lib/config.sh +5 -1
package/src/cli/flow-kit.ts +10 -4
package/src/cli/init.ts +219 -6
package/src/cli/runtime-adapter.ts +10 -5
package/src/cli/telemetry-doctor.ts +4 -1
package/src/cli/utterance-check.ts +71 -1
package/src/runtime-adapters.ts +35 -0
package/src/tools/build-universal-bundles.ts +283 -0
package/src/tools/filter-installed-packs.ts +3 -0
package/src/tools/validate-source-tree.ts +5 -1

package/docs/survey-utterance-check.md CHANGED Viewed

@@ -4,72 +4,206 @@ title: Survey Utterance Check Integration
 # Survey Utterance Check Integration
-Flow Agents can optionally check agent utterances for evidence coverage using `@kontourai/survey`. This integration is disabled by default and intentionally optional — ordinary Flow Agents workflows do not require Survey.
+When an agent says something factual — "test coverage is 92%", "the API is backward-compatible", "no breaking changes in this release" — that claim either has evidence behind it or it doesn't. The utterance check feature bridges Flow Agents hooks to `@kontourai/survey` so that every factual statement in an agent response is compared against a trust bundle and tagged with a badge. Statements with no backing evidence are flagged inline so the agent can acknowledge the gap rather than assert silently.
-The guiding rule mirrors the Veritas boundary: Flow Agents owns the hook wiring and badge guidance format; Survey owns the extraction, claim resolution, and trust report semantics.
+This document explains how to enable and configure the feature, what the workflow looks like end to end, and what to watch out for.
-## Background: ADR 0003 §9
+---
+## What actually happens
+Here is a concrete walkthrough from agent response to badge guidance:
+```
+Agent says: "The test coverage for auth-service is 92%.
+             All critical paths have been verified."
+Flow Agents hook (PostToolUse):
+  1. Captures the agent response text from the PostToolUse event.
+  2. Invokes the utterance-check CLI with the response text and your trust bundle.
+@kontourai/survey (inside the CLI):
+  3. Extractor splits the response into factual statements:
+       - "test coverage for auth-service is 92%"
+       - "All critical paths have been verified"
+  4. Each statement is resolved against the trust bundle.
+  5. Neither statement has a matching verified claim → both resolve as "unsupported".
+Flow Agents hook injects guidance into the agent context:
+  UTTERANCE CHECK: 2 statement(s) in this response lack evidence coverage.
+  Summary: unsupported:2
+    - [unsupported] "test coverage for auth-service is 92%"
+    - [unsupported] "All critical paths have been verified"
+  Evidence note: unsupported = no matching claim in the trust bundle; ...
+```
+The agent sees honest gap disclosure rather than silent pass-through. It can then cite sources, note the gap explicitly, or record a coverage claim via `@kontourai/survey`.
+---
+## Deciding between report and strict mode
+The hook has two modes:
+| Mode | Effect |
+|------|--------|
+| `report` (default) | Appends badge guidance to the agent context. Never blocks. Agent decides next step. |
+| `strict` | If any statement is `unsupported`, `disputed`, or `rejected`, the hook exits 2, which routes the Stop event back to the agent for revision. |
+Use **report** when you want visibility without gate behavior — good for exploratory sessions, onboarding, or repos where the trust bundle is still being built out. Use **strict** when you want the agent to revise or cite sources before completing a turn — appropriate for regulated workflows, production deployments, or repos with a well-populated bundle.
+The empty-bundle caveat: if you enable the hook without a `bundlePath`, every factual statement the extractor finds will resolve as `unsupported` because there are no claims to match against. In strict mode this means every response with factual statements will be blocked. Make sure you either provide a `bundlePath` or use report mode until you have a bundle.
+---
+## The trust bundle
+The trust bundle is a JSON file with a `claims` array. It is the authoritative record of what is considered evidenced for your codebase. Two practical sources:
+- **Veritas-generated bundle**: if your repo uses `@veritas/veritas`, it can produce a `trust.bundle.json` from `.veritas/evidence`. Point `bundlePath` at that output.
+- **Surface report**: the `@kontourai/surface` package can generate a trust bundle from a surface verification run. If your repo runs surface checks, look for the generated bundle in the surface output directory (e.g. `dist/trust-bundle.json` or a named artifact).
+- **Hand-authored bundle**: a minimal bundle is just `{ "claims": [] }`. Add claims incrementally as you record evidence.
+An empty or missing bundle means everything is unsupported. That is not necessarily wrong — it is an honest starting state — but it is only useful in report mode.
+---
+## Choosing an extractor
-ADR 0003 §9 designates agent-utterance extraction as a **Survey producer profile** — Survey pointed at agent prose instead of web sources. Each factual statement in agent output is extracted as a candidate claim and run through Survey's Inquiry pipeline. Flow Agents supplies the enforcement point (hooks) that ADR 0003 calls out. This integration is step 6 of the ADR sequencing and depends on the Inquiry pipeline already existing in Survey.
+The extractor is responsible for splitting the agent utterance into discrete factual statements. Two are available:
-## User-Facing Story
+| Extractor | How it works | Requirements |
+|-----------|-------------|--------------|
+| `reference` (default) | Pattern-based heuristics. Fast, no API call, no key needed. Works offline. Lower recall on complex prose. | `@kontourai/survey` installed |
+| `anthropic` | Model-backed extraction via `@kontourai/survey/anthropic`. Higher recall, understands context and nuance, can split compound claims. | `@kontourai/survey` + `@anthropic-ai/sdk` installed, `ANTHROPIC_API_KEY` set |
-```text
-Agent: "The test coverage for auth-service is 92%. All critical paths have been verified."
+For most exploratory use, `reference` is sufficient. Switch to `anthropic` when you find the reference extractor is missing statements that matter for your domain.
-Flow Agents (hook active):
-1. Captures the agent's response text from the PostToolUse event.
-2. Invokes the utterance-check CLI adapter with the response text.
-3. @kontourai/survey extracts factual statements: coverage:92%, paths:verified.
-4. Survey resolves each statement against the configured trust bundle.
-5. Statements without matching claims resolve as "unsupported".
-6. Flow Agents injects badge guidance into the agent context:
-   UTTERANCE CHECK: 2 statement(s) lack evidence coverage.
-   - [unsupported] "test coverage for auth-service is 92%"
-   - [unsupported] "All critical paths have been verified"
+The `anthropic` extractor fails open: if `ANTHROPIC_API_KEY` is missing or `@anthropic-ai/sdk` is not installed, the CLI emits `status: "not_configured"` (with a clear explanation in `summary`) and exits 0. The hook treats this as a silent pass-through. You will see a message in stderr explaining what is missing, but the hook will not block.
+---
+## Per-repo configuration
+The canonical way to enable utterance checking is a `context/settings/flow-agents-settings.json` file in the consumer repo. This is a peer to `context/settings/backlog-provider-settings.json` — the same directory, the same convention.
+**Minimal example (report mode, reference extractor):**
+```json
+{
+  "$schema": "../../node_modules/@kontourai/flow-agents/schemas/flow-agents-settings.schema.json",
+  "schema_version": "1.0",
+  "utteranceCheck": {
+    "enabled": true,
+    "mode": "report",
+    "extractor": "reference"
+  }
+}
 ```
-The agent sees honest gap disclosure rather than silent pass-through.
+**With a trust bundle and anthropic extractor:**
-## Ownership Split
+```json
+{
+  "$schema": "../../node_modules/@kontourai/flow-agents/schemas/flow-agents-settings.schema.json",
+  "schema_version": "1.0",
+  "utteranceCheck": {
+    "enabled": true,
+    "mode": "report",
+    "extractor": "anthropic",
+    "bundlePath": ".veritas/trust.bundle.json",
+    "model": "claude-haiku-4-5",
+    "agentId": "surface-agent"
+  }
+}
+```
-| Area | Flow Agents Owns | Survey Owns |
-| --- | --- | --- |
-| Hook wiring | PostToolUse/Stop hook, badge guidance format, enable/disable flags | None |
-| Extraction | Invoking the CLI adapter | Statement extraction, extractor interface |
-| Resolution | Passing the trust bundle path | Inquiry pipeline, claim resolution |
-| Output | Guidance text injected into agent context | UtteranceTrustReport with per-statement badges |
-| Packaging | Optional hook activation, CLI adapter | @kontourai/survey npm package |
+**Strict mode:**
-Flow Agents does not own trust claim models, inquiry semantics, or extractor implementations. Survey's `referenceUtteranceExtractor` is the default extractor; production use should inject `createAnthropicUtteranceExtractor` from `@kontourai/survey/anthropic` for model-backed extraction.
+```json
+{
+  "$schema": "../../node_modules/@kontourai/flow-agents/schemas/flow-agents-settings.schema.json",
+  "schema_version": "1.0",
+  "utteranceCheck": {
+    "enabled": true,
+    "mode": "strict",
+    "extractor": "anthropic",
+    "bundlePath": "dist/trust-bundle.json"
+  }
+}
+```
-## Enabling the Hook
+Config field reference:
-The hook is disabled by default. Set environment variables before starting the agent session:
+| Field | Type | Default | Description |
+|-------|------|---------|-------------|
+| `enabled` | boolean | `false` | Whether utterance checking is active for this repo. |
+| `mode` | `"report"` \| `"strict"` | `"report"` | How to handle concerning badges. See above. |
+| `extractor` | `"reference"` \| `"anthropic"` | `"reference"` | Extractor to use. See above. |
+| `bundlePath` | string | — | Repo-relative or absolute path to the trust bundle JSON. Omit to use an empty bundle. |
+| `model` | string | — | Model for the anthropic extractor. Only used when `extractor` is `"anthropic"`. |
+| `agentId` | string | `"flow-agents-hook"` | Agent identifier for provenance in the trust report. |
-```bash
-export FLOW_AGENTS_UTTERANCE_CHECK_ENABLED=true
+---
+## Environment variable overrides
+For one-off sessions or CI pipelines, you can override the config with environment variables. These take precedence over `flow-agents-settings.json`.
+| Variable | Effect |
+|----------|--------|
+| `FLOW_AGENTS_UTTERANCE_CHECK_ENABLED=true\|false` | Force the hook on or off, overriding the config `enabled` field. |
+| `FLOW_AGENTS_UTTERANCE_CHECK_STRICT=true` | Force strict mode. |
+| `FLOW_AGENTS_UTTERANCE_CHECK_BUNDLE_PATH=/path/to/bundle.json` | Override `bundlePath`. |
+| `FLOW_AGENTS_UTTERANCE_CHECK_AGENT_ID=my-agent` | Override `agentId`. |
+| `FLOW_AGENTS_UTTERANCE_CHECK_EXTRACTOR=anthropic\|reference` | Override `extractor`. |
+**When the config file is absent and no env vars are set**, the hook is disabled. This is the safe default — existing repos are not affected until they opt in.
+---
+## Registering the hook
+Add the utterance check to a Claude Code session via `.claude/settings.json`:
-# Optional: path to a trust bundle JSON file for claim resolution
-export FLOW_AGENTS_UTTERANCE_CHECK_BUNDLE_PATH=/path/to/trust-bundle.json
+```json
+{
+  "hooks": {
+    "PostToolUse": [
+      {
+        "matcher": ".*",
+        "hooks": [
+          {
+            "type": "command",
+            "command": "node scripts/hooks/claude-hook-adapter.js PostToolUse post:utterance-check utterance-check.js standard,strict"
+          }
+        ]
+      }
+    ]
+  }
+}
+```
-# Optional: agent identifier for provenance
-export FLOW_AGENTS_UTTERANCE_CHECK_AGENT_ID=my-codex-session
+Or run the hook directly (Kiro/Codex convention, exit 2 blocks):
-# Optional: strict mode — blocks Stop when concerning badges are present
-export FLOW_AGENTS_UTTERANCE_CHECK_STRICT=true
+```bash
+node scripts/hooks/run-hook.js post:utterance-check utterance-check.js standard,strict
 ```
-The hook runs through the standard `run-hook.js` runner and respects `SA_DISABLED_HOOKS` and `SA_HOOK_PROFILE`.
+The hook reads `context/settings/flow-agents-settings.json` relative to the repo root it detects from the hook event `cwd` or `process.cwd()`. No configuration needed in the hook command itself.
+---
-## CLI Adapter Contract
+## CLI reference
 The utterance check CLI is available as:
 ```bash
 node build/src/cli.js utterance-check check \
   --utterance "The coverage is 92% and all tests pass." \
-  --bundle-path .surface/trust-bundle.json \
+  --bundle-path .veritas/trust.bundle.json \
+  --extractor anthropic \
+  --model claude-haiku-4-5 \
   --agent-id my-session
 ```
@@ -79,6 +213,8 @@ Options:
   --utterance TEXT      Utterance text to check (required unless --not-configured).
   --bundle-path FILE    Trust bundle JSON file. Omit for an empty bundle (all unsupported).
   --agent-id ID         Agent identifier for provenance (default: flow-agents-utterance-check).
+  --extractor NAME      'reference' (default) or 'anthropic'.
+  --model MODEL         Model for the anthropic extractor (e.g. claude-haiku-4-5).
   --not-configured      Skip survey call; output not_configured without error.
   --strict              Exit non-zero when any badge is disputed, rejected, or unsupported.
   --help                Show this help.
@@ -109,83 +245,64 @@ The CLI outputs a JSON report to stdout:
 Badge values:
 | Badge | Meaning |
-| --- | --- |
-| `verified` | Matched a claim with verified status |
-| `assumed` | Matched a claim with assumed status |
-| `stale` | Matched a claim that is stale |
-| `disputed` | Matched a claim with conflicting evidence |
-| `rejected` | Matched a claim that was rejected |
-| `unsupported` | No matching claim in the trust bundle |
+|-------|---------|
+| `verified` | Matched a claim with verified status. |
+| `assumed` | Matched a claim with assumed status. |
+| `stale` | Matched a claim that is stale. |
+| `disputed` | Matched a claim with conflicting evidence. |
+| `rejected` | Matched a claim that was rejected. |
+| `unsupported` | No matching claim in the trust bundle. |
-Exit codes: `0` = pass, `1` = survey unavailable, `2` = strict mode with concerning badges, `3` = usage error.
+Exit codes: `0` = pass, `0` = anthropic not_configured (fail open), `1` = survey unavailable, `2` = strict mode with concerning badges, `3` = usage error.
-When `@kontourai/survey` is not installed, the CLI outputs `status: "not_configured"` and exits `1`. The hook treats `not_configured` as a silent pass-through.
+---
-## Registering the Hook
+## Installing dependencies
-Add the utterance check to a Claude Code session via `.claude/settings.json`:
-```json
-{
-  "hooks": {
-    "PostToolUse": [
-      {
-        "matcher": ".*",
-        "hooks": [
-          {
-            "type": "command",
-            "command": "node scripts/hooks/claude-hook-adapter.js PostToolUse post:utterance-check utterance-check.js standard,strict"
-          }
-        ]
-      }
-    ]
-  }
-}
-```
-Or run the hook directly (Kiro/Codex convention, exit 2 blocks):
+The CLI adapter uses dynamic imports so flow-agents itself does not list `@kontourai/survey` as a dependency. Install in the target workspace:
 ```bash
-node scripts/hooks/run-hook.js post:utterance-check utterance-check.js standard,strict
-```
+# Reference extractor only (default)
+npm install @kontourai/survey
-## Installing @kontourai/survey
+# Anthropic extractor (model-backed)
+npm install @kontourai/survey @anthropic-ai/sdk
+```
-The CLI adapter uses a dynamic import so flow-agents itself does not list `@kontourai/survey` as a dependency. Install it in the target workspace:
+---
-```bash
-npm install @kontourai/survey
-```
+## Ownership split
-For model-backed extraction (production-quality, requires `@anthropic-ai/sdk`):
+| Area | Flow Agents owns | Survey owns |
+|------|-----------------|-------------|
+| Hook wiring | PostToolUse/Stop hook, badge guidance format, config loading | None |
+| Extraction | Invoking the CLI, extractor selection, fail-open handling | Statement extraction, extractor interface, anthropic integration |
+| Resolution | Passing the trust bundle path | Inquiry pipeline, claim resolution |
+| Output | Guidance text injected into agent context | UtteranceTrustReport with per-statement badges |
+| Config | Per-repo `flow-agents-settings.json`, env var overrides | None |
-```bash
-npm install @kontourai/survey @anthropic-ai/sdk
-```
+Flow Agents does not own trust claim models, inquiry semantics, or extractor implementations.
-Then inject the Anthropic extractor by extending the CLI adapter or creating a wrapper script that calls `surveyAgentUtterance` with `createAnthropicUtteranceExtractor`.
+---
-## Non-Goals
+## Non-goals
 - Do not make `@kontourai/survey` a mandatory dependency of flow-agents.
 - Do not copy Survey's extraction or inquiry schemas into flow-agents.
 - Do not auto-register the hook in the default pack; it is opt-in only.
-- Do not make the hook blocking without explicit `--strict` / `FLOW_AGENTS_UTTERANCE_CHECK_STRICT=true`.
+- Do not make the hook blocking without explicit `mode: "strict"` or the env override.
 - Do not silently decide anything. The hook injects guidance; the agent decides next steps.
-## Current Integration Shape
+---
-The integration delivers:
+## Current integration shape
-1. `src/cli/utterance-check.ts` — TypeScript CLI adapter. Accepts utterance text, optional bundle path, and agent ID. Dynamically imports `@kontourai/survey`. Outputs a JSON badge report to stdout and human-readable guidance to stderr. Mirrors the `veritas-governance` adapter pattern.
+The integration delivers:
-2. `scripts/hooks/utterance-check.js` — CJS hook script. PostToolUse/Stop, non-blocking by default. Reads agent output text from the hook event, invokes the CLI adapter when `FLOW_AGENTS_UTTERANCE_CHECK_ENABLED=true`, and injects badge guidance into the agent context. Always fails open.
+1. `src/cli/utterance-check.ts` — TypeScript CLI adapter. Accepts utterance text, optional bundle path, agent ID, extractor name, and model. Dynamically imports `@kontourai/survey` (and optionally `@kontourai/survey/anthropic`). Outputs a JSON badge report to stdout and human-readable guidance to stderr.
-The forward path (out of scope for this slice):
+2. `scripts/hooks/utterance-check.js` — CJS hook script. PostToolUse/Stop, non-blocking in report mode. Reads per-repo policy from `context/settings/flow-agents-settings.json`, uses env vars as overrides. Resolves repo root from hook event `cwd`. Always fails open.
-- Register the hook in a dedicated `survey` pack for opt-in activation.
-- Support injecting the Anthropic extractor via `FLOW_AGENTS_UTTERANCE_CHECK_EXTRACTOR=anthropic`.
-- Surface badge results as evidence sidecar entries (linking utterance coverage to workflow evidence).
-- Auto-propose new claim mappings from unsupported statements via the Survey mapping proposer.
+3. `schemas/flow-agents-settings.schema.json` — JSON Schema for the per-repo settings file.
 Survey source and API details: https://github.com/kontourai/survey

package/docs/vision.md ADDED Viewed

@@ -0,0 +1,45 @@
+---
+title: Flow Agents Vision and Direction
+---
+# Vision and Direction
+This page captures where Flow Agents is headed, clearly labeled as direction rather than shipped capability. Shipped artifacts are documented in the [Runtime Hook Surface spec](spec/runtime-hook-surface.html) and the [Runtime and support matrix](index.html#runtime-and-support-matrix) on the overview page.
+---
+## What ships today
+Flow Agents currently ships as a harness adapter layer: six core harness runtimes (base, Claude Code, Codex, Kiro, opencode, pi) receive bundled agents, skills, context, scripts, and hook wiring through the `npx @kontourai/flow-agents init` installer. The four canonical policy classes — workflow steering, quality gate, stop-goal-fit, and config protection — are implemented as canonical scripts under `scripts/hooks/` and wired to each host's native event surface at conformance levels L0, L1, or L2.
+One official framework adapter spike exists: `integrations/strands/` is a Python `HookProvider` for AWS Strands that emits the canonical telemetry taxonomy and enforces config protection via tool-call cancellation. It is preview-status with documented limitations.
+---
+## Direction
+The items below are direction, not committed delivery dates. They record the intended shape of where this work goes.
+### Kits beyond coding
+The process-discipline layer is not coding-specific. The canonical policies, sidecar state model, and evidence taxonomy are defined without reference to source code, build systems, or CI. The direction is deployable agentic workflows — Flow Kits for domains beyond software delivery: knowledge work, research, operations, sales contexts, and personal productivity. The [North Star](north-star.html) records the broader scope.
+### TypeScript framework adapters
+The Strands Python spike proves the thesis: the policy engine is not harness-specific. The direction is TypeScript framework adapters that consume the canonical policy engine natively via the published `@kontourai/flow-agents` npm package, rather than shelling out to bash scripts. Candidate frameworks include LangGraph, VoltAgent, and the OpenAI Agents SDK. The [Runtime Hook Surface spec](spec/runtime-hook-surface.html) documents the adapter contract and the framework event mapping tables for each.
+### Kontour Console as the unifying telemetry surface
+Today, telemetry writes to local JSONL files by default, with optional sinks to a local or hosted Kontour Console. The direction is Kontour Console as the unifying surface that spans both harness sessions (Claude Code, Codex, Kiro, opencode, pi) and deployed framework agents (Strands, LangGraph, etc.) — so the same workflow state, evidence, and hook telemetry are visible regardless of which runtime executed the work.
+### Conformance kit for community adapters
+The runtime matrix includes a "conformance-certified" tier for community and third-party adapters that self-certify at a declared L0, L1, or L2 level. A conformance kit — a test suite and declaration format — is in development. It does not yet ship.
+---
+## What this is not
+Flow Agents is not building another agent runtime, coding assistant, workflow engine, or orchestration control plane. The model, the runtime, the IDE, the agent UI, the workflow engine, and the repo governance engine are all deliberately out of scope. Flow Agents owns the glue: discovery, just-in-time guidance, scoped delegation, Flow-backed workflow state inside agent runtimes, evidence-backed completion, and feedback loops.
+See the [North Star](north-star.html) for the full design principles and the [Developer Architecture](developer-architecture.html) for the product boundary map.

package/evals/acceptance/run.sh CHANGED Viewed

@@ -11,19 +11,30 @@ run_one() {
   bash "$ACCEPT_DIR/test_${name}_harness.sh"
 }
+run_knowledge_kit_live() {
+  echo ""
+  bash "$ACCEPT_DIR/test_knowledge_kit_live.sh"
+}
 case "$TARGET" in
-  kiro|claude|codex)
+  kiro|claude|codex|opencode|pi)
     run_one "$TARGET"
     ;;
+  knowledge-kit-live)
+    run_knowledge_kit_live
+    ;;
   all)
     status=0
     run_one kiro || status=1
     run_one claude || status=1
     run_one codex || status=1
+    run_one opencode || status=1
+    run_one pi || status=1
+    run_knowledge_kit_live || status=1
     exit "$status"
     ;;
   *)
-    echo "Usage: bash evals/acceptance/run.sh [all|kiro|claude|codex]"
+    echo "Usage: bash evals/acceptance/run.sh [all|kiro|claude|codex|opencode|pi|knowledge-kit-live]"
     exit 1
     ;;
 esac