npm - @kontourai/flow-agents - Versions diffs - 1.3.0 → 2.0.0 - Mend

@kontourai/flow-agents 1.3.0 → 2.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (214) hide show

package/.github/CODEOWNERS +29 -0
package/.github/actions/trust-verify/action.yml +145 -0
package/.github/workflows/ci.yml +11 -4
package/.github/workflows/kit-gates-demo.yml +2 -2
package/.github/workflows/publish-npm.yml +10 -2
package/.github/workflows/release-please.yml +1 -1
package/.github/workflows/trust-reconcile.yml +113 -0
package/AGENTS.md +13 -0
package/CHANGELOG.md +103 -0
package/CONTRIBUTING.md +4 -4
package/README.md +1 -0
package/agents/tool-planner.json +1 -1
package/build/src/cli/console-learning-projection.d.ts +1 -0
package/build/src/cli/effective-backlog-settings.d.ts +1 -0
package/build/src/cli/fixture-retirement-audit.d.ts +2 -0
package/build/src/cli/init.d.ts +17 -0
package/build/src/cli/init.js +242 -20
package/build/src/cli/kit.d.ts +1 -0
package/build/src/cli/promote-workflow-artifact.d.ts +1 -0
package/build/src/cli/publish-change-helper.d.ts +1 -0
package/build/src/cli/pull-work-provider.d.ts +1 -0
package/build/src/cli/runtime-adapter.d.ts +1 -0
package/build/src/cli/telemetry-doctor.d.ts +1 -0
package/build/src/cli/usage-feedback.d.ts +1 -0
package/build/src/cli/utterance-check.d.ts +1 -0
package/build/src/cli/validate-hook-influence.d.ts +1 -0
package/build/src/cli/validate-source-tree.d.ts +1 -0
package/build/src/cli/validate-workflow-artifacts.d.ts +2 -0
package/build/src/cli/validate-workflow-artifacts.js +19 -2
package/build/src/cli/verify.d.ts +1 -0
package/build/src/cli/verify.js +90 -0
package/build/src/cli/veritas-governance.d.ts +1 -0
package/build/src/cli/workflow-artifact-cleanup-audit.d.ts +1 -0
package/build/src/cli/workflow-sidecar.d.ts +324 -0
package/build/src/cli/workflow-sidecar.js +1973 -90
package/build/src/cli.d.ts +2 -0
package/build/src/cli.js +2 -3
package/build/src/flow-kit/validate.d.ts +81 -0
package/build/src/index.d.ts +5 -0
package/build/src/index.js +36 -0
package/build/src/lib/args.d.ts +8 -0
package/build/src/lib/flow-resolver.d.ts +82 -0
package/build/src/lib/flow-resolver.js +237 -0
package/build/src/lib/fs.d.ts +7 -0
package/build/src/lib/workflow-learning-projection.d.ts +132 -0
package/build/src/runtime-adapters.d.ts +18 -0
package/build/src/tools/build-universal-bundles.d.ts +2 -0
package/build/src/tools/build-universal-bundles.js +34 -22
package/build/src/tools/common.d.ts +9 -0
package/build/src/tools/generate-context-map.d.ts +2 -0
package/build/src/tools/generate-context-map.js +3 -16
package/build/src/tools/validate-package.d.ts +2 -0
package/build/src/tools/validate-source-tree.d.ts +2 -0
package/build/src/tools/validate-source-tree.js +42 -162
package/context/contracts/artifact-contract.md +10 -0
package/context/contracts/delivery-contract.md +1 -0
package/context/contracts/review-contract.md +1 -0
package/context/contracts/verification-contract.md +2 -0
package/context/gate-awareness.md +39 -0
package/context/scripts/hooks/stop-goal-fit.js +632 -70
package/docs/adr/0001-flow-agents-consumes-flow.md +1 -1
package/docs/adr/0002-flow-kits-as-extension-unit.md +1 -1
package/docs/adr/0004-gates-expect-surface-claims.md +2 -0
package/docs/adr/0005-kubernetes-inspired-resource-contracts.md +2 -0
package/docs/adr/0007-skill-audit.md +1 -1
package/docs/adr/0009-canonical-hook-core-kit-boundary.md +95 -0
package/docs/adr/0010-workflow-trust-state-as-hachure-bundle.md +139 -0
package/docs/adr/0011-mcp-posture.md +100 -0
package/docs/adr/0012-agent-coordination-as-liveness-claims.md +119 -0
package/docs/adr/0013-context-lifecycle.md +151 -0
package/docs/adr/0014-core-vs-domain-kit-boundary.md +143 -0
package/docs/adr/0015-flow-flow-agents-boundary-reconciliation.md +120 -0
package/docs/adr/0016-three-hard-boundary-model.md +71 -0
package/docs/adr/0017-anti-gaming-trust-security-model.md +155 -0
package/docs/agent-system-guidebook.md +5 -12
package/docs/context-map.md +4 -10
package/docs/developer-architecture.md +14 -0
package/docs/index.md +3 -2
package/docs/integrations/framework-adapter.md +19 -6
package/docs/integrations/index.md +2 -2
package/docs/north-star.md +4 -4
package/docs/operating-layers.md +3 -3
package/docs/plans/adr-0010-phase2-gate-recompute.md +55 -0
package/docs/repository-structure.md +2 -2
package/docs/skills-map.md +1 -0
package/docs/spec/runtime-hook-surface.md +78 -10
package/docs/standards-register.md +3 -3
package/docs/survey-utterance-check.md +1 -1
package/docs/trust-anchor-adoption.md +197 -0
package/docs/verifiable-trust.md +95 -0
package/docs/veritas-integration.md +2 -2
package/docs/workflow-usage-guide.md +69 -0
package/evals/acceptance/DEMO-false-completion.md +144 -0
package/evals/acceptance/demo-cast.sh +92 -0
package/evals/acceptance/demo-false-completion.sh +72 -0
package/evals/acceptance/demo-real-evidence.sh +104 -0
package/evals/acceptance/demo.tape +29 -0
package/evals/acceptance/prove-capture-teeth-declared.sh +335 -0
package/evals/acceptance/prove-capture-teeth.sh +114 -0
package/evals/acceptance/prove-teeth.sh +105 -0
package/evals/ci/antigaming-suite.sh +54 -0
package/evals/ci/run-baseline.sh +2 -0
package/evals/fixtures/flow-kit-repository/invalid-missing-extension-asset/flows/review.flow.json +26 -0
package/evals/fixtures/flow-kit-repository/invalid-missing-extension-asset/kit.json +20 -0
package/evals/fixtures/flow-kit-repository/valid-unknown-extension/flows/review.flow.json +26 -0
package/evals/fixtures/flow-kit-repository/valid-unknown-extension/kit.json +18 -0
package/evals/integration/test_builder_step_producers.sh +379 -0
package/evals/integration/test_bundle_install.sh +35 -71
package/evals/integration/test_bundle_lifecycle.sh +39 -2
package/evals/integration/test_captured_fail_reconciliation.sh +820 -0
package/evals/integration/test_checkpoint_signing.sh +489 -0
package/evals/integration/test_claim_lookup.sh +352 -0
package/evals/integration/test_command_log_integrity.sh +275 -0
package/evals/integration/test_context_map.sh +0 -2
package/evals/integration/test_dual_emit_flow_step.sh +278 -0
package/evals/integration/test_enforcer_expects_driven.sh +281 -0
package/evals/integration/test_evidence_capture_hook.sh +185 -0
package/evals/integration/test_flow_kit_repository.sh +2 -0
package/evals/integration/test_flowdef_session_activation.sh +273 -0
package/evals/integration/test_flowdef_session_history_preservation.sh +250 -0
package/evals/integration/test_gate_bypass_chain.sh +448 -0
package/evals/integration/test_gate_lockdown.sh +1137 -0
package/evals/integration/test_gate_review_inquiry_records.sh +399 -0
package/evals/integration/test_goal_fit_escape_hatch.sh +73 -0
package/evals/integration/test_goal_fit_hook.sh +69 -4
package/evals/integration/test_goal_fit_rederive.sh +263 -0
package/evals/integration/test_hook_category_behaviors.sh +14 -0
package/evals/integration/test_install_merge.sh +1176 -0
package/evals/integration/test_mint_attestation.sh +373 -0
package/evals/integration/test_phase_map_and_gate_claim.sh +365 -0
package/evals/integration/test_publish_delivery.sh +269 -0
package/evals/integration/test_reconcile_soundness.sh +528 -0
package/evals/integration/test_resolvefirststep_security.sh +208 -0
package/evals/integration/test_session_resume_roundtrip.sh +286 -0
package/evals/integration/test_trust_checkpoint.sh +325 -0
package/evals/integration/test_trust_reconcile.sh +293 -0
package/evals/integration/test_verify_cli.sh +208 -0
package/evals/integration/test_workflow_sidecar_writer.sh +549 -34
package/evals/lib/node.sh +0 -6
package/evals/run.sh +47 -0
package/evals/static/test_library_exports.sh +85 -0
package/evals/static/test_universal_bundles.sh +15 -0
package/evals/static/test_workflow_skills.sh +6 -13
package/install.sh +0 -7
package/integrations/strands-ts/README.md +25 -15
package/integrations/veritas/flow-agents.adapter.json +1 -2
package/kits/builder/flows/build.flow.json +59 -12
package/kits/builder/kit.json +85 -15
package/kits/builder/skills/continue-work/SKILL.md +116 -0
package/kits/builder/skills/deliver/SKILL.md +36 -6
package/kits/builder/skills/design-probe/SKILL.md +28 -0
package/kits/builder/skills/execute-plan/SKILL.md +9 -1
package/kits/builder/skills/gate-review/SKILL.md +234 -0
package/kits/builder/skills/learning-review/SKILL.md +30 -0
package/kits/builder/skills/pickup-probe/SKILL.md +29 -0
package/kits/builder/skills/plan-work/SKILL.md +13 -1
package/kits/builder/skills/pull-work/SKILL.md +19 -0
package/kits/knowledge/adapters/default-store/index.js +38 -0
package/kits/knowledge/adapters/flow-runner/index.js +1620 -0
package/kits/knowledge/adapters/obsidian-store/index.js +36 -6
package/kits/knowledge/docs/store-contract.md +314 -0
package/kits/knowledge/evals/audit-freshness/suite.test.js +368 -0
package/kits/knowledge/evals/canonicalize-category/suite.test.js +383 -0
package/kits/knowledge/evals/contract-suite/suite.test.js +111 -0
package/kits/knowledge/evals/detect-contradictions/suite.test.js +324 -0
package/kits/knowledge/evals/entities/suite.test.js +40 -0
package/kits/knowledge/evals/glossary-sync/suite.test.js +416 -0
package/kits/knowledge/evals/hygiene-review/suite.test.js +396 -0
package/kits/knowledge/evals/retirement/suite.test.js +145 -0
package/kits/knowledge/flows/audit-freshness.flow.json +44 -0
package/kits/knowledge/flows/canonicalize-category.flow.json +44 -0
package/kits/knowledge/flows/detect-contradictions.flow.json +44 -0
package/kits/knowledge/flows/glossary-sync.flow.json +61 -0
package/kits/knowledge/flows/hygiene-review.flow.json +43 -0
package/kits/knowledge/kit.json +51 -1
package/package.json +13 -4
package/packaging/conformance/README.md +10 -2
package/packaging/conformance/fixtures/evidence-capture--allow-records-command.json +29 -0
package/packaging/conformance/fixtures/stop-goal-fit--block-bundle-disputed-claim.json +29 -0
package/packaging/conformance/fixtures/stop-goal-fit--block-capture-contradicts-claimed-pass.json +30 -0
package/packaging/conformance/fixtures/stop-goal-fit--block-mode.json +23 -0
package/packaging/conformance/fixtures/stop-goal-fit--off-mode.json +24 -0
package/packaging/conformance/fixtures/stop-goal-fit--warn-active-delivery.json +5 -2
package/packaging/conformance/fixtures/stop-goal-fit--warn-no-bundle.json +23 -0
package/packaging/conformance/fixtures/workflow-steering--reground-active-prompt.json +30 -0
package/packaging/conformance/fixtures/workflow-steering--reground-session-start.json +30 -0
package/packaging/conformance/run-conformance.js +1 -1
package/scripts/README.md +2 -1
package/scripts/build-universal-bundles.js +0 -1
package/scripts/ci/mint-attestation.js +221 -0
package/scripts/ci/trust-reconcile.js +545 -0
package/scripts/hooks/config-protection.js +423 -1
package/scripts/hooks/evidence-capture.js +348 -0
package/scripts/hooks/lib/liveness-read.js +113 -0
package/scripts/hooks/run-hook.js +6 -1
package/scripts/hooks/stop-goal-fit.js +1471 -79
package/scripts/hooks/workflow-steering.js +135 -5
package/scripts/install-codex-home.sh +39 -0
package/scripts/install-merge.js +330 -0
package/src/cli/init.ts +218 -20
package/src/cli/validate-workflow-artifacts.ts +18 -2
package/src/cli/verify.ts +100 -0
package/src/cli/workflow-sidecar.ts +2093 -84
package/src/cli.ts +2 -3
package/src/index.ts +53 -0
package/src/lib/flow-resolver.ts +284 -0
package/src/tools/build-universal-bundles.ts +34 -21
package/src/tools/generate-context-map.ts +3 -17
package/src/tools/validate-source-tree.ts +44 -104
package/tsconfig.json +1 -0
package/build/src/tools/filter-installed-packs.js +0 -135
package/packaging/packs.json +0 -49
package/scripts/filter-installed-packs.js +0 -2
package/src/tools/filter-installed-packs.ts +0 -132

package/kits/builder/skills/pickup-probe/SKILL.md CHANGED Viewed

@@ -84,6 +84,35 @@ Planning is ready only when:
 - The route reason and next action are recorded in an artifact that can be recovered without chat memory.
 If the gate fails, stop before `plan-work` and update the artifact with the blocker or decision gap.
+## Gate Claims: Record Pickup Probe Results
+When the Planning Gate passes, record the two gate claims for the Builder Kit `design-probe` step before handing off to `plan-work`. These satisfy the `builder.design-probe.pickup-readiness` and `builder.design-probe.decisions` gate expectations.
+**Claim 1 — Pickup readiness** (probe passed, goal fit and scope confirmed):
+```bash
+npm run workflow:sidecar -- record-gate-claim .flow-agents/<slug> \
+  --expectation pickup-probe-readiness \
+  --status pass \
+  --summary "Pickup probe passed: goal fit confirmed, blockers checked, dependencies reviewed, acceptance criteria verified." \
+  --evidence-ref-json '{"kind":"artifact","file":".flow-agents/<slug>/<slug>--pull-work.md","summary":"Pull-work artifact recording probe status, scope, and planning readiness."}'
+```
+**Claim 2 — Probe decisions captured** (decisions, accepted gaps, and planning readiness are recorded):
+```bash
+npm run workflow:sidecar -- record-gate-claim .flow-agents/<slug> \
+  --expectation probe-decisions-or-accepted-gaps \
+  --status pass \
+  --summary "Probe decisions recorded: <decision-count> decisions, <gap-count> accepted gaps. Planning readiness: <ready|accepted_gap_ready>." \
+  --evidence-ref-json '{"kind":"artifact","file":".flow-agents/<slug>/<slug>--pull-work.md","summary":"Pull-work artifact with decisions, accepted gaps, and planning handoff."}'
+```
+Record both claims together immediately when the gate passes. Use `--status fail` when the gate fails (unresolved blocker or decision gap). Use `--status not_verified` only when the session has no active flow step.
+When the gate fails, record `--status fail` with `--expectation pickup-probe-readiness` naming the blocker, and omit or defer the decisions claim until the blocker is resolved.
 ## Docs And ADR Policy

package/kits/builder/skills/plan-work/SKILL.md CHANGED Viewed

@@ -33,7 +33,18 @@ Before delegating to tool-planner, check if the goal can be solved with existing
 2. If the goal involves adding new capabilities, invoke the search-first skill
 3. Pass research findings to tool-planner as additional context
-Skip this step if the goal is purely about modifying existing code (bug fixes, refactors).
+**Survey existing concepts before designing new ones.** Before the plan introduces a new
+artifact, schema, type, data shape, status, or derivation/algorithm, check what the project's
+**dependencies and contracts already define** — not just the local codebase. Inspect exported
+types, schemas, and builders from dependencies (e.g. `@kontourai/*` packages and vendored
+schemas) and the resource/data contracts under `context/contracts/`. Prefer **consuming the
+canonical concept over inventing a parallel one**: follow existing patterns, understand the
+dependency surface, and leverage existing concepts. If a planned shape resembles a dependency's
+existing concept, consume theirs and record which one. This operationalizes the consume-never-fork
+guardrail of ADR 0008 and ADR 0010 at planning time — the cheapest place to catch a fork.
+Skip the codebase-similarity search for pure bug-fix/refactor goals, but still apply the
+survey-existing-concepts check whenever the plan would add a new shape or algorithm.
 ## Input
@@ -92,6 +103,7 @@ The `tool-planner` prompt context must include the latest-base confirmation and
    - `status: planning`, `type: plan-work`
    - Create or update `state.json` with phase `planning`
    - use `npm run workflow:sidecar -- ensure-session --source-request ... --summary ... --criterion ...` when the repository provides it; this also writes `.flow-agents/current.json`
+   - **Builder Kit build flow**: add `--flow-id builder.build` to the `ensure-session` call when `plan-work` is invoked from `deliver`, from the Builder Kit `build` flow, or from a pick-up-and-build request after `pull-work`. This activates the FlowDefinition-driven path so producers fire and gates enforce on builder.* claims. Do NOT add `--flow-id` for direct/ad-hoc primitive `plan-work` invocations that are not part of a builder-flow.
 2. Delegate to `tool-planner`:
    ```
    Goal: <goal>

package/kits/builder/skills/pull-work/SKILL.md CHANGED Viewed

@@ -291,6 +291,25 @@ Selected work is ready when:
 If the gate fails, update the artifact and stop with the blocker.
 After a merge, automatic continuation may inspect the queue and write a new pull-work artifact, but it cannot enter planning or execution for the next work item until a fresh pickup Probe record exists for that newly selected item or justified group.
+## Gate Claim: Record Selected Work
+When the Pickup Gate passes and work is selected (not just a shepherding scan or WIP-only audit), record the gate claim for the Builder Kit `pull-work` step before handing off to `design-probe` or `plan-work`. This satisfies the `builder.pull-work.selected` gate expectation.
+Use the `selected_item_ids` as the evidence artifact ref and confirm that scope and acceptance criteria are present in the pull-work artifact:
+```bash
+npm run workflow:sidecar -- record-gate-claim .flow-agents/<slug> \
+  --expectation selected-work \
+  --status pass \
+  --summary "Selected <work-item-ref>: scope clear, acceptance criteria present." \
+  --evidence-ref-json '{"kind":"artifact","file":".flow-agents/<slug>/<slug>--pull-work.md","summary":"Pull-work artifact with selected_item_ids, scope, and acceptance criteria."}'
+```
+Use `--status fail` when the gate fails (blocker recorded but no selection made). Use `--status not_verified` only when the session has no active flow step (non-Builder-Kit usage).
+Record `--status fail` with a summary naming the blocker when stopping before selection. Do not record `pass` until `selected_item_ids` are confirmed and the pickup gate criteria above are met.
 ## Flow Validation Boundary

package/kits/knowledge/adapters/default-store/index.js CHANGED Viewed

@@ -297,6 +297,16 @@ function removeLinksFromGraph(graph, sourceId) {
   delete graph.forward[sourceId];
 }
+// Order-independent canonical form of a graph index, for drift comparison.
+function canonicalGraph(graph) {
+  const norm = (obj) =>
+    Object.keys(obj || {}).sort().reduce((acc, k) => {
+      acc[k] = (obj[k] || []).map((e) => JSON.stringify(e)).sort();
+      return acc;
+    }, {});
+  return JSON.stringify({ forward: norm(graph.forward), reverse: norm(graph.reverse) });
+}
 // ---------------------------------------------------------------------------
 // Validation helpers
 // ---------------------------------------------------------------------------
@@ -882,6 +892,34 @@ export class DefaultKnowledgeStore {
     );
   }
+  // -------------------------------------------------------------------------
+  // reindex — rebuild graph-index.json from records' links (recovery path)
+  // -------------------------------------------------------------------------
+  /**
+   * Rebuild the graph index authoritatively from the records' own `links`.
+   * Records are the source of truth; the index is a derived cache. Use this to
+   * recover from a lost, hand-edited, or drifted `graph-index.json` (issue #106).
+   * @returns {Promise<{records:number, links:number, forwardSources:number, reverseTargets:number, changed:boolean}>}
+   */
+  async reindex() {
+    const records = this._allRecords().sort((a, b) => a.id.localeCompare(b.id));
+    const rebuilt = emptyGraph();
+    for (const record of records) {
+      addLinksToGraph(rebuilt, record.id, Array.isArray(record.links) ? record.links : []);
+    }
+    const links = Object.values(rebuilt.forward).reduce((n, arr) => n + arr.length, 0);
+    const changed = canonicalGraph(loadGraph(this._graphPath)) !== canonicalGraph(rebuilt);
+    saveGraph(this._graphPath, rebuilt);
+    return {
+      records: records.length,
+      links,
+      forwardSources: Object.keys(rebuilt.forward).length,
+      reverseTargets: Object.keys(rebuilt.reverse).length,
+      changed,
+    };
+  }
   // -------------------------------------------------------------------------
   // Internal: read all records
   // -------------------------------------------------------------------------