npm - nubos-pilot - Versions diffs - 1.1.1 → 1.2.0 - Mend

nubos-pilot 1.1.1 → 1.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (210) hide show

package/CHANGELOG.md +23 -0
package/LICENSE +21 -0
package/README.md +37 -6
package/SECURITY.md +60 -0
package/agents/np-architect.md +1 -1
package/agents/np-build-fixer.md +4 -4
package/agents/np-executor.md +1 -1
package/agents/np-plan-checker.md +5 -5
package/agents/np-planner.md +2 -2
package/agents/np-researcher.md +2 -2
package/bin/check-workflows.cjs +1 -8
package/bin/install.js +113 -62
package/bin/np-tools/_args.cjs +16 -2
package/bin/np-tools/_commands.cjs +4 -8
package/bin/np-tools/_commands.test.cjs +31 -0
package/bin/np-tools/_memory-resolve.cjs +4 -4
package/bin/np-tools/askuser.cjs +2 -8
package/bin/np-tools/checkpoint.cjs +1 -1
package/bin/np-tools/close-project.cjs +3 -29
package/bin/np-tools/commit-task.cjs +31 -37
package/bin/np-tools/commit.cjs +2 -11
package/bin/np-tools/config.cjs +6 -21
package/bin/np-tools/discuss-phase.cjs +4 -27
package/bin/np-tools/discuss-project.cjs +0 -27
package/bin/np-tools/doctor.cjs +79 -30
package/bin/np-tools/doctor.test.cjs +14 -0
package/bin/np-tools/execute-milestone.cjs +6 -27
package/bin/np-tools/handoff-write.cjs +16 -2
package/bin/np-tools/help.cjs +5 -2
package/bin/np-tools/init-dispatch.test.cjs +21 -0
package/bin/np-tools/knowledge-search.cjs +7 -1
package/bin/np-tools/lang-directive.cjs +2 -8
package/bin/np-tools/learning-list.cjs +0 -2
package/bin/np-tools/learning-log.cjs +6 -16
package/bin/np-tools/loop-audit-tool-use.cjs +1 -11
package/bin/np-tools/loop-preflight.cjs +4 -8
package/bin/np-tools/loop-run-round.cjs +51 -148
package/bin/np-tools/loop-state-read.cjs +1 -5
package/bin/np-tools/loop-state-record.cjs +1 -27
package/bin/np-tools/loop-stuck.cjs +1 -8
package/bin/np-tools/messages-send.cjs +16 -2
package/bin/np-tools/metrics.test.cjs +4 -4
package/bin/np-tools/new-milestone.cjs +14 -3
package/bin/np-tools/new-project.cjs +4 -2
package/bin/np-tools/new-project.test.cjs +12 -0
package/bin/np-tools/park.cjs +3 -2
package/bin/np-tools/plan-lint.cjs +0 -19
package/bin/np-tools/plan-milestone.cjs +9 -30
package/bin/np-tools/propose-milestones.cjs +14 -3
package/bin/np-tools/propose-milestones.test.cjs +27 -0
package/bin/np-tools/research-phase.cjs +8 -41
package/bin/np-tools/research-phase.test.cjs +2 -1
package/bin/np-tools/researcher-reconcile.cjs +3 -21
package/bin/np-tools/reset-slice.cjs +12 -18
package/bin/np-tools/resolve-model.cjs +21 -26
package/bin/np-tools/resolve-model.test.cjs +15 -5
package/bin/np-tools/resume-work.cjs +1 -7
package/bin/np-tools/scan-codebase.test.cjs +1 -1
package/bin/np-tools/skip.cjs +3 -2
package/bin/np-tools/spawn-headless.cjs +138 -19
package/bin/np-tools/spawn-headless.test.cjs +310 -0
package/bin/np-tools/state.cjs +3 -4
package/bin/np-tools/state.test.cjs +2 -2
package/bin/np-tools/stats.cjs +3 -9
package/bin/np-tools/template-path.cjs +2 -8
package/bin/np-tools/text-mode.cjs +2 -8
package/bin/np-tools/undo-task.cjs +3 -2
package/bin/np-tools/undo.cjs +7 -5
package/bin/np-tools/unpark.cjs +3 -2
package/bin/np-tools/update-docs.test.cjs +1 -1
package/bin/np-tools/verify-work.cjs +82 -25
package/bin/np-tools/verify-work.test.cjs +211 -1
package/bin/researcher-merge.cjs +9 -2
package/bin/researcher-merge.test.cjs +14 -0
package/lib/agents-registry.cjs +32 -0
package/lib/agents.cjs +16 -6
package/lib/agents.test.cjs +44 -0
package/lib/archive.cjs +105 -39
package/lib/archive.test.cjs +147 -5
package/lib/checkpoint.cjs +43 -27
package/lib/checkpoint.test.cjs +67 -6
package/lib/codebase-docs.cjs +7 -9
package/lib/codebase-docs.test.cjs +2 -2
package/lib/codebase-manifest.cjs +2 -0
package/lib/commit-policy.cjs +6 -29
package/lib/commit-policy.test.cjs +6 -0
package/lib/config-defaults.cjs +5 -2
package/lib/config-defaults.test.cjs +71 -0
package/lib/config-schema.cjs +204 -0
package/lib/config-schema.test.cjs +148 -0
package/lib/config.cjs +194 -9
package/lib/config.test.cjs +234 -0
package/lib/core.cjs +231 -47
package/lib/core.test.cjs +193 -10
package/lib/dashboard.cjs +0 -12
package/lib/frontmatter.cjs +12 -18
package/lib/git.cjs +34 -56
package/lib/git.test.cjs +11 -3
package/lib/handoff.cjs +19 -20
package/lib/handoff.test.cjs +24 -0
package/lib/ids.cjs +6 -0
package/lib/init-emit.cjs +33 -0
package/lib/install/backup.cjs +19 -14
package/lib/install/claude-hooks.cjs +46 -25
package/lib/install/claude-hooks.test.cjs +64 -0
package/lib/install/codex-toml.cjs +15 -66
package/lib/install/manifest.cjs +19 -0
package/lib/install/manifest.test.cjs +107 -0
package/lib/install/runtime-assets.cjs +4 -3
package/lib/install/runtime-detect.cjs +1 -1
package/lib/install/runtimes-registry.cjs +0 -5
package/lib/knowledge-adapter.cjs +4 -57
package/lib/knowledge-adapter.test.cjs +0 -20
package/lib/knowledge.cjs +21 -5
package/lib/language.cjs +3 -19
package/lib/learnings.cjs +3 -108
package/lib/logger.cjs +157 -0
package/lib/logger.test.cjs +159 -0
package/lib/memory-index-usearch.cjs +9 -12
package/lib/memory-provider-local.cjs +8 -0
package/lib/memory.cjs +90 -23
package/lib/memory.test.cjs +135 -0
package/lib/messaging.cjs +155 -83
package/lib/metrics-aggregate.cjs +28 -28
package/lib/metrics.cjs +10 -4
package/lib/metrics.test.cjs +6 -5
package/lib/migrations.cjs +89 -0
package/lib/migrations.test.cjs +82 -0
package/lib/milestone-meta.cjs +70 -0
package/lib/model-profiles.cjs +2 -0
package/lib/nubosloop-audit.cjs +244 -0
package/lib/nubosloop.cjs +79 -412
package/lib/nubosloop.test.cjs +52 -21
package/lib/output-lint.cjs +1 -1
package/lib/plan-lint.cjs +0 -67
package/lib/researcher-reconciler.cjs +5 -10
package/lib/researcher-swarm.cjs +54 -101
package/lib/roadmap-render.cjs +108 -34
package/lib/roadmap-schema.cjs +42 -0
package/lib/roadmap.cjs +99 -35
package/lib/roadmap.test.cjs +215 -0
package/lib/run-context.cjs +54 -0
package/lib/run-context.test.cjs +53 -0
package/lib/runtime/_factory.cjs +19 -0
package/lib/runtime/antigravity.cjs +4 -12
package/lib/runtime/augment.cjs +4 -12
package/lib/runtime/claude.cjs +2 -0
package/lib/runtime/cline.cjs +4 -12
package/lib/runtime/codebuddy.cjs +4 -12
package/lib/runtime/codex.cjs +4 -12
package/lib/runtime/copilot.cjs +4 -12
package/lib/runtime/cursor.cjs +4 -12
package/lib/runtime/gemini.cjs +4 -12
package/lib/runtime/index.cjs +7 -10
package/lib/runtime/index.test.cjs +13 -1
package/lib/runtime/kilo.cjs +4 -12
package/lib/runtime/opencode.cjs +4 -12
package/lib/runtime/qwen.cjs +4 -12
package/lib/runtime/trae.cjs +4 -12
package/lib/runtime/windsurf.cjs +4 -12
package/lib/safe-path.cjs +156 -0
package/lib/safe-path.test.cjs +164 -0
package/lib/state.cjs +33 -10
package/lib/state.test.cjs +90 -21
package/lib/tasks.cjs +92 -14
package/lib/tasks.test.cjs +65 -0
package/lib/template.cjs +0 -1
package/lib/text-mode.cjs +4 -30
package/lib/todo.cjs +7 -5
package/lib/verify.cjs +47 -16
package/lib/workspace-scan.cjs +2 -0
package/lib/worktree.cjs +3 -9
package/lib/yaml.cjs +44 -0
package/lib/yaml.test.cjs +65 -0
package/np-tools.cjs +39 -50
package/package.json +7 -6
package/templates/COMPLETENESS.md +3 -3
package/workflows/add-tests.md +1 -1
package/workflows/architect-phase.md +1 -1
package/workflows/doctor.md +7 -5
package/workflows/execute-phase.md +13 -9
package/workflows/plan-phase.md +3 -3
package/workflows/research-phase.md +2 -2
package/bin/np-tools/research-merge.cjs +0 -105
package/bin/np-tools/research-merge.test.cjs +0 -166
package/docs/adr/0001-no-daemon-invariant.md +0 -82
package/docs/adr/0002-zero-runtime-dependencies.md +0 -91
package/docs/adr/0003-max-six-unit-types.md +0 -85
package/docs/adr/0004-atomic-commit-per-unit.md +0 -102
package/docs/adr/0005-three-orthogonal-file-trees.md +0 -98
package/docs/adr/0006-yaml-dependency-amendment.md +0 -60
package/docs/adr/0007-codebase-docs-layer.md +0 -273
package/docs/adr/0008-worktree-isolation-per-slice.md +0 -140
package/docs/adr/0009-tui-framework-for-dashboard.md +0 -95
package/docs/adr/0010-nubosloop.md +0 -244
package/docs/adr/0011-researcher-swarm-consensus.md +0 -84
package/docs/adr/0012-completeness-doctrine.md +0 -85
package/docs/adr/0013-learnings-store-schema-evolution.md +0 -128
package/docs/adr/0013-plan-trust-layer.md +0 -95
package/docs/adr/0014-vector-memory-layer.md +0 -175
package/docs/adr/0015-named-agent-messaging.md +0 -162
package/docs/adr/README.md +0 -37
package/docs/agent-frontmatter-schema.md +0 -105
package/docs/phase-artifact-schemas.md +0 -292
package/docs/phase-directory-layout.md +0 -82
package/lib/install/mcp-writer.cjs +0 -127
package/mcp-configs/README.md +0 -41
package/mcp-configs/claude-code.example.json +0 -27
package/mcp-configs/codex.example.toml +0 -17
package/mcp-configs/nubos-knowledge.notes.md +0 -42

package/CHANGELOG.md ADDED Viewed

@@ -0,0 +1,23 @@
+# Changelog
+All notable changes to nubos-pilot are documented in this file. Format
+follows [Keep a Changelog](https://keepachangelog.com/en/1.1.0/); versioning
+follows [SemVer](https://semver.org/spec/v2.0.0.html).
+## [1.1.4] — 2026-05-25
+Public release.
+- Plan, execute, and verify code changes through a researcher + critic
+  agent loop.
+- Wave-based milestone execution; one atomic git commit per task.
+- Multi-runtime install for 14 host CLIs (Claude Code, Codex, Gemini,
+  OpenCode, Cursor, and more) via `npx nubos-pilot`.
+- Local vector memory for cross-task learnings.
+- Inter-agent messages, handoffs, and project archive with crash-safe
+  resume.
+- Hardened filesystem operations: symlink-rejecting locks, restricted
+  permissions on audit logs, path containment for file-input flags,
+  frontmatter sanitisation, and a memory-model allow-list.
+Full documentation at <https://pilot.nubos.cloud>.

package/LICENSE ADDED Viewed

@@ -0,0 +1,21 @@
+MIT License
+Copyright (c) 2025 Nubos AI
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

package/README.md CHANGED Viewed

@@ -5,7 +5,7 @@ AI-driven planning and execution tool for code projects. Installs into 14 host C
 - **No daemon.** Every command runs as a short-lived `node` invocation.
 - **Markdown-first.** Workflows and agents are plain `.md` files — the host reads them directly.
 - **Atomic per-task commits.** One `task(M<NNN>-S<NNN>-T<NNNN>): …` commit per unit of work. `/np:undo-task` and `/np:undo` are mechanical reverts.
-- **Multi-runtime.** One source tree, one install payload, four first-class host CLIs.
+- **Multi-runtime.** One source tree, one install payload, fourteen supported host CLIs.
 ## Install
@@ -95,16 +95,18 @@ task(M001-S001-T0002): wire login handler
 ## Agents
-Eleven subagents are installed into the host's agent directory:
+Thirteen spawnable subagents are installed into the host's agent directory (alongside three `np-critic-*` audit modules consumed by `np-critic`):
 - `np-planner` (opus) — breaks a milestone into slices + tasks
 - `np-plan-checker` (opus) — adversarial goal-backward review before execution
 - `np-architect` (sonnet) — optional ADR-style decisions before planning
 - `np-researcher` (sonnet) — milestone-level stack + pitfalls research
+- `np-researcher-reconciler` (sonnet) — reconciles disagreements across researcher-swarm outputs
 - `np-sc-extractor` (haiku) — derives observable Success Criteria from goal + CONTEXT
 - `np-codebase-documenter` (sonnet) — maintains `.nubos-pilot/codebase/` module docs
 - `np-executor` (sonnet) — one task per spawn, one commit per task
 - `np-build-fixer` (sonnet) — recovery patcher for executor verify failures (manual spawn)
+- `np-critic` (sonnet) — Nubosloop critic; audits executor output across style, tests and acceptance
 - `np-verifier` (sonnet) — post-execution Pass/Fail/Defer per success_criterion
 - `np-nyquist-auditor` (haiku) — requirement test-coverage audit
 - `np-security-reviewer` (sonnet) — OWASP-aligned read-only audit (manual spawn)
@@ -113,7 +115,7 @@ Every spawn runs with an **explicit tier** (`haiku` / `sonnet` / `opus`) resolve
 ## Model profile
-Five profiles (`frontier`, `quality`, `balanced`, `budget`, `inherit`) map each tier (`haiku` / `sonnet` / `opus`) to a concrete model. Set at install time (`Model-Profile?` prompt) or in `.nubos-pilot/config.json`. Full matrix in `docs/agent-frontmatter-schema.md`.
+Five profiles (`frontier`, `quality`, `balanced`, `budget`, `inherit`) map each tier (`haiku` / `sonnet` / `opus`) to a concrete model. Set at install time (`Model-Profile?` prompt) or in `.nubos-pilot/config.json`.
 ## Requirements
@@ -131,11 +133,11 @@ node np-tools.cjs help           # JSON: { commands: [ { name, category, descrip
 ## Doctor
 ```bash
-npx nubos-pilot doctor           # 6-check integrity scan
+npx nubos-pilot doctor           # 12-check integrity scan
 npx nubos-pilot doctor --fix     # auto-fix what's safely fixable
 ```
-Checks: payload manifest integrity, version mismatch, hooks presence, codex-toml sanity, askuser runtime availability, codebase docs freshness, milestone/slice directory layout.
+Checks: payload manifest integrity, version mismatch, hooks presence, codex-toml sanity, askuser runtime availability, codebase docs freshness, milestone/slice directory layout, the three Nubosloop checks (critics present, knowledge store, config), orphan temp files, and output schemas.
 ## Development
@@ -144,6 +146,35 @@ npm test                         # all unit tests via node:test
 node bin/check-workflows.cjs     # workflow linter
 ```
+See [`CONTRIBUTING.md`](./CONTRIBUTING.md) for setup, code conventions, ADR
+map and commit format.
+## Architecture Decisions
+ADRs live in the VitePress at
+[`pilot.nubos.cloud/v1/adr/`](https://pilot.nubos.cloud/v1/adr/). The
+load-bearing ones for users and contributors:
+| ADR | What it pins |
+|---|---|
+| 0004 | `workflow.commit_artifacts` controls whether `.nubos-pilot/` is committed |
+| 0010 | Nubosloop — researcher → executor → critic-schwarm is mandatory in `/np:execute-phase` |
+| 0012 | Completeness doctrine (12 rules in `templates/COMPLETENESS.md`) |
+| 0013 | Learnings-store schema evolution |
+| 0017 | Strict output-schema enforcement |
+| 0019 | Plan-side trust layer (`lib/plan-lint.cjs`) |
+## Security
+See [`SECURITY.md`](./SECURITY.md) for the vulnerability disclosure policy
+and threat model.
+## Support
+- Bugs / features: [GitHub issues](https://github.com/Nubos-AI/nubos-pilot/issues)
+- Security: `security@nubos.ai` (see [`SECURITY.md`](./SECURITY.md))
+- Docs: <https://pilot.nubos.cloud>
 ## License
-MIT
+MIT — see [`LICENSE`](./LICENSE).

package/SECURITY.md ADDED Viewed

@@ -0,0 +1,60 @@
+# Security Policy
+## Reporting a Vulnerability
+If you discover a security issue in nubos-pilot, **do not open a public issue**.
+Email **security@nubos.ai** with:
+- A description of the issue and its impact.
+- Steps to reproduce (PoC if possible).
+- The affected version (`npx nubos-pilot --version` or check `package.json`).
+- Your preferred contact channel for follow-up.
+We will acknowledge receipt within **3 business days** and provide a
+resolution plan within **14 business days**. Fixes are released as patch
+versions and announced in `CHANGELOG.md`.
+## Supported Versions
+| Version | Supported |
+|---------|-----------|
+| 0.2.x   | ✅ active |
+| < 0.2   | ❌ end of life |
+Only the latest minor on the current major receives security patches until
+1.0 is reached.
+## Threat Model
+nubos-pilot is a **local CLI** distributed via npm to developer workstations
+and CI. It is **not** a hosted service. The threat surface and assumptions:
+| What nubos-pilot reads | What it writes | What it executes |
+|---|---|---|
+| `.nubos-pilot/`, project source for context | `.nubos-pilot/` state, `~/.codex/`, `~/.claude/` config (install only) | `git`, `claude`/`codex` headless via `child_process.spawn` |
+**Trust boundaries:**
+- **Project source code** — untrusted in the sense that agent-authored
+  files (`PLAN.md`, `RESEARCH.md` etc.) may contain hostile YAML. nubos-pilot
+  rejects prototype-pollution keys, refuses symlink-escape via `safe-path`,
+  caps message bodies, and whitelists ML model identifiers.
+- **`.nubos-pilot/messages/`** — multi-agent inbox; entries are written
+  atomically with `O_CREAT|O_EXCL|O_NOFOLLOW` (POSIX) so a pre-planted
+  symlink cannot redirect writes.
+- **Subprocess spawn** — `claude`/`codex` are invoked via `spawnSync` (no
+  shell). The binary path is overridable via `NUBOS_PILOT_CLAUDE_BIN` /
+  `NUBOS_PILOT_CODEX_BIN`; treat operators who can set those env vars as
+  trusted.
+- **`workflow.commit_artifacts`** flag controls whether `.nubos-pilot/`
+  artifacts are committed to git. Default is `true`; downstream projects
+  that consider artifacts sensitive should set it to `false`.
+## What is Out of Scope
+- Vulnerabilities in `@huggingface/transformers`, `usearch`, or the
+  `yaml` package — report those upstream.
+- Operator-controlled config (`config.json`) that the operator themselves
+  wrote — config is trusted input from the project owner.
+- DoS from running nubos-pilot in obviously bad conditions
+  (no disk space, no Node 22+, broken `git`).

package/agents/np-architect.md CHANGED Viewed

@@ -70,7 +70,7 @@ If the project already documents a module/pattern that fits, extend it instead o
 ## Output Contract
-**Granularity (ADR-0013).** Architecture decisions are intent-level: which library, which boundary, which protocol. They do NOT prescribe implementation — no schema DDL, no exact framework-generated filenames, no code-style edicts. Those are executor-territory and downstream `np-planner` will refuse plans that bake them in (Plan-side Trust Layer, ADR-0013). If you find yourself describing how a controller method should be structured, stop — that's not architecture.
+**Granularity (ADR-0019).** Architecture decisions are intent-level: which library, which boundary, which protocol. They do NOT prescribe implementation — no schema DDL, no exact framework-generated filenames, no code-style edicts. Those are executor-territory and downstream `np-planner` will refuse plans that bake them in (Plan-side Trust Layer, ADR-0019). If you find yourself describing how a controller method should be structured, stop — that's not architecture.
 ```markdown
 # M<NNN> — <milestone name> — Architecture

package/agents/np-build-fixer.md CHANGED Viewed

@@ -58,9 +58,9 @@ The orchestrator provides these in your prompt context. Read every path it hands
    - `infra` (missing tool, network, env var) → STOP and emit `## INFRA BLOCKER` block; do not edit source.
 1a. **MANDATORY knowledge lookup (Rule 9 — non-optional, runs before any Edit).** Pick the failing symbol or error class from Step 1 and run:
     ```bash
-    node .nubos-pilot/bin/np-tools.cjs knowledge-search "<failing-symbol-or-error-class>" --limit 5
+    node .nubos-pilot/bin/np-tools.cjs knowledge-search "<failing-symbol-or-error-class>" --task <task-id> --limit 5
     ```
-    If a hit lives in `.nubos-pilot/codebase/<module>.md`, `Read` that doc before patching. Skipping this step stamps `rule-9-violation` in the Layer-C audit log and the loop routes back to the researcher swarm next round — it is **not** an opt-out.
+    The `--task <task-id>` flag is required: it records the Rule 9 evidence the tool-use audit cross-checks. A `knowledge-search` run without it leaves no ledger entry, so the audit treats the spawn as if it never searched (`rule-9-search-tool-unverified`). If a hit lives in `.nubos-pilot/codebase/<module>.md`, `Read` that doc before patching. Skipping this step stamps `rule-9-violation` in the Layer-C audit log and the loop routes back to the researcher swarm next round — it is **not** an opt-out.
 2. **Locate the failure surface** strictly inside `files_modified`. If the failure points outside that set, emit `## SCOPE EXPANSION REQUEST` and stop — do NOT edit out-of-scope files.
 3. **Propose the smallest patch** that addresses the root cause:
    - For `compile` / `lint`: edit the offending file directly.
@@ -72,10 +72,10 @@ The orchestrator provides these in your prompt context. Read every path it hands
 ## Mandatory Knowledge Lookup (Rule 9)
-**This is non-optional, not advisory.** Workflow Step 1a runs the lookup before any Edit. Skipping it stamps `rule-9-violation` in the audit log and forces a re-route to the researcher swarm.
+**This is non-optional, not advisory.** Workflow Step 1a runs the lookup before any Edit. Skipping it — or running it without `--task` — stamps `rule-9-violation` in the audit log and forces a re-route to the researcher swarm.
 ```bash
-node .nubos-pilot/bin/np-tools.cjs knowledge-search "<failing-symbol>" --limit 5
+node .nubos-pilot/bin/np-tools.cjs knowledge-search "<failing-symbol>" --task <task-id> --limit 5
 ```
 If a hit lives in `.nubos-pilot/codebase/<module>.md`, `Read` that doc before patching. Cross-task context belongs in `RULES.md` and `M<NNN>-CONTEXT.md`.

package/agents/np-executor.md CHANGED Viewed

@@ -31,7 +31,7 @@ This agent operates under [`templates/COMPLETENESS.md`](../templates/COMPLETENES
 - **Rule 3 — Do it with tests.** Every commit ships tests for the production code it adds or changes. No "trivial enough to skip tests" exceptions.
 - **Rule 4 — Do it with documentation.** Update `.nubos-pilot/codebase/<module>.md` after every commit (`update-docs` is mandatory, not optional).
 - **Rule 7 — Never leave a dangling thread.** Dead imports, unused symbols, half-renamed identifiers — clean them up in the same commit that introduces the change.
-- **Rule 9 — Search before building.** Run `knowledge-search` for the symbols you plan to introduce before writing them. Reuse beats reinvention.
+- **Rule 9 — Search before building.** Before writing any new symbol, run `node np-tools.cjs knowledge-search "<symbol>" --task <task-id>` via Bash. The `--task <task-id>` flag is mandatory — it records the evidence the Rule 9 tool-use audit cross-checks; a lookup without it counts as no search. Reuse beats reinvention.
 - **Rule 10 — Test before shipping.** Verify must be green before you call `commit-task`. Manual "I ran it once" is not proof of work.
 Refusal of any rule is a hard-stop. Surface the violation to the orchestrator verbatim and abort the spawn.

package/agents/np-plan-checker.md CHANGED Viewed

@@ -28,7 +28,7 @@ Refusal of any rule is a hard-stop. Surface the violation to the orchestrator ve
 ## Role
-Adversarial reader of milestone plans. You assume the planner made mistakes and look for them systematically. You enforce the canonical finding-category taxonomy published in `docs/agent-frontmatter-schema.md` — every issue you emit MUST use one of those codes verbatim.
+Adversarial reader of milestone plans. You assume the planner made mistakes and look for them systematically. You enforce the canonical finding-category taxonomy defined below — every issue you emit MUST use one of those codes verbatim.
 You are NOT the executor (`/np:execute-phase`) and NOT the post-execution verifier (`/np:validate-phase`). You verify plans WILL work before execution; the verifier confirms code DID work after execution. Same goal-backward methodology, different timing.
@@ -53,7 +53,7 @@ Additional context the orchestrator may inline in the prompt:
 ## Review Dimensions
-Each dimension maps to one or more canonical finding categories from `docs/agent-frontmatter-schema.md`. The 14 canonical codes are:
+Each dimension maps to one or more canonical finding categories. The 14 canonical codes are:
 - `missing-success-criterion` — a ROADMAP SC-X is not mapped to any task.
 - `non-atomic-task` — a task bundles multiple distinct deliverables that should be split.
@@ -66,9 +66,9 @@ Each dimension maps to one or more canonical finding categories from `docs/agent
 - `hook-field-present` — agent frontmatter contains `hooks:` (D-10).
 - `forbidden-agent-field` — agent frontmatter contains `model:` or `model_profile:` (D-10).
 - `unverified-assumption` — a slice plan's `<reality_check>` block is missing, empty, or contains an `<assumption>` without a non-empty `verified_by` attribute, OR a `<files_read>` path does not exist in the repo (Reality-Check rule, see Dimension 12).
-- `verify-command-unknown` — a `<verify>` block invokes a command that is not a known np-tools verb, declared composer/npm script, vendor binary, or POSIX baseline tool (Plan-side Trust Layer, ADR-0013). Mechanically detected by `np-tools.cjs plan-lint`; you mirror the verdict into your findings array so the loop handler treats it uniformly with semantic findings.
-- `parallel-task-implicit-dependency` — tasks marked `depends_on: []` in the same slice but one of them runs a working-tree-reading verify (`update-docs`, `phpstan analyse`, `git diff`, etc.) against files another sibling modifies. Implicit ordering must be made explicit (Plan-side Trust Layer, ADR-0013).
-- `plan-over-specifies-implementation` — PLAN.md body contains schema DDL, framework-controlled timestamped filenames, or large inline code snippets. Plans specify intent + boundary + acceptance, not implementation. Severity is `major` (advisory) — not a hard block, but you flag it so the planner course-corrects (Plan-side Granularity Doctrine, ADR-0013).
+- `verify-command-unknown` — a `<verify>` block invokes a command that is not a known np-tools verb, declared composer/npm script, vendor binary, or POSIX baseline tool (Plan-side Trust Layer, ADR-0019). Mechanically detected by `np-tools.cjs plan-lint`; you mirror the verdict into your findings array so the loop handler treats it uniformly with semantic findings.
+- `parallel-task-implicit-dependency` — tasks marked `depends_on: []` in the same slice but one of them runs a working-tree-reading verify (`update-docs`, `phpstan analyse`, `git diff`, etc.) against files another sibling modifies. Implicit ordering must be made explicit (Plan-side Trust Layer, ADR-0019).
+- `plan-over-specifies-implementation` — PLAN.md body contains schema DDL, framework-controlled timestamped filenames, or large inline code snippets. Plans specify intent + boundary + acceptance, not implementation. Severity is `major` (advisory) — not a hard block, but you flag it so the planner course-corrects (Plan-side Granularity Doctrine, ADR-0019).
 Note on the Nubosloop critic: as of 2026-05-05 a single `np-critic` agent covers style + tests + acceptance in one spawn (ADR-0010 §Single-Critic Revision). The legacy three-critic schwarm (`np-critic-style`/`np-critic-tests`/`np-critic-acceptance`) is removed. References in older plans should be updated.

package/agents/np-planner.md CHANGED Viewed

@@ -277,7 +277,7 @@ Every PLAN.md you write will be consumed by an executor agent that:
 **Implications for your writing style:**
 - **Name the library, not the category.** "Use `jose` for JWT" > "use a JWT library".
-- **Name the file, not the area** — for *deterministic edits the planner can know up-front*. "Modify `src/api/auth/login.ts`" > "update the auth layer". For *scaffolding tasks where a framework generates files at install/publish time*, use a glob (`database/migrations/*_cashier_*.php`) or leave `files_modified` empty — the executor resolves the real paths from the actual publish output and `commit-task` falls back to `checkpoint.files_touched` (D-04, ADR-0013 Layer-D Granularity).
+- **Name the file, not the area** — for *deterministic edits the planner can know up-front*. "Modify `src/api/auth/login.ts`" > "update the auth layer". For *scaffolding tasks where a framework generates files at install/publish time*, use a glob (`database/migrations/*_cashier_*.php`) or leave `files_modified` empty — the executor resolves the real paths from the actual publish output and `commit-task` falls back to `checkpoint.files_touched` (D-04, ADR-0019 Layer-D Granularity).
 - **Name the command, not the intent.** "Run `npm test -- --filter=auth`" > "run the tests".
 - **Cite existing interfaces verbatim.** If `lib/core.cjs` exports `NubosPilotError(code, message, details)` — quote that signature in the task context so the executor doesn't mis-remember.
 - **Document deviations from canonical advice.** If you deviate from CONTEXT.md's stack choice, say so explicitly and note why.
@@ -286,7 +286,7 @@ If the executor has to stop and read three more files to figure out what you mea
 </downstream_awareness>
 <plan_granularity>
-## Plan Granularity Doctrine — Intent + Boundary + Acceptance, NOT Implementation (ADR-0013)
+## Plan Granularity Doctrine — Intent + Boundary + Acceptance, NOT Implementation (ADR-0019)
 A PLAN.md is a contract. It specifies **what** must be true at the end (intent), **where** the work is allowed to touch (boundary), and **how** success is measured (acceptance). It does NOT specify HOW the implementation looks. That's the executor's territory; you don't have ground-truth on it and pretending you do is the bug class that produced the M004 plan-bugs.

package/agents/np-researcher.md CHANGED Viewed

@@ -24,7 +24,7 @@ Your output is prescriptive, not exploratory: "Use library X at version Y" beats
 This agent operates under [`templates/COMPLETENESS.md`](../templates/COMPLETENESS.md). The rules that bind this role:
 - **Rule 5 — Aim to genuinely impress.** Prescriptive beats exploratory. "Use `jose@6.0.10`" beats "consider a JWT library". Vague research produces vague plans, vague plans produce vague software.
-- **Rule 9 — Search before building.** This is your core job. Before any new claim, search the local knowledge index (`knowledge-search`), the codebase docs (`.nubos-pilot/codebase/`), and Context7 / WebFetch. Reuse prior learnings.
+- **Rule 9 — Search before building.** This is your core job. Before any new claim, search the local knowledge index via `node np-tools.cjs knowledge-search "<query>"` (pass `--task <task-id>` when spawned inside the execute-loop so the Rule 9 audit ledger records the call), the codebase docs (`.nubos-pilot/codebase/`), and Context7 / WebFetch. Reuse prior learnings.
 - **Rule 11 — Ship the complete thing.** RESEARCH.md is a deliverable, not a draft. Every claim has provenance, every assumption is tagged `[ASSUMED]`, every gap is listed in `Open Questions`. No half-research.
 Refusal of any rule is a hard-stop. Surface the violation to the orchestrator verbatim and abort the spawn.
@@ -37,7 +37,7 @@ Your per-spawn output MUST conform to the **`researcher-output`** schema. The or
 Hard rules from the schema:
-- Frontmatter must include `schema_version`, `agent: np-researcher`, `spawn_index`, `seed_delta`, `task_query_hash`, plus count fields (`decision_count`, `risk_count`, etc.).
+- Frontmatter must include `schema_version`, `agent: np-researcher`, `spawn_index`, `seed_delta`, `task_query_hash`, plus count fields (`decision_count`, `risk_count`, etc.). `spawn_index` and `seed_delta` are **integers** — copy them verbatim from the `index` / `seed_delta` fields of your spawn spec. The prose perspective nudge arrives on the spawn spec's separate `seed_nudge` field; it shapes HOW you investigate and never goes into frontmatter.
 - Five body sections are pflichtig (use `_None._` if empty): `## Decisions`, `## Risks`, `## Patterns`, `## Open Questions`, `## Sources`.
 - Every Decision / Risk / Pattern / Open Question / Source uses heading style `### <PREFIX>-N: <text>` where PREFIX ∈ {D, R, P, Q, S}.
 - **Every entry has a `**Reasoning:**` field** (mandatory). The Reasoning field documents what you weighed, what you discarded, and why this conclusion. The reconciler compares `Reasoning` traces across spawns to detect groupthink (identical reasoning → low independent evidence) vs orthogonal evidence (different reasoning paths to same conclusion → strong signal).

package/bin/check-workflows.cjs CHANGED Viewed

@@ -66,8 +66,6 @@ function _scanMetricsCoverage(files) {
     const raw = fs.readFileSync(file, 'utf-8');
     const lines = raw.split(/\r?\n/);
     let inAnyFence = false;
     let inBashFence = false;
     for (let i = 0; i < lines.length; i++) {
@@ -102,10 +100,6 @@ function _scanMetricsCoverage(files) {
   return warnings;
 }
-function _scan(dir) {
-  return _scanFiles(_walk(dir, [], { ext: ['.md'] }));
-}
 function _scanInstallerSurface(cwd) {
   const root = cwd || process.cwd();
   const files = [];
@@ -131,7 +125,7 @@ function checkWorkflows(dir) {
       violations.push(..._scanFiles(workflowFiles));
       warnings.push(..._scanMetricsCoverage(workflowFiles));
     }
-  } catch {  }
+  } catch {}
   violations.push(..._scanInstallerSurface());
   return { violations, warnings, exitCode: violations.length ? 1 : 0 };
 }
@@ -158,7 +152,6 @@ if (require.main === module) main();
 module.exports = {
   checkWorkflows,
-  _scan,
   _scanFiles,
   _scanInstallerSurface,
   _scanMetricsCoverage,