npm - muonroi-cli - Versions diffs - 1.4.1 → 1.6.0 - Mend

muonroi-cli 1.4.1 → 1.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (194) hide show

package/LICENSE +21 -21
package/README.md +122 -122
package/dist/packages/agent-harness-core/src/predicate.d.ts +1 -1
package/dist/src/agent-harness/__tests__/mock-model.spec.js +48 -1
package/dist/src/agent-harness/mock-model.d.ts +11 -0
package/dist/src/agent-harness/mock-model.js +21 -0
package/dist/src/cli/cost-forensics.js +12 -12
package/dist/src/council/__tests__/clarification-prompt.test.js +51 -0
package/dist/src/council/__tests__/clarifier-ready-gate.test.js +32 -0
package/dist/src/council/__tests__/decisions-lock.test.js +17 -1
package/dist/src/council/__tests__/oauth-reachable.test.d.ts +1 -0
package/dist/src/council/__tests__/oauth-reachable.test.js +31 -0
package/dist/src/council/__tests__/parse-outcome-fallback.test.js +11 -0
package/dist/src/council/clarifier.js +9 -1
package/dist/src/council/debate.js +5 -1
package/dist/src/council/decisions-lock.js +3 -3
package/dist/src/council/index.js +12 -5
package/dist/src/council/leader.d.ts +0 -17
package/dist/src/council/leader.js +22 -15
package/dist/src/council/planner.js +1 -1
package/dist/src/council/prompts.js +63 -57
package/dist/src/council/types.d.ts +7 -0
package/dist/src/ee/__tests__/ee-onboarding.test.d.ts +1 -0
package/dist/src/ee/__tests__/ee-onboarding.test.js +32 -0
package/dist/src/ee/artifact-cache.d.ts +56 -0
package/dist/src/ee/artifact-cache.js +155 -0
package/dist/src/ee/artifact-cache.test.d.ts +1 -0
package/dist/src/ee/artifact-cache.test.js +69 -0
package/dist/src/ee/auth.d.ts +9 -0
package/dist/src/ee/auth.js +19 -0
package/dist/src/ee/ee-onboarding.d.ts +5 -0
package/dist/src/ee/ee-onboarding.js +76 -0
package/dist/src/ee/search.js +7 -5
package/dist/src/ee/search.test.d.ts +1 -0
package/dist/src/ee/search.test.js +23 -0
package/dist/src/generated/version.d.ts +1 -1
package/dist/src/generated/version.js +1 -1
package/dist/src/headless/output.js +6 -4
package/dist/src/headless/output.test.js +4 -3
package/dist/src/index.js +20 -1
package/dist/src/mcp/__tests__/auto-setup.test.js +74 -0
package/dist/src/mcp/__tests__/client-pool.spec.d.ts +1 -0
package/dist/src/mcp/__tests__/client-pool.spec.js +98 -0
package/dist/src/mcp/__tests__/parallel-build.spec.d.ts +1 -0
package/dist/src/mcp/__tests__/parallel-build.spec.js +67 -0
package/dist/src/mcp/__tests__/smart-filter.test.js +56 -0
package/dist/src/mcp/auto-setup.js +56 -2
package/dist/src/mcp/client-pool.d.ts +46 -0
package/dist/src/mcp/client-pool.js +212 -0
package/dist/src/mcp/oauth-callback.js +2 -2
package/dist/src/mcp/parse-headers.test.js +14 -14
package/dist/src/mcp/runtime.d.ts +28 -0
package/dist/src/mcp/runtime.js +117 -51
package/dist/src/mcp/self-verify-runner.d.ts +14 -0
package/dist/src/mcp/self-verify-runner.js +38 -0
package/dist/src/mcp/setup-guide-text.d.ts +9 -0
package/dist/src/mcp/setup-guide-text.js +84 -0
package/dist/src/mcp/smart-filter.js +49 -0
package/dist/src/mcp/smoke.test.js +43 -43
package/dist/src/mcp/tools-server.d.ts +7 -0
package/dist/src/mcp/tools-server.js +19 -22
package/dist/src/models/catalog.json +349 -349
package/dist/src/ops/__tests__/doctor-ee-health.test.js +21 -0
package/dist/src/ops/doctor.d.ts +3 -2
package/dist/src/ops/doctor.js +47 -11
package/dist/src/ops/doctor.test.js +4 -3
package/dist/src/orchestrator/__tests__/mcp-capability-block.test.d.ts +1 -0
package/dist/src/orchestrator/__tests__/mcp-capability-block.test.js +39 -0
package/dist/src/orchestrator/__tests__/project-stack.test.d.ts +1 -0
package/dist/src/orchestrator/__tests__/project-stack.test.js +65 -0
package/dist/src/orchestrator/batch-turn-runner.js +7 -11
package/dist/src/orchestrator/compaction.d.ts +2 -0
package/dist/src/orchestrator/compaction.js +14 -1
package/dist/src/orchestrator/compaction.test.js +25 -1
package/dist/src/orchestrator/message-processor.js +72 -32
package/dist/src/orchestrator/orchestrator.js +26 -0
package/dist/src/orchestrator/prompts.d.ts +51 -0
package/dist/src/orchestrator/prompts.js +257 -134
package/dist/src/orchestrator/scope-ceiling.js +6 -1
package/dist/src/orchestrator/scope-reminder.d.ts +12 -0
package/dist/src/orchestrator/scope-reminder.js +16 -0
package/dist/src/orchestrator/scope-reminder.test.js +22 -1
package/dist/src/orchestrator/stream-runner.js +23 -15
package/dist/src/orchestrator/subagent-compactor.d.ts +14 -5
package/dist/src/orchestrator/subagent-compactor.js +30 -8
package/dist/src/orchestrator/subagent-compactor.spec.js +18 -0
package/dist/src/orchestrator/text-tool-call-detector.test.js +13 -13
package/dist/src/pil/__tests__/clarity-gate.test.js +24 -215
package/dist/src/pil/__tests__/config.test.js +1 -17
package/dist/src/pil/__tests__/discovery.test.js +144 -11
package/dist/src/pil/__tests__/layer1-intent-trace.test.js +7 -2
package/dist/src/pil/__tests__/layer1-intent.test.js +3 -0
package/dist/src/pil/__tests__/layer16-clarity.test.js +32 -116
package/dist/src/pil/__tests__/layer4-gsd.test.js +37 -0
package/dist/src/pil/__tests__/layer6-output.test.js +158 -18
package/dist/src/pil/__tests__/llm-classify.test.js +49 -2
package/dist/src/pil/__tests__/surface-compaction-artifacts.test.d.ts +1 -0
package/dist/src/pil/__tests__/surface-compaction-artifacts.test.js +112 -0
package/dist/src/pil/agent-operating-contract.d.ts +1 -1
package/dist/src/pil/agent-operating-contract.js +2 -0
package/dist/src/pil/agent-operating-contract.test.js +7 -2
package/dist/src/pil/cheap-model-playbook.js +35 -35
package/dist/src/pil/cheap-model-workbooks.js +16 -13
package/dist/src/pil/clarity-gate.d.ts +21 -19
package/dist/src/pil/clarity-gate.js +26 -153
package/dist/src/pil/config.d.ts +9 -1
package/dist/src/pil/config.js +15 -4
package/dist/src/pil/discovery.js +211 -136
package/dist/src/pil/layer1-intent.d.ts +12 -0
package/dist/src/pil/layer1-intent.js +283 -38
package/dist/src/pil/layer1-intent.test.js +210 -4
package/dist/src/pil/layer16-clarity.d.ts +25 -11
package/dist/src/pil/layer16-clarity.js +19 -306
package/dist/src/pil/layer3-ee-injection.d.ts +19 -0
package/dist/src/pil/layer3-ee-injection.js +96 -4
package/dist/src/pil/layer4-gsd.js +18 -6
package/dist/src/pil/layer6-output.d.ts +2 -0
package/dist/src/pil/layer6-output.js +151 -25
package/dist/src/pil/llm-classify.d.ts +26 -0
package/dist/src/pil/llm-classify.js +34 -5
package/dist/src/pil/native-capabilities-workbook.d.ts +1 -1
package/dist/src/pil/native-capabilities-workbook.js +82 -76
package/dist/src/pil/pipeline.js +15 -9
package/dist/src/pil/schema.d.ts +8 -0
package/dist/src/pil/schema.js +12 -1
package/dist/src/pil/task-tier-map.js +4 -0
package/dist/src/pil/types.d.ts +11 -1
package/dist/src/product-loop/done-gate.js +3 -3
package/dist/src/product-loop/loop-driver.js +18 -18
package/dist/src/product-loop/progress-snapshot.js +4 -4
package/dist/src/providers/auth/gemini-oauth.js +6 -15
package/dist/src/providers/auth/grok-oauth.js +6 -15
package/dist/src/providers/auth/openai-oauth.js +6 -15
package/dist/src/providers/mcp-vision-bridge.js +48 -48
package/dist/src/reporter/index.js +1 -1
package/dist/src/scaffold/bb-ecosystem-apply.js +47 -47
package/dist/src/scaffold/bb-quality-gate.js +5 -5
package/dist/src/scaffold/continuation-prompt.js +60 -60
package/dist/src/scaffold/init-new.js +453 -453
package/dist/src/self-qa/__tests__/scenario-planner.test.js +3 -3
package/dist/src/self-qa/agentic-loop.js +24 -19
package/dist/src/self-qa/spec-emitter.js +26 -23
package/dist/src/storage/__tests__/migrations.test.js +2 -2
package/dist/src/storage/interaction-log.js +5 -5
package/dist/src/storage/migrations.js +122 -122
package/dist/src/storage/sessions.js +42 -42
package/dist/src/storage/transcript.js +91 -84
package/dist/src/storage/usage.js +14 -14
package/dist/src/storage/workspaces.js +12 -12
package/dist/src/tools/__tests__/native-tools.test.d.ts +1 -0
package/dist/src/tools/__tests__/native-tools.test.js +53 -0
package/dist/src/tools/git-safety.d.ts +61 -0
package/dist/src/tools/git-safety.js +141 -0
package/dist/src/tools/git-safety.test.d.ts +1 -0
package/dist/src/tools/git-safety.test.js +111 -0
package/dist/src/tools/native-tools.d.ts +31 -0
package/dist/src/tools/native-tools.js +273 -0
package/dist/src/tools/registry-ee-query.test.js +18 -1
package/dist/src/tools/registry-git-safety.test.d.ts +7 -0
package/dist/src/tools/registry-git-safety.test.js +92 -0
package/dist/src/tools/registry.js +52 -6
package/dist/src/ui/__tests__/markdown-render.test.d.ts +1 -0
package/dist/src/ui/__tests__/markdown-render.test.js +48 -0
package/dist/src/ui/app.js +0 -0
package/dist/src/ui/components/message-view.js +4 -1
package/dist/src/ui/components/structured-response-view.js +7 -3
package/dist/src/ui/components/tool-group.js +7 -1
package/dist/src/ui/markdown-render.d.ts +41 -0
package/dist/src/ui/markdown-render.js +223 -0
package/dist/src/ui/markdown.d.ts +10 -0
package/dist/src/ui/markdown.js +12 -35
package/dist/src/ui/slash/council-inspect.js +4 -4
package/dist/src/ui/slash/export.js +4 -4
package/dist/src/ui/utils/text.d.ts +8 -0
package/dist/src/ui/utils/text.js +16 -0
package/dist/src/ui/utils/text.test.d.ts +1 -0
package/dist/src/ui/utils/text.test.js +23 -0
package/dist/src/usage/ledger.js +48 -15
package/dist/src/utils/__tests__/footprint-gitignore.test.d.ts +1 -0
package/dist/src/utils/__tests__/footprint-gitignore.test.js +50 -0
package/dist/src/utils/clipboard-image.js +23 -23
package/dist/src/utils/open-url.d.ts +56 -0
package/dist/src/utils/open-url.js +58 -0
package/dist/src/utils/open-url.test.d.ts +1 -0
package/dist/src/utils/open-url.test.js +86 -0
package/dist/src/utils/settings.d.ts +12 -0
package/dist/src/utils/settings.js +48 -0
package/dist/src/utils/side-question.js +2 -2
package/dist/src/utils/skills.js +3 -3
package/dist/src/verify/__tests__/coverage-parsers.test.js +30 -30
package/dist/src/verify/environment.js +2 -1
package/package.json +1 -1
package/dist/src/pil/layer16-clarity.test.js +0 -31
/package/dist/src/{pil/layer16-clarity.test.d.ts → council/__tests__/clarification-prompt.test.d.ts} +0 -0

package/dist/src/tools/git-safety.test.js ADDED Viewed

@@ -0,0 +1,111 @@
+import { mkdtempSync, rmSync, writeFileSync } from "node:fs";
+import { tmpdir } from "node:os";
+import { join } from "node:path";
+import { afterEach, beforeEach, describe, expect, it } from "vitest";
+import { __resetGitSafetyState, analyzeGitCommand, checkPushGate, detectSensitiveStaging, recordCommandOutcome, stagingWarning, } from "./git-safety.js";
+describe("analyzeGitCommand", () => {
+    it("detects git push (with flags and chained)", () => {
+        expect(analyzeGitCommand("git push").isPush).toBe(true);
+        expect(analyzeGitCommand("git push origin main").isPush).toBe(true);
+        expect(analyzeGitCommand("git -c x=y push --force").isPush).toBe(true);
+        expect(analyzeGitCommand("git add -A && git commit -m x && git push origin main").isPush).toBe(true);
+    });
+    it("does not match 'push' inside a quoted commit message", () => {
+        expect(analyzeGitCommand('git commit -m "fix git push regression"').isPush).toBe(false);
+    });
+    it("detects a real push on its own line in a multi-line script", () => {
+        expect(analyzeGitCommand("git config user.name x\ngit push origin main").isPush).toBe(true);
+    });
+    it("does not bleed across a newline into an unrelated command", () => {
+        // 'git status' then a separate line with the word 'push' is NOT a git push.
+        expect(analyzeGitCommand("git status\necho push-notification").isPush).toBe(false);
+        expect(analyzeGitCommand("git log\nrm push.txt").isPush).toBe(false);
+    });
+    it("detects broad staging (-A / . / --all / commit -a)", () => {
+        expect(analyzeGitCommand("git add -A").isBroadStage).toBe(true);
+        expect(analyzeGitCommand("git add .").isBroadStage).toBe(true);
+        expect(analyzeGitCommand("git add --all").isBroadStage).toBe(true);
+        expect(analyzeGitCommand("git commit -am 'x'").isBroadStage).toBe(true);
+        expect(analyzeGitCommand("git commit -a").isBroadStage).toBe(true);
+    });
+    it("detects broad staging even with git global options before the subcommand", () => {
+        expect(analyzeGitCommand("git -c core.editor=true commit -a").isBroadStage).toBe(true);
+        expect(analyzeGitCommand("git -c x=y add -A").isBroadStage).toBe(true);
+    });
+    it("does not flag explicit/narrow staging or non-staging flags", () => {
+        expect(analyzeGitCommand("git add src/foo.ts src/bar.ts").isBroadStage).toBe(false);
+        expect(analyzeGitCommand("git add ./src/foo.ts").isBroadStage).toBe(false);
+        expect(analyzeGitCommand("git commit -m 'message'").isBroadStage).toBe(false);
+        expect(analyzeGitCommand("git commit --amend").isBroadStage).toBe(false);
+        // -a must be a clean flag cluster — a malformed `-a--otherflag` is not `-a`.
+        expect(analyzeGitCommand("git commit -a--otherflag").isBroadStage).toBe(false);
+    });
+});
+describe("push gate", () => {
+    beforeEach(() => {
+        __resetGitSafetyState();
+        delete process.env.MUONROI_ALLOW_PUSH_ON_RED;
+    });
+    afterEach(() => {
+        delete process.env.MUONROI_ALLOW_PUSH_ON_RED;
+    });
+    it("does not block when no verification has failed", () => {
+        expect(checkPushGate("s1").blocked).toBe(false);
+    });
+    it("blocks push after a verification command fails", () => {
+        recordCommandOutcome("s1", "npm test", false);
+        const gate = checkPushGate("s1");
+        expect(gate.blocked).toBe(true);
+        expect(gate.failed).toContain("npm test");
+    });
+    it("clears the block when that same command re-runs green", () => {
+        recordCommandOutcome("s1", "npm test", false);
+        expect(checkPushGate("s1").blocked).toBe(true);
+        recordCommandOutcome("s1", "npm test", true);
+        expect(checkPushGate("s1").blocked).toBe(false);
+    });
+    it("a different verify passing does NOT clear an unrelated failed verify", () => {
+        recordCommandOutcome("s1", "npm test", false);
+        recordCommandOutcome("s1", "npm run build", true); // build green, tests still red
+        expect(checkPushGate("s1").blocked).toBe(true);
+        expect(checkPushGate("s1").failed).toEqual(["npm test"]);
+    });
+    it("is session-scoped (one session's failure does not gate another)", () => {
+        recordCommandOutcome("s1", "vitest run", false);
+        expect(checkPushGate("s1").blocked).toBe(true);
+        expect(checkPushGate("s2").blocked).toBe(false);
+    });
+    it("ignores non-verification command outcomes", () => {
+        recordCommandOutcome("s1", "git status", false);
+        recordCommandOutcome("s1", "ls -la", false);
+        expect(checkPushGate("s1").blocked).toBe(false);
+    });
+    it("respects the MUONROI_ALLOW_PUSH_ON_RED override", () => {
+        recordCommandOutcome("s1", "npm test", false);
+        process.env.MUONROI_ALLOW_PUSH_ON_RED = "1";
+        expect(checkPushGate("s1").blocked).toBe(false);
+    });
+});
+describe("sensitive staging detection", () => {
+    let dir;
+    beforeEach(() => {
+        dir = mkdtempSync(join(tmpdir(), "git-safety-"));
+    });
+    afterEach(() => {
+        rmSync(dir, { recursive: true, force: true });
+    });
+    it("flags .env and .muonroi-cli present in the repo root", () => {
+        writeFileSync(join(dir, ".env"), "SECRET=1");
+        writeFileSync(join(dir, ".muonroi-cli"), ""); // a file is enough for existsSync
+        const found = detectSensitiveStaging(dir);
+        expect(found).toContain(".env");
+        expect(found).toContain(".muonroi-cli");
+        expect(stagingWarning(dir)).toMatch(/WARNING/);
+    });
+    it("returns no warning for a clean repo", () => {
+        writeFileSync(join(dir, "README.md"), "# ok");
+        expect(detectSensitiveStaging(dir)).toEqual([]);
+        expect(stagingWarning(dir)).toBe("");
+    });
+});
+//# sourceMappingURL=git-safety.test.js.map

package/dist/src/tools/native-tools.d.ts ADDED Viewed

@@ -0,0 +1,31 @@
+/**
+ * src/tools/native-tools.ts
+ *
+ * NATIVE in-process builtins for the capabilities that muonroi-tools previously
+ * exposed only via a self-spawned MCP subprocess: ee_health, ee_feedback,
+ * usage_forensics, lsp_query, setup_guide, and selfverify_* (start/status/
+ * result/list/cancel).
+ *
+ * Why native: muonroi-tools is THIS CLI. Self-spawning a 137MB CLI as an MCP
+ * server per turn cold-started ~2-3.5s and overran the build deadline (and a
+ * seed-time bug once persisted a vitest-worker command that crashed on launch).
+ * For the CLI's OWN inner agent these tools should run in-process — no subprocess,
+ * no MCP round-trip, no cold-start. The muonroi-tools MCP server (tools-server.ts)
+ * stays for EXTERNAL agents (Claude Code etc.). `ee_query` is already native
+ * (registry.ts) and is intentionally NOT duplicated here.
+ *
+ * Each tool reuses the SAME core the MCP server wraps (ee/search, cli/cost-
+ * forensics, lsp/runtime, the shared self-verify JobManager), so behaviour is
+ * identical across the two surfaces.
+ */
+import { type ToolSet } from "ai";
+/** The native tool names this module registers — used by the MCP-twin dedup. */
+export declare const NATIVE_MUONROI_TOOL_NAMES: readonly ["ee_health", "ee_feedback", "usage_forensics", "lsp_query", "setup_guide", "selfverify_start", "selfverify_status", "selfverify_result", "selfverify_list", "selfverify_cancel"];
+export interface NativeToolOpts {
+    /** Workspace cwd for lsp_query. Defaults to process.cwd(). */
+    cwd?: string;
+}
+/**
+ * Add the native muonroi-tools builtins to `tools`. Mutates and returns it.
+ */
+export declare function registerNativeMuonroiTools(tools: ToolSet, opts?: NativeToolOpts): ToolSet;

package/dist/src/tools/native-tools.js ADDED Viewed

@@ -0,0 +1,273 @@
+/**
+ * src/tools/native-tools.ts
+ *
+ * NATIVE in-process builtins for the capabilities that muonroi-tools previously
+ * exposed only via a self-spawned MCP subprocess: ee_health, ee_feedback,
+ * usage_forensics, lsp_query, setup_guide, and selfverify_* (start/status/
+ * result/list/cancel).
+ *
+ * Why native: muonroi-tools is THIS CLI. Self-spawning a 137MB CLI as an MCP
+ * server per turn cold-started ~2-3.5s and overran the build deadline (and a
+ * seed-time bug once persisted a vitest-worker command that crashed on launch).
+ * For the CLI's OWN inner agent these tools should run in-process — no subprocess,
+ * no MCP round-trip, no cold-start. The muonroi-tools MCP server (tools-server.ts)
+ * stays for EXTERNAL agents (Claude Code etc.). `ee_query` is already native
+ * (registry.ts) and is intentionally NOT duplicated here.
+ *
+ * Each tool reuses the SAME core the MCP server wraps (ee/search, cli/cost-
+ * forensics, lsp/runtime, the shared self-verify JobManager), so behaviour is
+ * identical across the two surfaces.
+ */
+import { dynamicTool, jsonSchema } from "ai";
+import { LSP_TOOL_OPERATIONS } from "../lsp/types.js";
+import { getSelfVerifyJobManager } from "../mcp/self-verify-runner.js";
+import { SETUP_GUIDE_TEXT } from "../mcp/setup-guide-text.js";
+/** The native tool names this module registers — used by the MCP-twin dedup. */
+export const NATIVE_MUONROI_TOOL_NAMES = [
+    "ee_health",
+    "ee_feedback",
+    "usage_forensics",
+    "lsp_query",
+    "setup_guide",
+    "selfverify_start",
+    "selfverify_status",
+    "selfverify_result",
+    "selfverify_list",
+    "selfverify_cancel",
+];
+const json = (data) => JSON.stringify(data);
+const errLine = (error, message) => `ERROR ${error}: ${message}`;
+/**
+ * Add the native muonroi-tools builtins to `tools`. Mutates and returns it.
+ */
+export function registerNativeMuonroiTools(tools, opts = {}) {
+    // ── Experience Engine: health + feedback (ee_query is already native) ──────
+    tools.ee_health = dynamicTool({
+        description: "Check Experience Engine server reachability (returns {ok, status}).",
+        inputSchema: jsonSchema({ type: "object", properties: {}, additionalProperties: false }),
+        execute: async () => {
+            try {
+                const { healthEE } = await import("../ee/search.js");
+                return json(await healthEE());
+            }
+            catch (e) {
+                return errLine("ee_unavailable", e instanceof Error ? e.message : String(e));
+            }
+        },
+    });
+    tools.ee_feedback = dynamicTool({
+        description: "Rate an Experience Engine recall entry so the brain keeps what helped and prunes the rest. Call after " +
+            "acting on an ee_query result — once per `[id col]` you used or judged. verdict: 'followed' (you changed " +
+            "your approach because of it), 'ignored' (topical but did not apply this time), 'noise' (wrong by category — " +
+            "REQUIRES reason: wrong_repo | wrong_language | wrong_task | stale_rule). id may be a short prefix.",
+        inputSchema: jsonSchema({
+            type: "object",
+            properties: {
+                id: { type: "string", description: "Entry id (short prefix accepted)" },
+                collection: { type: "string", description: "EE collection the entry came from" },
+                verdict: { type: "string", enum: ["followed", "ignored", "noise"] },
+                reason: { type: "string", enum: ["wrong_repo", "wrong_language", "wrong_task", "stale_rule"] },
+            },
+            required: ["id", "collection", "verdict"],
+        }),
+        execute: async (input) => {
+            const id = typeof input?.id === "string" ? input.id.trim() : "";
+            const collection = typeof input?.collection === "string" ? input.collection.trim() : "";
+            const verdict = input?.verdict;
+            const reason = input?.reason;
+            if (!id || !collection || !verdict) {
+                return errLine("invalid_args", "ee_feedback requires id, collection, and verdict");
+            }
+            if (verdict === "noise" && !reason) {
+                return errLine("reason_required", "verdict 'noise' requires reason: wrong_repo | wrong_language | wrong_task | stale_rule");
+            }
+            try {
+                const { feedbackEE } = await import("../ee/search.js");
+                const { sessionRecallLedger } = await import("../ee/recall-ledger.js");
+                const result = await feedbackEE(id, collection, verdict, reason);
+                if (!result.ok)
+                    return errLine("feedback_failed", result.error ?? "feedback POST failed");
+                const clearedId = result.resolvedId ?? id;
+                sessionRecallLedger.clear(clearedId);
+                sessionRecallLedger.clear(id);
+                return json({
+                    ok: true,
+                    id: clearedId,
+                    verdict: result.verdict,
+                    ...(result.reason ? { reason: result.reason } : {}),
+                    pendingRemaining: sessionRecallLedger.pendingCount(),
+                });
+            }
+            catch (e) {
+                return errLine("feedback_failed", e instanceof Error ? e.message : String(e));
+            }
+        },
+    });
+    // ── Self-diagnostics: usage_forensics ─────────────────────────────────────
+    tools.usage_forensics = dynamicTool({
+        description: "Per-session token-cost forensics by session-id prefix: peak input, cache-hit ratio, per-event breakdown.",
+        inputSchema: jsonSchema({
+            type: "object",
+            properties: { prefix: { type: "string", description: "Session id prefix (1-100 chars)" } },
+            required: ["prefix"],
+        }),
+        execute: async (input) => {
+            const prefix = typeof input?.prefix === "string" ? input.prefix.trim() : "";
+            if (!prefix)
+                return errLine("invalid_args", "usage_forensics requires a non-empty prefix");
+            try {
+                const { resolveSessionIds, collectCostForensics } = await import("../cli/cost-forensics.js");
+                const ids = await resolveSessionIds(prefix);
+                if (ids.length === 0)
+                    return errLine("not_found", `no session matches prefix '${prefix}'`);
+                if (ids.length > 1)
+                    return errLine("ambiguous", `prefix '${prefix}' matched ${ids.length} sessions`);
+                return json(await collectCostForensics(ids[0]));
+            }
+            catch (e) {
+                return errLine("db_error", e instanceof Error ? e.message : String(e));
+            }
+        },
+    });
+    // ── Code intelligence: lsp_query ──────────────────────────────────────────
+    tools.lsp_query = dynamicTool({
+        description: "Semantic code intelligence via language servers. operation is one of: goToDefinition, findReferences, hover, documentSymbol, workspaceSymbol, goToImplementation, prepareCallHierarchy, incomingCalls, outgoingCalls. " +
+            "filePath: absolute, or relative to the workspace root. line/character: 1-based — required for position-based ops; omit for documentSymbol; use query (not position) for workspaceSymbol. Returns {success, output}.",
+        inputSchema: jsonSchema({
+            type: "object",
+            properties: {
+                operation: { type: "string", enum: [...LSP_TOOL_OPERATIONS] },
+                filePath: { type: "string", description: "Absolute or workspace-relative path" },
+                line: { type: "number", description: "1-based line (position ops)" },
+                character: { type: "number", description: "1-based character (position ops)" },
+                query: { type: "string", description: "Symbol query (workspaceSymbol)" },
+            },
+            required: ["operation", "filePath"],
+        }),
+        execute: async (input) => {
+            const cwd = opts.cwd ?? process.cwd();
+            try {
+                const { queryLsp, isLspToolEnabled } = await import("../lsp/runtime.js");
+                if (!(await isLspToolEnabled(cwd))) {
+                    return errLine("lsp_disabled", "LSP tool is disabled in settings (lsp.enabled / lsp.tool)");
+                }
+                return json(await queryLsp(cwd, input));
+            }
+            catch (e) {
+                return errLine("lsp_error", e instanceof Error ? e.message : String(e));
+            }
+        },
+    });
+    // ── Onboarding: setup_guide ───────────────────────────────────────────────
+    tools.setup_guide = dynamicTool({
+        description: "Returns the up-to-date setup / install / first-run / MCP wiring / verify guide for muonroi-cli. Call this " +
+            "when the user asks how to set up, install, or get started — instead of guessing, reading files, or shelling commands.",
+        inputSchema: jsonSchema({ type: "object", properties: {}, additionalProperties: false }),
+        execute: async () => SETUP_GUIDE_TEXT,
+    });
+    // ── Self-QA harness: selfverify_* (shared JobManager, in-process) ──────────
+    tools.selfverify_start = dynamicTool({
+        description: "Start a self-verify run (mode=tier1 heuristic, or mode=agentic LLM-driven). Returns {runId} immediately; " +
+            "poll selfverify_status, then selfverify_result.",
+        inputSchema: jsonSchema({
+            type: "object",
+            properties: {
+                mode: { type: "string", enum: ["tier1", "agentic"] },
+                since: { type: "string" },
+                max: { type: "number" },
+                emit: { type: "boolean" },
+                out: { type: "string" },
+                goal: { type: "string" },
+                llm: { type: "string" },
+                turns: { type: "number" },
+            },
+            required: ["mode"],
+        }),
+        execute: async (input) => {
+            const jm = getSelfVerifyJobManager();
+            if (input?.mode === "agentic") {
+                if (!input?.goal || !input?.llm)
+                    return errLine("invalid_args", "agentic mode requires both goal and llm");
+                const { getModelInfo } = await import("../models/registry.js");
+                if (!getModelInfo(input.llm))
+                    return errLine("unknown_model", `llm '${input.llm}' is not in catalog.json`);
+                return json({ runId: jm.start({ kind: "agentic", goal: input.goal, llm: input.llm, turns: input.turns }) });
+            }
+            return json({
+                runId: jm.start({ kind: "tier1", since: input?.since, max: input?.max, emit: input?.emit, out: input?.out }),
+            });
+        },
+    });
+    tools.selfverify_status = dynamicTool({
+        description: "Get status + log tail of a self-verify run.",
+        inputSchema: jsonSchema({
+            type: "object",
+            properties: { runId: { type: "string" } },
+            required: ["runId"],
+        }),
+        execute: async (input) => {
+            const job = getSelfVerifyJobManager().status(input?.runId);
+            if (!job)
+                return errLine("not_found", `runId ${input?.runId} not found`);
+            const summary = job.report && job.kind === "tier1" && "summary" in job.report
+                ? job.report.summary
+                : job.report && job.kind === "agentic" && "verdict" in job.report
+                    ? { verdict: job.report.verdict }
+                    : null;
+            return json({
+                runId: job.runId,
+                status: job.status,
+                kind: job.kind,
+                startedAt: job.startedAt,
+                finishedAt: job.finishedAt,
+                elapsedMs: (job.finishedAt ?? Date.now()) - job.startedAt,
+                logTail: job.logBuffer.slice(-40),
+                summary,
+                error: job.error,
+            });
+        },
+    });
+    tools.selfverify_result = dynamicTool({
+        description: "Fetch the full report of a completed self-verify run.",
+        inputSchema: jsonSchema({
+            type: "object",
+            properties: { runId: { type: "string" } },
+            required: ["runId"],
+        }),
+        execute: async (input) => {
+            const job = getSelfVerifyJobManager().status(input?.runId);
+            if (!job)
+                return errLine("not_found", `runId ${input?.runId} not found`);
+            if (job.status === "running")
+                return errLine("still_running", "run not finished; poll selfverify_status first");
+            if (job.status === "error")
+                return errLine("run_error", job.error ?? "unknown error");
+            if (job.status === "cancelled")
+                return errLine("cancelled", "run was cancelled");
+            return json(job.report ?? {});
+        },
+    });
+    tools.selfverify_list = dynamicTool({
+        description: "List recent self-verify runs.",
+        inputSchema: jsonSchema({ type: "object", properties: {}, additionalProperties: false }),
+        execute: async () => json(getSelfVerifyJobManager()
+            .list()
+            .map((j) => ({
+            runId: j.runId,
+            kind: j.kind,
+            status: j.status,
+            elapsedMs: (j.finishedAt ?? Date.now()) - j.startedAt,
+        }))),
+    });
+    tools.selfverify_cancel = dynamicTool({
+        description: "Cancel a running self-verify run (best-effort).",
+        inputSchema: jsonSchema({
+            type: "object",
+            properties: { runId: { type: "string" } },
+            required: ["runId"],
+        }),
+        execute: async (input) => json({ cancelled: getSelfVerifyJobManager().cancel(input?.runId) }),
+    });
+    return tools;
+}
+//# sourceMappingURL=native-tools.js.map

package/dist/src/tools/registry-ee-query.test.js CHANGED Viewed

@@ -9,7 +9,8 @@
  * (no network).
  */
 import os from "node:os";
-import { describe, expect, it } from "vitest";
+import { afterEach, describe, expect, it } from "vitest";
+import { __resetArtifactCacheForTests, recordArtifact } from "../ee/artifact-cache.js";
 import { BashTool } from "./bash.js";
 import { createBuiltinTools, isToolArtifactQuery } from "./registry.js";
 describe("ee_query builtin tool", () => {
@@ -45,4 +46,20 @@ describe("isToolArtifactQuery — ee_query intent routing", () => {
         expect(isToolArtifactQuery("tool-artifact storage design")).toBe(false);
     });
 });
+describe("ee_query — anti-mù rehydrate (local-first, durable when EE is down)", () => {
+    afterEach(() => __resetArtifactCacheForTests());
+    it("rehydrates a tool-artifact from the in-session cache with NO EE/network call", async () => {
+        // Simulates: the compactor elided this output earlier (recordArtifact), EE is
+        // now down. The agent's ee_query("tool-artifact id=X") must still return the
+        // full content from the local cache rather than an [ee_unavailable] note.
+        recordArtifact("call_42", "read_file", "FULL ELIDED CONTENT — line A\nline B\nline C");
+        const tools = createBuiltinTools(new BashTool(os.tmpdir()), "agent");
+        const t = tools.ee_query;
+        const out = String(await t.execute?.({ query: "tool-artifact id=call_42" }));
+        expect(out).toContain("rehydrated from in-session cache");
+        expect(out).toContain("tool=read_file");
+        expect(out).toContain("FULL ELIDED CONTENT");
+        expect(out).not.toMatch(/ee_unavailable/);
+    });
+});
 //# sourceMappingURL=registry-ee-query.test.js.map

package/dist/src/tools/registry-git-safety.test.d.ts ADDED Viewed

@@ -0,0 +1,7 @@
+/**
+ * Integration: git-safety guards wired into the bash tool (registry.ts).
+ * Unit logic lives in git-safety.test.ts; this asserts the WIRING — a blocked
+ * push returns the block message WITHOUT executing, and a broad stage appends
+ * the sensitive-path warning to the tool output.
+ */
+export {};

package/dist/src/tools/registry-git-safety.test.js ADDED Viewed

@@ -0,0 +1,92 @@
+/**
+ * Integration: git-safety guards wired into the bash tool (registry.ts).
+ * Unit logic lives in git-safety.test.ts; this asserts the WIRING — a blocked
+ * push returns the block message WITHOUT executing, and a broad stage appends
+ * the sensitive-path warning to the tool output.
+ */
+import { mkdtempSync, rmSync, writeFileSync } from "node:fs";
+import os from "node:os";
+import { join } from "node:path";
+import { afterEach, beforeEach, describe, expect, it } from "vitest";
+import { BashTool } from "./bash.js";
+import { clearBashOutputCache } from "./bash-output-cache.js";
+import { __resetGitSafetyState, recordCommandOutcome } from "./git-safety.js";
+import { createBuiltinTools } from "./registry.js";
+async function runBash(tools, args) {
+    const t = tools.bash;
+    if (!t?.execute)
+        throw new Error("bash tool has no execute");
+    const out = await t.execute(args);
+    return typeof out === "string" ? out : JSON.stringify(out);
+}
+describe("git-safety wiring in bash tool", () => {
+    beforeEach(() => {
+        clearBashOutputCache();
+        globalThis.__muonroiBashRepeatState = new Map();
+        __resetGitSafetyState();
+        delete process.env.MUONROI_ALLOW_PUSH_ON_RED;
+    });
+    afterEach(() => {
+        delete process.env.MUONROI_ALLOW_PUSH_ON_RED;
+    });
+    it("BLOCKS git push (without executing) after a verification failed this session", async () => {
+        const bash = new BashTool(os.tmpdir());
+        const tools = createBuiltinTools(bash, "agent", { sessionId: "GS1" });
+        // Simulate a failed test earlier in the session.
+        recordCommandOutcome("GS1", "npm test", false);
+        const out = await runBash(tools, { command: "git push origin main", timeout: 10_000 });
+        expect(out).toMatch(/^BLOCKED:/);
+        expect(out).toMatch(/npm test/);
+        // The distinctive block message proves git push never ran (a real push in
+        // tmpdir would fail with a git error like "not a git repository", not this).
+        expect(out).not.toMatch(/not a git repository|fatal:/i);
+    }, 20_000);
+    it("ALLOWS git push once the failed verification re-runs green", async () => {
+        const bash = new BashTool(os.tmpdir());
+        const tools = createBuiltinTools(bash, "agent", { sessionId: "GS2" });
+        recordCommandOutcome("GS2", "npm test", false);
+        recordCommandOutcome("GS2", "npm test", true); // re-ran green
+        const out = await runBash(tools, { command: "git push origin main", timeout: 10_000 });
+        expect(out).not.toMatch(/^BLOCKED:/);
+    }, 20_000);
+    it("respects MUONROI_ALLOW_PUSH_ON_RED override", async () => {
+        process.env.MUONROI_ALLOW_PUSH_ON_RED = "1";
+        const bash = new BashTool(os.tmpdir());
+        const tools = createBuiltinTools(bash, "agent", { sessionId: "GS3" });
+        recordCommandOutcome("GS3", "vitest run", false);
+        const out = await runBash(tools, { command: "git push", timeout: 10_000 });
+        expect(out).not.toMatch(/^BLOCKED:/);
+    }, 20_000);
+    it("blocks push across registry rebuilds even with NO sessionId (stable process key)", async () => {
+        // Regression for the anon-key false negative: createBuiltinTools() without a
+        // sessionId must still gate the push, because production call sites
+        // (message-processor) don't thread sessionId and rebuild the registry every
+        // turn. A failing verify in one anon registry must block a push in the next.
+        const bash = new BashTool(os.tmpdir());
+        // `npm test` is a recognized verification command and fails fast here
+        // (no package.json in a temp dir) → recorded as a failed verify under the
+        // stable process key.
+        const toolsA = createBuiltinTools(bash, "agent"); // no sessionId
+        const failOut = await runBash(toolsA, { command: "npm test", timeout: 20_000 });
+        expect(failOut).toMatch(/ERROR/); // the verify failed
+        // Fresh anon registry (simulates the per-turn rebuild).
+        const toolsB = createBuiltinTools(bash, "agent"); // no sessionId
+        const pushOut = await runBash(toolsB, { command: "git push origin main", timeout: 10_000 });
+        expect(pushOut).toMatch(/^BLOCKED:/);
+    }, 30_000);
+    it("appends a sensitive-path WARNING on a broad git add when secrets exist", async () => {
+        const dir = mkdtempSync(join(os.tmpdir(), "gs-stage-"));
+        writeFileSync(join(dir, ".env"), "API_KEY=secret");
+        try {
+            const bash = new BashTool(dir);
+            const tools = createBuiltinTools(bash, "agent", { sessionId: "GS4" });
+            const out = await runBash(tools, { command: "git add -A", timeout: 10_000 });
+            expect(out).toMatch(/\[WARNING:/);
+            expect(out).toMatch(/\.env/);
+        }
+        finally {
+            rmSync(dir, { recursive: true, force: true });
+        }
+    }, 20_000);
+});
+//# sourceMappingURL=registry-git-safety.test.js.map