npm - @pugi/cli - Versions diffs - 0.1.0-beta.5 → 0.1.0-beta.51 - Mend

@pugi/cli 0.1.0-beta.5 → 0.1.0-beta.51

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (264) hide show

package/THIRD_PARTY_NOTICES.md +40 -0
package/assets/pugi-mascot.ansi +15 -25
package/assets/pugi-prozr2-mascot.ansi +9 -0
package/bin/run.js +33 -1
package/dist/commands/jobs-watch.js +201 -0
package/dist/commands/jobs.js +15 -0
package/dist/commands/smoke.js +133 -0
package/dist/core/agent-progress/cleanup.js +134 -0
package/dist/core/agent-progress/schema.js +144 -0
package/dist/core/agent-progress/writer.js +101 -0
package/dist/core/artifact-chain/dispatcher.js +148 -0
package/dist/core/artifact-chain/exporter.js +164 -0
package/dist/core/artifact-chain/state.js +243 -0
package/dist/core/artifact-chain/steps.js +169 -0
package/dist/core/auth/ensure-authenticated.js +129 -0
package/dist/core/auth/env-provider.js +238 -0
package/dist/core/auto-update/channels.js +122 -0
package/dist/core/auto-update/checker.js +241 -0
package/dist/core/auto-update/state.js +235 -0
package/dist/core/bare-mode/index.js +107 -0
package/dist/core/bash-classifier.js +400 -4
package/dist/core/checkpoint/resumer.js +149 -0
package/dist/core/checkpoint/rewinder.js +291 -0
package/dist/core/codegraph/decision-store.js +248 -0
package/dist/core/codegraph/detect-repo.js +459 -0
package/dist/core/codegraph/install.js +134 -0
package/dist/core/codegraph/offer-hook.js +220 -0
package/dist/core/compact/auto-trigger.js +96 -0
package/dist/core/compact/buffer-rewriter.js +115 -0
package/dist/core/compact/summarizer.js +208 -0
package/dist/core/compact/token-counter.js +108 -0
package/dist/core/consensus/diff-capture.js +112 -3
package/dist/core/context/index.js +7 -0
package/dist/core/context/markdown-traverse.js +255 -0
package/dist/core/cost/rate-card.js +129 -0
package/dist/core/cost/tracker.js +221 -0
package/dist/core/denial-tracking/index.js +8 -0
package/dist/core/denial-tracking/state.js +264 -0
package/dist/core/diagnostics/probe-runner.js +93 -0
package/dist/core/diagnostics/probes/api.js +46 -0
package/dist/core/diagnostics/probes/auth.js +86 -0
package/dist/core/diagnostics/probes/bare-mode.js +42 -0
package/dist/core/diagnostics/probes/cli-version.js +127 -0
package/dist/core/diagnostics/probes/config.js +72 -0
package/dist/core/diagnostics/probes/denial-tracking.js +57 -0
package/dist/core/diagnostics/probes/disk.js +81 -0
package/dist/core/diagnostics/probes/git.js +65 -0
package/dist/core/diagnostics/probes/hooks.js +118 -0
package/dist/core/diagnostics/probes/mcp.js +75 -0
package/dist/core/diagnostics/probes/node.js +59 -0
package/dist/core/diagnostics/probes/pnpm.js +36 -0
package/dist/core/diagnostics/probes/pugi-md.js +89 -0
package/dist/core/diagnostics/probes/sandbox.js +40 -0
package/dist/core/diagnostics/probes/session.js +74 -0
package/dist/core/diagnostics/probes/status-snapshot.js +488 -0
package/dist/core/diagnostics/probes/workspace.js +63 -0
package/dist/core/diagnostics/types.js +70 -0
package/dist/core/dispatch/cache-cleanup.js +197 -0
package/dist/core/dispatch/cache-handoff.js +295 -0
package/dist/core/edits/dispatch.js +218 -2
package/dist/core/edits/journal.js +199 -0
package/dist/core/edits/layer-d-ast.js +557 -14
package/dist/core/edits/verify-hook.js +273 -0
package/dist/core/edits/worktree.js +322 -0
package/dist/core/engine/anvil-client.js +115 -5
package/dist/core/engine/auto-compact.js +179 -0
package/dist/core/engine/budgets.js +155 -0
package/dist/core/engine/context-prefix.js +155 -0
package/dist/core/engine/intent.js +260 -0
package/dist/core/engine/native-pugi.js +897 -211
package/dist/core/engine/prompts.js +88 -2
package/dist/core/engine/strip-internal-fields.js +124 -0
package/dist/core/engine/tool-bridge.js +1045 -36
package/dist/core/feedback/queue.js +177 -0
package/dist/core/feedback/submitter.js +145 -0
package/dist/core/file-cache.js +113 -1
package/dist/core/hooks/events.js +44 -0
package/dist/core/hooks/index.js +15 -0
package/dist/core/hooks/registry.js +213 -0
package/dist/core/hooks/runner.js +236 -0
package/dist/core/hooks/v2/event-emitter.js +115 -0
package/dist/core/hooks/v2/executor.js +282 -0
package/dist/core/hooks/v2/index.js +25 -0
package/dist/core/hooks/v2/lifecycle.js +104 -0
package/dist/core/hooks/v2/loader.js +216 -0
package/dist/core/hooks/v2/matcher.js +125 -0
package/dist/core/hooks/v2/trust.js +143 -0
package/dist/core/hooks/v2/types.js +86 -0
package/dist/core/lsp/cache.js +105 -0
package/dist/core/lsp/client.js +776 -0
package/dist/core/lsp/language-detect.js +66 -0
package/dist/core/lsp/post-edit-diagnostics.js +171 -0
package/dist/core/mcp/client.js +75 -6
package/dist/core/mcp/http-server.js +553 -0
package/dist/core/mcp/orchestrator-tools.js +662 -0
package/dist/core/mcp/permission.js +190 -0
package/dist/core/mcp/registry.js +24 -2
package/dist/core/mcp/server-tools.js +219 -0
package/dist/core/mcp/server.js +397 -0
package/dist/core/memory/dual-write.js +416 -0
package/dist/core/memory/phase1-kinds.js +20 -0
package/dist/core/memory-sync/queue.js +158 -0
package/dist/core/onboarding/ensure-initialized.js +133 -0
package/dist/core/onboarding/marker.js +111 -0
package/dist/core/onboarding/telemetry-state.js +108 -0
package/dist/core/output-style/presets.js +176 -0
package/dist/core/output-style/state.js +185 -0
package/dist/core/path-security.js +284 -2
package/dist/core/permissions/auto-classifier.js +124 -0
package/dist/core/permissions/circuit-breaker.js +83 -0
package/dist/core/permissions/gate.js +278 -0
package/dist/core/permissions/index.js +20 -0
package/dist/core/permissions/mode.js +174 -0
package/dist/core/permissions/state.js +241 -0
package/dist/core/permissions/tool-class.js +93 -0
package/dist/core/prd-check/parser.js +215 -0
package/dist/core/prd-check/reporter.js +127 -0
package/dist/core/prd-check/session-review.js +557 -0
package/dist/core/prd-check/verifiers.js +223 -0
package/dist/core/pugi-md/context-injector.js +76 -0
package/dist/core/pugi-md/walk-up.js +207 -0
package/dist/core/release-notes/parser.js +241 -0
package/dist/core/release-notes/state.js +116 -0
package/dist/core/repl/history.js +11 -1
package/dist/core/repl/model-pricing.js +135 -0
package/dist/core/repl/session.js +1897 -37
package/dist/core/repl/slash-commands.js +430 -15
package/dist/core/repl/store/session-store.js +31 -2
package/dist/core/repl/workspace-context.js +22 -0
package/dist/core/repo-map/build.js +125 -0
package/dist/core/repo-map/cache.js +185 -0
package/dist/core/repo-map/extractor.js +254 -0
package/dist/core/repo-map/formatter.js +145 -0
package/dist/core/repo-map/scanner.js +211 -0
package/dist/core/retry-budget/budget.js +284 -0
package/dist/core/retry-budget/index.js +5 -0
package/dist/core/session.js +92 -0
package/dist/core/settings.js +80 -0
package/dist/core/share/formatter.js +271 -0
package/dist/core/share/redactor.js +221 -0
package/dist/core/share/uploader.js +267 -0
package/dist/core/skills/defaults.js +457 -0
package/dist/core/smoke/headless-driver.js +174 -0
package/dist/core/smoke/orchestrator.js +194 -0
package/dist/core/smoke/runner.js +238 -0
package/dist/core/smoke/scenario-parser.js +316 -0
package/dist/core/subagents/dispatcher-real.js +600 -0
package/dist/core/subagents/dispatcher.js +113 -24
package/dist/core/subagents/index.js +18 -5
package/dist/core/subagents/isolation-matrix.js +213 -0
package/dist/core/subagents/spawn.js +19 -4
package/dist/core/telemetry/emitter.js +229 -0
package/dist/core/telemetry/queue.js +251 -0
package/dist/core/theme/context.js +91 -0
package/dist/core/theme/presets.js +228 -0
package/dist/core/theme/state.js +181 -0
package/dist/core/todos/invariant.js +10 -0
package/dist/core/todos/state.js +177 -0
package/dist/core/transport/version-interceptor.js +166 -0
package/dist/core/vim/keymap.js +288 -0
package/dist/core/vim/state.js +92 -0
package/dist/core/worktree-manager/cleanup.js +123 -0
package/dist/core/worktree-manager/manager.js +303 -0
package/dist/index.js +28 -0
package/dist/runtime/bootstrap.js +190 -0
package/dist/runtime/cli.js +3241 -343
package/dist/runtime/commands/cancel.js +231 -0
package/dist/runtime/commands/chain.js +489 -0
package/dist/runtime/commands/codegraph-status.js +227 -0
package/dist/runtime/commands/compact.js +297 -0
package/dist/runtime/commands/cost.js +199 -0
package/dist/runtime/commands/delegate.js +242 -11
package/dist/runtime/commands/dispatch.js +126 -0
package/dist/runtime/commands/doctor.js +412 -0
package/dist/runtime/commands/feedback.js +184 -0
package/dist/runtime/commands/hooks.js +184 -0
package/dist/runtime/commands/lsp.js +368 -0
package/dist/runtime/commands/mcp.js +879 -0
package/dist/runtime/commands/memory.js +508 -0
package/dist/runtime/commands/model.js +237 -0
package/dist/runtime/commands/onboarding.js +275 -0
package/dist/runtime/commands/patch.js +128 -0
package/dist/runtime/commands/permissions.js +112 -0
package/dist/runtime/commands/plan.js +143 -0
package/dist/runtime/commands/prd-check.js +285 -0
package/dist/runtime/commands/redo-blob-store.js +92 -0
package/dist/runtime/commands/redo.js +361 -0
package/dist/runtime/commands/release-notes.js +229 -0
package/dist/runtime/commands/repo-map.js +95 -0
package/dist/runtime/commands/report.js +299 -0
package/dist/runtime/commands/resume.js +118 -0
package/dist/runtime/commands/review-consensus.js +17 -2
package/dist/runtime/commands/rewind.js +333 -0
package/dist/runtime/commands/sessions.js +163 -0
package/dist/runtime/commands/share.js +316 -0
package/dist/runtime/commands/status.js +186 -0
package/dist/runtime/commands/stickers.js +82 -0
package/dist/runtime/commands/style.js +194 -0
package/dist/runtime/commands/theme.js +196 -0
package/dist/runtime/commands/undo.js +32 -0
package/dist/runtime/commands/update.js +289 -0
package/dist/runtime/commands/vim.js +140 -0
package/dist/runtime/commands/worktree.js +177 -0
package/dist/runtime/commands/worktrees.js +155 -0
package/dist/runtime/headless-repl.js +195 -0
package/dist/runtime/headless.js +543 -0
package/dist/runtime/load-hooks-or-exit.js +71 -0
package/dist/runtime/plan-decompose.js +531 -0
package/dist/runtime/version.js +65 -0
package/dist/tools/agent-tool.js +229 -0
package/dist/tools/apply-patch.js +556 -0
package/dist/tools/ask-user-question.js +213 -0
package/dist/tools/ask-user.js +115 -0
package/dist/tools/bash.js +203 -4
package/dist/tools/file-tools.js +85 -14
package/dist/tools/lsp-tools.js +189 -0
package/dist/tools/mcp-tool.js +260 -0
package/dist/tools/multi-edit.js +361 -0
package/dist/tools/powershell.js +268 -0
package/dist/tools/registry.js +51 -0
package/dist/tools/skill-tool.js +96 -0
package/dist/tools/tasks.js +208 -0
package/dist/tools/todo-write.js +184 -0
package/dist/tools/web-fetch.js +147 -2
package/dist/tools/web-search.js +458 -0
package/dist/tui/agent-progress-card.js +111 -0
package/dist/tui/agent-tree.js +10 -0
package/dist/tui/ask-modal.js +2 -2
package/dist/tui/ask-user-question-prompt.js +192 -0
package/dist/tui/compact-banner.js +81 -0
package/dist/tui/conversation-pane.js +82 -8
package/dist/tui/cost-table.js +111 -0
package/dist/tui/doctor-table.js +46 -0
package/dist/tui/feedback-prompt.js +156 -0
package/dist/tui/input-box.js +218 -3
package/dist/tui/markdown-render.js +4 -4
package/dist/tui/onboarding-wizard.js +240 -0
package/dist/tui/permissions-picker.js +86 -0
package/dist/tui/render.js +35 -0
package/dist/tui/repl-render.js +313 -35
package/dist/tui/repl-splash-art.js +1 -1
package/dist/tui/repl-splash-mascot.js +32 -8
package/dist/tui/repl-splash.js +2 -2
package/dist/tui/repl.js +85 -5
package/dist/tui/splash.js +1 -1
package/dist/tui/status-bar.js +94 -16
package/dist/tui/status-table.js +7 -0
package/dist/tui/stickers-art.js +136 -0
package/dist/tui/style-table.js +28 -0
package/dist/tui/theme-table.js +29 -0
package/dist/tui/thinking-spinner.js +123 -0
package/dist/tui/tool-stream-pane.js +52 -3
package/dist/tui/update-banner.js +27 -2
package/dist/tui/vim-input.js +267 -0
package/dist/tui/welcome-banner.js +107 -0
package/dist/tui/welcome-data.js +293 -0
package/docs/examples/codegraph.mcp.json +10 -0
package/package.json +13 -7
package/test/scenarios/codegen-create-file.scenario.txt +13 -0
package/test/scenarios/compact-force.scenario.txt +11 -0
package/test/scenarios/identity.scenario.txt +11 -0
package/test/scenarios/persona-handoff.scenario.txt +11 -0
package/test/scenarios/walkback.scenario.txt +12 -0
package/dist/core/engine/compaction-hook.js +0 -154

package/dist/tools/registry.js CHANGED Viewed

@@ -1,8 +1,36 @@
 const registry = [
+    // α7.7: unified-diff patch apply. Routes through the same security
+    // gate as Layer A/B/C, so the risk class matches `edit`/`write`
+    // (medium — writes inside the workspace, never to protected files).
+    { name: 'apply_patch', permission: 'edit', risk: 'medium', concurrencySafe: false, m1: true },
+    // Leak L5 (2026-05-27): structured multi-choice clarifier tool. Risk =
+    // low because the dispatch is a pure UI surface — no file writes, no
+    // shell, no network. Permission = none (no workspace access required).
+    // concurrencySafe = true because the prompt-budget gate runs in the
+    // engine loop, not via tool-side mutex (one prompt per turn is enforced
+    // by the persona system prompt + the engine's tool_calls budget).
+    { name: 'ask_user_question', permission: 'none', risk: 'low', concurrencySafe: true, m1: true },
     { name: 'bash', permission: 'bash', risk: 'high', concurrencySafe: false, m1: true },
     { name: 'edit', permission: 'edit', risk: 'medium', concurrencySafe: false, m1: true },
     { name: 'glob', permission: 'read', risk: 'low', concurrencySafe: true, m1: true },
     { name: 'grep', permission: 'read', risk: 'low', concurrencySafe: true, m1: true },
+    // α7.7: LSP read-only surface. Server runs locally, no Anvil
+    // round-trip. Concurrency-safe because every operation reads
+    // server state without mutating workspace files.
+    { name: 'lsp_definition', permission: 'read', risk: 'low', concurrencySafe: true, m1: true },
+    { name: 'lsp_diagnostics', permission: 'read', risk: 'low', concurrencySafe: true, m1: true },
+    { name: 'lsp_hover', permission: 'read', risk: 'low', concurrencySafe: true, m1: true },
+    { name: 'lsp_references', permission: 'read', risk: 'low', concurrencySafe: true, m1: true },
+    // β7 L5+T11: multi_edit dispatches an ordered batch of Layer A edits
+    // as a single transaction. Risk = medium (same chokepoints as `edit`).
+    // concurrencySafe = false because the journal serialises one dispatch
+    // per session.
+    { name: 'multi_edit', permission: 'edit', risk: 'medium', concurrencySafe: false, m1: true },
+    // Leak L6 (2026-05-28): PowerShell tool for Windows-first workflows. Same
+    // bash permission class — destructive-pattern classification fires the
+    // same gate. concurrencySafe = false because spawn-shell child cwd /
+    // env carry-over could race across parallel agent calls.
+    { name: 'powershell', permission: 'bash', risk: 'high', concurrencySafe: false, m1: false },
     { name: 'question', permission: 'none', risk: 'low', concurrencySafe: false, m1: true },
     { name: 'read', permission: 'read', risk: 'low', concurrencySafe: true, m1: true },
     { name: 'skill', permission: 'read', risk: 'low', concurrencySafe: true, m1: true },
@@ -10,7 +38,30 @@ const registry = [
     { name: 'task_get', permission: 'none', risk: 'low', concurrencySafe: true, m1: true },
     { name: 'task_list', permission: 'none', risk: 'low', concurrencySafe: true, m1: true },
     { name: 'task_update', permission: 'none', risk: 'low', concurrencySafe: false, m1: true },
+    // Leak L16 (2026-05-27): batch TodoWrite. Mirrors Claude Code's upstream
+    // surface — full board snapshot, single-in-progress invariant, atomic
+    // tmp+rename persistence to `.pugi/todos.json`. `concurrencySafe = false`
+    // because two concurrent writes could lose the loser's snapshot (the
+    // rename is atomic but the read-modify-write loop is not). Risk = low
+    // because the only filesystem mutation lands inside `.pugi/todos.json`,
+    // which is metadata, not source.
+    { name: 'todo_write', permission: 'none', risk: 'low', concurrencySafe: false, m1: true },
     { name: 'web_fetch', permission: 'network', risk: 'medium', concurrencySafe: true, m1: true },
+    // α7.7: scratch worktree management. `worktree_create` writes nothing
+    // dangerous (a clone under `.pugi/worktrees/`); `worktree_promote`
+    // applies a diff back to the main tree, so it shares the `edit`
+    // risk class. `worktree_drop` is the cleanup primitive.
+    //
+    // R1 fix (2026-05-26, PR #413 r1, Fix 9): raised `worktree_create`
+    // and `worktree_drop` from `low` to `medium`. `worktree_drop` runs
+    // `rmSync` on its target — even with the new path-containment gate
+    // in `core/edits/worktree.ts::dropWorktree`, a destructive primitive
+    // belongs in `medium` so the permission FSM prompts on every call.
+    // `worktree_create` is raised for disk-pressure parity (a runaway
+    // agent loop could fill the disk with abandoned scratch worktrees).
+    { name: 'worktree_create', permission: 'edit', risk: 'medium', concurrencySafe: false, m1: true },
+    { name: 'worktree_drop', permission: 'edit', risk: 'medium', concurrencySafe: false, m1: true },
+    { name: 'worktree_promote', permission: 'edit', risk: 'medium', concurrencySafe: false, m1: true },
     { name: 'write', permission: 'edit', risk: 'medium', concurrencySafe: false, m1: true },
 ];
 export const toolRegistry = registry.sort((a, b) => a.name.localeCompare(b.name));

package/dist/tools/skill-tool.js ADDED Viewed

@@ -0,0 +1,96 @@
+import { listSkills } from '../core/skills/loader.js';
+import { hashSkillDir, verifyTrust } from '../core/skills/trust.js';
+export const SKILL_BODY_CAP_BYTES = 32 * 1024;
+export const SKILL_LIST_CAP = 100;
+export function skillList(ctx, input) {
+    const scope = input.scope ?? 'all';
+    const all = [];
+    if (scope === 'all' || scope === 'global') {
+        all.push(...listSkills('global', ctx.workspaceRoot));
+    }
+    if (scope === 'all' || scope === 'workspace') {
+        all.push(...listSkills('workspace', ctx.workspaceRoot));
+    }
+    // Dedup by name, prefer workspace scope when both exist (workspace
+    // overrides global per skills loader convention).
+    const byName = new Map();
+    for (const skill of all) {
+        const prev = byName.get(skill.name);
+        if (!prev || skill.scope === 'workspace') {
+            byName.set(skill.name, skill);
+        }
+    }
+    return Array.from(byName.values())
+        .slice(0, SKILL_LIST_CAP)
+        .map((skill) => ({
+        name: skill.name,
+        description: skill.frontmatter.description,
+        scope: skill.scope,
+    }));
+}
+export async function skillInvoke(ctx, input) {
+    if (!input.name || typeof input.name !== 'string') {
+        throw new Error('skill: name is required');
+    }
+    // Defense-in-depth: skill loader already validates slugs but the
+    // tool surface is operator-controlled.
+    if (!/^[a-zA-Z0-9_-]{1,128}$/.test(input.name)) {
+        throw new Error(`skill: invalid skill name shape: "${input.name}"`);
+    }
+    // Workspace scope wins over global (operator override). Mirrors
+    // SkillLoader convention.
+    const workspace = listSkills('workspace', ctx.workspaceRoot).find((s) => s.name === input.name);
+    const global = workspace
+        ? null
+        : listSkills('global', ctx.workspaceRoot).find((s) => s.name === input.name);
+    const skill = workspace ?? global;
+    if (!skill) {
+        throw new Error(`skill: not found: "${input.name}"`);
+    }
+    // β1a r1 (2026-05-26): re-verify the on-disk skill payload against
+    // the trust manifest sha256 on EVERY invoke, not just at install
+    // time. Before this fix a post-install swap (malicious npm dep that
+    // touches `~/.pugi/skills/<name>/SKILL.md` after the operator
+    // approved the install) would bypass the trust gate — `listSkills`
+    // reads the body fresh from disk and the loader does no integrity
+    // check. The skill body lands directly in the model's tool result,
+    // so a mutated body is a prompt-injection vector against the agent
+    // loop's tool surface.
+    //
+    // Posture:
+    //   - `trusted`   → proceed (body is hash-pinned).
+    //   - `unsigned`  → refuse: the operator never approved this skill.
+    //     This catches the case where a skill directory was dropped in
+    //     manually (no `pugi skills install`) and the loader picked it
+    //     up. Refusing is fail-closed.
+    //   - `mismatch`  → refuse + surface the recorded vs actual hashes
+    //     so the operator can decide between re-trust and revoke.
+    //
+    // Performance: `hashSkillDir` walks the skill directory on every
+    // invoke. Skills are small (median 4-8 files, <50KB total) so the
+    // cost is sub-millisecond on warm cache. The β1a r1 spec exercises
+    // a mutated-body case; the existing skill-tool.spec.ts cases for
+    // happy-path use the `recordTrust` helper to seed the registry.
+    const actualHash = hashSkillDir(skill.dir);
+    const verdict = await verifyTrust('skill', skill.scope, skill.name, actualHash);
+    if (verdict.status === 'unsigned') {
+        throw new Error(`skill: refused to invoke "${skill.name}" — no trust entry (run \`pugi skills trust ${skill.name}\` to approve)`);
+    }
+    if (verdict.status === 'mismatch') {
+        throw new Error(`skill: refused to invoke "${skill.name}" — sha256 mismatch (recorded ${verdict.recorded.slice(0, 12)}…, actual ${verdict.actual.slice(0, 12)}…). Re-trust via \`pugi skills trust ${skill.name}\`.`);
+    }
+    const body = skill.body;
+    const truncated = Buffer.byteLength(body, 'utf8') > SKILL_BODY_CAP_BYTES;
+    const cappedBody = truncated
+        ? body.slice(0, SKILL_BODY_CAP_BYTES) +
+            `\n\n(... truncated at ${SKILL_BODY_CAP_BYTES} bytes — see \`pugi skills info ${skill.name}\` for full text)`
+        : body;
+    return {
+        name: skill.name,
+        scope: skill.scope,
+        description: skill.frontmatter.description,
+        body: cappedBody,
+        truncated,
+    };
+}
+//# sourceMappingURL=skill-tool.js.map

package/dist/tools/tasks.js ADDED Viewed

@@ -0,0 +1,208 @@
+/**
+ * task_* tool family — β1 T1/T6 (TodoWrite + agent task ledger).
+ *
+ * Mirrors Claude Code's TodoWrite tool surface so a model trained on
+ * the upstream tool grammar speaks Pugi's variant verbatim. Four ops:
+ *
+ *   - `task_create` — append a new task to the session's todo ledger.
+ *     Returns the assigned id.
+ *   - `task_get`    — fetch a single task by id.
+ *   - `task_list`   — list every task in the current session, ordered
+ *                     by createdAt ascending.
+ *   - `task_update` — mutate status/title/notes of an existing task.
+ *                     Append-only journal — every mutation lands as a
+ *                     fresh JSONL line and the latest line per id wins
+ *                     on `task_list` / `task_get` reads.
+ *
+ * Persistence: append-only JSONL at
+ * `.pugi/sessions/<sessionId>/tasks.jsonl`. Append-only keeps crash
+ * recovery trivial — a partial write at the end of the file is the
+ * worst case and the parser drops the malformed tail line.
+ *
+ * Scope: this is the local-side ledger surface. Anvil-side mirror
+ * (cabinet `/projects/[id]/tasks` page) ships in β5 once the session-
+ * memory hook lands; until then the ledger is purely local.
+ */
+import { appendFileSync, chmodSync, existsSync, mkdirSync, readFileSync, } from 'node:fs';
+import { dirname, join } from 'node:path';
+import { randomUUID } from 'node:crypto';
+function ledgerPath(ctx) {
+    // Defense-in-depth: the sessionId is supposed to be a UUID minted by
+    // openSession() but the tool surface is operator-facing. Validate the
+    // shape before composing a path — refuse anything that contains
+    // separators or shell wildcards.
+    if (!/^[a-zA-Z0-9_-]{1,128}$/.test(ctx.sessionId)) {
+        throw new Error(`task_*: invalid sessionId shape: "${ctx.sessionId}"`);
+    }
+    return join(ctx.workspaceRoot, '.pugi', 'sessions', ctx.sessionId, 'tasks.jsonl');
+}
+function nowIso(ctx) {
+    return (ctx.now ? ctx.now() : new Date()).toISOString();
+}
+function ensureDir(path) {
+    // β1a r1 (2026-05-26): switched from POSIX-only
+    // `path.slice(0, path.lastIndexOf('/'))` to `path.dirname()` so
+    // Windows path separators (`\`) work. Also chmod the per-session
+    // directory to 0o700 — the tasks ledger carries operator-confidential
+    // brief text, status notes, and timing metadata that should not be
+    // world-readable through an inherited umask.
+    const dir = dirname(path);
+    if (!existsSync(dir)) {
+        mkdirSync(dir, { recursive: true });
+        try {
+            chmodSync(dir, 0o700);
+        }
+        catch {
+            // Best-effort. POSIX permission setting is a no-op on Windows
+            // NTFS, and the dir-creation race with another concurrent task
+            // tool call is the only realistic failure case. The 0o600 mode
+            // on the JSONL file itself remains the primary guard; the dir
+            // chmod is defense in depth for tools that walk `.pugi/`.
+        }
+    }
+}
+function readJournal(ctx) {
+    const path = ledgerPath(ctx);
+    if (!existsSync(path))
+        return [];
+    const raw = readFileSync(path, 'utf8');
+    const out = [];
+    for (const line of raw.split('\n')) {
+        if (!line.trim())
+            continue;
+        try {
+            const parsed = JSON.parse(line);
+            if ((parsed.op === 'create' || parsed.op === 'update') &&
+                typeof parsed.id === 'string' &&
+                typeof parsed.at === 'string') {
+                out.push(parsed);
+            }
+        }
+        catch {
+            // Drop malformed line (partial-write tail or external corruption).
+            // The append-only design guarantees only the LAST line can be bad
+            // — everything before it is whole.
+        }
+    }
+    return out;
+}
+function fold(journal) {
+    const out = new Map();
+    for (const entry of journal) {
+        if (entry.op === 'create') {
+            if (!entry.title)
+                continue;
+            out.set(entry.id, {
+                id: entry.id,
+                title: entry.title,
+                status: entry.status ?? 'pending',
+                ...(entry.notes !== undefined ? { notes: entry.notes } : {}),
+                createdAt: entry.at,
+                updatedAt: entry.at,
+            });
+        }
+        else {
+            const prev = out.get(entry.id);
+            if (!prev)
+                continue; // update before create — drop silently
+            out.set(entry.id, {
+                ...prev,
+                ...(entry.title !== undefined ? { title: entry.title } : {}),
+                ...(entry.status !== undefined ? { status: entry.status } : {}),
+                ...(entry.notes !== undefined ? { notes: entry.notes } : {}),
+                updatedAt: entry.at,
+            });
+        }
+    }
+    return out;
+}
+function appendEntry(ctx, entry) {
+    const path = ledgerPath(ctx);
+    ensureDir(path);
+    appendFileSync(path, `${JSON.stringify(entry)}\n`, {
+        encoding: 'utf8',
+        mode: 0o600,
+    });
+}
+export function taskCreate(ctx, input) {
+    const title = input.title?.trim();
+    if (!title) {
+        throw new Error('task_create: title is required');
+    }
+    if (title.length > 2_000) {
+        throw new Error('task_create: title exceeds 2000 char cap');
+    }
+    const status = input.status ?? 'pending';
+    if (!isValidStatus(status)) {
+        throw new Error(`task_create: invalid status "${status}"`);
+    }
+    const id = `task-${randomUUID()}`;
+    const at = nowIso(ctx);
+    const entry = {
+        op: 'create',
+        id,
+        title,
+        status,
+        at,
+        ...(input.notes !== undefined ? { notes: input.notes } : {}),
+    };
+    appendEntry(ctx, entry);
+    return {
+        id,
+        title,
+        status,
+        ...(input.notes !== undefined ? { notes: input.notes } : {}),
+        createdAt: at,
+        updatedAt: at,
+    };
+}
+export function taskGet(ctx, id) {
+    if (typeof id !== 'string' || id.length === 0) {
+        throw new Error('task_get: id is required');
+    }
+    const folded = fold(readJournal(ctx));
+    return folded.get(id) ?? null;
+}
+export function taskList(ctx) {
+    const folded = fold(readJournal(ctx));
+    return Array.from(folded.values()).sort((a, b) => a.createdAt.localeCompare(b.createdAt));
+}
+export function taskUpdate(ctx, input) {
+    if (!input.id)
+        throw new Error('task_update: id is required');
+    const folded = fold(readJournal(ctx));
+    const existing = folded.get(input.id);
+    if (!existing) {
+        throw new Error(`task_update: unknown id "${input.id}"`);
+    }
+    if (input.status !== undefined && !isValidStatus(input.status)) {
+        throw new Error(`task_update: invalid status "${input.status}"`);
+    }
+    if (input.title !== undefined && input.title.trim().length === 0) {
+        throw new Error('task_update: title cannot be empty');
+    }
+    const at = nowIso(ctx);
+    const entry = {
+        op: 'update',
+        id: input.id,
+        at,
+        ...(input.title !== undefined ? { title: input.title } : {}),
+        ...(input.status !== undefined ? { status: input.status } : {}),
+        ...(input.notes !== undefined ? { notes: input.notes } : {}),
+    };
+    appendEntry(ctx, entry);
+    return {
+        ...existing,
+        ...(input.title !== undefined ? { title: input.title } : {}),
+        ...(input.status !== undefined ? { status: input.status } : {}),
+        ...(input.notes !== undefined ? { notes: input.notes } : {}),
+        updatedAt: at,
+    };
+}
+function isValidStatus(status) {
+    return (status === 'pending' ||
+        status === 'in_progress' ||
+        status === 'completed' ||
+        status === 'cancelled');
+}
+//# sourceMappingURL=tasks.js.map

package/dist/tools/todo-write.js ADDED Viewed

@@ -0,0 +1,184 @@
+/**
+ * todo_write tool — Leak L16 (TodoWrite single-in-progress invariant).
+ *
+ * Mirrors Claude Code's `TodoWrite` tool 1:1 so a model trained on the
+ * upstream grammar speaks Pugi's variant verbatim. The tool dispatches
+ * a BATCH replace of the workspace todo board (not an incremental
+ * mutation — the model emits the FULL list every call). At most ONE
+ * todo may carry `status: 'in_progress'` at any time; violations
+ * reject with the `TODO_INVARIANT_VIOLATED` sentinel and the board on
+ * disk is left unchanged.
+ *
+ * Relationship to `task_*` (β1 T1/T6, tools/tasks.ts):
+ *   - `task_*` is GRANULAR (create/get/list/update one task at a
+ *     time) with an append-only JSONL journal scoped to the SESSION.
+ *   - `todo_write` is BATCH (snapshot the whole board) with an atomic
+ *     JSON snapshot scoped to the WORKSPACE.
+ *   They are complementary surfaces: agents that prefer the upstream
+ *   TodoWrite grammar use `todo_write`; agents that want a fine-grained
+ *   audit trail use `task_*`.
+ *
+ * Hard rules (enforced by Zod + dispatcher):
+ *   - `todos.length` ≤ 50 (board overload guard).
+ *   - Every item: id (≥1 char, ≤128), content (≥1 char), status enum.
+ *   - At most ONE item with `status === 'in_progress'`.
+ *   - All ids unique within the batch.
+ *
+ * Dispatch returns the persisted board as JSON; callers can read
+ * `todos: [...]` directly. Errors return the sentinel-prefixed message
+ * so the engine adapter can pattern-match.
+ */
+import { z } from 'zod';
+import { saveTodoBoard } from '../core/todos/state.js';
+/** Cap matches the `task_*` family's title cap for parity. */
+export const TODO_CONTENT_MAX = 2_000;
+/** id is opaque to us but must be slug-safe so file paths could embed it. */
+export const TODO_ID_MIN = 1;
+export const TODO_ID_MAX = 128;
+/** Hard cap on board size. Beyond this the operator should split work. */
+export const TODO_BATCH_MAX = 50;
+export const todoItemSchema = z
+    .strictObject({
+    id: z
+        .string()
+        .min(TODO_ID_MIN)
+        .max(TODO_ID_MAX)
+        .describe('Stable id for this todo. Opaque, ≤128 chars.'),
+    content: z
+        .string()
+        .min(1)
+        .max(TODO_CONTENT_MAX)
+        .describe('Imperative task description. E.g. "Add invariant check".'),
+    status: z
+        .enum(['pending', 'in_progress', 'completed'])
+        .describe('Lifecycle status. At most ONE in_progress per board.'),
+    activeForm: z
+        .string()
+        .min(1)
+        .max(TODO_CONTENT_MAX)
+        .optional()
+        .describe('Present-continuous form. E.g. "Adding invariant check".'),
+});
+export const todoWriteArgsSchema = z.strictObject({
+    todos: z
+        .array(todoItemSchema)
+        .max(TODO_BATCH_MAX)
+        .describe(`Full todo board (batch replace, not incremental). Max ${TODO_BATCH_MAX} items. ` +
+        `At most ONE item may carry status="in_progress".`),
+});
+/**
+ * JSON-Schema fragment surfaced to the model via the tool-bridge
+ * `parameters` field. Mirrors the Zod schema 1:1 — kept hand-written
+ * (same convention as ask_user_question) because the runtime engine
+ * wires OpenAI-compatible JSON Schema and we have not greenlit the
+ * zod-to-json-schema transitive dep. Keep both in lockstep.
+ */
+export const todoWriteJsonSchema = {
+    type: 'object',
+    additionalProperties: false,
+    required: ['todos'],
+    properties: {
+        todos: {
+            type: 'array',
+            maxItems: TODO_BATCH_MAX,
+            description: `Full todo board (batch replace, not incremental). Max ${TODO_BATCH_MAX} items. ` +
+                `At most ONE item may carry status="in_progress".`,
+            items: {
+                type: 'object',
+                additionalProperties: false,
+                required: ['id', 'content', 'status'],
+                properties: {
+                    id: {
+                        type: 'string',
+                        minLength: TODO_ID_MIN,
+                        maxLength: TODO_ID_MAX,
+                        description: 'Stable id for this todo. Opaque, ≤128 chars.',
+                    },
+                    content: {
+                        type: 'string',
+                        minLength: 1,
+                        maxLength: TODO_CONTENT_MAX,
+                        description: 'Imperative task description.',
+                    },
+                    status: {
+                        type: 'string',
+                        enum: ['pending', 'in_progress', 'completed'],
+                        description: 'Lifecycle status. At most ONE in_progress per board.',
+                    },
+                    activeForm: {
+                        type: 'string',
+                        minLength: 1,
+                        maxLength: TODO_CONTENT_MAX,
+                        description: 'Present-continuous form.',
+                    },
+                },
+            },
+        },
+    },
+};
+/**
+ * Sentinel prefix the dispatcher returns when Zod schema validation
+ * rejects the raw arguments. Distinct from `TODO_INVARIANT_VIOLATED`
+ * (>1 in_progress) and `TODO_DUPLICATE_ID` (collision within batch),
+ * which are emitted from `saveTodoBoard` AFTER schema parsing.
+ *
+ * Surfaced as a return string (not a throw) so the engine adapter sees
+ * a recoverable tool error and the model can self-correct its args,
+ * instead of the engine loop tearing down on an uncaught ZodError.
+ */
+export const TODO_INVALID_ARGS = 'INVALID_ARGS';
+/**
+ * Render a ZodError into a deterministic `INVALID_ARGS: ...` sentinel
+ * the model can pattern-match. Each issue contributes one
+ * `path: message` clause; clauses are joined with `; ` so the model
+ * sees every offence in a single line. Path with the root scope is
+ * rendered as `<root>` to avoid an empty colon.
+ */
+function renderZodIssues(error) {
+    const parts = error.issues.map((issue) => {
+        const path = issue.path.length === 0 ? '<root>' : issue.path.join('.');
+        return `${path}: ${issue.message}`;
+    });
+    return `${TODO_INVALID_ARGS}: ${parts.join('; ')}`;
+}
+/**
+ * Validate via Zod + persist atomically. Surfaces three sentinel
+ * families the dispatcher pattern-matches on:
+ *   - `INVALID_ARGS: <path>: <issue>; ...`        — Zod schema rejected
+ *     the raw arguments (returned as STRING, not thrown).
+ *   - `TODO_INVARIANT_VIOLATED: ...`              — >1 in_progress
+ *     (thrown by `saveTodoBoard`).
+ *   - `TODO_DUPLICATE_ID: ...`                    — collision within batch
+ *     (thrown by `saveTodoBoard`).
+ *
+ * Why the asymmetry: schema rejection means the model emitted malformed
+ * structure (missing field, wrong type) and CAN self-correct given a
+ * clear breakdown of the offending path. The invariant + duplicate-id
+ * paths mean the model emitted structurally-valid but semantically
+ * conflicting state — those still throw so the engine loop's tool-error
+ * hook can surface them through `PostToolUseFailure` for observability,
+ * mirroring how the file-tools layer surfaces `STALE_READ` / `PermissionDenied`.
+ */
+export function dispatchTodoWrite(ctx, rawArgs) {
+    // L16 P1 fix (2026-05-27): `.parse` throws a `ZodError` on validation
+    // failure. The previous implementation let that throw bubble through
+    // the engine adapter's catch arm as a free-form `error.message`,
+    // which (a) loses the issue-by-issue structure the model needs to
+    // self-correct, and (b) tears down the tool-call as a hard failure
+    // rather than a recoverable tool result. Switch to `safeParse` and
+    // emit a structured `INVALID_ARGS: <path>: <issue>; ...` sentinel
+    // string instead — the engine sees a successful tool call, the model
+    // sees the offending paths, and the dispatcher's catch arm reserves
+    // throws for the genuine semantic conflicts emitted by `saveTodoBoard`.
+    const parsed = todoWriteArgsSchema.safeParse(rawArgs);
+    if (!parsed.success) {
+        return renderZodIssues(parsed.error);
+    }
+    const stateCtx = {
+        workspaceRoot: ctx.workspaceRoot,
+        ...(ctx.now ? { now: ctx.now } : {}),
+    };
+    const board = saveTodoBoard(stateCtx, parsed.data.todos);
+    return JSON.stringify(board);
+}
+//# sourceMappingURL=todo-write.js.map