@pugi/cli 0.1.0-beta.5 → 0.1.0-beta.51

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (264) hide show
  1. package/THIRD_PARTY_NOTICES.md +40 -0
  2. package/assets/pugi-mascot.ansi +15 -25
  3. package/assets/pugi-prozr2-mascot.ansi +9 -0
  4. package/bin/run.js +33 -1
  5. package/dist/commands/jobs-watch.js +201 -0
  6. package/dist/commands/jobs.js +15 -0
  7. package/dist/commands/smoke.js +133 -0
  8. package/dist/core/agent-progress/cleanup.js +134 -0
  9. package/dist/core/agent-progress/schema.js +144 -0
  10. package/dist/core/agent-progress/writer.js +101 -0
  11. package/dist/core/artifact-chain/dispatcher.js +148 -0
  12. package/dist/core/artifact-chain/exporter.js +164 -0
  13. package/dist/core/artifact-chain/state.js +243 -0
  14. package/dist/core/artifact-chain/steps.js +169 -0
  15. package/dist/core/auth/ensure-authenticated.js +129 -0
  16. package/dist/core/auth/env-provider.js +238 -0
  17. package/dist/core/auto-update/channels.js +122 -0
  18. package/dist/core/auto-update/checker.js +241 -0
  19. package/dist/core/auto-update/state.js +235 -0
  20. package/dist/core/bare-mode/index.js +107 -0
  21. package/dist/core/bash-classifier.js +400 -4
  22. package/dist/core/checkpoint/resumer.js +149 -0
  23. package/dist/core/checkpoint/rewinder.js +291 -0
  24. package/dist/core/codegraph/decision-store.js +248 -0
  25. package/dist/core/codegraph/detect-repo.js +459 -0
  26. package/dist/core/codegraph/install.js +134 -0
  27. package/dist/core/codegraph/offer-hook.js +220 -0
  28. package/dist/core/compact/auto-trigger.js +96 -0
  29. package/dist/core/compact/buffer-rewriter.js +115 -0
  30. package/dist/core/compact/summarizer.js +208 -0
  31. package/dist/core/compact/token-counter.js +108 -0
  32. package/dist/core/consensus/diff-capture.js +112 -3
  33. package/dist/core/context/index.js +7 -0
  34. package/dist/core/context/markdown-traverse.js +255 -0
  35. package/dist/core/cost/rate-card.js +129 -0
  36. package/dist/core/cost/tracker.js +221 -0
  37. package/dist/core/denial-tracking/index.js +8 -0
  38. package/dist/core/denial-tracking/state.js +264 -0
  39. package/dist/core/diagnostics/probe-runner.js +93 -0
  40. package/dist/core/diagnostics/probes/api.js +46 -0
  41. package/dist/core/diagnostics/probes/auth.js +86 -0
  42. package/dist/core/diagnostics/probes/bare-mode.js +42 -0
  43. package/dist/core/diagnostics/probes/cli-version.js +127 -0
  44. package/dist/core/diagnostics/probes/config.js +72 -0
  45. package/dist/core/diagnostics/probes/denial-tracking.js +57 -0
  46. package/dist/core/diagnostics/probes/disk.js +81 -0
  47. package/dist/core/diagnostics/probes/git.js +65 -0
  48. package/dist/core/diagnostics/probes/hooks.js +118 -0
  49. package/dist/core/diagnostics/probes/mcp.js +75 -0
  50. package/dist/core/diagnostics/probes/node.js +59 -0
  51. package/dist/core/diagnostics/probes/pnpm.js +36 -0
  52. package/dist/core/diagnostics/probes/pugi-md.js +89 -0
  53. package/dist/core/diagnostics/probes/sandbox.js +40 -0
  54. package/dist/core/diagnostics/probes/session.js +74 -0
  55. package/dist/core/diagnostics/probes/status-snapshot.js +488 -0
  56. package/dist/core/diagnostics/probes/workspace.js +63 -0
  57. package/dist/core/diagnostics/types.js +70 -0
  58. package/dist/core/dispatch/cache-cleanup.js +197 -0
  59. package/dist/core/dispatch/cache-handoff.js +295 -0
  60. package/dist/core/edits/dispatch.js +218 -2
  61. package/dist/core/edits/journal.js +199 -0
  62. package/dist/core/edits/layer-d-ast.js +557 -14
  63. package/dist/core/edits/verify-hook.js +273 -0
  64. package/dist/core/edits/worktree.js +322 -0
  65. package/dist/core/engine/anvil-client.js +115 -5
  66. package/dist/core/engine/auto-compact.js +179 -0
  67. package/dist/core/engine/budgets.js +155 -0
  68. package/dist/core/engine/context-prefix.js +155 -0
  69. package/dist/core/engine/intent.js +260 -0
  70. package/dist/core/engine/native-pugi.js +897 -211
  71. package/dist/core/engine/prompts.js +88 -2
  72. package/dist/core/engine/strip-internal-fields.js +124 -0
  73. package/dist/core/engine/tool-bridge.js +1045 -36
  74. package/dist/core/feedback/queue.js +177 -0
  75. package/dist/core/feedback/submitter.js +145 -0
  76. package/dist/core/file-cache.js +113 -1
  77. package/dist/core/hooks/events.js +44 -0
  78. package/dist/core/hooks/index.js +15 -0
  79. package/dist/core/hooks/registry.js +213 -0
  80. package/dist/core/hooks/runner.js +236 -0
  81. package/dist/core/hooks/v2/event-emitter.js +115 -0
  82. package/dist/core/hooks/v2/executor.js +282 -0
  83. package/dist/core/hooks/v2/index.js +25 -0
  84. package/dist/core/hooks/v2/lifecycle.js +104 -0
  85. package/dist/core/hooks/v2/loader.js +216 -0
  86. package/dist/core/hooks/v2/matcher.js +125 -0
  87. package/dist/core/hooks/v2/trust.js +143 -0
  88. package/dist/core/hooks/v2/types.js +86 -0
  89. package/dist/core/lsp/cache.js +105 -0
  90. package/dist/core/lsp/client.js +776 -0
  91. package/dist/core/lsp/language-detect.js +66 -0
  92. package/dist/core/lsp/post-edit-diagnostics.js +171 -0
  93. package/dist/core/mcp/client.js +75 -6
  94. package/dist/core/mcp/http-server.js +553 -0
  95. package/dist/core/mcp/orchestrator-tools.js +662 -0
  96. package/dist/core/mcp/permission.js +190 -0
  97. package/dist/core/mcp/registry.js +24 -2
  98. package/dist/core/mcp/server-tools.js +219 -0
  99. package/dist/core/mcp/server.js +397 -0
  100. package/dist/core/memory/dual-write.js +416 -0
  101. package/dist/core/memory/phase1-kinds.js +20 -0
  102. package/dist/core/memory-sync/queue.js +158 -0
  103. package/dist/core/onboarding/ensure-initialized.js +133 -0
  104. package/dist/core/onboarding/marker.js +111 -0
  105. package/dist/core/onboarding/telemetry-state.js +108 -0
  106. package/dist/core/output-style/presets.js +176 -0
  107. package/dist/core/output-style/state.js +185 -0
  108. package/dist/core/path-security.js +284 -2
  109. package/dist/core/permissions/auto-classifier.js +124 -0
  110. package/dist/core/permissions/circuit-breaker.js +83 -0
  111. package/dist/core/permissions/gate.js +278 -0
  112. package/dist/core/permissions/index.js +20 -0
  113. package/dist/core/permissions/mode.js +174 -0
  114. package/dist/core/permissions/state.js +241 -0
  115. package/dist/core/permissions/tool-class.js +93 -0
  116. package/dist/core/prd-check/parser.js +215 -0
  117. package/dist/core/prd-check/reporter.js +127 -0
  118. package/dist/core/prd-check/session-review.js +557 -0
  119. package/dist/core/prd-check/verifiers.js +223 -0
  120. package/dist/core/pugi-md/context-injector.js +76 -0
  121. package/dist/core/pugi-md/walk-up.js +207 -0
  122. package/dist/core/release-notes/parser.js +241 -0
  123. package/dist/core/release-notes/state.js +116 -0
  124. package/dist/core/repl/history.js +11 -1
  125. package/dist/core/repl/model-pricing.js +135 -0
  126. package/dist/core/repl/session.js +1897 -37
  127. package/dist/core/repl/slash-commands.js +430 -15
  128. package/dist/core/repl/store/session-store.js +31 -2
  129. package/dist/core/repl/workspace-context.js +22 -0
  130. package/dist/core/repo-map/build.js +125 -0
  131. package/dist/core/repo-map/cache.js +185 -0
  132. package/dist/core/repo-map/extractor.js +254 -0
  133. package/dist/core/repo-map/formatter.js +145 -0
  134. package/dist/core/repo-map/scanner.js +211 -0
  135. package/dist/core/retry-budget/budget.js +284 -0
  136. package/dist/core/retry-budget/index.js +5 -0
  137. package/dist/core/session.js +92 -0
  138. package/dist/core/settings.js +80 -0
  139. package/dist/core/share/formatter.js +271 -0
  140. package/dist/core/share/redactor.js +221 -0
  141. package/dist/core/share/uploader.js +267 -0
  142. package/dist/core/skills/defaults.js +457 -0
  143. package/dist/core/smoke/headless-driver.js +174 -0
  144. package/dist/core/smoke/orchestrator.js +194 -0
  145. package/dist/core/smoke/runner.js +238 -0
  146. package/dist/core/smoke/scenario-parser.js +316 -0
  147. package/dist/core/subagents/dispatcher-real.js +600 -0
  148. package/dist/core/subagents/dispatcher.js +113 -24
  149. package/dist/core/subagents/index.js +18 -5
  150. package/dist/core/subagents/isolation-matrix.js +213 -0
  151. package/dist/core/subagents/spawn.js +19 -4
  152. package/dist/core/telemetry/emitter.js +229 -0
  153. package/dist/core/telemetry/queue.js +251 -0
  154. package/dist/core/theme/context.js +91 -0
  155. package/dist/core/theme/presets.js +228 -0
  156. package/dist/core/theme/state.js +181 -0
  157. package/dist/core/todos/invariant.js +10 -0
  158. package/dist/core/todos/state.js +177 -0
  159. package/dist/core/transport/version-interceptor.js +166 -0
  160. package/dist/core/vim/keymap.js +288 -0
  161. package/dist/core/vim/state.js +92 -0
  162. package/dist/core/worktree-manager/cleanup.js +123 -0
  163. package/dist/core/worktree-manager/manager.js +303 -0
  164. package/dist/index.js +28 -0
  165. package/dist/runtime/bootstrap.js +190 -0
  166. package/dist/runtime/cli.js +3241 -343
  167. package/dist/runtime/commands/cancel.js +231 -0
  168. package/dist/runtime/commands/chain.js +489 -0
  169. package/dist/runtime/commands/codegraph-status.js +227 -0
  170. package/dist/runtime/commands/compact.js +297 -0
  171. package/dist/runtime/commands/cost.js +199 -0
  172. package/dist/runtime/commands/delegate.js +242 -11
  173. package/dist/runtime/commands/dispatch.js +126 -0
  174. package/dist/runtime/commands/doctor.js +412 -0
  175. package/dist/runtime/commands/feedback.js +184 -0
  176. package/dist/runtime/commands/hooks.js +184 -0
  177. package/dist/runtime/commands/lsp.js +368 -0
  178. package/dist/runtime/commands/mcp.js +879 -0
  179. package/dist/runtime/commands/memory.js +508 -0
  180. package/dist/runtime/commands/model.js +237 -0
  181. package/dist/runtime/commands/onboarding.js +275 -0
  182. package/dist/runtime/commands/patch.js +128 -0
  183. package/dist/runtime/commands/permissions.js +112 -0
  184. package/dist/runtime/commands/plan.js +143 -0
  185. package/dist/runtime/commands/prd-check.js +285 -0
  186. package/dist/runtime/commands/redo-blob-store.js +92 -0
  187. package/dist/runtime/commands/redo.js +361 -0
  188. package/dist/runtime/commands/release-notes.js +229 -0
  189. package/dist/runtime/commands/repo-map.js +95 -0
  190. package/dist/runtime/commands/report.js +299 -0
  191. package/dist/runtime/commands/resume.js +118 -0
  192. package/dist/runtime/commands/review-consensus.js +17 -2
  193. package/dist/runtime/commands/rewind.js +333 -0
  194. package/dist/runtime/commands/sessions.js +163 -0
  195. package/dist/runtime/commands/share.js +316 -0
  196. package/dist/runtime/commands/status.js +186 -0
  197. package/dist/runtime/commands/stickers.js +82 -0
  198. package/dist/runtime/commands/style.js +194 -0
  199. package/dist/runtime/commands/theme.js +196 -0
  200. package/dist/runtime/commands/undo.js +32 -0
  201. package/dist/runtime/commands/update.js +289 -0
  202. package/dist/runtime/commands/vim.js +140 -0
  203. package/dist/runtime/commands/worktree.js +177 -0
  204. package/dist/runtime/commands/worktrees.js +155 -0
  205. package/dist/runtime/headless-repl.js +195 -0
  206. package/dist/runtime/headless.js +543 -0
  207. package/dist/runtime/load-hooks-or-exit.js +71 -0
  208. package/dist/runtime/plan-decompose.js +531 -0
  209. package/dist/runtime/version.js +65 -0
  210. package/dist/tools/agent-tool.js +229 -0
  211. package/dist/tools/apply-patch.js +556 -0
  212. package/dist/tools/ask-user-question.js +213 -0
  213. package/dist/tools/ask-user.js +115 -0
  214. package/dist/tools/bash.js +203 -4
  215. package/dist/tools/file-tools.js +85 -14
  216. package/dist/tools/lsp-tools.js +189 -0
  217. package/dist/tools/mcp-tool.js +260 -0
  218. package/dist/tools/multi-edit.js +361 -0
  219. package/dist/tools/powershell.js +268 -0
  220. package/dist/tools/registry.js +51 -0
  221. package/dist/tools/skill-tool.js +96 -0
  222. package/dist/tools/tasks.js +208 -0
  223. package/dist/tools/todo-write.js +184 -0
  224. package/dist/tools/web-fetch.js +147 -2
  225. package/dist/tools/web-search.js +458 -0
  226. package/dist/tui/agent-progress-card.js +111 -0
  227. package/dist/tui/agent-tree.js +10 -0
  228. package/dist/tui/ask-modal.js +2 -2
  229. package/dist/tui/ask-user-question-prompt.js +192 -0
  230. package/dist/tui/compact-banner.js +81 -0
  231. package/dist/tui/conversation-pane.js +82 -8
  232. package/dist/tui/cost-table.js +111 -0
  233. package/dist/tui/doctor-table.js +46 -0
  234. package/dist/tui/feedback-prompt.js +156 -0
  235. package/dist/tui/input-box.js +218 -3
  236. package/dist/tui/markdown-render.js +4 -4
  237. package/dist/tui/onboarding-wizard.js +240 -0
  238. package/dist/tui/permissions-picker.js +86 -0
  239. package/dist/tui/render.js +35 -0
  240. package/dist/tui/repl-render.js +313 -35
  241. package/dist/tui/repl-splash-art.js +1 -1
  242. package/dist/tui/repl-splash-mascot.js +32 -8
  243. package/dist/tui/repl-splash.js +2 -2
  244. package/dist/tui/repl.js +85 -5
  245. package/dist/tui/splash.js +1 -1
  246. package/dist/tui/status-bar.js +94 -16
  247. package/dist/tui/status-table.js +7 -0
  248. package/dist/tui/stickers-art.js +136 -0
  249. package/dist/tui/style-table.js +28 -0
  250. package/dist/tui/theme-table.js +29 -0
  251. package/dist/tui/thinking-spinner.js +123 -0
  252. package/dist/tui/tool-stream-pane.js +52 -3
  253. package/dist/tui/update-banner.js +27 -2
  254. package/dist/tui/vim-input.js +267 -0
  255. package/dist/tui/welcome-banner.js +107 -0
  256. package/dist/tui/welcome-data.js +293 -0
  257. package/docs/examples/codegraph.mcp.json +10 -0
  258. package/package.json +13 -7
  259. package/test/scenarios/codegen-create-file.scenario.txt +13 -0
  260. package/test/scenarios/compact-force.scenario.txt +11 -0
  261. package/test/scenarios/identity.scenario.txt +11 -0
  262. package/test/scenarios/persona-handoff.scenario.txt +11 -0
  263. package/test/scenarios/walkback.scenario.txt +12 -0
  264. package/dist/core/engine/compaction-hook.js +0 -154
@@ -1,8 +1,36 @@
1
1
  const registry = [
2
+ // α7.7: unified-diff patch apply. Routes through the same security
3
+ // gate as Layer A/B/C, so the risk class matches `edit`/`write`
4
+ // (medium — writes inside the workspace, never to protected files).
5
+ { name: 'apply_patch', permission: 'edit', risk: 'medium', concurrencySafe: false, m1: true },
6
+ // Leak L5 (2026-05-27): structured multi-choice clarifier tool. Risk =
7
+ // low because the dispatch is a pure UI surface — no file writes, no
8
+ // shell, no network. Permission = none (no workspace access required).
9
+ // concurrencySafe = true because the prompt-budget gate runs in the
10
+ // engine loop, not via tool-side mutex (one prompt per turn is enforced
11
+ // by the persona system prompt + the engine's tool_calls budget).
12
+ { name: 'ask_user_question', permission: 'none', risk: 'low', concurrencySafe: true, m1: true },
2
13
  { name: 'bash', permission: 'bash', risk: 'high', concurrencySafe: false, m1: true },
3
14
  { name: 'edit', permission: 'edit', risk: 'medium', concurrencySafe: false, m1: true },
4
15
  { name: 'glob', permission: 'read', risk: 'low', concurrencySafe: true, m1: true },
5
16
  { name: 'grep', permission: 'read', risk: 'low', concurrencySafe: true, m1: true },
17
+ // α7.7: LSP read-only surface. Server runs locally, no Anvil
18
+ // round-trip. Concurrency-safe because every operation reads
19
+ // server state without mutating workspace files.
20
+ { name: 'lsp_definition', permission: 'read', risk: 'low', concurrencySafe: true, m1: true },
21
+ { name: 'lsp_diagnostics', permission: 'read', risk: 'low', concurrencySafe: true, m1: true },
22
+ { name: 'lsp_hover', permission: 'read', risk: 'low', concurrencySafe: true, m1: true },
23
+ { name: 'lsp_references', permission: 'read', risk: 'low', concurrencySafe: true, m1: true },
24
+ // β7 L5+T11: multi_edit dispatches an ordered batch of Layer A edits
25
+ // as a single transaction. Risk = medium (same chokepoints as `edit`).
26
+ // concurrencySafe = false because the journal serialises one dispatch
27
+ // per session.
28
+ { name: 'multi_edit', permission: 'edit', risk: 'medium', concurrencySafe: false, m1: true },
29
+ // Leak L6 (2026-05-28): PowerShell tool for Windows-first workflows. Same
30
+ // bash permission class — destructive-pattern classification fires the
31
+ // same gate. concurrencySafe = false because spawn-shell child cwd /
32
+ // env carry-over could race across parallel agent calls.
33
+ { name: 'powershell', permission: 'bash', risk: 'high', concurrencySafe: false, m1: false },
6
34
  { name: 'question', permission: 'none', risk: 'low', concurrencySafe: false, m1: true },
7
35
  { name: 'read', permission: 'read', risk: 'low', concurrencySafe: true, m1: true },
8
36
  { name: 'skill', permission: 'read', risk: 'low', concurrencySafe: true, m1: true },
@@ -10,7 +38,30 @@ const registry = [
10
38
  { name: 'task_get', permission: 'none', risk: 'low', concurrencySafe: true, m1: true },
11
39
  { name: 'task_list', permission: 'none', risk: 'low', concurrencySafe: true, m1: true },
12
40
  { name: 'task_update', permission: 'none', risk: 'low', concurrencySafe: false, m1: true },
41
+ // Leak L16 (2026-05-27): batch TodoWrite. Mirrors Claude Code's upstream
42
+ // surface — full board snapshot, single-in-progress invariant, atomic
43
+ // tmp+rename persistence to `.pugi/todos.json`. `concurrencySafe = false`
44
+ // because two concurrent writes could lose the loser's snapshot (the
45
+ // rename is atomic but the read-modify-write loop is not). Risk = low
46
+ // because the only filesystem mutation lands inside `.pugi/todos.json`,
47
+ // which is metadata, not source.
48
+ { name: 'todo_write', permission: 'none', risk: 'low', concurrencySafe: false, m1: true },
13
49
  { name: 'web_fetch', permission: 'network', risk: 'medium', concurrencySafe: true, m1: true },
50
+ // α7.7: scratch worktree management. `worktree_create` writes nothing
51
+ // dangerous (a clone under `.pugi/worktrees/`); `worktree_promote`
52
+ // applies a diff back to the main tree, so it shares the `edit`
53
+ // risk class. `worktree_drop` is the cleanup primitive.
54
+ //
55
+ // R1 fix (2026-05-26, PR #413 r1, Fix 9): raised `worktree_create`
56
+ // and `worktree_drop` from `low` to `medium`. `worktree_drop` runs
57
+ // `rmSync` on its target — even with the new path-containment gate
58
+ // in `core/edits/worktree.ts::dropWorktree`, a destructive primitive
59
+ // belongs in `medium` so the permission FSM prompts on every call.
60
+ // `worktree_create` is raised for disk-pressure parity (a runaway
61
+ // agent loop could fill the disk with abandoned scratch worktrees).
62
+ { name: 'worktree_create', permission: 'edit', risk: 'medium', concurrencySafe: false, m1: true },
63
+ { name: 'worktree_drop', permission: 'edit', risk: 'medium', concurrencySafe: false, m1: true },
64
+ { name: 'worktree_promote', permission: 'edit', risk: 'medium', concurrencySafe: false, m1: true },
14
65
  { name: 'write', permission: 'edit', risk: 'medium', concurrencySafe: false, m1: true },
15
66
  ];
16
67
  export const toolRegistry = registry.sort((a, b) => a.name.localeCompare(b.name));
@@ -0,0 +1,96 @@
1
+ import { listSkills } from '../core/skills/loader.js';
2
+ import { hashSkillDir, verifyTrust } from '../core/skills/trust.js';
3
+ export const SKILL_BODY_CAP_BYTES = 32 * 1024;
4
+ export const SKILL_LIST_CAP = 100;
5
+ export function skillList(ctx, input) {
6
+ const scope = input.scope ?? 'all';
7
+ const all = [];
8
+ if (scope === 'all' || scope === 'global') {
9
+ all.push(...listSkills('global', ctx.workspaceRoot));
10
+ }
11
+ if (scope === 'all' || scope === 'workspace') {
12
+ all.push(...listSkills('workspace', ctx.workspaceRoot));
13
+ }
14
+ // Dedup by name, prefer workspace scope when both exist (workspace
15
+ // overrides global per skills loader convention).
16
+ const byName = new Map();
17
+ for (const skill of all) {
18
+ const prev = byName.get(skill.name);
19
+ if (!prev || skill.scope === 'workspace') {
20
+ byName.set(skill.name, skill);
21
+ }
22
+ }
23
+ return Array.from(byName.values())
24
+ .slice(0, SKILL_LIST_CAP)
25
+ .map((skill) => ({
26
+ name: skill.name,
27
+ description: skill.frontmatter.description,
28
+ scope: skill.scope,
29
+ }));
30
+ }
31
+ export async function skillInvoke(ctx, input) {
32
+ if (!input.name || typeof input.name !== 'string') {
33
+ throw new Error('skill: name is required');
34
+ }
35
+ // Defense-in-depth: skill loader already validates slugs but the
36
+ // tool surface is operator-controlled.
37
+ if (!/^[a-zA-Z0-9_-]{1,128}$/.test(input.name)) {
38
+ throw new Error(`skill: invalid skill name shape: "${input.name}"`);
39
+ }
40
+ // Workspace scope wins over global (operator override). Mirrors
41
+ // SkillLoader convention.
42
+ const workspace = listSkills('workspace', ctx.workspaceRoot).find((s) => s.name === input.name);
43
+ const global = workspace
44
+ ? null
45
+ : listSkills('global', ctx.workspaceRoot).find((s) => s.name === input.name);
46
+ const skill = workspace ?? global;
47
+ if (!skill) {
48
+ throw new Error(`skill: not found: "${input.name}"`);
49
+ }
50
+ // β1a r1 (2026-05-26): re-verify the on-disk skill payload against
51
+ // the trust manifest sha256 on EVERY invoke, not just at install
52
+ // time. Before this fix a post-install swap (malicious npm dep that
53
+ // touches `~/.pugi/skills/<name>/SKILL.md` after the operator
54
+ // approved the install) would bypass the trust gate — `listSkills`
55
+ // reads the body fresh from disk and the loader does no integrity
56
+ // check. The skill body lands directly in the model's tool result,
57
+ // so a mutated body is a prompt-injection vector against the agent
58
+ // loop's tool surface.
59
+ //
60
+ // Posture:
61
+ // - `trusted` → proceed (body is hash-pinned).
62
+ // - `unsigned` → refuse: the operator never approved this skill.
63
+ // This catches the case where a skill directory was dropped in
64
+ // manually (no `pugi skills install`) and the loader picked it
65
+ // up. Refusing is fail-closed.
66
+ // - `mismatch` → refuse + surface the recorded vs actual hashes
67
+ // so the operator can decide between re-trust and revoke.
68
+ //
69
+ // Performance: `hashSkillDir` walks the skill directory on every
70
+ // invoke. Skills are small (median 4-8 files, <50KB total) so the
71
+ // cost is sub-millisecond on warm cache. The β1a r1 spec exercises
72
+ // a mutated-body case; the existing skill-tool.spec.ts cases for
73
+ // happy-path use the `recordTrust` helper to seed the registry.
74
+ const actualHash = hashSkillDir(skill.dir);
75
+ const verdict = await verifyTrust('skill', skill.scope, skill.name, actualHash);
76
+ if (verdict.status === 'unsigned') {
77
+ throw new Error(`skill: refused to invoke "${skill.name}" — no trust entry (run \`pugi skills trust ${skill.name}\` to approve)`);
78
+ }
79
+ if (verdict.status === 'mismatch') {
80
+ throw new Error(`skill: refused to invoke "${skill.name}" — sha256 mismatch (recorded ${verdict.recorded.slice(0, 12)}…, actual ${verdict.actual.slice(0, 12)}…). Re-trust via \`pugi skills trust ${skill.name}\`.`);
81
+ }
82
+ const body = skill.body;
83
+ const truncated = Buffer.byteLength(body, 'utf8') > SKILL_BODY_CAP_BYTES;
84
+ const cappedBody = truncated
85
+ ? body.slice(0, SKILL_BODY_CAP_BYTES) +
86
+ `\n\n(... truncated at ${SKILL_BODY_CAP_BYTES} bytes — see \`pugi skills info ${skill.name}\` for full text)`
87
+ : body;
88
+ return {
89
+ name: skill.name,
90
+ scope: skill.scope,
91
+ description: skill.frontmatter.description,
92
+ body: cappedBody,
93
+ truncated,
94
+ };
95
+ }
96
+ //# sourceMappingURL=skill-tool.js.map
@@ -0,0 +1,208 @@
1
+ /**
2
+ * task_* tool family — β1 T1/T6 (TodoWrite + agent task ledger).
3
+ *
4
+ * Mirrors Claude Code's TodoWrite tool surface so a model trained on
5
+ * the upstream tool grammar speaks Pugi's variant verbatim. Four ops:
6
+ *
7
+ * - `task_create` — append a new task to the session's todo ledger.
8
+ * Returns the assigned id.
9
+ * - `task_get` — fetch a single task by id.
10
+ * - `task_list` — list every task in the current session, ordered
11
+ * by createdAt ascending.
12
+ * - `task_update` — mutate status/title/notes of an existing task.
13
+ * Append-only journal — every mutation lands as a
14
+ * fresh JSONL line and the latest line per id wins
15
+ * on `task_list` / `task_get` reads.
16
+ *
17
+ * Persistence: append-only JSONL at
18
+ * `.pugi/sessions/<sessionId>/tasks.jsonl`. Append-only keeps crash
19
+ * recovery trivial — a partial write at the end of the file is the
20
+ * worst case and the parser drops the malformed tail line.
21
+ *
22
+ * Scope: this is the local-side ledger surface. Anvil-side mirror
23
+ * (cabinet `/projects/[id]/tasks` page) ships in β5 once the session-
24
+ * memory hook lands; until then the ledger is purely local.
25
+ */
26
+ import { appendFileSync, chmodSync, existsSync, mkdirSync, readFileSync, } from 'node:fs';
27
+ import { dirname, join } from 'node:path';
28
+ import { randomUUID } from 'node:crypto';
29
+ function ledgerPath(ctx) {
30
+ // Defense-in-depth: the sessionId is supposed to be a UUID minted by
31
+ // openSession() but the tool surface is operator-facing. Validate the
32
+ // shape before composing a path — refuse anything that contains
33
+ // separators or shell wildcards.
34
+ if (!/^[a-zA-Z0-9_-]{1,128}$/.test(ctx.sessionId)) {
35
+ throw new Error(`task_*: invalid sessionId shape: "${ctx.sessionId}"`);
36
+ }
37
+ return join(ctx.workspaceRoot, '.pugi', 'sessions', ctx.sessionId, 'tasks.jsonl');
38
+ }
39
+ function nowIso(ctx) {
40
+ return (ctx.now ? ctx.now() : new Date()).toISOString();
41
+ }
42
+ function ensureDir(path) {
43
+ // β1a r1 (2026-05-26): switched from POSIX-only
44
+ // `path.slice(0, path.lastIndexOf('/'))` to `path.dirname()` so
45
+ // Windows path separators (`\`) work. Also chmod the per-session
46
+ // directory to 0o700 — the tasks ledger carries operator-confidential
47
+ // brief text, status notes, and timing metadata that should not be
48
+ // world-readable through an inherited umask.
49
+ const dir = dirname(path);
50
+ if (!existsSync(dir)) {
51
+ mkdirSync(dir, { recursive: true });
52
+ try {
53
+ chmodSync(dir, 0o700);
54
+ }
55
+ catch {
56
+ // Best-effort. POSIX permission setting is a no-op on Windows
57
+ // NTFS, and the dir-creation race with another concurrent task
58
+ // tool call is the only realistic failure case. The 0o600 mode
59
+ // on the JSONL file itself remains the primary guard; the dir
60
+ // chmod is defense in depth for tools that walk `.pugi/`.
61
+ }
62
+ }
63
+ }
64
+ function readJournal(ctx) {
65
+ const path = ledgerPath(ctx);
66
+ if (!existsSync(path))
67
+ return [];
68
+ const raw = readFileSync(path, 'utf8');
69
+ const out = [];
70
+ for (const line of raw.split('\n')) {
71
+ if (!line.trim())
72
+ continue;
73
+ try {
74
+ const parsed = JSON.parse(line);
75
+ if ((parsed.op === 'create' || parsed.op === 'update') &&
76
+ typeof parsed.id === 'string' &&
77
+ typeof parsed.at === 'string') {
78
+ out.push(parsed);
79
+ }
80
+ }
81
+ catch {
82
+ // Drop malformed line (partial-write tail or external corruption).
83
+ // The append-only design guarantees only the LAST line can be bad
84
+ // — everything before it is whole.
85
+ }
86
+ }
87
+ return out;
88
+ }
89
+ function fold(journal) {
90
+ const out = new Map();
91
+ for (const entry of journal) {
92
+ if (entry.op === 'create') {
93
+ if (!entry.title)
94
+ continue;
95
+ out.set(entry.id, {
96
+ id: entry.id,
97
+ title: entry.title,
98
+ status: entry.status ?? 'pending',
99
+ ...(entry.notes !== undefined ? { notes: entry.notes } : {}),
100
+ createdAt: entry.at,
101
+ updatedAt: entry.at,
102
+ });
103
+ }
104
+ else {
105
+ const prev = out.get(entry.id);
106
+ if (!prev)
107
+ continue; // update before create — drop silently
108
+ out.set(entry.id, {
109
+ ...prev,
110
+ ...(entry.title !== undefined ? { title: entry.title } : {}),
111
+ ...(entry.status !== undefined ? { status: entry.status } : {}),
112
+ ...(entry.notes !== undefined ? { notes: entry.notes } : {}),
113
+ updatedAt: entry.at,
114
+ });
115
+ }
116
+ }
117
+ return out;
118
+ }
119
+ function appendEntry(ctx, entry) {
120
+ const path = ledgerPath(ctx);
121
+ ensureDir(path);
122
+ appendFileSync(path, `${JSON.stringify(entry)}\n`, {
123
+ encoding: 'utf8',
124
+ mode: 0o600,
125
+ });
126
+ }
127
+ export function taskCreate(ctx, input) {
128
+ const title = input.title?.trim();
129
+ if (!title) {
130
+ throw new Error('task_create: title is required');
131
+ }
132
+ if (title.length > 2_000) {
133
+ throw new Error('task_create: title exceeds 2000 char cap');
134
+ }
135
+ const status = input.status ?? 'pending';
136
+ if (!isValidStatus(status)) {
137
+ throw new Error(`task_create: invalid status "${status}"`);
138
+ }
139
+ const id = `task-${randomUUID()}`;
140
+ const at = nowIso(ctx);
141
+ const entry = {
142
+ op: 'create',
143
+ id,
144
+ title,
145
+ status,
146
+ at,
147
+ ...(input.notes !== undefined ? { notes: input.notes } : {}),
148
+ };
149
+ appendEntry(ctx, entry);
150
+ return {
151
+ id,
152
+ title,
153
+ status,
154
+ ...(input.notes !== undefined ? { notes: input.notes } : {}),
155
+ createdAt: at,
156
+ updatedAt: at,
157
+ };
158
+ }
159
+ export function taskGet(ctx, id) {
160
+ if (typeof id !== 'string' || id.length === 0) {
161
+ throw new Error('task_get: id is required');
162
+ }
163
+ const folded = fold(readJournal(ctx));
164
+ return folded.get(id) ?? null;
165
+ }
166
+ export function taskList(ctx) {
167
+ const folded = fold(readJournal(ctx));
168
+ return Array.from(folded.values()).sort((a, b) => a.createdAt.localeCompare(b.createdAt));
169
+ }
170
+ export function taskUpdate(ctx, input) {
171
+ if (!input.id)
172
+ throw new Error('task_update: id is required');
173
+ const folded = fold(readJournal(ctx));
174
+ const existing = folded.get(input.id);
175
+ if (!existing) {
176
+ throw new Error(`task_update: unknown id "${input.id}"`);
177
+ }
178
+ if (input.status !== undefined && !isValidStatus(input.status)) {
179
+ throw new Error(`task_update: invalid status "${input.status}"`);
180
+ }
181
+ if (input.title !== undefined && input.title.trim().length === 0) {
182
+ throw new Error('task_update: title cannot be empty');
183
+ }
184
+ const at = nowIso(ctx);
185
+ const entry = {
186
+ op: 'update',
187
+ id: input.id,
188
+ at,
189
+ ...(input.title !== undefined ? { title: input.title } : {}),
190
+ ...(input.status !== undefined ? { status: input.status } : {}),
191
+ ...(input.notes !== undefined ? { notes: input.notes } : {}),
192
+ };
193
+ appendEntry(ctx, entry);
194
+ return {
195
+ ...existing,
196
+ ...(input.title !== undefined ? { title: input.title } : {}),
197
+ ...(input.status !== undefined ? { status: input.status } : {}),
198
+ ...(input.notes !== undefined ? { notes: input.notes } : {}),
199
+ updatedAt: at,
200
+ };
201
+ }
202
+ function isValidStatus(status) {
203
+ return (status === 'pending' ||
204
+ status === 'in_progress' ||
205
+ status === 'completed' ||
206
+ status === 'cancelled');
207
+ }
208
+ //# sourceMappingURL=tasks.js.map
@@ -0,0 +1,184 @@
1
+ /**
2
+ * todo_write tool — Leak L16 (TodoWrite single-in-progress invariant).
3
+ *
4
+ * Mirrors Claude Code's `TodoWrite` tool 1:1 so a model trained on the
5
+ * upstream grammar speaks Pugi's variant verbatim. The tool dispatches
6
+ * a BATCH replace of the workspace todo board (not an incremental
7
+ * mutation — the model emits the FULL list every call). At most ONE
8
+ * todo may carry `status: 'in_progress'` at any time; violations
9
+ * reject with the `TODO_INVARIANT_VIOLATED` sentinel and the board on
10
+ * disk is left unchanged.
11
+ *
12
+ * Relationship to `task_*` (β1 T1/T6, tools/tasks.ts):
13
+ * - `task_*` is GRANULAR (create/get/list/update one task at a
14
+ * time) with an append-only JSONL journal scoped to the SESSION.
15
+ * - `todo_write` is BATCH (snapshot the whole board) with an atomic
16
+ * JSON snapshot scoped to the WORKSPACE.
17
+ * They are complementary surfaces: agents that prefer the upstream
18
+ * TodoWrite grammar use `todo_write`; agents that want a fine-grained
19
+ * audit trail use `task_*`.
20
+ *
21
+ * Hard rules (enforced by Zod + dispatcher):
22
+ * - `todos.length` ≤ 50 (board overload guard).
23
+ * - Every item: id (≥1 char, ≤128), content (≥1 char), status enum.
24
+ * - At most ONE item with `status === 'in_progress'`.
25
+ * - All ids unique within the batch.
26
+ *
27
+ * Dispatch returns the persisted board as JSON; callers can read
28
+ * `todos: [...]` directly. Errors return the sentinel-prefixed message
29
+ * so the engine adapter can pattern-match.
30
+ */
31
+ import { z } from 'zod';
32
+ import { saveTodoBoard } from '../core/todos/state.js';
33
+ /** Cap matches the `task_*` family's title cap for parity. */
34
+ export const TODO_CONTENT_MAX = 2_000;
35
+ /** id is opaque to us but must be slug-safe so file paths could embed it. */
36
+ export const TODO_ID_MIN = 1;
37
+ export const TODO_ID_MAX = 128;
38
+ /** Hard cap on board size. Beyond this the operator should split work. */
39
+ export const TODO_BATCH_MAX = 50;
40
+ export const todoItemSchema = z
41
+ .strictObject({
42
+ id: z
43
+ .string()
44
+ .min(TODO_ID_MIN)
45
+ .max(TODO_ID_MAX)
46
+ .describe('Stable id for this todo. Opaque, ≤128 chars.'),
47
+ content: z
48
+ .string()
49
+ .min(1)
50
+ .max(TODO_CONTENT_MAX)
51
+ .describe('Imperative task description. E.g. "Add invariant check".'),
52
+ status: z
53
+ .enum(['pending', 'in_progress', 'completed'])
54
+ .describe('Lifecycle status. At most ONE in_progress per board.'),
55
+ activeForm: z
56
+ .string()
57
+ .min(1)
58
+ .max(TODO_CONTENT_MAX)
59
+ .optional()
60
+ .describe('Present-continuous form. E.g. "Adding invariant check".'),
61
+ });
62
+ export const todoWriteArgsSchema = z.strictObject({
63
+ todos: z
64
+ .array(todoItemSchema)
65
+ .max(TODO_BATCH_MAX)
66
+ .describe(`Full todo board (batch replace, not incremental). Max ${TODO_BATCH_MAX} items. ` +
67
+ `At most ONE item may carry status="in_progress".`),
68
+ });
69
+ /**
70
+ * JSON-Schema fragment surfaced to the model via the tool-bridge
71
+ * `parameters` field. Mirrors the Zod schema 1:1 — kept hand-written
72
+ * (same convention as ask_user_question) because the runtime engine
73
+ * wires OpenAI-compatible JSON Schema and we have not greenlit the
74
+ * zod-to-json-schema transitive dep. Keep both in lockstep.
75
+ */
76
+ export const todoWriteJsonSchema = {
77
+ type: 'object',
78
+ additionalProperties: false,
79
+ required: ['todos'],
80
+ properties: {
81
+ todos: {
82
+ type: 'array',
83
+ maxItems: TODO_BATCH_MAX,
84
+ description: `Full todo board (batch replace, not incremental). Max ${TODO_BATCH_MAX} items. ` +
85
+ `At most ONE item may carry status="in_progress".`,
86
+ items: {
87
+ type: 'object',
88
+ additionalProperties: false,
89
+ required: ['id', 'content', 'status'],
90
+ properties: {
91
+ id: {
92
+ type: 'string',
93
+ minLength: TODO_ID_MIN,
94
+ maxLength: TODO_ID_MAX,
95
+ description: 'Stable id for this todo. Opaque, ≤128 chars.',
96
+ },
97
+ content: {
98
+ type: 'string',
99
+ minLength: 1,
100
+ maxLength: TODO_CONTENT_MAX,
101
+ description: 'Imperative task description.',
102
+ },
103
+ status: {
104
+ type: 'string',
105
+ enum: ['pending', 'in_progress', 'completed'],
106
+ description: 'Lifecycle status. At most ONE in_progress per board.',
107
+ },
108
+ activeForm: {
109
+ type: 'string',
110
+ minLength: 1,
111
+ maxLength: TODO_CONTENT_MAX,
112
+ description: 'Present-continuous form.',
113
+ },
114
+ },
115
+ },
116
+ },
117
+ },
118
+ };
119
+ /**
120
+ * Sentinel prefix the dispatcher returns when Zod schema validation
121
+ * rejects the raw arguments. Distinct from `TODO_INVARIANT_VIOLATED`
122
+ * (>1 in_progress) and `TODO_DUPLICATE_ID` (collision within batch),
123
+ * which are emitted from `saveTodoBoard` AFTER schema parsing.
124
+ *
125
+ * Surfaced as a return string (not a throw) so the engine adapter sees
126
+ * a recoverable tool error and the model can self-correct its args,
127
+ * instead of the engine loop tearing down on an uncaught ZodError.
128
+ */
129
+ export const TODO_INVALID_ARGS = 'INVALID_ARGS';
130
+ /**
131
+ * Render a ZodError into a deterministic `INVALID_ARGS: ...` sentinel
132
+ * the model can pattern-match. Each issue contributes one
133
+ * `path: message` clause; clauses are joined with `; ` so the model
134
+ * sees every offence in a single line. Path with the root scope is
135
+ * rendered as `<root>` to avoid an empty colon.
136
+ */
137
+ function renderZodIssues(error) {
138
+ const parts = error.issues.map((issue) => {
139
+ const path = issue.path.length === 0 ? '<root>' : issue.path.join('.');
140
+ return `${path}: ${issue.message}`;
141
+ });
142
+ return `${TODO_INVALID_ARGS}: ${parts.join('; ')}`;
143
+ }
144
+ /**
145
+ * Validate via Zod + persist atomically. Surfaces three sentinel
146
+ * families the dispatcher pattern-matches on:
147
+ * - `INVALID_ARGS: <path>: <issue>; ...` — Zod schema rejected
148
+ * the raw arguments (returned as STRING, not thrown).
149
+ * - `TODO_INVARIANT_VIOLATED: ...` — >1 in_progress
150
+ * (thrown by `saveTodoBoard`).
151
+ * - `TODO_DUPLICATE_ID: ...` — collision within batch
152
+ * (thrown by `saveTodoBoard`).
153
+ *
154
+ * Why the asymmetry: schema rejection means the model emitted malformed
155
+ * structure (missing field, wrong type) and CAN self-correct given a
156
+ * clear breakdown of the offending path. The invariant + duplicate-id
157
+ * paths mean the model emitted structurally-valid but semantically
158
+ * conflicting state — those still throw so the engine loop's tool-error
159
+ * hook can surface them through `PostToolUseFailure` for observability,
160
+ * mirroring how the file-tools layer surfaces `STALE_READ` / `PermissionDenied`.
161
+ */
162
+ export function dispatchTodoWrite(ctx, rawArgs) {
163
+ // L16 P1 fix (2026-05-27): `.parse` throws a `ZodError` on validation
164
+ // failure. The previous implementation let that throw bubble through
165
+ // the engine adapter's catch arm as a free-form `error.message`,
166
+ // which (a) loses the issue-by-issue structure the model needs to
167
+ // self-correct, and (b) tears down the tool-call as a hard failure
168
+ // rather than a recoverable tool result. Switch to `safeParse` and
169
+ // emit a structured `INVALID_ARGS: <path>: <issue>; ...` sentinel
170
+ // string instead — the engine sees a successful tool call, the model
171
+ // sees the offending paths, and the dispatcher's catch arm reserves
172
+ // throws for the genuine semantic conflicts emitted by `saveTodoBoard`.
173
+ const parsed = todoWriteArgsSchema.safeParse(rawArgs);
174
+ if (!parsed.success) {
175
+ return renderZodIssues(parsed.error);
176
+ }
177
+ const stateCtx = {
178
+ workspaceRoot: ctx.workspaceRoot,
179
+ ...(ctx.now ? { now: ctx.now } : {}),
180
+ };
181
+ const board = saveTodoBoard(stateCtx, parsed.data.todos);
182
+ return JSON.stringify(board);
183
+ }
184
+ //# sourceMappingURL=todo-write.js.map