@pugi/cli 0.1.0-beta.8 → 0.1.0-beta.88

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (405) hide show
  1. package/CHANGELOG.md +132 -0
  2. package/LICENSE +1 -1
  3. package/THIRD_PARTY_NOTICES.md +40 -0
  4. package/assets/pugi-prozr2-mascot.ansi +9 -0
  5. package/bin/run.js +33 -1
  6. package/dist/commands/deploy.js +40 -40
  7. package/dist/commands/flatten.js +191 -0
  8. package/dist/commands/jobs-watch.js +201 -0
  9. package/dist/commands/jobs.js +42 -27
  10. package/dist/commands/smoke.js +133 -0
  11. package/dist/core/agent-progress/cleanup.js +134 -0
  12. package/dist/core/agent-progress/schema.js +144 -0
  13. package/dist/core/agent-progress/writer.js +101 -0
  14. package/dist/core/agents/adaptive-router.js +330 -0
  15. package/dist/core/agents/query-decomposer.js +297 -0
  16. package/dist/core/agents/registry.js +3 -3
  17. package/dist/core/approvals/shortcut-resolver.js +98 -0
  18. package/dist/core/artifact-chain/dispatcher.js +148 -0
  19. package/dist/core/artifact-chain/exporter.js +164 -0
  20. package/dist/core/artifact-chain/state.js +243 -0
  21. package/dist/core/artifact-chain/steps.js +169 -0
  22. package/dist/core/ask-user/question.js +92 -0
  23. package/dist/core/audit/audit-trail.js +275 -0
  24. package/dist/core/auth/ensure-authenticated.js +129 -0
  25. package/dist/core/auth/env-provider.js +238 -0
  26. package/dist/core/auto-open-browser.js +4 -4
  27. package/dist/core/auto-update/channels.js +122 -0
  28. package/dist/core/auto-update/checker.js +241 -0
  29. package/dist/core/auto-update/state.js +235 -0
  30. package/dist/core/bare-mode/index.js +107 -0
  31. package/dist/core/bash/redirect.js +281 -0
  32. package/dist/core/bash-classifier.js +436 -40
  33. package/dist/core/checkpoint/resumer.js +149 -0
  34. package/dist/core/checkpoint/rewinder.js +291 -0
  35. package/dist/core/checkpoints/shadow-git.js +670 -0
  36. package/dist/core/citations/parser.js +109 -0
  37. package/dist/core/classifier/yolo-classifier.js +88 -0
  38. package/dist/core/codegraph/decision-store.js +248 -0
  39. package/dist/core/codegraph/detect-repo.js +459 -0
  40. package/dist/core/codegraph/install.js +134 -0
  41. package/dist/core/codegraph/offer-hook.js +220 -0
  42. package/dist/core/compact/auto-trigger.js +96 -0
  43. package/dist/core/compact/buffer-rewriter.js +115 -0
  44. package/dist/core/compact/summarizer.js +208 -0
  45. package/dist/core/compact/token-counter.js +108 -0
  46. package/dist/core/consensus/anvil-fanout.js +25 -25
  47. package/dist/core/consensus/diff-capture.js +121 -12
  48. package/dist/core/consensus/rubric.js +21 -21
  49. package/dist/core/context/builder.js +6 -6
  50. package/dist/core/context/compaction-events.js +8 -8
  51. package/dist/core/context/compaction.js +31 -31
  52. package/dist/core/context/index.js +15 -8
  53. package/dist/core/context/invariants.js +51 -51
  54. package/dist/core/context/markdown-loader.js +28 -10
  55. package/dist/core/context/markdown-traverse.js +255 -0
  56. package/dist/core/context/pugiignore.js +41 -41
  57. package/dist/core/context/repo-skeleton.js +37 -37
  58. package/dist/core/context/tool-eviction.js +55 -0
  59. package/dist/core/context/watcher.js +32 -32
  60. package/dist/core/context/working-set.js +23 -23
  61. package/dist/core/coordinator/agent-tools.js +77 -0
  62. package/dist/core/coordinator/agent-toolset.js +65 -0
  63. package/dist/core/coordinator/fsm.js +73 -0
  64. package/dist/core/coordinator/mode-fsm.js +70 -0
  65. package/dist/core/cost/rate-card.js +129 -0
  66. package/dist/core/cost/tracker.js +221 -0
  67. package/dist/core/credentials.js +12 -12
  68. package/dist/core/cron/scheduler.js +138 -0
  69. package/dist/core/denial-tracking/index.js +8 -0
  70. package/dist/core/denial-tracking/state.js +264 -0
  71. package/dist/core/diagnostics/probe-runner.js +93 -0
  72. package/dist/core/diagnostics/probes/api.js +46 -0
  73. package/dist/core/diagnostics/probes/auth.js +93 -0
  74. package/dist/core/diagnostics/probes/bare-mode.js +42 -0
  75. package/dist/core/diagnostics/probes/cli-version.js +127 -0
  76. package/dist/core/diagnostics/probes/config.js +72 -0
  77. package/dist/core/diagnostics/probes/denial-tracking.js +57 -0
  78. package/dist/core/diagnostics/probes/disk.js +81 -0
  79. package/dist/core/diagnostics/probes/engine-live.js +46 -0
  80. package/dist/core/diagnostics/probes/git.js +65 -0
  81. package/dist/core/diagnostics/probes/hooks.js +118 -0
  82. package/dist/core/diagnostics/probes/mcp.js +75 -0
  83. package/dist/core/diagnostics/probes/node.js +59 -0
  84. package/dist/core/diagnostics/probes/pnpm.js +36 -0
  85. package/dist/core/diagnostics/probes/pugi-md.js +89 -0
  86. package/dist/core/diagnostics/probes/sandbox.js +40 -0
  87. package/dist/core/diagnostics/probes/session.js +74 -0
  88. package/dist/core/diagnostics/probes/status-snapshot.js +488 -0
  89. package/dist/core/diagnostics/probes/workspace.js +63 -0
  90. package/dist/core/diagnostics/types.js +70 -0
  91. package/dist/core/dispatch/cache-cleanup.js +197 -0
  92. package/dist/core/dispatch/cache-handoff.js +295 -0
  93. package/dist/core/edits/apply-patch-layer-e.js +189 -0
  94. package/dist/core/edits/dispatch.js +293 -7
  95. package/dist/core/edits/format-matrix.js +26 -0
  96. package/dist/core/edits/fuzzy-ladder.js +650 -0
  97. package/dist/core/edits/index.js +3 -1
  98. package/dist/core/edits/journal.js +199 -0
  99. package/dist/core/edits/layer-a-apply.js +15 -15
  100. package/dist/core/edits/layer-a-fuzzy-apply.js +198 -0
  101. package/dist/core/edits/layer-b-apply.js +9 -9
  102. package/dist/core/edits/layer-c-apply.js +6 -6
  103. package/dist/core/edits/layer-d-ast.js +557 -14
  104. package/dist/core/edits/marker-parser.js +12 -12
  105. package/dist/core/edits/security-gate.js +27 -27
  106. package/dist/core/edits/verify-hook.js +273 -0
  107. package/dist/core/edits/worktree.js +322 -0
  108. package/dist/core/engine/anvil-client.js +151 -26
  109. package/dist/core/engine/auto-compact.js +179 -0
  110. package/dist/core/engine/budgets.js +186 -0
  111. package/dist/core/engine/context-prefix.js +155 -0
  112. package/dist/core/engine/index.js +1 -1
  113. package/dist/core/engine/intensity.js +158 -0
  114. package/dist/core/engine/intent.js +260 -0
  115. package/dist/core/engine/native-pugi.js +1295 -227
  116. package/dist/core/engine/prompts.js +134 -16
  117. package/dist/core/engine/strip-internal-fields.js +124 -0
  118. package/dist/core/engine/tool-bridge.js +1295 -59
  119. package/dist/core/evaluation/golden-dataset.js +293 -0
  120. package/dist/core/feedback/queue.js +177 -0
  121. package/dist/core/feedback/submitter.js +145 -0
  122. package/dist/core/file-cache.js +113 -1
  123. package/dist/core/flatten/flatten-repo.js +439 -0
  124. package/dist/core/format/osc8-link.js +28 -0
  125. package/dist/core/hook-chains.js +392 -0
  126. package/dist/core/hooks/citation-verify-hook.js +138 -0
  127. package/dist/core/hooks/citation-verify.js +112 -0
  128. package/dist/core/hooks/events.js +44 -0
  129. package/dist/core/hooks/index.js +15 -0
  130. package/dist/core/hooks/registry.js +213 -0
  131. package/dist/core/hooks/runner.js +236 -0
  132. package/dist/core/hooks/v2/event-emitter.js +115 -0
  133. package/dist/core/hooks/v2/executor.js +282 -0
  134. package/dist/core/hooks/v2/index.js +25 -0
  135. package/dist/core/hooks/v2/lifecycle.js +104 -0
  136. package/dist/core/hooks/v2/loader.js +216 -0
  137. package/dist/core/hooks/v2/matcher.js +125 -0
  138. package/dist/core/hooks/v2/trust.js +143 -0
  139. package/dist/core/hooks/v2/types.js +86 -0
  140. package/dist/core/image/renderer.js +71 -0
  141. package/dist/core/init/detector.js +582 -0
  142. package/dist/core/init/template-renderer.js +242 -0
  143. package/dist/core/jobs/registry.js +18 -18
  144. package/dist/core/ledger/results-tsv.js +142 -0
  145. package/dist/core/log-discipline/stdout-redirect.js +51 -0
  146. package/dist/core/lsp/cache.js +105 -0
  147. package/dist/core/lsp/client.js +776 -0
  148. package/dist/core/lsp/language-detect.js +66 -0
  149. package/dist/core/lsp/post-edit-diagnostics.js +171 -0
  150. package/dist/core/lsp/symbol-tools.js +372 -0
  151. package/dist/core/mcp/client.js +97 -28
  152. package/dist/core/mcp/http-server.js +553 -0
  153. package/dist/core/mcp/orchestrator-tools.js +662 -0
  154. package/dist/core/mcp/permission.js +190 -0
  155. package/dist/core/mcp/registry.js +39 -17
  156. package/dist/core/mcp/server-tools.js +219 -0
  157. package/dist/core/mcp/server.js +397 -0
  158. package/dist/core/mcp/trust.js +10 -10
  159. package/dist/core/memory/dual-write.js +416 -0
  160. package/dist/core/memory/passive-extract.js +130 -0
  161. package/dist/core/memory/phase1-kinds.js +20 -0
  162. package/dist/core/memory/secret-scanner.js +304 -0
  163. package/dist/core/memory-sync/queue.js +170 -0
  164. package/dist/core/metrics/extract.js +113 -0
  165. package/dist/core/modes/roo-modes.js +68 -0
  166. package/dist/core/onboarding/ensure-initialized.js +133 -0
  167. package/dist/core/onboarding/marker.js +111 -0
  168. package/dist/core/onboarding/telemetry-state.js +108 -0
  169. package/dist/core/output-style/presets.js +176 -0
  170. package/dist/core/output-style/state.js +185 -0
  171. package/dist/core/path-security.js +287 -5
  172. package/dist/core/permission.js +82 -22
  173. package/dist/core/permissions/auto-classifier.js +124 -0
  174. package/dist/core/permissions/bash-parser.js +371 -0
  175. package/dist/core/permissions/circuit-breaker.js +83 -0
  176. package/dist/core/permissions/constrained-edit.js +91 -0
  177. package/dist/core/permissions/gate.js +278 -0
  178. package/dist/core/permissions/index.js +20 -0
  179. package/dist/core/permissions/mode.js +174 -0
  180. package/dist/core/permissions/network-egress.js +137 -0
  181. package/dist/core/permissions/state.js +241 -0
  182. package/dist/core/permissions/tool-class.js +93 -0
  183. package/dist/core/plan-mode/ui-state.js +51 -0
  184. package/dist/core/plans/plan-artifact.js +721 -0
  185. package/dist/core/policy-limits/etag-store.js +122 -0
  186. package/dist/core/prd-check/parser.js +215 -0
  187. package/dist/core/prd-check/reporter.js +127 -0
  188. package/dist/core/prd-check/session-review.js +557 -0
  189. package/dist/core/prd-check/verifiers.js +223 -0
  190. package/dist/core/prompt-cache/client-cache.js +99 -0
  191. package/dist/core/prompts/assembly.js +29 -0
  192. package/dist/core/prompts/registry.js +364 -0
  193. package/dist/core/pugi-md/cc-compat-rules.js +735 -0
  194. package/dist/core/pugi-md/context-injector.js +76 -0
  195. package/dist/core/pugi-md/walk-up.js +207 -0
  196. package/dist/core/python/uv-installer.js +270 -0
  197. package/dist/core/python/uv-resolver.js +83 -0
  198. package/dist/core/rate-limit/narrator.js +146 -0
  199. package/dist/core/recipes/cli-types.js +20 -0
  200. package/dist/core/recipes/loader.js +103 -0
  201. package/dist/core/recipes/runner.js +345 -0
  202. package/dist/core/recipes/schema.js +587 -0
  203. package/dist/core/release-notes/parser.js +241 -0
  204. package/dist/core/release-notes/state.js +116 -0
  205. package/dist/core/repl/ask.js +37 -37
  206. package/dist/core/repl/cancellation.js +26 -26
  207. package/dist/core/repl/cap-warning.js +4 -4
  208. package/dist/core/repl/clipboard-read.js +11 -11
  209. package/dist/core/repl/dispatch-fsm.js +12 -12
  210. package/dist/core/repl/history-search.js +15 -15
  211. package/dist/core/repl/history.js +28 -18
  212. package/dist/core/repl/kill-ring.js +5 -5
  213. package/dist/core/repl/model-pricing.js +135 -0
  214. package/dist/core/repl/privacy-banner.js +22 -22
  215. package/dist/core/repl/session.js +2157 -214
  216. package/dist/core/repl/slash-commands.js +533 -40
  217. package/dist/core/repl/store/index.js +1 -1
  218. package/dist/core/repl/store/jsonl-log.js +22 -22
  219. package/dist/core/repl/store/lockfile.js +10 -10
  220. package/dist/core/repl/store/session-store.js +136 -107
  221. package/dist/core/repl/store/types.js +15 -15
  222. package/dist/core/repl/store/uuid-v7.js +12 -12
  223. package/dist/core/repl/workspace-context.js +43 -21
  224. package/dist/core/repo-map/build.js +125 -0
  225. package/dist/core/repo-map/cache.js +185 -0
  226. package/dist/core/repo-map/extractor.js +254 -0
  227. package/dist/core/repo-map/formatter.js +145 -0
  228. package/dist/core/repo-map/page-rank.js +105 -0
  229. package/dist/core/repo-map/scanner.js +211 -0
  230. package/dist/core/retry-budget/budget.js +284 -0
  231. package/dist/core/retry-budget/index.js +5 -0
  232. package/dist/core/retry-budget/retry-cap.js +74 -0
  233. package/dist/core/routing/lead-worker.js +43 -0
  234. package/dist/core/routing/pre-flight-estimator.js +108 -0
  235. package/dist/core/runs/run-tree.js +103 -0
  236. package/dist/core/security/injection-scanner.js +367 -0
  237. package/dist/core/security/output-filter.js +418 -0
  238. package/dist/core/session/env-file.js +105 -0
  239. package/dist/core/session/section-budgets.js +140 -0
  240. package/dist/core/session.js +92 -0
  241. package/dist/core/settings.js +298 -5
  242. package/dist/core/share/formatter.js +271 -0
  243. package/dist/core/share/redactor.js +221 -0
  244. package/dist/core/share/uploader.js +267 -0
  245. package/dist/core/skills/defaults.js +457 -0
  246. package/dist/core/skills/loader.js +22 -22
  247. package/dist/core/skills/sources.js +27 -27
  248. package/dist/core/smoke/headless-driver.js +174 -0
  249. package/dist/core/smoke/orchestrator.js +194 -0
  250. package/dist/core/smoke/runner.js +238 -0
  251. package/dist/core/smoke/scenario-parser.js +316 -0
  252. package/dist/core/statusline.js +99 -0
  253. package/dist/core/subagents/dispatcher-real.js +600 -0
  254. package/dist/core/subagents/dispatcher.js +132 -43
  255. package/dist/core/subagents/index.js +19 -6
  256. package/dist/core/subagents/isolation-matrix.js +213 -0
  257. package/dist/core/subagents/spawn.js +19 -4
  258. package/dist/core/telemetry/emitter.js +229 -0
  259. package/dist/core/telemetry/queue.js +251 -0
  260. package/dist/core/theme/context.js +91 -0
  261. package/dist/core/theme/presets.js +228 -0
  262. package/dist/core/theme/state.js +181 -0
  263. package/dist/core/todos/invariant.js +10 -0
  264. package/dist/core/todos/state.js +177 -0
  265. package/dist/core/tool-schema/compressor.js +89 -0
  266. package/dist/core/transport/version-interceptor.js +166 -0
  267. package/dist/core/trust.js +2 -2
  268. package/dist/core/tui/thinking-block.js +64 -0
  269. package/dist/core/vim/keymap.js +288 -0
  270. package/dist/core/vim/state.js +92 -0
  271. package/dist/core/watch-markers/marker-watcher.js +133 -0
  272. package/dist/core/worktree-manager/cleanup.js +123 -0
  273. package/dist/core/worktree-manager/manager.js +303 -0
  274. package/dist/index.js +36 -0
  275. package/dist/runtime/bootstrap.js +190 -0
  276. package/dist/runtime/cli.js +4203 -493
  277. package/dist/runtime/commands/agents.js +30 -30
  278. package/dist/runtime/commands/budget.js +5 -5
  279. package/dist/runtime/commands/cancel.js +231 -0
  280. package/dist/runtime/commands/chain.js +489 -0
  281. package/dist/runtime/commands/codegraph-status.js +227 -0
  282. package/dist/runtime/commands/compact.js +297 -0
  283. package/dist/runtime/commands/config.js +73 -39
  284. package/dist/runtime/commands/cost.js +199 -0
  285. package/dist/runtime/commands/delegate.js +244 -13
  286. package/dist/runtime/commands/dispatch.js +126 -0
  287. package/dist/runtime/commands/doctor.js +579 -0
  288. package/dist/runtime/commands/feedback.js +184 -0
  289. package/dist/runtime/commands/hooks.js +184 -0
  290. package/dist/runtime/commands/init.js +254 -0
  291. package/dist/runtime/commands/lsp.js +368 -0
  292. package/dist/runtime/commands/mcp.js +879 -0
  293. package/dist/runtime/commands/memory.js +582 -0
  294. package/dist/runtime/commands/model.js +237 -0
  295. package/dist/runtime/commands/onboarding.js +275 -0
  296. package/dist/runtime/commands/patch.js +128 -0
  297. package/dist/runtime/commands/permissions.js +112 -0
  298. package/dist/runtime/commands/plan.js +143 -0
  299. package/dist/runtime/commands/prd-check.js +285 -0
  300. package/dist/runtime/commands/privacy.js +17 -17
  301. package/dist/runtime/commands/recipe.js +325 -0
  302. package/dist/runtime/commands/redo-blob-store.js +92 -0
  303. package/dist/runtime/commands/redo.js +361 -0
  304. package/dist/runtime/commands/release-notes.js +229 -0
  305. package/dist/runtime/commands/repo-map.js +95 -0
  306. package/dist/runtime/commands/report.js +299 -0
  307. package/dist/runtime/commands/resume.js +118 -0
  308. package/dist/runtime/commands/review-consensus.js +68 -53
  309. package/dist/runtime/commands/rewind.js +333 -0
  310. package/dist/runtime/commands/roster.js +14 -14
  311. package/dist/runtime/commands/sessions.js +163 -0
  312. package/dist/runtime/commands/share.js +316 -0
  313. package/dist/runtime/commands/skills.js +31 -31
  314. package/dist/runtime/commands/status.js +186 -0
  315. package/dist/runtime/commands/stickers.js +82 -0
  316. package/dist/runtime/commands/style.js +194 -0
  317. package/dist/runtime/commands/theme.js +196 -0
  318. package/dist/runtime/commands/undo.js +54 -22
  319. package/dist/runtime/commands/update.js +289 -0
  320. package/dist/runtime/commands/vim.js +140 -0
  321. package/dist/runtime/commands/worktree.js +177 -0
  322. package/dist/runtime/commands/worktrees.js +155 -0
  323. package/dist/runtime/headless-repl.js +195 -0
  324. package/dist/runtime/headless.js +543 -0
  325. package/dist/runtime/load-hooks-or-exit.js +71 -0
  326. package/dist/runtime/plan-decompose.js +531 -0
  327. package/dist/runtime/sigint-guard.js +272 -0
  328. package/dist/runtime/update-check.js +28 -28
  329. package/dist/runtime/version.js +65 -0
  330. package/dist/skills/bundled/batch.js +617 -0
  331. package/dist/skills/bundled/index.js +45 -0
  332. package/dist/skills/bundled/loop.js +358 -0
  333. package/dist/skills/bundled/remember.js +383 -0
  334. package/dist/skills/bundled/simplify.js +289 -0
  335. package/dist/skills/bundled/skillify.js +373 -0
  336. package/dist/skills/bundled/stuck.js +558 -0
  337. package/dist/skills/bundled/verify.js +439 -0
  338. package/dist/testing/vcr.js +486 -0
  339. package/dist/tools/agent-tool.js +229 -0
  340. package/dist/tools/apply-patch.js +556 -0
  341. package/dist/tools/ask-user-question.js +288 -0
  342. package/dist/tools/ask-user.js +115 -0
  343. package/dist/tools/bash.js +624 -46
  344. package/dist/tools/brief.js +224 -0
  345. package/dist/tools/enter-worktree.js +250 -0
  346. package/dist/tools/exit-worktree.js +147 -0
  347. package/dist/tools/file-tools.js +161 -44
  348. package/dist/tools/lsp-tools.js +189 -0
  349. package/dist/tools/mcp-tool.js +260 -0
  350. package/dist/tools/multi-edit.js +361 -0
  351. package/dist/tools/powershell.js +268 -0
  352. package/dist/tools/registry.js +85 -0
  353. package/dist/tools/skill-tool.js +96 -0
  354. package/dist/tools/sleep.js +99 -0
  355. package/dist/tools/synthetic-output.js +133 -0
  356. package/dist/tools/tasks.js +208 -0
  357. package/dist/tools/todo-write.js +184 -0
  358. package/dist/tools/verify-plan-execution.js +295 -0
  359. package/dist/tools/web-fetch-injection-scanner.js +207 -0
  360. package/dist/tools/web-fetch.js +195 -10
  361. package/dist/tools/web-search.js +458 -0
  362. package/dist/tui/agent-progress-card.js +111 -0
  363. package/dist/tui/agent-tree.js +11 -1
  364. package/dist/tui/ask-modal.js +14 -14
  365. package/dist/tui/ask-user-question-chips.js +257 -0
  366. package/dist/tui/ask-user-question-prompt.js +203 -0
  367. package/dist/tui/compact-banner.js +81 -0
  368. package/dist/tui/conversation-pane.js +85 -11
  369. package/dist/tui/cost-table.js +111 -0
  370. package/dist/tui/device-flow.js +2 -2
  371. package/dist/tui/doctor-table.js +46 -0
  372. package/dist/tui/feedback-prompt.js +156 -0
  373. package/dist/tui/input-box.js +247 -32
  374. package/dist/tui/login-picker.js +3 -3
  375. package/dist/tui/markdown-render.js +6 -6
  376. package/dist/tui/onboarding-wizard.js +240 -0
  377. package/dist/tui/permissions-picker.js +86 -0
  378. package/dist/tui/render.js +35 -0
  379. package/dist/tui/repl-render.js +332 -54
  380. package/dist/tui/repl-splash-art.js +16 -16
  381. package/dist/tui/repl-splash-mascot.js +48 -24
  382. package/dist/tui/repl-splash.js +22 -22
  383. package/dist/tui/repl.js +124 -44
  384. package/dist/tui/slash-palette.js +6 -6
  385. package/dist/tui/splash.js +2 -2
  386. package/dist/tui/status-bar.js +109 -31
  387. package/dist/tui/status-table.js +7 -0
  388. package/dist/tui/stickers-art.js +136 -0
  389. package/dist/tui/style-table.js +28 -0
  390. package/dist/tui/theme-table.js +29 -0
  391. package/dist/tui/thinking-spinner.js +123 -0
  392. package/dist/tui/tool-stream-pane.js +53 -4
  393. package/dist/tui/update-banner.js +27 -2
  394. package/dist/tui/vim-input.js +267 -0
  395. package/dist/tui/welcome-banner.js +107 -0
  396. package/dist/tui/welcome-data.js +293 -0
  397. package/dist/tui/workspace-context.js +2 -2
  398. package/docs/examples/codegraph.mcp.json +10 -0
  399. package/package.json +25 -7
  400. package/test/scenarios/codegen-create-file.scenario.txt +13 -0
  401. package/test/scenarios/compact-force.scenario.txt +11 -0
  402. package/test/scenarios/identity.scenario.txt +11 -0
  403. package/test/scenarios/persona-handoff.scenario.txt +11 -0
  404. package/test/scenarios/walkback.scenario.txt +12 -0
  405. package/dist/core/engine/compaction-hook.js +0 -154
@@ -0,0 +1,295 @@
1
+ /**
2
+ * verify_plan_execution tool — anti-fake-dispatch gate (backlog #5 P0).
3
+ *
4
+ * Gives the engine loop a way to ASSERT that a previously-stated plan's
5
+ * promised steps actually executed. When the model says "Step 1: read
6
+ * file A. Step 2: edit file B. Step 3: run tests" and then emits a
7
+ * "done" final text, this tool lets the engine loop verify the session's
8
+ * recorded tool calls and file mutations cover every requirement.
9
+ *
10
+ * If any gap is found the engine loop continues another turn so the
11
+ * model can either fill the gap or explicitly explain why the step was
12
+ * skipped. Closes the fake-dispatch failure mode documented in
13
+ * memory `feedback_no_fake_dispatch_promises.md`.
14
+ */
15
+ import { existsSync, readFileSync } from 'node:fs';
16
+ export const VERIFY_PLAN_INVALID_ARGS = 'VERIFY_PLAN_INVALID_ARGS';
17
+ export function parseVerifyPlanArgs(raw) {
18
+ if (typeof raw !== 'object' || raw === null || Array.isArray(raw)) {
19
+ return `${VERIFY_PLAN_INVALID_ARGS}: arguments must be a JSON object`;
20
+ }
21
+ const obj = raw;
22
+ if (!Object.prototype.hasOwnProperty.call(obj, 'steps')) {
23
+ return `${VERIFY_PLAN_INVALID_ARGS}: steps is required`;
24
+ }
25
+ const rawSteps = obj['steps'];
26
+ if (!Array.isArray(rawSteps)) {
27
+ return `${VERIFY_PLAN_INVALID_ARGS}: steps must be an array`;
28
+ }
29
+ if (rawSteps.length > 200) {
30
+ return `${VERIFY_PLAN_INVALID_ARGS}: steps must have <= 200 entries`;
31
+ }
32
+ const steps = [];
33
+ const issues = [];
34
+ for (let i = 0; i < rawSteps.length; i++) {
35
+ const s = rawSteps[i];
36
+ if (typeof s !== 'object' || s === null || Array.isArray(s)) {
37
+ issues.push(`steps[${i}]: must be an object`);
38
+ continue;
39
+ }
40
+ const step = s;
41
+ const id = step['id'];
42
+ if (typeof id !== 'string' || id.trim().length === 0) {
43
+ issues.push(`steps[${i}].id: must be a non-empty string`);
44
+ continue;
45
+ }
46
+ const intent = step['intent'];
47
+ if (typeof intent !== 'string') {
48
+ issues.push(`steps[${i}].intent: must be a string`);
49
+ continue;
50
+ }
51
+ const toolCallsRaw = step['requiredToolCalls'];
52
+ let requiredToolCalls;
53
+ if (toolCallsRaw !== undefined && toolCallsRaw !== null) {
54
+ if (!Array.isArray(toolCallsRaw)) {
55
+ issues.push(`steps[${i}].requiredToolCalls: must be an array when present`);
56
+ continue;
57
+ }
58
+ requiredToolCalls = [];
59
+ for (let j = 0; j < toolCallsRaw.length; j++) {
60
+ const tc = toolCallsRaw[j];
61
+ if (typeof tc !== 'string' || tc.trim().length === 0) {
62
+ issues.push(`steps[${i}].requiredToolCalls[${j}]: must be a non-empty string`);
63
+ }
64
+ else {
65
+ requiredToolCalls.push(tc);
66
+ }
67
+ }
68
+ }
69
+ const fileChangesRaw = step['requiredFileChanges'];
70
+ let requiredFileChanges;
71
+ if (fileChangesRaw !== undefined && fileChangesRaw !== null) {
72
+ if (!Array.isArray(fileChangesRaw)) {
73
+ issues.push(`steps[${i}].requiredFileChanges: must be an array when present`);
74
+ continue;
75
+ }
76
+ requiredFileChanges = [];
77
+ for (let j = 0; j < fileChangesRaw.length; j++) {
78
+ const fc = fileChangesRaw[j];
79
+ if (typeof fc !== 'string' || fc.trim().length === 0) {
80
+ issues.push(`steps[${i}].requiredFileChanges[${j}]: must be a non-empty string`);
81
+ }
82
+ else {
83
+ requiredFileChanges.push(fc);
84
+ }
85
+ }
86
+ }
87
+ const built = {
88
+ id: id.trim(),
89
+ intent,
90
+ ...(requiredToolCalls !== undefined && requiredToolCalls.length > 0
91
+ ? { requiredToolCalls }
92
+ : {}),
93
+ ...(requiredFileChanges !== undefined && requiredFileChanges.length > 0
94
+ ? { requiredFileChanges }
95
+ : {}),
96
+ };
97
+ steps.push(built);
98
+ }
99
+ if (issues.length > 0) {
100
+ return `${VERIFY_PLAN_INVALID_ARGS}: ${issues.join('; ')}`;
101
+ }
102
+ return { steps };
103
+ }
104
+ export function readRelevantEvents(session) {
105
+ if (!session.enabled)
106
+ return [];
107
+ if (!existsSync(session.eventsPath))
108
+ return [];
109
+ const raw = readFileSync(session.eventsPath, 'utf8');
110
+ const events = [];
111
+ for (const line of raw.split('\n')) {
112
+ const trimmed = line.trim();
113
+ if (trimmed.length === 0)
114
+ continue;
115
+ let parsed;
116
+ try {
117
+ parsed = JSON.parse(trimmed);
118
+ }
119
+ catch {
120
+ continue;
121
+ }
122
+ if (typeof parsed !== 'object' || parsed === null || Array.isArray(parsed)) {
123
+ continue;
124
+ }
125
+ const obj = parsed;
126
+ if (obj['type'] === 'tool_call' && typeof obj['tool'] === 'string') {
127
+ events.push({ type: 'tool_call', tool: obj['tool'] });
128
+ }
129
+ else if (obj['type'] === 'file_mutation' && typeof obj['path'] === 'string') {
130
+ events.push({ type: 'file_mutation', path: obj['path'] });
131
+ }
132
+ }
133
+ return events;
134
+ }
135
+ export function verifyPlan(steps, events) {
136
+ if (steps.length === 0) {
137
+ return { status: 'verified', gaps: [] };
138
+ }
139
+ // Per-step consumption queues. The previous Set<string> shared across
140
+ // all steps allowed two steps requiring `edit` к be satisfied by a
141
+ // single edit call — defeating the per-step verification contract.
142
+ // We track per-tool counts of remaining (unconsumed) events; each step
143
+ // consumes one event per requiredToolCall it lists. Same approach for
144
+ // file mutations: each path-substring requirement consumes one matching
145
+ // mutation event, so two steps each requiring `foo.ts` need TWO foo.ts
146
+ // mutations к verify.
147
+ const toolCallRemaining = new Map();
148
+ const mutationRemaining = [];
149
+ for (const event of events) {
150
+ if (event.type === 'tool_call') {
151
+ toolCallRemaining.set(event.tool, (toolCallRemaining.get(event.tool) ?? 0) + 1);
152
+ }
153
+ else {
154
+ mutationRemaining.push(event.path);
155
+ }
156
+ }
157
+ const gaps = [];
158
+ for (const step of steps) {
159
+ if (step.requiredToolCalls !== undefined) {
160
+ for (const toolName of step.requiredToolCalls) {
161
+ const left = toolCallRemaining.get(toolName) ?? 0;
162
+ if (left <= 0) {
163
+ gaps.push({
164
+ stepId: step.id,
165
+ intent: step.intent,
166
+ missing: { kind: 'tool_call', toolName },
167
+ });
168
+ }
169
+ else {
170
+ toolCallRemaining.set(toolName, left - 1);
171
+ }
172
+ }
173
+ }
174
+ if (step.requiredFileChanges !== undefined) {
175
+ for (const pathSub of step.requiredFileChanges) {
176
+ const idx = mutationRemaining.findIndex((p) => pathMatches(p, pathSub));
177
+ if (idx === -1) {
178
+ gaps.push({
179
+ stepId: step.id,
180
+ intent: step.intent,
181
+ missing: { kind: 'file_change', pathSubstring: pathSub },
182
+ });
183
+ }
184
+ else {
185
+ mutationRemaining.splice(idx, 1);
186
+ }
187
+ }
188
+ }
189
+ }
190
+ return {
191
+ status: gaps.length === 0 ? 'verified' : 'gap',
192
+ gaps,
193
+ };
194
+ }
195
+ /**
196
+ * Path requirement matcher. Replaces the previous `String.includes`
197
+ * which falsely matched `foo.ts` against `foo.tsbackup` или `notfoo.ts`.
198
+ *
199
+ * Accepts:
200
+ * - Exact match (`a/b/foo.ts` === `a/b/foo.ts`).
201
+ * - Suffix match anchored on path separator (`foo.ts` matches
202
+ * `a/b/foo.ts` but NOT `bar/notfoo.ts`).
203
+ * - Bare basename (`foo.ts` matches mutation `foo.ts` at any depth).
204
+ * Path separator normalised — `\\` к `/` so Windows mutation paths
205
+ * still match POSIX-style requirements operators write.
206
+ */
207
+ function pathMatches(mutationPath, requirement) {
208
+ const m = mutationPath.replace(/\\/g, '/');
209
+ const req = requirement.replace(/\\/g, '/');
210
+ if (m === req)
211
+ return true;
212
+ if (req.startsWith('/')) {
213
+ return m === req || m.endsWith(req);
214
+ }
215
+ return m.endsWith('/' + req);
216
+ }
217
+ export function verifyPlanExecution(session, steps) {
218
+ // Fail-CLOSED on disabled session audit. The previous vacuous-verified
219
+ // return turned the entire anti-fake-dispatch gate into a no-op the
220
+ // moment session.enabled flipped к false — an operator (or runaway
221
+ // model that learned к disable audit) could silently bypass every
222
+ // verification. The gate must surface an explicit `session_audit_disabled`
223
+ // gap so the engine loop forces acknowledgement instead of accepting
224
+ // silent success. Empty plans still trivially verify.
225
+ if (steps.length === 0) {
226
+ return { status: 'verified', gaps: [] };
227
+ }
228
+ if (!session.enabled) {
229
+ return {
230
+ status: 'gap',
231
+ gaps: [
232
+ {
233
+ stepId: '__session__',
234
+ intent: 'session audit must be enabled к verify plan execution',
235
+ missing: { kind: 'session_audit_disabled' },
236
+ },
237
+ ],
238
+ };
239
+ }
240
+ const events = readRelevantEvents(session);
241
+ return verifyPlan(steps, events);
242
+ }
243
+ export function dispatchVerifyPlanExecution(session, raw) {
244
+ const parsed = parseVerifyPlanArgs(raw);
245
+ if (typeof parsed === 'string') {
246
+ return parsed;
247
+ }
248
+ const result = verifyPlanExecution(session, parsed.steps);
249
+ return JSON.stringify(result);
250
+ }
251
+ export const verifyPlanExecutionJsonSchema = {
252
+ type: 'object',
253
+ additionalProperties: false,
254
+ required: ['steps'],
255
+ properties: {
256
+ steps: {
257
+ type: 'array',
258
+ maxItems: 200,
259
+ description: 'Ordered list of plan steps to verify. Each step declares what tool calls ' +
260
+ 'and file mutations must have occurred in this session for the step to be ' +
261
+ 'considered executed. An empty array returns status=verified immediately.',
262
+ items: {
263
+ type: 'object',
264
+ additionalProperties: false,
265
+ required: ['id', 'intent'],
266
+ properties: {
267
+ id: {
268
+ type: 'string',
269
+ minLength: 1,
270
+ description: 'Stable opaque step identifier. Used in gap reports.',
271
+ },
272
+ intent: {
273
+ type: 'string',
274
+ description: 'Human-readable description of what the step accomplishes.',
275
+ },
276
+ requiredToolCalls: {
277
+ type: 'array',
278
+ items: { type: 'string', minLength: 1 },
279
+ description: 'Tool names (e.g. "read", "write", "edit", "bash") that must appear ' +
280
+ 'as tool_call events in the session audit log. Each entry must match ' +
281
+ 'at least once. Absent or empty means no tool-call requirement.',
282
+ },
283
+ requiredFileChanges: {
284
+ type: 'array',
285
+ items: { type: 'string', minLength: 1 },
286
+ description: 'File path substrings that must appear as file_mutation events. ' +
287
+ 'Each entry must be a substring of at least one mutated path. ' +
288
+ 'Absent or empty means no file-change requirement.',
289
+ },
290
+ },
291
+ },
292
+ },
293
+ },
294
+ };
295
+ //# sourceMappingURL=verify-plan-execution.js.map
@@ -0,0 +1,207 @@
1
+ /**
2
+ * web_fetch injection scanner — task, P1 security follow-up.
3
+ *
4
+ * Threat model: a fetched HTTP body (HTML/text) can be authored by a
5
+ * hostile origin attempting prompt injection against the agent that
6
+ * consumes the markdown downstream. The third-party prompt-injection corpus
7
+ * README incident surfaced three forged `<system-reminder>` blocks in
8
+ * a freshly fetched README — date suppression, fake MCP tool listing,
9
+ * and an instruction-override block. The agents on session correctly
10
+ * ignored them, but that is luck, not guarantee.
11
+ *
12
+ * This scanner is the deterministic guard at the WebFetch return path.
13
+ * It runs BEFORE the model ever sees the body. High-severity findings
14
+ * trigger a defense-in-depth wrap (HTML escape + warning prepend) on
15
+ * top of the existing `<untrusted-content-NONCE>` sentinel. Medium/low
16
+ * findings are recorded but the body is passed through; the call site
17
+ * decides what to do with them (current policy: prepend one-line note
18
+ * for med, no-op for low).
19
+ *
20
+ * Pure function, no IO. Regex-driven so we ship zero new deps.
21
+ */
22
+ /**
23
+ * Zero-width / invisible characters that have been used in prompt
24
+ * injection PoCs to hide instructions inside otherwise plain text.
25
+ * Stripped from `clean` so the model never sees the smuggled bytes.
26
+ *
27
+ * U+200B zero-width space
28
+ * U+200C zero-width non-joiner
29
+ * U+200D zero-width joiner
30
+ * U+2060 word joiner
31
+ * U+FEFF zero-width no-break space (BOM)
32
+ * U+180E mongolian vowel separator
33
+ */
34
+ const ZERO_WIDTH_RE = /[​‌‍⁠᠎]/g;
35
+ const HIGH_RULES = [
36
+ // Forged system-reminder envelopes — exactly the vector.
37
+ { pattern: '<system-reminder>', severity: 'high', re: /<system-reminder\b[^>]*>/i },
38
+ { pattern: '</system-reminder>', severity: 'high', re: /<\/system-reminder\s*>/i },
39
+ // Other impostor wrappers seen across published PoCs.
40
+ { pattern: '<important_instructions>', severity: 'high', re: /<important[_\s-]?instructions\b[^>]*>/i },
41
+ { pattern: '<critical_security_rules>', severity: 'high', re: /<critical[_\s-]?security[_\s-]?rules\b[^>]*>/i },
42
+ { pattern: '<EXTREMELY_IMPORTANT>', severity: 'high', re: /<extremely[_\s-]?important\b[^>]*>/i },
43
+ // Instruction-override copy with "IMPORTANT: you MUST | override | ignore previous".
44
+ {
45
+ pattern: 'IMPORTANT: instruction override',
46
+ severity: 'high',
47
+ re: /important\s*:.*?(you\s+must|override|ignore\s+previous|disregard\s+previous|ignore\s+all\s+prior)/i,
48
+ },
49
+ // Date manipulation — observed in the external prompt-injection patterns.
50
+ { pattern: "Today's date is now ...", severity: 'high', re: /today'?s?\s+date\s+is\s+now\b/i },
51
+ // Mimics the system-prompt language for tool execution semantics.
52
+ { pattern: 'Tools are executed in ...', severity: 'high', re: /tools?\s+are\s+executed\s+in\b/i },
53
+ // Embedded model-name instructions ("You are claude-opus-4-... and you must").
54
+ {
55
+ pattern: 'embedded model-name directive',
56
+ severity: 'high',
57
+ re: /\b(claude-opus-4-|claude-sonnet-4-)[a-z0-9.\-]*/i,
58
+ },
59
+ // Raw ANSI escape — only ever cursor manipulation in fetched markdown.
60
+ { pattern: 'ANSI escape sequence', severity: 'high', re: /\x1b\[/ },
61
+ ];
62
+ const MED_RULES = [
63
+ // Skill-invocation mimicry.
64
+ { pattern: 'BLOCKING REQUIREMENT', severity: 'med', re: /blocking\s+requirement/i },
65
+ { pattern: 'you MUST invoke', severity: 'med', re: /you\s+must\s+invoke/i },
66
+ { pattern: 'Skill tool', severity: 'med', re: /\bskill\s+tool\b/i },
67
+ { pattern: 'MCP tool', severity: 'med', re: /\bmcp\s+tool\b/i },
68
+ // Tool-name mimicry — bare phrasing without obvious code-block
69
+ // context. These are common English so the rule is intentionally
70
+ // narrow: word-boundary + literal tool name + word "tool".
71
+ { pattern: 'Bash tool', severity: 'med', re: /\bbash\s+tool\b/i },
72
+ { pattern: 'Read tool', severity: 'med', re: /\bread\s+tool\b/i },
73
+ { pattern: 'Edit tool', severity: 'med', re: /\bedit\s+tool\b/i },
74
+ ];
75
+ const LOW_RULES = [
76
+ { pattern: 'system prompt mention', severity: 'low', re: /\bsystem\s+prompt\b/i },
77
+ { pattern: 'instructions mention', severity: 'low', re: /\binstructions\b/i },
78
+ { pattern: 'pre-authorized mention', severity: 'low', re: /\bpre[-\s]?authori[sz]ed\b/i },
79
+ ];
80
+ /**
81
+ * Detect a suspicious base64 block: >200 contiguous base64 chars on a
82
+ * single line. Base64 is the standard smuggling format for embedded
83
+ * binary blobs in prompt-injection PoCs (hidden tool definitions,
84
+ * obfuscated instruction sets). Below 200 chars we accept the false
85
+ * positives (commit hashes, JWTs, asset URLs); above 200 the signal
86
+ * dominates.
87
+ */
88
+ const BASE64_BLOCK_RE = /[A-Za-z0-9+/]{200,}={0,2}/;
89
+ /**
90
+ * HTML-escape the five characters that can break out of an element
91
+ * body. Mirrors `escapeForSentinelBody` in web-fetch.ts but applied
92
+ * selectively to flagged tags — we do NOT escape the entire body,
93
+ * only the high-severity matches, so the model still sees readable
94
+ * markdown.
95
+ */
96
+ function escapeHtml(input) {
97
+ return input
98
+ .replace(/&/g, '&amp;')
99
+ .replace(/</g, '&lt;')
100
+ .replace(/>/g, '&gt;')
101
+ .replace(/"/g, '&quot;')
102
+ .replace(/'/g, '&#39;');
103
+ }
104
+ /**
105
+ * Tags that, when matched at HIGH severity, get HTML-escaped in the
106
+ * cleaned output. The list is intentionally narrow: any `<…>` element
107
+ * whose name matches one of these gets `<` and `>` swapped for
108
+ * entities, so a downstream consumer reads the text literally rather
109
+ * than parsing it as structure.
110
+ */
111
+ const TAG_NAMES_TO_ESCAPE = [
112
+ 'system-reminder',
113
+ 'important_instructions',
114
+ 'important-instructions',
115
+ 'critical_security_rules',
116
+ 'critical-security-rules',
117
+ 'extremely_important',
118
+ 'extremely-important',
119
+ ];
120
+ /**
121
+ * Build a single regex that captures any opening/closing tag whose
122
+ * name is in `TAG_NAMES_TO_ESCAPE`. Used by `clean` to escape only
123
+ * the dangerous tags, leaving the rest of the body untouched.
124
+ */
125
+ const TAG_ESCAPE_RE = new RegExp(`</?(?:${TAG_NAMES_TO_ESCAPE.join('|')})\\b[^>]*>`, 'gi');
126
+ /**
127
+ * Run the rule dictionaries against a body of text and return the
128
+ * scrubbed clean output plus the list of findings.
129
+ *
130
+ * Line numbers are 1-indexed and reference the ORIGINAL body. The
131
+ * caller can rely on them to point at the same line in `clean`
132
+ * because the only structural changes are (1) zero-width strips and
133
+ * (2) HTML escaping of specific tag tokens — neither alters line
134
+ * counts.
135
+ */
136
+ export function scanForInjection(body) {
137
+ if (!body)
138
+ return { clean: '', findings: [] };
139
+ const findings = [];
140
+ const lines = body.split(/\r?\n/);
141
+ for (let i = 0; i < lines.length; i++) {
142
+ const line = lines[i] ?? '';
143
+ const lineNumber = i + 1;
144
+ for (const rule of HIGH_RULES) {
145
+ if (rule.re.test(line)) {
146
+ findings.push({ pattern: rule.pattern, line: lineNumber, severity: 'high' });
147
+ }
148
+ }
149
+ for (const rule of MED_RULES) {
150
+ if (rule.re.test(line)) {
151
+ findings.push({ pattern: rule.pattern, line: lineNumber, severity: 'med' });
152
+ }
153
+ }
154
+ for (const rule of LOW_RULES) {
155
+ if (rule.re.test(line)) {
156
+ findings.push({ pattern: rule.pattern, line: lineNumber, severity: 'low' });
157
+ }
158
+ }
159
+ if (BASE64_BLOCK_RE.test(line)) {
160
+ findings.push({ pattern: 'long base64 block (>200 chars)', line: lineNumber, severity: 'med' });
161
+ }
162
+ }
163
+ // Always strip zero-width chars from the cleaned output, even when
164
+ // no rule explicitly flagged them. They have no legitimate use in
165
+ // fetched markdown content the model is meant to read.
166
+ let clean = body.replace(ZERO_WIDTH_RE, (match) => {
167
+ findings.push({
168
+ pattern: `zero-width char U+${match.charCodeAt(0).toString(16).toUpperCase().padStart(4, '0')}`,
169
+ line: 0, // multi-line; surfaced separately
170
+ severity: 'high',
171
+ });
172
+ return '';
173
+ });
174
+ // HTML-escape the high-severity impostor tags so a downstream parser
175
+ // (or another LLM) sees text, not structure.
176
+ clean = clean.replace(TAG_ESCAPE_RE, (match) => escapeHtml(match));
177
+ return { clean, findings };
178
+ }
179
+ /**
180
+ * Convenience: return the highest severity present in a findings
181
+ * list, or `null` if the list is empty. `high` > `med` > `low`.
182
+ */
183
+ export function topSeverity(findings) {
184
+ if (findings.some((f) => f.severity === 'high'))
185
+ return 'high';
186
+ if (findings.some((f) => f.severity === 'med'))
187
+ return 'med';
188
+ if (findings.some((f) => f.severity === 'low'))
189
+ return 'low';
190
+ return null;
191
+ }
192
+ /**
193
+ * Render a one-line summary of high-severity findings for the safety
194
+ * envelope. Stable ordering: by line, then by pattern.
195
+ */
196
+ export function formatHighFindings(findings) {
197
+ const high = findings.filter((f) => f.severity === 'high');
198
+ if (high.length === 0)
199
+ return '';
200
+ const sorted = [...high].sort((a, b) => {
201
+ if (a.line !== b.line)
202
+ return a.line - b.line;
203
+ return a.pattern.localeCompare(b.pattern);
204
+ });
205
+ return sorted.map((f) => `[${f.severity}] ${f.pattern} @ line ${f.line}`).join('; ');
206
+ }
207
+ //# sourceMappingURL=web-fetch-injection-scanner.js.map