@pugi/cli 0.1.0-beta.99 → 1.0.0-alpha.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +1 -1
- package/README.md +11 -191
- package/bin/pugi +8 -0
- package/package.json +15 -71
- package/postinstall.mjs +31 -0
- package/CHANGELOG.md +0 -132
- package/THIRD_PARTY_NOTICES.md +0 -40
- package/assets/pugi-mascot.ansi +0 -16
- package/assets/pugi-prozr2-mascot.ansi +0 -9
- package/bin/run.js +0 -34
- package/dist/commands/deploy.js +0 -439
- package/dist/commands/flatten.js +0 -191
- package/dist/commands/jobs-watch.js +0 -201
- package/dist/commands/jobs.js +0 -260
- package/dist/commands/retro.js +0 -210
- package/dist/commands/smoke.js +0 -133
- package/dist/core/agent-progress/cleanup.js +0 -134
- package/dist/core/agent-progress/schema.js +0 -144
- package/dist/core/agent-progress/writer.js +0 -101
- package/dist/core/agents/adaptive-router.js +0 -330
- package/dist/core/agents/loader.js +0 -104
- package/dist/core/agents/query-decomposer.js +0 -297
- package/dist/core/agents/registry.js +0 -69
- package/dist/core/approvals/shortcut-resolver.js +0 -98
- package/dist/core/artifact-chain/dispatcher.js +0 -148
- package/dist/core/artifact-chain/exporter.js +0 -164
- package/dist/core/artifact-chain/state.js +0 -243
- package/dist/core/artifact-chain/steps.js +0 -169
- package/dist/core/ask-user/question.js +0 -92
- package/dist/core/audit/audit-trail.js +0 -275
- package/dist/core/auth/ensure-authenticated.js +0 -129
- package/dist/core/auth/env-provider.js +0 -238
- package/dist/core/auto-open-browser.js +0 -128
- package/dist/core/auto-update/channels.js +0 -122
- package/dist/core/auto-update/checker.js +0 -241
- package/dist/core/auto-update/state.js +0 -235
- package/dist/core/bare-mode/index.js +0 -107
- package/dist/core/bash/redirect.js +0 -281
- package/dist/core/bash-classifier.js +0 -1397
- package/dist/core/checkpoint/resumer.js +0 -149
- package/dist/core/checkpoint/rewinder.js +0 -291
- package/dist/core/checkpoints/shadow-git.js +0 -670
- package/dist/core/citations/parser.js +0 -109
- package/dist/core/classifier/yolo-classifier.js +0 -88
- package/dist/core/clipboard.js +0 -70
- package/dist/core/codegraph/decision-store.js +0 -248
- package/dist/core/codegraph/detect-repo.js +0 -459
- package/dist/core/codegraph/install.js +0 -134
- package/dist/core/codegraph/offer-hook.js +0 -220
- package/dist/core/compact/auto-trigger.js +0 -96
- package/dist/core/compact/buffer-rewriter.js +0 -115
- package/dist/core/compact/summarizer.js +0 -208
- package/dist/core/compact/token-counter.js +0 -108
- package/dist/core/consensus/anvil-fanout.js +0 -276
- package/dist/core/consensus/diff-capture.js +0 -491
- package/dist/core/consensus/rubric.js +0 -233
- package/dist/core/context/builder.js +0 -114
- package/dist/core/context/compaction-events.js +0 -99
- package/dist/core/context/compaction.js +0 -602
- package/dist/core/context/index.js +0 -28
- package/dist/core/context/invariants.js +0 -250
- package/dist/core/context/markdown-loader.js +0 -288
- package/dist/core/context/markdown-traverse.js +0 -255
- package/dist/core/context/pugiignore.js +0 -316
- package/dist/core/context/repo-skeleton.js +0 -533
- package/dist/core/context/tool-eviction.js +0 -55
- package/dist/core/context/watcher.js +0 -342
- package/dist/core/context/working-set.js +0 -165
- package/dist/core/coordinator/agent-tools.js +0 -77
- package/dist/core/coordinator/agent-toolset.js +0 -65
- package/dist/core/coordinator/fsm.js +0 -73
- package/dist/core/coordinator/mode-fsm.js +0 -70
- package/dist/core/cost/rate-card.js +0 -129
- package/dist/core/cost/tracker.js +0 -221
- package/dist/core/credentials.js +0 -355
- package/dist/core/cron/scheduler.js +0 -138
- package/dist/core/denial-tracking/index.js +0 -8
- package/dist/core/denial-tracking/state.js +0 -264
- package/dist/core/diagnostics/probe-runner.js +0 -93
- package/dist/core/diagnostics/probes/api.js +0 -46
- package/dist/core/diagnostics/probes/auth.js +0 -93
- package/dist/core/diagnostics/probes/bare-mode.js +0 -42
- package/dist/core/diagnostics/probes/cli-version.js +0 -127
- package/dist/core/diagnostics/probes/config.js +0 -72
- package/dist/core/diagnostics/probes/denial-tracking.js +0 -57
- package/dist/core/diagnostics/probes/disk.js +0 -81
- package/dist/core/diagnostics/probes/engine-live.js +0 -46
- package/dist/core/diagnostics/probes/git.js +0 -65
- package/dist/core/diagnostics/probes/hooks.js +0 -118
- package/dist/core/diagnostics/probes/mcp.js +0 -75
- package/dist/core/diagnostics/probes/node.js +0 -59
- package/dist/core/diagnostics/probes/pnpm.js +0 -36
- package/dist/core/diagnostics/probes/pugi-md.js +0 -89
- package/dist/core/diagnostics/probes/sandbox.js +0 -72
- package/dist/core/diagnostics/probes/session.js +0 -74
- package/dist/core/diagnostics/probes/status-snapshot.js +0 -488
- package/dist/core/diagnostics/probes/workspace.js +0 -63
- package/dist/core/diagnostics/types.js +0 -70
- package/dist/core/dispatch/cache-cleanup.js +0 -197
- package/dist/core/dispatch/cache-handoff.js +0 -295
- package/dist/core/edits/apply-patch-layer-e.js +0 -189
- package/dist/core/edits/dispatch.js +0 -511
- package/dist/core/edits/format-detector.js +0 -260
- package/dist/core/edits/format-matrix.js +0 -26
- package/dist/core/edits/fuzzy-ladder.js +0 -650
- package/dist/core/edits/index.js +0 -19
- package/dist/core/edits/journal.js +0 -199
- package/dist/core/edits/layer-a-apply.js +0 -217
- package/dist/core/edits/layer-a-fuzzy-apply.js +0 -198
- package/dist/core/edits/layer-b-apply.js +0 -211
- package/dist/core/edits/layer-c-apply.js +0 -160
- package/dist/core/edits/layer-d-ast.js +0 -572
- package/dist/core/edits/marker-parser.js +0 -401
- package/dist/core/edits/security-gate.js +0 -223
- package/dist/core/edits/verify-hook.js +0 -273
- package/dist/core/edits/worktree.js +0 -322
- package/dist/core/engine/adapter-runner.js +0 -8
- package/dist/core/engine/anvil-client.js +0 -344
- package/dist/core/engine/auto-compact.js +0 -179
- package/dist/core/engine/budgets.js +0 -195
- package/dist/core/engine/context-prefix.js +0 -155
- package/dist/core/engine/index.js +0 -12
- package/dist/core/engine/intensity.js +0 -163
- package/dist/core/engine/intent.js +0 -260
- package/dist/core/engine/native-pugi.js +0 -1616
- package/dist/core/engine/noop.js +0 -27
- package/dist/core/engine/prompts.js +0 -236
- package/dist/core/engine/strip-internal-fields.js +0 -124
- package/dist/core/engine/tool-bridge.js +0 -2173
- package/dist/core/engine/verification-patterns.js +0 -195
- package/dist/core/evaluation/golden-dataset.js +0 -293
- package/dist/core/feedback/queue.js +0 -177
- package/dist/core/feedback/submitter.js +0 -145
- package/dist/core/file-cache.js +0 -141
- package/dist/core/flatten/flatten-repo.js +0 -439
- package/dist/core/format/osc8-link.js +0 -28
- package/dist/core/hook-chains.js +0 -392
- package/dist/core/hooks/citation-verify-hook.js +0 -138
- package/dist/core/hooks/citation-verify.js +0 -112
- package/dist/core/hooks/events.js +0 -46
- package/dist/core/hooks/index.js +0 -15
- package/dist/core/hooks/registry.js +0 -216
- package/dist/core/hooks/runner.js +0 -236
- package/dist/core/hooks/v2/event-emitter.js +0 -115
- package/dist/core/hooks/v2/executor.js +0 -282
- package/dist/core/hooks/v2/index.js +0 -25
- package/dist/core/hooks/v2/lifecycle.js +0 -104
- package/dist/core/hooks/v2/loader.js +0 -216
- package/dist/core/hooks/v2/matcher.js +0 -125
- package/dist/core/hooks/v2/trust.js +0 -143
- package/dist/core/hooks/v2/types.js +0 -86
- package/dist/core/hooks/worktree-events.js +0 -158
- package/dist/core/hooks.js +0 -415
- package/dist/core/image/renderer.js +0 -71
- package/dist/core/index-store.js +0 -260
- package/dist/core/init/detector.js +0 -582
- package/dist/core/init/template-renderer.js +0 -242
- package/dist/core/jobs/registry.js +0 -462
- package/dist/core/ledger/results-tsv.js +0 -142
- package/dist/core/log-discipline/stdout-redirect.js +0 -51
- package/dist/core/lsp/cache.js +0 -105
- package/dist/core/lsp/client.js +0 -1229
- package/dist/core/lsp/language-detect.js +0 -66
- package/dist/core/lsp/post-edit-diagnostics.js +0 -171
- package/dist/core/lsp/server-detect.js +0 -173
- package/dist/core/lsp/symbol-cache.js +0 -162
- package/dist/core/lsp/symbol-tools.js +0 -664
- package/dist/core/mcp/client.js +0 -385
- package/dist/core/mcp/http-server.js +0 -553
- package/dist/core/mcp/orchestrator-config.js +0 -192
- package/dist/core/mcp/orchestrator-tools.js +0 -806
- package/dist/core/mcp/permission.js +0 -190
- package/dist/core/mcp/registry.js +0 -193
- package/dist/core/mcp/server-tools.js +0 -219
- package/dist/core/mcp/server.js +0 -397
- package/dist/core/mcp/trust.js +0 -91
- package/dist/core/memory/dual-write.js +0 -416
- package/dist/core/memory/passive-extract.js +0 -130
- package/dist/core/memory/phase1-kinds.js +0 -20
- package/dist/core/memory/secret-scanner.js +0 -304
- package/dist/core/memory-sync/queue.js +0 -170
- package/dist/core/metrics/extract.js +0 -113
- package/dist/core/modes/roo-modes.js +0 -68
- package/dist/core/onboarding/ensure-initialized.js +0 -133
- package/dist/core/onboarding/marker.js +0 -111
- package/dist/core/onboarding/telemetry-state.js +0 -108
- package/dist/core/output-style/presets.js +0 -176
- package/dist/core/output-style/state.js +0 -185
- package/dist/core/path-security.js +0 -345
- package/dist/core/permission.js +0 -369
- package/dist/core/permissions/auto-classifier.js +0 -124
- package/dist/core/permissions/bash-parser.js +0 -371
- package/dist/core/permissions/circuit-breaker.js +0 -83
- package/dist/core/permissions/constrained-edit.js +0 -91
- package/dist/core/permissions/gate.js +0 -278
- package/dist/core/permissions/index.js +0 -20
- package/dist/core/permissions/mode.js +0 -174
- package/dist/core/permissions/network-egress.js +0 -137
- package/dist/core/permissions/state.js +0 -241
- package/dist/core/permissions/tool-class.js +0 -107
- package/dist/core/plan-mode/ui-state.js +0 -51
- package/dist/core/plans/plan-artifact.js +0 -721
- package/dist/core/policy-limits/etag-store.js +0 -122
- package/dist/core/prd-check/parser.js +0 -215
- package/dist/core/prd-check/reporter.js +0 -127
- package/dist/core/prd-check/session-review.js +0 -557
- package/dist/core/prd-check/verifiers.js +0 -223
- package/dist/core/prompt-cache/client-cache.js +0 -99
- package/dist/core/prompts/assembly.js +0 -29
- package/dist/core/prompts/registry.js +0 -364
- package/dist/core/pugi-gitignore.js +0 -52
- package/dist/core/pugi-md/cc-compat-rules.js +0 -735
- package/dist/core/pugi-md/context-injector.js +0 -76
- package/dist/core/pugi-md/walk-up.js +0 -207
- package/dist/core/python/uv-installer.js +0 -270
- package/dist/core/python/uv-resolver.js +0 -83
- package/dist/core/rate-limit/narrator.js +0 -146
- package/dist/core/recipes/cli-types.js +0 -20
- package/dist/core/recipes/loader.js +0 -103
- package/dist/core/recipes/runner.js +0 -345
- package/dist/core/recipes/schema.js +0 -587
- package/dist/core/release-notes/parser.js +0 -241
- package/dist/core/release-notes/state.js +0 -116
- package/dist/core/repl/ask.js +0 -512
- package/dist/core/repl/cancellation.js +0 -98
- package/dist/core/repl/cap-warning.js +0 -91
- package/dist/core/repl/clipboard-read.js +0 -174
- package/dist/core/repl/dispatch-fsm.js +0 -220
- package/dist/core/repl/engine-bridge.js +0 -303
- package/dist/core/repl/history-search.js +0 -175
- package/dist/core/repl/history.js +0 -182
- package/dist/core/repl/kill-ring.js +0 -138
- package/dist/core/repl/model-pricing.js +0 -135
- package/dist/core/repl/privacy-banner.js +0 -71
- package/dist/core/repl/session.js +0 -4962
- package/dist/core/repl/slash-commands.js +0 -747
- package/dist/core/repl/store/index.js +0 -12
- package/dist/core/repl/store/jsonl-log.js +0 -321
- package/dist/core/repl/store/lockfile.js +0 -155
- package/dist/core/repl/store/session-store.js +0 -821
- package/dist/core/repl/store/types.js +0 -44
- package/dist/core/repl/store/uuid-v7.js +0 -68
- package/dist/core/repl/tool-route.js +0 -382
- package/dist/core/repl/workspace-context.js +0 -206
- package/dist/core/repo-map/build.js +0 -125
- package/dist/core/repo-map/cache.js +0 -185
- package/dist/core/repo-map/extractor.js +0 -254
- package/dist/core/repo-map/formatter.js +0 -145
- package/dist/core/repo-map/page-rank.js +0 -105
- package/dist/core/repo-map/scanner.js +0 -211
- package/dist/core/retro/git-collector.js +0 -251
- package/dist/core/retro/health-card.js +0 -25
- package/dist/core/retro/metrics.js +0 -342
- package/dist/core/retro/narrative.js +0 -249
- package/dist/core/retro/plane-collector.js +0 -274
- package/dist/core/retro/pr-issue-link.js +0 -65
- package/dist/core/retro/types.js +0 -16
- package/dist/core/retry-budget/budget.js +0 -284
- package/dist/core/retry-budget/index.js +0 -5
- package/dist/core/retry-budget/retry-cap.js +0 -74
- package/dist/core/routing/lead-worker.js +0 -43
- package/dist/core/routing/pre-flight-estimator.js +0 -108
- package/dist/core/runs/run-tree.js +0 -103
- package/dist/core/sandboxing/adapter.js +0 -29
- package/dist/core/sandboxing/index.js +0 -49
- package/dist/core/sandboxing/none.js +0 -19
- package/dist/core/sandboxing/seatbelt.js +0 -183
- package/dist/core/security/injection-scanner.js +0 -367
- package/dist/core/security/output-filter.js +0 -418
- package/dist/core/session/env-file.js +0 -105
- package/dist/core/session/section-budgets.js +0 -140
- package/dist/core/session.js +0 -377
- package/dist/core/settings.js +0 -400
- package/dist/core/share/formatter.js +0 -271
- package/dist/core/share/redactor.js +0 -221
- package/dist/core/share/uploader.js +0 -267
- package/dist/core/skills/defaults.js +0 -457
- package/dist/core/skills/loader.js +0 -454
- package/dist/core/skills/sources.js +0 -480
- package/dist/core/skills/trust.js +0 -172
- package/dist/core/smoke/headless-driver.js +0 -174
- package/dist/core/smoke/orchestrator.js +0 -194
- package/dist/core/smoke/runner.js +0 -238
- package/dist/core/smoke/scenario-parser.js +0 -316
- package/dist/core/statusline.js +0 -99
- package/dist/core/subagents/dispatcher-real.js +0 -600
- package/dist/core/subagents/dispatcher.js +0 -352
- package/dist/core/subagents/index.js +0 -39
- package/dist/core/subagents/isolation-matrix.js +0 -213
- package/dist/core/subagents/spawn.js +0 -101
- package/dist/core/telemetry/emitter.js +0 -229
- package/dist/core/telemetry/queue.js +0 -251
- package/dist/core/theme/context.js +0 -91
- package/dist/core/theme/presets.js +0 -228
- package/dist/core/theme/state.js +0 -181
- package/dist/core/todos/invariant.js +0 -10
- package/dist/core/todos/state.js +0 -177
- package/dist/core/tool-schema/compressor.js +0 -89
- package/dist/core/transport/version-interceptor.js +0 -166
- package/dist/core/trust.js +0 -109
- package/dist/core/tui/thinking-block.js +0 -64
- package/dist/core/vim/keymap.js +0 -288
- package/dist/core/vim/state.js +0 -92
- package/dist/core/watch-markers/marker-watcher.js +0 -133
- package/dist/core/worktree/include-parser.js +0 -249
- package/dist/core/worktree-manager/cleanup.js +0 -123
- package/dist/core/worktree-manager/manager.js +0 -303
- package/dist/index.js +0 -44
- package/dist/runtime/bootstrap.js +0 -190
- package/dist/runtime/cli.js +0 -8121
- package/dist/runtime/commands/agents.js +0 -385
- package/dist/runtime/commands/budget.js +0 -192
- package/dist/runtime/commands/cancel.js +0 -231
- package/dist/runtime/commands/chain.js +0 -489
- package/dist/runtime/commands/codegraph-status.js +0 -227
- package/dist/runtime/commands/compact.js +0 -297
- package/dist/runtime/commands/config.js +0 -595
- package/dist/runtime/commands/cost.js +0 -199
- package/dist/runtime/commands/delegate.js +0 -312
- package/dist/runtime/commands/dispatch.js +0 -126
- package/dist/runtime/commands/doctor.js +0 -579
- package/dist/runtime/commands/feedback.js +0 -184
- package/dist/runtime/commands/hooks.js +0 -187
- package/dist/runtime/commands/init.js +0 -254
- package/dist/runtime/commands/lsp.js +0 -368
- package/dist/runtime/commands/mcp.js +0 -935
- package/dist/runtime/commands/memory.js +0 -582
- package/dist/runtime/commands/model.js +0 -237
- package/dist/runtime/commands/onboarding.js +0 -275
- package/dist/runtime/commands/patch.js +0 -128
- package/dist/runtime/commands/permissions.js +0 -112
- package/dist/runtime/commands/plan.js +0 -143
- package/dist/runtime/commands/prd-check.js +0 -285
- package/dist/runtime/commands/privacy.js +0 -107
- package/dist/runtime/commands/recipe.js +0 -325
- package/dist/runtime/commands/redo-blob-store.js +0 -92
- package/dist/runtime/commands/redo.js +0 -361
- package/dist/runtime/commands/release-notes.js +0 -229
- package/dist/runtime/commands/repo-map.js +0 -95
- package/dist/runtime/commands/report.js +0 -299
- package/dist/runtime/commands/resume.js +0 -118
- package/dist/runtime/commands/review-consensus.js +0 -414
- package/dist/runtime/commands/rewind.js +0 -333
- package/dist/runtime/commands/roster.js +0 -117
- package/dist/runtime/commands/sessions.js +0 -163
- package/dist/runtime/commands/share.js +0 -316
- package/dist/runtime/commands/skills.js +0 -401
- package/dist/runtime/commands/status.js +0 -186
- package/dist/runtime/commands/stickers.js +0 -82
- package/dist/runtime/commands/style.js +0 -194
- package/dist/runtime/commands/theme.js +0 -196
- package/dist/runtime/commands/undo.js +0 -361
- package/dist/runtime/commands/update.js +0 -289
- package/dist/runtime/commands/vim.js +0 -140
- package/dist/runtime/commands/worktree.js +0 -177
- package/dist/runtime/commands/worktrees.js +0 -155
- package/dist/runtime/deprecation-warning.js +0 -69
- package/dist/runtime/engine-exit-code.js +0 -50
- package/dist/runtime/headless-repl.js +0 -195
- package/dist/runtime/headless.js +0 -548
- package/dist/runtime/load-hooks-or-exit.js +0 -71
- package/dist/runtime/plan-decompose.js +0 -531
- package/dist/runtime/sigint-guard.js +0 -272
- package/dist/runtime/stream-renderer.js +0 -195
- package/dist/runtime/update-check.js +0 -294
- package/dist/runtime/version.js +0 -65
- package/dist/runtime/worktree-bootstrap.js +0 -579
- package/dist/skills/bundled/batch.js +0 -617
- package/dist/skills/bundled/index.js +0 -45
- package/dist/skills/bundled/loop.js +0 -358
- package/dist/skills/bundled/remember.js +0 -383
- package/dist/skills/bundled/simplify.js +0 -289
- package/dist/skills/bundled/skillify.js +0 -373
- package/dist/skills/bundled/stuck.js +0 -558
- package/dist/skills/bundled/verify.js +0 -439
- package/dist/testing/vcr.js +0 -486
- package/dist/tools/agent-tool.js +0 -229
- package/dist/tools/apply-patch.js +0 -556
- package/dist/tools/ask-user-question.js +0 -337
- package/dist/tools/ask-user.js +0 -115
- package/dist/tools/bash.js +0 -1238
- package/dist/tools/brief.js +0 -224
- package/dist/tools/cron.js +0 -433
- package/dist/tools/enter-worktree.js +0 -250
- package/dist/tools/exit-worktree.js +0 -147
- package/dist/tools/file-tools.js +0 -553
- package/dist/tools/http-request.js +0 -336
- package/dist/tools/lsp-tools.js +0 -565
- package/dist/tools/mcp-tool.js +0 -260
- package/dist/tools/multi-edit.js +0 -361
- package/dist/tools/powershell.js +0 -268
- package/dist/tools/registry.js +0 -166
- package/dist/tools/server-tools.js +0 -892
- package/dist/tools/skill-tool.js +0 -96
- package/dist/tools/sleep.js +0 -99
- package/dist/tools/synthetic-output.js +0 -133
- package/dist/tools/tasks.js +0 -208
- package/dist/tools/todo-write.js +0 -184
- package/dist/tools/verify-plan-execution.js +0 -295
- package/dist/tools/web-fetch-injection-scanner.js +0 -207
- package/dist/tools/web-fetch.js +0 -720
- package/dist/tools/web-search.js +0 -458
- package/dist/tui/agent-progress-card.js +0 -111
- package/dist/tui/agent-tree-pane.js +0 -9
- package/dist/tui/agent-tree.js +0 -87
- package/dist/tui/ask-cli.js +0 -52
- package/dist/tui/ask-modal.js +0 -211
- package/dist/tui/ask-user-question-chips.js +0 -315
- package/dist/tui/ask-user-question-prompt.js +0 -203
- package/dist/tui/compact-banner.js +0 -81
- package/dist/tui/conversation-pane.js +0 -164
- package/dist/tui/cost-table.js +0 -111
- package/dist/tui/device-flow.js +0 -142
- package/dist/tui/doctor-table.js +0 -46
- package/dist/tui/feedback-prompt.js +0 -156
- package/dist/tui/input-box.js +0 -732
- package/dist/tui/login-picker.js +0 -69
- package/dist/tui/markdown-render.js +0 -266
- package/dist/tui/multi-file-diff-approval.js +0 -375
- package/dist/tui/onboarding-wizard.js +0 -240
- package/dist/tui/permissions-picker.js +0 -86
- package/dist/tui/render.js +0 -160
- package/dist/tui/repl-render.js +0 -770
- package/dist/tui/repl-splash-art.js +0 -64
- package/dist/tui/repl-splash-mascot.js +0 -154
- package/dist/tui/repl-splash.js +0 -117
- package/dist/tui/repl.js +0 -378
- package/dist/tui/slash-palette.js +0 -106
- package/dist/tui/splash-data.js +0 -61
- package/dist/tui/splash.js +0 -31
- package/dist/tui/status-bar.js +0 -209
- package/dist/tui/status-table.js +0 -7
- package/dist/tui/stickers-art.js +0 -136
- package/dist/tui/style-table.js +0 -28
- package/dist/tui/theme-table.js +0 -29
- package/dist/tui/thinking-spinner.js +0 -123
- package/dist/tui/tool-stream-pane.js +0 -140
- package/dist/tui/update-banner.js +0 -33
- package/dist/tui/vim-input.js +0 -267
- package/dist/tui/welcome-banner.js +0 -107
- package/dist/tui/welcome-data.js +0 -293
- package/dist/tui/workspace-context.js +0 -105
- package/docs/examples/codegraph.mcp.json +0 -10
- package/test/scenarios/codegen-create-file.scenario.txt +0 -13
- package/test/scenarios/compact-force.scenario.txt +0 -12
- package/test/scenarios/identity.scenario.txt +0 -11
- package/test/scenarios/persona-handoff.scenario.txt +0 -12
- package/test/scenarios/walkback.scenario.txt +0 -12
package/dist/tools/todo-write.js
DELETED
|
@@ -1,184 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* todo_write tool — .
|
|
3
|
-
*
|
|
4
|
-
* Mirrors the standard tool's `TodoWrite` tool 1:1 so a model trained on the
|
|
5
|
-
* upstream grammar speaks Pugi's variant verbatim. The tool dispatches
|
|
6
|
-
* a BATCH replace of the workspace todo board (not an incremental
|
|
7
|
-
* mutation — the model emits the FULL list every call). At most ONE
|
|
8
|
-
* todo may carry `status: 'in_progress'` at any time; violations
|
|
9
|
-
* reject with the `TODO_INVARIANT_VIOLATED` sentinel and the board on
|
|
10
|
-
* disk is left unchanged.
|
|
11
|
-
*
|
|
12
|
-
* Relationship to `task_*` (β1 T1/T6, tools/tasks.ts):
|
|
13
|
-
* - `task_*` is GRANULAR (create/get/list/update one task at a
|
|
14
|
-
* time) with an append-only JSONL journal scoped to the SESSION.
|
|
15
|
-
* - `todo_write` is BATCH (snapshot the whole board) with an atomic
|
|
16
|
-
* JSON snapshot scoped to the WORKSPACE.
|
|
17
|
-
* They are complementary surfaces: agents that prefer the upstream
|
|
18
|
-
* TodoWrite grammar use `todo_write`; agents that want a fine-grained
|
|
19
|
-
* audit trail use `task_*`.
|
|
20
|
-
*
|
|
21
|
-
* Hard rules (enforced by Zod + dispatcher):
|
|
22
|
-
* - `todos.length` ≤ 50 (board overload guard).
|
|
23
|
-
* - Every item: id (≥1 char, ≤128), content (≥1 char), status enum.
|
|
24
|
-
* - At most ONE item with `status === 'in_progress'`.
|
|
25
|
-
* - All ids unique within the batch.
|
|
26
|
-
*
|
|
27
|
-
* Dispatch returns the persisted board as JSON; callers can read
|
|
28
|
-
* `todos: [...]` directly. Errors return the sentinel-prefixed message
|
|
29
|
-
* so the engine adapter can pattern-match.
|
|
30
|
-
*/
|
|
31
|
-
import { z } from 'zod';
|
|
32
|
-
import { saveTodoBoard } from '../core/todos/state.js';
|
|
33
|
-
/** Cap matches the `task_*` family's title cap for parity. */
|
|
34
|
-
export const TODO_CONTENT_MAX = 2_000;
|
|
35
|
-
/** id is opaque to us but must be slug-safe so file paths could embed it. */
|
|
36
|
-
export const TODO_ID_MIN = 1;
|
|
37
|
-
export const TODO_ID_MAX = 128;
|
|
38
|
-
/** Hard cap on board size. Beyond this the operator should split work. */
|
|
39
|
-
export const TODO_BATCH_MAX = 50;
|
|
40
|
-
export const todoItemSchema = z
|
|
41
|
-
.strictObject({
|
|
42
|
-
id: z
|
|
43
|
-
.string()
|
|
44
|
-
.min(TODO_ID_MIN)
|
|
45
|
-
.max(TODO_ID_MAX)
|
|
46
|
-
.describe('Stable id for this todo. Opaque, ≤128 chars.'),
|
|
47
|
-
content: z
|
|
48
|
-
.string()
|
|
49
|
-
.min(1)
|
|
50
|
-
.max(TODO_CONTENT_MAX)
|
|
51
|
-
.describe('Imperative task description. E.g. "Add invariant check".'),
|
|
52
|
-
status: z
|
|
53
|
-
.enum(['pending', 'in_progress', 'completed'])
|
|
54
|
-
.describe('Lifecycle status. At most ONE in_progress per board.'),
|
|
55
|
-
activeForm: z
|
|
56
|
-
.string()
|
|
57
|
-
.min(1)
|
|
58
|
-
.max(TODO_CONTENT_MAX)
|
|
59
|
-
.optional()
|
|
60
|
-
.describe('Present-continuous form. E.g. "Adding invariant check".'),
|
|
61
|
-
});
|
|
62
|
-
export const todoWriteArgsSchema = z.strictObject({
|
|
63
|
-
todos: z
|
|
64
|
-
.array(todoItemSchema)
|
|
65
|
-
.max(TODO_BATCH_MAX)
|
|
66
|
-
.describe(`Full todo board (batch replace, not incremental). Max ${TODO_BATCH_MAX} items. ` +
|
|
67
|
-
`At most ONE item may carry status="in_progress".`),
|
|
68
|
-
});
|
|
69
|
-
/**
|
|
70
|
-
* JSON-Schema fragment surfaced to the model via the tool-bridge
|
|
71
|
-
* `parameters` field. Mirrors the Zod schema 1:1 — kept hand-written
|
|
72
|
-
* (same convention as ask_user_question) because the runtime engine
|
|
73
|
-
* wires OpenAI-compatible JSON Schema and we have not greenlit the
|
|
74
|
-
* zod-to-json-schema transitive dep. Keep both in lockstep.
|
|
75
|
-
*/
|
|
76
|
-
export const todoWriteJsonSchema = {
|
|
77
|
-
type: 'object',
|
|
78
|
-
additionalProperties: false,
|
|
79
|
-
required: ['todos'],
|
|
80
|
-
properties: {
|
|
81
|
-
todos: {
|
|
82
|
-
type: 'array',
|
|
83
|
-
maxItems: TODO_BATCH_MAX,
|
|
84
|
-
description: `Full todo board (batch replace, not incremental). Max ${TODO_BATCH_MAX} items. ` +
|
|
85
|
-
`At most ONE item may carry status="in_progress".`,
|
|
86
|
-
items: {
|
|
87
|
-
type: 'object',
|
|
88
|
-
additionalProperties: false,
|
|
89
|
-
required: ['id', 'content', 'status'],
|
|
90
|
-
properties: {
|
|
91
|
-
id: {
|
|
92
|
-
type: 'string',
|
|
93
|
-
minLength: TODO_ID_MIN,
|
|
94
|
-
maxLength: TODO_ID_MAX,
|
|
95
|
-
description: 'Stable id for this todo. Opaque, ≤128 chars.',
|
|
96
|
-
},
|
|
97
|
-
content: {
|
|
98
|
-
type: 'string',
|
|
99
|
-
minLength: 1,
|
|
100
|
-
maxLength: TODO_CONTENT_MAX,
|
|
101
|
-
description: 'Imperative task description.',
|
|
102
|
-
},
|
|
103
|
-
status: {
|
|
104
|
-
type: 'string',
|
|
105
|
-
enum: ['pending', 'in_progress', 'completed'],
|
|
106
|
-
description: 'Lifecycle status. At most ONE in_progress per board.',
|
|
107
|
-
},
|
|
108
|
-
activeForm: {
|
|
109
|
-
type: 'string',
|
|
110
|
-
minLength: 1,
|
|
111
|
-
maxLength: TODO_CONTENT_MAX,
|
|
112
|
-
description: 'Present-continuous form.',
|
|
113
|
-
},
|
|
114
|
-
},
|
|
115
|
-
},
|
|
116
|
-
},
|
|
117
|
-
},
|
|
118
|
-
};
|
|
119
|
-
/**
|
|
120
|
-
* Sentinel prefix the dispatcher returns when Zod schema validation
|
|
121
|
-
* rejects the raw arguments. Distinct from `TODO_INVARIANT_VIOLATED`
|
|
122
|
-
* (>1 in_progress) and `TODO_DUPLICATE_ID` (collision within batch),
|
|
123
|
-
* which are emitted from `saveTodoBoard` AFTER schema parsing.
|
|
124
|
-
*
|
|
125
|
-
* Surfaced as a return string (not a throw) so the engine adapter sees
|
|
126
|
-
* a recoverable tool error and the model can self-correct its args,
|
|
127
|
-
* instead of the engine loop tearing down on an uncaught ZodError.
|
|
128
|
-
*/
|
|
129
|
-
export const TODO_INVALID_ARGS = 'INVALID_ARGS';
|
|
130
|
-
/**
|
|
131
|
-
* Render a ZodError into a deterministic `INVALID_ARGS: ...` sentinel
|
|
132
|
-
* the model can pattern-match. Each issue contributes one
|
|
133
|
-
* `path: message` clause; clauses are joined with `; ` so the model
|
|
134
|
-
* sees every offence in a single line. Path with the root scope is
|
|
135
|
-
* rendered as `<root>` to avoid an empty colon.
|
|
136
|
-
*/
|
|
137
|
-
function renderZodIssues(error) {
|
|
138
|
-
const parts = error.issues.map((issue) => {
|
|
139
|
-
const path = issue.path.length === 0 ? '<root>' : issue.path.join('.');
|
|
140
|
-
return `${path}: ${issue.message}`;
|
|
141
|
-
});
|
|
142
|
-
return `${TODO_INVALID_ARGS}: ${parts.join('; ')}`;
|
|
143
|
-
}
|
|
144
|
-
/**
|
|
145
|
-
* Validate via Zod + persist atomically. Surfaces three sentinel
|
|
146
|
-
* families the dispatcher pattern-matches on:
|
|
147
|
-
* - `INVALID_ARGS: <path>: <issue>; ...` — Zod schema rejected
|
|
148
|
-
* the raw arguments (returned as STRING, not thrown).
|
|
149
|
-
* - `TODO_INVARIANT_VIOLATED: ...` — >1 in_progress
|
|
150
|
-
* (thrown by `saveTodoBoard`).
|
|
151
|
-
* - `TODO_DUPLICATE_ID: ...` — collision within batch
|
|
152
|
-
* (thrown by `saveTodoBoard`).
|
|
153
|
-
*
|
|
154
|
-
* Why the asymmetry: schema rejection means the model emitted malformed
|
|
155
|
-
* structure (missing field, wrong type) and CAN self-correct given a
|
|
156
|
-
* clear breakdown of the offending path. The invariant + duplicate-id
|
|
157
|
-
* paths mean the model emitted structurally-valid but semantically
|
|
158
|
-
* conflicting state — those still throw so the engine loop's tool-error
|
|
159
|
-
* hook can surface them through `PostToolUseFailure` for observability,
|
|
160
|
-
* mirroring how the file-tools layer surfaces `STALE_READ` / `PermissionDenied`.
|
|
161
|
-
*/
|
|
162
|
-
export function dispatchTodoWrite(ctx, rawArgs) {
|
|
163
|
-
// L16 P1 fix : `.parse` throws a `ZodError` on validation
|
|
164
|
-
// failure. The previous implementation let that throw bubble through
|
|
165
|
-
// the engine adapter's catch arm as a free-form `error.message`,
|
|
166
|
-
// which (a) loses the issue-by-issue structure the model needs to
|
|
167
|
-
// self-correct, and (b) tears down the tool-call as a hard failure
|
|
168
|
-
// rather than a recoverable tool result. Switch to `safeParse` and
|
|
169
|
-
// emit a structured `INVALID_ARGS: <path>: <issue>; ...` sentinel
|
|
170
|
-
// string instead — the engine sees a successful tool call, the model
|
|
171
|
-
// sees the offending paths, and the dispatcher's catch arm reserves
|
|
172
|
-
// throws for the genuine semantic conflicts emitted by `saveTodoBoard`.
|
|
173
|
-
const parsed = todoWriteArgsSchema.safeParse(rawArgs);
|
|
174
|
-
if (!parsed.success) {
|
|
175
|
-
return renderZodIssues(parsed.error);
|
|
176
|
-
}
|
|
177
|
-
const stateCtx = {
|
|
178
|
-
workspaceRoot: ctx.workspaceRoot,
|
|
179
|
-
...(ctx.now ? { now: ctx.now } : {}),
|
|
180
|
-
};
|
|
181
|
-
const board = saveTodoBoard(stateCtx, parsed.data.todos);
|
|
182
|
-
return JSON.stringify(board);
|
|
183
|
-
}
|
|
184
|
-
//# sourceMappingURL=todo-write.js.map
|
|
@@ -1,295 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* verify_plan_execution tool — anti-fake-dispatch gate (backlog #5 P0).
|
|
3
|
-
*
|
|
4
|
-
* Gives the engine loop a way to ASSERT that a previously-stated plan's
|
|
5
|
-
* promised steps actually executed. When the model says "Step 1: read
|
|
6
|
-
* file A. Step 2: edit file B. Step 3: run tests" and then emits a
|
|
7
|
-
* "done" final text, this tool lets the engine loop verify the session's
|
|
8
|
-
* recorded tool calls and file mutations cover every requirement.
|
|
9
|
-
*
|
|
10
|
-
* If any gap is found the engine loop continues another turn so the
|
|
11
|
-
* model can either fill the gap or explicitly explain why the step was
|
|
12
|
-
* skipped. Closes the fake-dispatch failure mode documented in
|
|
13
|
-
* memory `feedback_no_fake_dispatch_promises.md`.
|
|
14
|
-
*/
|
|
15
|
-
import { existsSync, readFileSync } from 'node:fs';
|
|
16
|
-
export const VERIFY_PLAN_INVALID_ARGS = 'VERIFY_PLAN_INVALID_ARGS';
|
|
17
|
-
export function parseVerifyPlanArgs(raw) {
|
|
18
|
-
if (typeof raw !== 'object' || raw === null || Array.isArray(raw)) {
|
|
19
|
-
return `${VERIFY_PLAN_INVALID_ARGS}: arguments must be a JSON object`;
|
|
20
|
-
}
|
|
21
|
-
const obj = raw;
|
|
22
|
-
if (!Object.prototype.hasOwnProperty.call(obj, 'steps')) {
|
|
23
|
-
return `${VERIFY_PLAN_INVALID_ARGS}: steps is required`;
|
|
24
|
-
}
|
|
25
|
-
const rawSteps = obj['steps'];
|
|
26
|
-
if (!Array.isArray(rawSteps)) {
|
|
27
|
-
return `${VERIFY_PLAN_INVALID_ARGS}: steps must be an array`;
|
|
28
|
-
}
|
|
29
|
-
if (rawSteps.length > 200) {
|
|
30
|
-
return `${VERIFY_PLAN_INVALID_ARGS}: steps must have <= 200 entries`;
|
|
31
|
-
}
|
|
32
|
-
const steps = [];
|
|
33
|
-
const issues = [];
|
|
34
|
-
for (let i = 0; i < rawSteps.length; i++) {
|
|
35
|
-
const s = rawSteps[i];
|
|
36
|
-
if (typeof s !== 'object' || s === null || Array.isArray(s)) {
|
|
37
|
-
issues.push(`steps[${i}]: must be an object`);
|
|
38
|
-
continue;
|
|
39
|
-
}
|
|
40
|
-
const step = s;
|
|
41
|
-
const id = step['id'];
|
|
42
|
-
if (typeof id !== 'string' || id.trim().length === 0) {
|
|
43
|
-
issues.push(`steps[${i}].id: must be a non-empty string`);
|
|
44
|
-
continue;
|
|
45
|
-
}
|
|
46
|
-
const intent = step['intent'];
|
|
47
|
-
if (typeof intent !== 'string') {
|
|
48
|
-
issues.push(`steps[${i}].intent: must be a string`);
|
|
49
|
-
continue;
|
|
50
|
-
}
|
|
51
|
-
const toolCallsRaw = step['requiredToolCalls'];
|
|
52
|
-
let requiredToolCalls;
|
|
53
|
-
if (toolCallsRaw !== undefined && toolCallsRaw !== null) {
|
|
54
|
-
if (!Array.isArray(toolCallsRaw)) {
|
|
55
|
-
issues.push(`steps[${i}].requiredToolCalls: must be an array when present`);
|
|
56
|
-
continue;
|
|
57
|
-
}
|
|
58
|
-
requiredToolCalls = [];
|
|
59
|
-
for (let j = 0; j < toolCallsRaw.length; j++) {
|
|
60
|
-
const tc = toolCallsRaw[j];
|
|
61
|
-
if (typeof tc !== 'string' || tc.trim().length === 0) {
|
|
62
|
-
issues.push(`steps[${i}].requiredToolCalls[${j}]: must be a non-empty string`);
|
|
63
|
-
}
|
|
64
|
-
else {
|
|
65
|
-
requiredToolCalls.push(tc);
|
|
66
|
-
}
|
|
67
|
-
}
|
|
68
|
-
}
|
|
69
|
-
const fileChangesRaw = step['requiredFileChanges'];
|
|
70
|
-
let requiredFileChanges;
|
|
71
|
-
if (fileChangesRaw !== undefined && fileChangesRaw !== null) {
|
|
72
|
-
if (!Array.isArray(fileChangesRaw)) {
|
|
73
|
-
issues.push(`steps[${i}].requiredFileChanges: must be an array when present`);
|
|
74
|
-
continue;
|
|
75
|
-
}
|
|
76
|
-
requiredFileChanges = [];
|
|
77
|
-
for (let j = 0; j < fileChangesRaw.length; j++) {
|
|
78
|
-
const fc = fileChangesRaw[j];
|
|
79
|
-
if (typeof fc !== 'string' || fc.trim().length === 0) {
|
|
80
|
-
issues.push(`steps[${i}].requiredFileChanges[${j}]: must be a non-empty string`);
|
|
81
|
-
}
|
|
82
|
-
else {
|
|
83
|
-
requiredFileChanges.push(fc);
|
|
84
|
-
}
|
|
85
|
-
}
|
|
86
|
-
}
|
|
87
|
-
const built = {
|
|
88
|
-
id: id.trim(),
|
|
89
|
-
intent,
|
|
90
|
-
...(requiredToolCalls !== undefined && requiredToolCalls.length > 0
|
|
91
|
-
? { requiredToolCalls }
|
|
92
|
-
: {}),
|
|
93
|
-
...(requiredFileChanges !== undefined && requiredFileChanges.length > 0
|
|
94
|
-
? { requiredFileChanges }
|
|
95
|
-
: {}),
|
|
96
|
-
};
|
|
97
|
-
steps.push(built);
|
|
98
|
-
}
|
|
99
|
-
if (issues.length > 0) {
|
|
100
|
-
return `${VERIFY_PLAN_INVALID_ARGS}: ${issues.join('; ')}`;
|
|
101
|
-
}
|
|
102
|
-
return { steps };
|
|
103
|
-
}
|
|
104
|
-
export function readRelevantEvents(session) {
|
|
105
|
-
if (!session.enabled)
|
|
106
|
-
return [];
|
|
107
|
-
if (!existsSync(session.eventsPath))
|
|
108
|
-
return [];
|
|
109
|
-
const raw = readFileSync(session.eventsPath, 'utf8');
|
|
110
|
-
const events = [];
|
|
111
|
-
for (const line of raw.split('\n')) {
|
|
112
|
-
const trimmed = line.trim();
|
|
113
|
-
if (trimmed.length === 0)
|
|
114
|
-
continue;
|
|
115
|
-
let parsed;
|
|
116
|
-
try {
|
|
117
|
-
parsed = JSON.parse(trimmed);
|
|
118
|
-
}
|
|
119
|
-
catch {
|
|
120
|
-
continue;
|
|
121
|
-
}
|
|
122
|
-
if (typeof parsed !== 'object' || parsed === null || Array.isArray(parsed)) {
|
|
123
|
-
continue;
|
|
124
|
-
}
|
|
125
|
-
const obj = parsed;
|
|
126
|
-
if (obj['type'] === 'tool_call' && typeof obj['tool'] === 'string') {
|
|
127
|
-
events.push({ type: 'tool_call', tool: obj['tool'] });
|
|
128
|
-
}
|
|
129
|
-
else if (obj['type'] === 'file_mutation' && typeof obj['path'] === 'string') {
|
|
130
|
-
events.push({ type: 'file_mutation', path: obj['path'] });
|
|
131
|
-
}
|
|
132
|
-
}
|
|
133
|
-
return events;
|
|
134
|
-
}
|
|
135
|
-
export function verifyPlan(steps, events) {
|
|
136
|
-
if (steps.length === 0) {
|
|
137
|
-
return { status: 'verified', gaps: [] };
|
|
138
|
-
}
|
|
139
|
-
// Per-step consumption queues. The previous Set<string> shared across
|
|
140
|
-
// all steps allowed two steps requiring `edit` к be satisfied by a
|
|
141
|
-
// single edit call — defeating the per-step verification contract.
|
|
142
|
-
// We track per-tool counts of remaining (unconsumed) events; each step
|
|
143
|
-
// consumes one event per requiredToolCall it lists. Same approach for
|
|
144
|
-
// file mutations: each path-substring requirement consumes one matching
|
|
145
|
-
// mutation event, so two steps each requiring `foo.ts` need TWO foo.ts
|
|
146
|
-
// mutations к verify.
|
|
147
|
-
const toolCallRemaining = new Map();
|
|
148
|
-
const mutationRemaining = [];
|
|
149
|
-
for (const event of events) {
|
|
150
|
-
if (event.type === 'tool_call') {
|
|
151
|
-
toolCallRemaining.set(event.tool, (toolCallRemaining.get(event.tool) ?? 0) + 1);
|
|
152
|
-
}
|
|
153
|
-
else {
|
|
154
|
-
mutationRemaining.push(event.path);
|
|
155
|
-
}
|
|
156
|
-
}
|
|
157
|
-
const gaps = [];
|
|
158
|
-
for (const step of steps) {
|
|
159
|
-
if (step.requiredToolCalls !== undefined) {
|
|
160
|
-
for (const toolName of step.requiredToolCalls) {
|
|
161
|
-
const left = toolCallRemaining.get(toolName) ?? 0;
|
|
162
|
-
if (left <= 0) {
|
|
163
|
-
gaps.push({
|
|
164
|
-
stepId: step.id,
|
|
165
|
-
intent: step.intent,
|
|
166
|
-
missing: { kind: 'tool_call', toolName },
|
|
167
|
-
});
|
|
168
|
-
}
|
|
169
|
-
else {
|
|
170
|
-
toolCallRemaining.set(toolName, left - 1);
|
|
171
|
-
}
|
|
172
|
-
}
|
|
173
|
-
}
|
|
174
|
-
if (step.requiredFileChanges !== undefined) {
|
|
175
|
-
for (const pathSub of step.requiredFileChanges) {
|
|
176
|
-
const idx = mutationRemaining.findIndex((p) => pathMatches(p, pathSub));
|
|
177
|
-
if (idx === -1) {
|
|
178
|
-
gaps.push({
|
|
179
|
-
stepId: step.id,
|
|
180
|
-
intent: step.intent,
|
|
181
|
-
missing: { kind: 'file_change', pathSubstring: pathSub },
|
|
182
|
-
});
|
|
183
|
-
}
|
|
184
|
-
else {
|
|
185
|
-
mutationRemaining.splice(idx, 1);
|
|
186
|
-
}
|
|
187
|
-
}
|
|
188
|
-
}
|
|
189
|
-
}
|
|
190
|
-
return {
|
|
191
|
-
status: gaps.length === 0 ? 'verified' : 'gap',
|
|
192
|
-
gaps,
|
|
193
|
-
};
|
|
194
|
-
}
|
|
195
|
-
/**
|
|
196
|
-
* Path requirement matcher. Replaces the previous `String.includes`
|
|
197
|
-
* which falsely matched `foo.ts` against `foo.tsbackup` или `notfoo.ts`.
|
|
198
|
-
*
|
|
199
|
-
* Accepts:
|
|
200
|
-
* - Exact match (`a/b/foo.ts` === `a/b/foo.ts`).
|
|
201
|
-
* - Suffix match anchored on path separator (`foo.ts` matches
|
|
202
|
-
* `a/b/foo.ts` but NOT `bar/notfoo.ts`).
|
|
203
|
-
* - Bare basename (`foo.ts` matches mutation `foo.ts` at any depth).
|
|
204
|
-
* Path separator normalised — `\\` к `/` so Windows mutation paths
|
|
205
|
-
* still match POSIX-style requirements operators write.
|
|
206
|
-
*/
|
|
207
|
-
function pathMatches(mutationPath, requirement) {
|
|
208
|
-
const m = mutationPath.replace(/\\/g, '/');
|
|
209
|
-
const req = requirement.replace(/\\/g, '/');
|
|
210
|
-
if (m === req)
|
|
211
|
-
return true;
|
|
212
|
-
if (req.startsWith('/')) {
|
|
213
|
-
return m === req || m.endsWith(req);
|
|
214
|
-
}
|
|
215
|
-
return m.endsWith('/' + req);
|
|
216
|
-
}
|
|
217
|
-
export function verifyPlanExecution(session, steps) {
|
|
218
|
-
// Fail-CLOSED on disabled session audit. The previous vacuous-verified
|
|
219
|
-
// return turned the entire anti-fake-dispatch gate into a no-op the
|
|
220
|
-
// moment session.enabled flipped к false — an operator (or runaway
|
|
221
|
-
// model that learned к disable audit) could silently bypass every
|
|
222
|
-
// verification. The gate must surface an explicit `session_audit_disabled`
|
|
223
|
-
// gap so the engine loop forces acknowledgement instead of accepting
|
|
224
|
-
// silent success. Empty plans still trivially verify.
|
|
225
|
-
if (steps.length === 0) {
|
|
226
|
-
return { status: 'verified', gaps: [] };
|
|
227
|
-
}
|
|
228
|
-
if (!session.enabled) {
|
|
229
|
-
return {
|
|
230
|
-
status: 'gap',
|
|
231
|
-
gaps: [
|
|
232
|
-
{
|
|
233
|
-
stepId: '__session__',
|
|
234
|
-
intent: 'session audit must be enabled к verify plan execution',
|
|
235
|
-
missing: { kind: 'session_audit_disabled' },
|
|
236
|
-
},
|
|
237
|
-
],
|
|
238
|
-
};
|
|
239
|
-
}
|
|
240
|
-
const events = readRelevantEvents(session);
|
|
241
|
-
return verifyPlan(steps, events);
|
|
242
|
-
}
|
|
243
|
-
export function dispatchVerifyPlanExecution(session, raw) {
|
|
244
|
-
const parsed = parseVerifyPlanArgs(raw);
|
|
245
|
-
if (typeof parsed === 'string') {
|
|
246
|
-
return parsed;
|
|
247
|
-
}
|
|
248
|
-
const result = verifyPlanExecution(session, parsed.steps);
|
|
249
|
-
return JSON.stringify(result);
|
|
250
|
-
}
|
|
251
|
-
export const verifyPlanExecutionJsonSchema = {
|
|
252
|
-
type: 'object',
|
|
253
|
-
additionalProperties: false,
|
|
254
|
-
required: ['steps'],
|
|
255
|
-
properties: {
|
|
256
|
-
steps: {
|
|
257
|
-
type: 'array',
|
|
258
|
-
maxItems: 200,
|
|
259
|
-
description: 'Ordered list of plan steps to verify. Each step declares what tool calls ' +
|
|
260
|
-
'and file mutations must have occurred in this session for the step to be ' +
|
|
261
|
-
'considered executed. An empty array returns status=verified immediately.',
|
|
262
|
-
items: {
|
|
263
|
-
type: 'object',
|
|
264
|
-
additionalProperties: false,
|
|
265
|
-
required: ['id', 'intent'],
|
|
266
|
-
properties: {
|
|
267
|
-
id: {
|
|
268
|
-
type: 'string',
|
|
269
|
-
minLength: 1,
|
|
270
|
-
description: 'Stable opaque step identifier. Used in gap reports.',
|
|
271
|
-
},
|
|
272
|
-
intent: {
|
|
273
|
-
type: 'string',
|
|
274
|
-
description: 'Human-readable description of what the step accomplishes.',
|
|
275
|
-
},
|
|
276
|
-
requiredToolCalls: {
|
|
277
|
-
type: 'array',
|
|
278
|
-
items: { type: 'string', minLength: 1 },
|
|
279
|
-
description: 'Tool names (e.g. "read", "write", "edit", "bash") that must appear ' +
|
|
280
|
-
'as tool_call events in the session audit log. Each entry must match ' +
|
|
281
|
-
'at least once. Absent or empty means no tool-call requirement.',
|
|
282
|
-
},
|
|
283
|
-
requiredFileChanges: {
|
|
284
|
-
type: 'array',
|
|
285
|
-
items: { type: 'string', minLength: 1 },
|
|
286
|
-
description: 'File path substrings that must appear as file_mutation events. ' +
|
|
287
|
-
'Each entry must be a substring of at least one mutated path. ' +
|
|
288
|
-
'Absent or empty means no file-change requirement.',
|
|
289
|
-
},
|
|
290
|
-
},
|
|
291
|
-
},
|
|
292
|
-
},
|
|
293
|
-
},
|
|
294
|
-
};
|
|
295
|
-
//# sourceMappingURL=verify-plan-execution.js.map
|
|
@@ -1,207 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* web_fetch injection scanner — task, P1 security follow-up.
|
|
3
|
-
*
|
|
4
|
-
* Threat model: a fetched HTTP body (HTML/text) can be authored by a
|
|
5
|
-
* hostile origin attempting prompt injection against the agent that
|
|
6
|
-
* consumes the markdown downstream. The third-party prompt-injection corpus
|
|
7
|
-
* README incident surfaced three forged `<system-reminder>` blocks in
|
|
8
|
-
* a freshly fetched README — date suppression, fake MCP tool listing,
|
|
9
|
-
* and an instruction-override block. The agents on session correctly
|
|
10
|
-
* ignored them, but that is luck, not guarantee.
|
|
11
|
-
*
|
|
12
|
-
* This scanner is the deterministic guard at the WebFetch return path.
|
|
13
|
-
* It runs BEFORE the model ever sees the body. High-severity findings
|
|
14
|
-
* trigger a defense-in-depth wrap (HTML escape + warning prepend) on
|
|
15
|
-
* top of the existing `<untrusted-content-NONCE>` sentinel. Medium/low
|
|
16
|
-
* findings are recorded but the body is passed through; the call site
|
|
17
|
-
* decides what to do with them (current policy: prepend one-line note
|
|
18
|
-
* for med, no-op for low).
|
|
19
|
-
*
|
|
20
|
-
* Pure function, no IO. Regex-driven so we ship zero new deps.
|
|
21
|
-
*/
|
|
22
|
-
/**
|
|
23
|
-
* Zero-width / invisible characters that have been used in prompt
|
|
24
|
-
* injection PoCs to hide instructions inside otherwise plain text.
|
|
25
|
-
* Stripped from `clean` so the model never sees the smuggled bytes.
|
|
26
|
-
*
|
|
27
|
-
* U+200B zero-width space
|
|
28
|
-
* U+200C zero-width non-joiner
|
|
29
|
-
* U+200D zero-width joiner
|
|
30
|
-
* U+2060 word joiner
|
|
31
|
-
* U+FEFF zero-width no-break space (BOM)
|
|
32
|
-
* U+180E mongolian vowel separator
|
|
33
|
-
*/
|
|
34
|
-
const ZERO_WIDTH_RE = /[]/g;
|
|
35
|
-
const HIGH_RULES = [
|
|
36
|
-
// Forged system-reminder envelopes — exactly the vector.
|
|
37
|
-
{ pattern: '<system-reminder>', severity: 'high', re: /<system-reminder\b[^>]*>/i },
|
|
38
|
-
{ pattern: '</system-reminder>', severity: 'high', re: /<\/system-reminder\s*>/i },
|
|
39
|
-
// Other impostor wrappers seen across published PoCs.
|
|
40
|
-
{ pattern: '<important_instructions>', severity: 'high', re: /<important[_\s-]?instructions\b[^>]*>/i },
|
|
41
|
-
{ pattern: '<critical_security_rules>', severity: 'high', re: /<critical[_\s-]?security[_\s-]?rules\b[^>]*>/i },
|
|
42
|
-
{ pattern: '<EXTREMELY_IMPORTANT>', severity: 'high', re: /<extremely[_\s-]?important\b[^>]*>/i },
|
|
43
|
-
// Instruction-override copy with "IMPORTANT: you MUST | override | ignore previous".
|
|
44
|
-
{
|
|
45
|
-
pattern: 'IMPORTANT: instruction override',
|
|
46
|
-
severity: 'high',
|
|
47
|
-
re: /important\s*:.*?(you\s+must|override|ignore\s+previous|disregard\s+previous|ignore\s+all\s+prior)/i,
|
|
48
|
-
},
|
|
49
|
-
// Date manipulation — observed in the external prompt-injection patterns.
|
|
50
|
-
{ pattern: "Today's date is now ...", severity: 'high', re: /today'?s?\s+date\s+is\s+now\b/i },
|
|
51
|
-
// Mimics the system-prompt language for tool execution semantics.
|
|
52
|
-
{ pattern: 'Tools are executed in ...', severity: 'high', re: /tools?\s+are\s+executed\s+in\b/i },
|
|
53
|
-
// Embedded model-name instructions ("You are claude-opus-4-... and you must").
|
|
54
|
-
{
|
|
55
|
-
pattern: 'embedded model-name directive',
|
|
56
|
-
severity: 'high',
|
|
57
|
-
re: /\b(claude-opus-4-|claude-sonnet-4-)[a-z0-9.\-]*/i,
|
|
58
|
-
},
|
|
59
|
-
// Raw ANSI escape — only ever cursor manipulation in fetched markdown.
|
|
60
|
-
{ pattern: 'ANSI escape sequence', severity: 'high', re: /\x1b\[/ },
|
|
61
|
-
];
|
|
62
|
-
const MED_RULES = [
|
|
63
|
-
// Skill-invocation mimicry.
|
|
64
|
-
{ pattern: 'BLOCKING REQUIREMENT', severity: 'med', re: /blocking\s+requirement/i },
|
|
65
|
-
{ pattern: 'you MUST invoke', severity: 'med', re: /you\s+must\s+invoke/i },
|
|
66
|
-
{ pattern: 'Skill tool', severity: 'med', re: /\bskill\s+tool\b/i },
|
|
67
|
-
{ pattern: 'MCP tool', severity: 'med', re: /\bmcp\s+tool\b/i },
|
|
68
|
-
// Tool-name mimicry — bare phrasing without obvious code-block
|
|
69
|
-
// context. These are common English so the rule is intentionally
|
|
70
|
-
// narrow: word-boundary + literal tool name + word "tool".
|
|
71
|
-
{ pattern: 'Bash tool', severity: 'med', re: /\bbash\s+tool\b/i },
|
|
72
|
-
{ pattern: 'Read tool', severity: 'med', re: /\bread\s+tool\b/i },
|
|
73
|
-
{ pattern: 'Edit tool', severity: 'med', re: /\bedit\s+tool\b/i },
|
|
74
|
-
];
|
|
75
|
-
const LOW_RULES = [
|
|
76
|
-
{ pattern: 'system prompt mention', severity: 'low', re: /\bsystem\s+prompt\b/i },
|
|
77
|
-
{ pattern: 'instructions mention', severity: 'low', re: /\binstructions\b/i },
|
|
78
|
-
{ pattern: 'pre-authorized mention', severity: 'low', re: /\bpre[-\s]?authori[sz]ed\b/i },
|
|
79
|
-
];
|
|
80
|
-
/**
|
|
81
|
-
* Detect a suspicious base64 block: >200 contiguous base64 chars on a
|
|
82
|
-
* single line. Base64 is the standard smuggling format for embedded
|
|
83
|
-
* binary blobs in prompt-injection PoCs (hidden tool definitions,
|
|
84
|
-
* obfuscated instruction sets). Below 200 chars we accept the false
|
|
85
|
-
* positives (commit hashes, JWTs, asset URLs); above 200 the signal
|
|
86
|
-
* dominates.
|
|
87
|
-
*/
|
|
88
|
-
const BASE64_BLOCK_RE = /[A-Za-z0-9+/]{200,}={0,2}/;
|
|
89
|
-
/**
|
|
90
|
-
* HTML-escape the five characters that can break out of an element
|
|
91
|
-
* body. Mirrors `escapeForSentinelBody` in web-fetch.ts but applied
|
|
92
|
-
* selectively to flagged tags — we do NOT escape the entire body,
|
|
93
|
-
* only the high-severity matches, so the model still sees readable
|
|
94
|
-
* markdown.
|
|
95
|
-
*/
|
|
96
|
-
function escapeHtml(input) {
|
|
97
|
-
return input
|
|
98
|
-
.replace(/&/g, '&')
|
|
99
|
-
.replace(/</g, '<')
|
|
100
|
-
.replace(/>/g, '>')
|
|
101
|
-
.replace(/"/g, '"')
|
|
102
|
-
.replace(/'/g, ''');
|
|
103
|
-
}
|
|
104
|
-
/**
|
|
105
|
-
* Tags that, when matched at HIGH severity, get HTML-escaped in the
|
|
106
|
-
* cleaned output. The list is intentionally narrow: any `<…>` element
|
|
107
|
-
* whose name matches one of these gets `<` and `>` swapped for
|
|
108
|
-
* entities, so a downstream consumer reads the text literally rather
|
|
109
|
-
* than parsing it as structure.
|
|
110
|
-
*/
|
|
111
|
-
const TAG_NAMES_TO_ESCAPE = [
|
|
112
|
-
'system-reminder',
|
|
113
|
-
'important_instructions',
|
|
114
|
-
'important-instructions',
|
|
115
|
-
'critical_security_rules',
|
|
116
|
-
'critical-security-rules',
|
|
117
|
-
'extremely_important',
|
|
118
|
-
'extremely-important',
|
|
119
|
-
];
|
|
120
|
-
/**
|
|
121
|
-
* Build a single regex that captures any opening/closing tag whose
|
|
122
|
-
* name is in `TAG_NAMES_TO_ESCAPE`. Used by `clean` to escape only
|
|
123
|
-
* the dangerous tags, leaving the rest of the body untouched.
|
|
124
|
-
*/
|
|
125
|
-
const TAG_ESCAPE_RE = new RegExp(`</?(?:${TAG_NAMES_TO_ESCAPE.join('|')})\\b[^>]*>`, 'gi');
|
|
126
|
-
/**
|
|
127
|
-
* Run the rule dictionaries against a body of text and return the
|
|
128
|
-
* scrubbed clean output plus the list of findings.
|
|
129
|
-
*
|
|
130
|
-
* Line numbers are 1-indexed and reference the ORIGINAL body. The
|
|
131
|
-
* caller can rely on them to point at the same line in `clean`
|
|
132
|
-
* because the only structural changes are (1) zero-width strips and
|
|
133
|
-
* (2) HTML escaping of specific tag tokens — neither alters line
|
|
134
|
-
* counts.
|
|
135
|
-
*/
|
|
136
|
-
export function scanForInjection(body) {
|
|
137
|
-
if (!body)
|
|
138
|
-
return { clean: '', findings: [] };
|
|
139
|
-
const findings = [];
|
|
140
|
-
const lines = body.split(/\r?\n/);
|
|
141
|
-
for (let i = 0; i < lines.length; i++) {
|
|
142
|
-
const line = lines[i] ?? '';
|
|
143
|
-
const lineNumber = i + 1;
|
|
144
|
-
for (const rule of HIGH_RULES) {
|
|
145
|
-
if (rule.re.test(line)) {
|
|
146
|
-
findings.push({ pattern: rule.pattern, line: lineNumber, severity: 'high' });
|
|
147
|
-
}
|
|
148
|
-
}
|
|
149
|
-
for (const rule of MED_RULES) {
|
|
150
|
-
if (rule.re.test(line)) {
|
|
151
|
-
findings.push({ pattern: rule.pattern, line: lineNumber, severity: 'med' });
|
|
152
|
-
}
|
|
153
|
-
}
|
|
154
|
-
for (const rule of LOW_RULES) {
|
|
155
|
-
if (rule.re.test(line)) {
|
|
156
|
-
findings.push({ pattern: rule.pattern, line: lineNumber, severity: 'low' });
|
|
157
|
-
}
|
|
158
|
-
}
|
|
159
|
-
if (BASE64_BLOCK_RE.test(line)) {
|
|
160
|
-
findings.push({ pattern: 'long base64 block (>200 chars)', line: lineNumber, severity: 'med' });
|
|
161
|
-
}
|
|
162
|
-
}
|
|
163
|
-
// Always strip zero-width chars from the cleaned output, even when
|
|
164
|
-
// no rule explicitly flagged them. They have no legitimate use in
|
|
165
|
-
// fetched markdown content the model is meant to read.
|
|
166
|
-
let clean = body.replace(ZERO_WIDTH_RE, (match) => {
|
|
167
|
-
findings.push({
|
|
168
|
-
pattern: `zero-width char U+${match.charCodeAt(0).toString(16).toUpperCase().padStart(4, '0')}`,
|
|
169
|
-
line: 0, // multi-line; surfaced separately
|
|
170
|
-
severity: 'high',
|
|
171
|
-
});
|
|
172
|
-
return '';
|
|
173
|
-
});
|
|
174
|
-
// HTML-escape the high-severity impostor tags so a downstream parser
|
|
175
|
-
// (or another LLM) sees text, not structure.
|
|
176
|
-
clean = clean.replace(TAG_ESCAPE_RE, (match) => escapeHtml(match));
|
|
177
|
-
return { clean, findings };
|
|
178
|
-
}
|
|
179
|
-
/**
|
|
180
|
-
* Convenience: return the highest severity present in a findings
|
|
181
|
-
* list, or `null` if the list is empty. `high` > `med` > `low`.
|
|
182
|
-
*/
|
|
183
|
-
export function topSeverity(findings) {
|
|
184
|
-
if (findings.some((f) => f.severity === 'high'))
|
|
185
|
-
return 'high';
|
|
186
|
-
if (findings.some((f) => f.severity === 'med'))
|
|
187
|
-
return 'med';
|
|
188
|
-
if (findings.some((f) => f.severity === 'low'))
|
|
189
|
-
return 'low';
|
|
190
|
-
return null;
|
|
191
|
-
}
|
|
192
|
-
/**
|
|
193
|
-
* Render a one-line summary of high-severity findings for the safety
|
|
194
|
-
* envelope. Stable ordering: by line, then by pattern.
|
|
195
|
-
*/
|
|
196
|
-
export function formatHighFindings(findings) {
|
|
197
|
-
const high = findings.filter((f) => f.severity === 'high');
|
|
198
|
-
if (high.length === 0)
|
|
199
|
-
return '';
|
|
200
|
-
const sorted = [...high].sort((a, b) => {
|
|
201
|
-
if (a.line !== b.line)
|
|
202
|
-
return a.line - b.line;
|
|
203
|
-
return a.pattern.localeCompare(b.pattern);
|
|
204
|
-
});
|
|
205
|
-
return sorted.map((f) => `[${f.severity}] ${f.pattern} @ line ${f.line}`).join('; ');
|
|
206
|
-
}
|
|
207
|
-
//# sourceMappingURL=web-fetch-injection-scanner.js.map
|