npm - @pugi/cli - Versions diffs - 0.1.0-beta.9 → 0.1.0-beta.91 - Mend

@pugi/cli 0.1.0-beta.9 → 0.1.0-beta.91

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (411) hide show

package/CHANGELOG.md +132 -0
package/LICENSE +1 -1
package/assets/pugi-prozr2-mascot.ansi +9 -0
package/bin/run.js +33 -1
package/dist/commands/deploy.js +40 -40
package/dist/commands/flatten.js +191 -0
package/dist/commands/jobs-watch.js +201 -0
package/dist/commands/jobs.js +42 -27
package/dist/commands/smoke.js +133 -0
package/dist/core/agent-progress/cleanup.js +134 -0
package/dist/core/agent-progress/schema.js +144 -0
package/dist/core/agent-progress/writer.js +101 -0
package/dist/core/agents/adaptive-router.js +330 -0
package/dist/core/agents/query-decomposer.js +297 -0
package/dist/core/agents/registry.js +3 -3
package/dist/core/approvals/shortcut-resolver.js +98 -0
package/dist/core/artifact-chain/dispatcher.js +148 -0
package/dist/core/artifact-chain/exporter.js +164 -0
package/dist/core/artifact-chain/state.js +243 -0
package/dist/core/artifact-chain/steps.js +169 -0
package/dist/core/ask-user/question.js +92 -0
package/dist/core/audit/audit-trail.js +275 -0
package/dist/core/auth/ensure-authenticated.js +129 -0
package/dist/core/auth/env-provider.js +238 -0
package/dist/core/auto-open-browser.js +4 -4
package/dist/core/auto-update/channels.js +122 -0
package/dist/core/auto-update/checker.js +241 -0
package/dist/core/auto-update/state.js +235 -0
package/dist/core/bare-mode/index.js +107 -0
package/dist/core/bash/redirect.js +281 -0
package/dist/core/bash-classifier.js +436 -40
package/dist/core/checkpoint/resumer.js +149 -0
package/dist/core/checkpoint/rewinder.js +291 -0
package/dist/core/checkpoints/shadow-git.js +670 -0
package/dist/core/citations/parser.js +109 -0
package/dist/core/classifier/yolo-classifier.js +88 -0
package/dist/core/codegraph/decision-store.js +248 -0
package/dist/core/codegraph/detect-repo.js +459 -0
package/dist/core/codegraph/install.js +134 -0
package/dist/core/codegraph/offer-hook.js +220 -0
package/dist/core/compact/auto-trigger.js +96 -0
package/dist/core/compact/buffer-rewriter.js +115 -0
package/dist/core/compact/summarizer.js +208 -0
package/dist/core/compact/token-counter.js +108 -0
package/dist/core/consensus/anvil-fanout.js +25 -25
package/dist/core/consensus/diff-capture.js +121 -12
package/dist/core/consensus/rubric.js +21 -21
package/dist/core/context/builder.js +6 -6
package/dist/core/context/compaction-events.js +8 -8
package/dist/core/context/compaction.js +31 -31
package/dist/core/context/index.js +15 -8
package/dist/core/context/invariants.js +51 -51
package/dist/core/context/markdown-loader.js +28 -10
package/dist/core/context/markdown-traverse.js +255 -0
package/dist/core/context/pugiignore.js +41 -41
package/dist/core/context/repo-skeleton.js +37 -37
package/dist/core/context/tool-eviction.js +55 -0
package/dist/core/context/watcher.js +32 -32
package/dist/core/context/working-set.js +23 -23
package/dist/core/coordinator/agent-tools.js +77 -0
package/dist/core/coordinator/agent-toolset.js +65 -0
package/dist/core/coordinator/fsm.js +73 -0
package/dist/core/coordinator/mode-fsm.js +70 -0
package/dist/core/cost/rate-card.js +129 -0
package/dist/core/cost/tracker.js +221 -0
package/dist/core/credentials.js +13 -13
package/dist/core/cron/scheduler.js +138 -0
package/dist/core/denial-tracking/index.js +8 -0
package/dist/core/denial-tracking/state.js +264 -0
package/dist/core/diagnostics/probe-runner.js +93 -0
package/dist/core/diagnostics/probes/api.js +46 -0
package/dist/core/diagnostics/probes/auth.js +93 -0
package/dist/core/diagnostics/probes/bare-mode.js +42 -0
package/dist/core/diagnostics/probes/cli-version.js +127 -0
package/dist/core/diagnostics/probes/config.js +72 -0
package/dist/core/diagnostics/probes/denial-tracking.js +57 -0
package/dist/core/diagnostics/probes/disk.js +81 -0
package/dist/core/diagnostics/probes/engine-live.js +46 -0
package/dist/core/diagnostics/probes/git.js +65 -0
package/dist/core/diagnostics/probes/hooks.js +118 -0
package/dist/core/diagnostics/probes/mcp.js +75 -0
package/dist/core/diagnostics/probes/node.js +59 -0
package/dist/core/diagnostics/probes/pnpm.js +36 -0
package/dist/core/diagnostics/probes/pugi-md.js +89 -0
package/dist/core/diagnostics/probes/sandbox.js +40 -0
package/dist/core/diagnostics/probes/session.js +74 -0
package/dist/core/diagnostics/probes/status-snapshot.js +488 -0
package/dist/core/diagnostics/probes/workspace.js +63 -0
package/dist/core/diagnostics/types.js +70 -0
package/dist/core/dispatch/cache-cleanup.js +197 -0
package/dist/core/dispatch/cache-handoff.js +295 -0
package/dist/core/edits/apply-patch-layer-e.js +189 -0
package/dist/core/edits/dispatch.js +333 -7
package/dist/core/edits/format-detector.js +260 -0
package/dist/core/edits/format-matrix.js +26 -0
package/dist/core/edits/fuzzy-ladder.js +650 -0
package/dist/core/edits/index.js +5 -1
package/dist/core/edits/journal.js +199 -0
package/dist/core/edits/layer-a-apply.js +15 -15
package/dist/core/edits/layer-a-fuzzy-apply.js +198 -0
package/dist/core/edits/layer-b-apply.js +9 -9
package/dist/core/edits/layer-c-apply.js +6 -6
package/dist/core/edits/layer-d-ast.js +557 -14
package/dist/core/edits/marker-parser.js +12 -12
package/dist/core/edits/security-gate.js +27 -27
package/dist/core/edits/verify-hook.js +273 -0
package/dist/core/edits/worktree.js +29 -29
package/dist/core/engine/anvil-client.js +214 -26
package/dist/core/engine/auto-compact.js +179 -0
package/dist/core/engine/budgets.js +186 -0
package/dist/core/engine/context-prefix.js +155 -0
package/dist/core/engine/index.js +1 -1
package/dist/core/engine/intensity.js +158 -0
package/dist/core/engine/intent.js +260 -0
package/dist/core/engine/native-pugi.js +1295 -227
package/dist/core/engine/prompts.js +129 -19
package/dist/core/engine/strip-internal-fields.js +124 -0
package/dist/core/engine/tool-bridge.js +1792 -59
package/dist/core/evaluation/golden-dataset.js +293 -0
package/dist/core/feedback/queue.js +177 -0
package/dist/core/feedback/submitter.js +145 -0
package/dist/core/file-cache.js +113 -1
package/dist/core/flatten/flatten-repo.js +439 -0
package/dist/core/format/osc8-link.js +28 -0
package/dist/core/hook-chains.js +392 -0
package/dist/core/hooks/citation-verify-hook.js +138 -0
package/dist/core/hooks/citation-verify.js +112 -0
package/dist/core/hooks/events.js +46 -0
package/dist/core/hooks/index.js +15 -0
package/dist/core/hooks/registry.js +216 -0
package/dist/core/hooks/runner.js +236 -0
package/dist/core/hooks/v2/event-emitter.js +115 -0
package/dist/core/hooks/v2/executor.js +282 -0
package/dist/core/hooks/v2/index.js +25 -0
package/dist/core/hooks/v2/lifecycle.js +104 -0
package/dist/core/hooks/v2/loader.js +216 -0
package/dist/core/hooks/v2/matcher.js +125 -0
package/dist/core/hooks/v2/trust.js +143 -0
package/dist/core/hooks/v2/types.js +86 -0
package/dist/core/hooks/worktree-events.js +158 -0
package/dist/core/image/renderer.js +71 -0
package/dist/core/init/detector.js +582 -0
package/dist/core/init/template-renderer.js +242 -0
package/dist/core/jobs/registry.js +18 -18
package/dist/core/ledger/results-tsv.js +142 -0
package/dist/core/log-discipline/stdout-redirect.js +51 -0
package/dist/core/lsp/cache.js +105 -0
package/dist/core/lsp/client.js +551 -41
package/dist/core/lsp/language-detect.js +66 -0
package/dist/core/lsp/post-edit-diagnostics.js +171 -0
package/dist/core/lsp/server-detect.js +173 -0
package/dist/core/lsp/symbol-cache.js +162 -0
package/dist/core/lsp/symbol-tools.js +664 -0
package/dist/core/mcp/client.js +97 -28
package/dist/core/mcp/http-server.js +553 -0
package/dist/core/mcp/orchestrator-tools.js +662 -0
package/dist/core/mcp/permission.js +190 -0
package/dist/core/mcp/registry.js +39 -17
package/dist/core/mcp/server-tools.js +219 -0
package/dist/core/mcp/server.js +397 -0
package/dist/core/mcp/trust.js +10 -10
package/dist/core/memory/dual-write.js +416 -0
package/dist/core/memory/passive-extract.js +130 -0
package/dist/core/memory/phase1-kinds.js +20 -0
package/dist/core/memory/secret-scanner.js +304 -0
package/dist/core/memory-sync/queue.js +170 -0
package/dist/core/metrics/extract.js +113 -0
package/dist/core/modes/roo-modes.js +68 -0
package/dist/core/onboarding/ensure-initialized.js +133 -0
package/dist/core/onboarding/marker.js +111 -0
package/dist/core/onboarding/telemetry-state.js +108 -0
package/dist/core/output-style/presets.js +176 -0
package/dist/core/output-style/state.js +185 -0
package/dist/core/path-security.js +287 -5
package/dist/core/permission.js +82 -22
package/dist/core/permissions/auto-classifier.js +124 -0
package/dist/core/permissions/bash-parser.js +371 -0
package/dist/core/permissions/circuit-breaker.js +83 -0
package/dist/core/permissions/constrained-edit.js +91 -0
package/dist/core/permissions/gate.js +278 -0
package/dist/core/permissions/index.js +20 -0
package/dist/core/permissions/mode.js +174 -0
package/dist/core/permissions/network-egress.js +137 -0
package/dist/core/permissions/state.js +241 -0
package/dist/core/permissions/tool-class.js +93 -0
package/dist/core/plan-mode/ui-state.js +51 -0
package/dist/core/plans/plan-artifact.js +721 -0
package/dist/core/policy-limits/etag-store.js +122 -0
package/dist/core/prd-check/parser.js +215 -0
package/dist/core/prd-check/reporter.js +127 -0
package/dist/core/prd-check/session-review.js +557 -0
package/dist/core/prd-check/verifiers.js +223 -0
package/dist/core/prompt-cache/client-cache.js +99 -0
package/dist/core/prompts/assembly.js +29 -0
package/dist/core/prompts/registry.js +364 -0
package/dist/core/pugi-md/cc-compat-rules.js +735 -0
package/dist/core/pugi-md/context-injector.js +76 -0
package/dist/core/pugi-md/walk-up.js +207 -0
package/dist/core/python/uv-installer.js +270 -0
package/dist/core/python/uv-resolver.js +83 -0
package/dist/core/rate-limit/narrator.js +146 -0
package/dist/core/recipes/cli-types.js +20 -0
package/dist/core/recipes/loader.js +103 -0
package/dist/core/recipes/runner.js +345 -0
package/dist/core/recipes/schema.js +587 -0
package/dist/core/release-notes/parser.js +241 -0
package/dist/core/release-notes/state.js +116 -0
package/dist/core/repl/ask.js +37 -37
package/dist/core/repl/cancellation.js +26 -26
package/dist/core/repl/cap-warning.js +4 -4
package/dist/core/repl/clipboard-read.js +11 -11
package/dist/core/repl/dispatch-fsm.js +12 -12
package/dist/core/repl/history-search.js +15 -15
package/dist/core/repl/history.js +28 -18
package/dist/core/repl/kill-ring.js +5 -5
package/dist/core/repl/model-pricing.js +135 -0
package/dist/core/repl/privacy-banner.js +22 -22
package/dist/core/repl/session.js +2148 -217
package/dist/core/repl/slash-commands.js +501 -41
package/dist/core/repl/store/index.js +1 -1
package/dist/core/repl/store/jsonl-log.js +22 -22
package/dist/core/repl/store/lockfile.js +10 -10
package/dist/core/repl/store/session-store.js +136 -107
package/dist/core/repl/store/types.js +15 -15
package/dist/core/repl/store/uuid-v7.js +12 -12
package/dist/core/repl/workspace-context.js +43 -21
package/dist/core/repo-map/build.js +125 -0
package/dist/core/repo-map/cache.js +185 -0
package/dist/core/repo-map/extractor.js +254 -0
package/dist/core/repo-map/formatter.js +145 -0
package/dist/core/repo-map/page-rank.js +105 -0
package/dist/core/repo-map/scanner.js +211 -0
package/dist/core/retry-budget/budget.js +284 -0
package/dist/core/retry-budget/index.js +5 -0
package/dist/core/retry-budget/retry-cap.js +74 -0
package/dist/core/routing/lead-worker.js +43 -0
package/dist/core/routing/pre-flight-estimator.js +108 -0
package/dist/core/runs/run-tree.js +103 -0
package/dist/core/security/injection-scanner.js +367 -0
package/dist/core/security/output-filter.js +418 -0
package/dist/core/session/env-file.js +105 -0
package/dist/core/session/section-budgets.js +140 -0
package/dist/core/session.js +92 -0
package/dist/core/settings.js +324 -5
package/dist/core/share/formatter.js +271 -0
package/dist/core/share/redactor.js +221 -0
package/dist/core/share/uploader.js +267 -0
package/dist/core/skills/defaults.js +30 -30
package/dist/core/skills/loader.js +22 -22
package/dist/core/skills/sources.js +27 -27
package/dist/core/smoke/headless-driver.js +174 -0
package/dist/core/smoke/orchestrator.js +194 -0
package/dist/core/smoke/runner.js +238 -0
package/dist/core/smoke/scenario-parser.js +316 -0
package/dist/core/statusline.js +99 -0
package/dist/core/subagents/dispatcher-real.js +600 -0
package/dist/core/subagents/dispatcher.js +132 -43
package/dist/core/subagents/index.js +19 -6
package/dist/core/subagents/isolation-matrix.js +213 -0
package/dist/core/subagents/spawn.js +19 -4
package/dist/core/telemetry/emitter.js +229 -0
package/dist/core/telemetry/queue.js +251 -0
package/dist/core/theme/context.js +91 -0
package/dist/core/theme/presets.js +228 -0
package/dist/core/theme/state.js +181 -0
package/dist/core/todos/invariant.js +10 -0
package/dist/core/todos/state.js +177 -0
package/dist/core/tool-schema/compressor.js +89 -0
package/dist/core/transport/version-interceptor.js +166 -0
package/dist/core/trust.js +2 -2
package/dist/core/tui/thinking-block.js +64 -0
package/dist/core/vim/keymap.js +288 -0
package/dist/core/vim/state.js +92 -0
package/dist/core/watch-markers/marker-watcher.js +133 -0
package/dist/core/worktree/include-parser.js +249 -0
package/dist/core/worktree-manager/cleanup.js +123 -0
package/dist/core/worktree-manager/manager.js +303 -0
package/dist/index.js +36 -0
package/dist/runtime/bootstrap.js +190 -0
package/dist/runtime/cli.js +4185 -549
package/dist/runtime/commands/agents.js +31 -31
package/dist/runtime/commands/budget.js +5 -5
package/dist/runtime/commands/cancel.js +231 -0
package/dist/runtime/commands/chain.js +489 -0
package/dist/runtime/commands/codegraph-status.js +227 -0
package/dist/runtime/commands/compact.js +297 -0
package/dist/runtime/commands/config.js +73 -39
package/dist/runtime/commands/cost.js +199 -0
package/dist/runtime/commands/delegate.js +27 -4
package/dist/runtime/commands/dispatch.js +126 -0
package/dist/runtime/commands/doctor.js +579 -0
package/dist/runtime/commands/feedback.js +184 -0
package/dist/runtime/commands/hooks.js +187 -0
package/dist/runtime/commands/init.js +254 -0
package/dist/runtime/commands/lsp.js +200 -38
package/dist/runtime/commands/mcp.js +879 -0
package/dist/runtime/commands/memory.js +582 -0
package/dist/runtime/commands/model.js +237 -0
package/dist/runtime/commands/onboarding.js +275 -0
package/dist/runtime/commands/patch.js +12 -12
package/dist/runtime/commands/permissions.js +112 -0
package/dist/runtime/commands/plan.js +143 -0
package/dist/runtime/commands/prd-check.js +285 -0
package/dist/runtime/commands/privacy.js +17 -17
package/dist/runtime/commands/recipe.js +325 -0
package/dist/runtime/commands/redo-blob-store.js +92 -0
package/dist/runtime/commands/redo.js +361 -0
package/dist/runtime/commands/release-notes.js +229 -0
package/dist/runtime/commands/repo-map.js +95 -0
package/dist/runtime/commands/report.js +299 -0
package/dist/runtime/commands/resume.js +118 -0
package/dist/runtime/commands/review-consensus.js +68 -53
package/dist/runtime/commands/rewind.js +333 -0
package/dist/runtime/commands/roster.js +14 -14
package/dist/runtime/commands/sessions.js +163 -0
package/dist/runtime/commands/share.js +316 -0
package/dist/runtime/commands/skills.js +31 -31
package/dist/runtime/commands/status.js +186 -0
package/dist/runtime/commands/stickers.js +82 -0
package/dist/runtime/commands/style.js +194 -0
package/dist/runtime/commands/theme.js +196 -0
package/dist/runtime/commands/undo.js +54 -22
package/dist/runtime/commands/update.js +289 -0
package/dist/runtime/commands/vim.js +140 -0
package/dist/runtime/commands/worktree.js +8 -8
package/dist/runtime/commands/worktrees.js +155 -0
package/dist/runtime/headless-repl.js +195 -0
package/dist/runtime/headless.js +543 -0
package/dist/runtime/load-hooks-or-exit.js +71 -0
package/dist/runtime/plan-decompose.js +22 -22
package/dist/runtime/sigint-guard.js +272 -0
package/dist/runtime/update-check.js +28 -28
package/dist/runtime/version.js +65 -0
package/dist/runtime/worktree-bootstrap.js +579 -0
package/dist/skills/bundled/batch.js +617 -0
package/dist/skills/bundled/index.js +45 -0
package/dist/skills/bundled/loop.js +358 -0
package/dist/skills/bundled/remember.js +383 -0
package/dist/skills/bundled/simplify.js +289 -0
package/dist/skills/bundled/skillify.js +373 -0
package/dist/skills/bundled/stuck.js +558 -0
package/dist/skills/bundled/verify.js +439 -0
package/dist/testing/vcr.js +486 -0
package/dist/tools/agent-tool.js +229 -0
package/dist/tools/apply-patch.js +89 -28
package/dist/tools/ask-user-question.js +337 -0
package/dist/tools/ask-user.js +115 -0
package/dist/tools/bash.js +624 -46
package/dist/tools/brief.js +224 -0
package/dist/tools/cron.js +433 -0
package/dist/tools/enter-worktree.js +250 -0
package/dist/tools/exit-worktree.js +147 -0
package/dist/tools/file-tools.js +161 -44
package/dist/tools/lsp-tools.js +377 -1
package/dist/tools/mcp-tool.js +260 -0
package/dist/tools/multi-edit.js +361 -0
package/dist/tools/powershell.js +268 -0
package/dist/tools/registry.js +99 -4
package/dist/tools/skill-tool.js +96 -0
package/dist/tools/sleep.js +99 -0
package/dist/tools/synthetic-output.js +133 -0
package/dist/tools/tasks.js +208 -0
package/dist/tools/todo-write.js +184 -0
package/dist/tools/verify-plan-execution.js +295 -0
package/dist/tools/web-fetch-injection-scanner.js +207 -0
package/dist/tools/web-fetch.js +195 -10
package/dist/tools/web-search.js +458 -0
package/dist/tui/agent-progress-card.js +111 -0
package/dist/tui/agent-tree.js +11 -1
package/dist/tui/ask-modal.js +14 -14
package/dist/tui/ask-user-question-chips.js +315 -0
package/dist/tui/ask-user-question-prompt.js +203 -0
package/dist/tui/compact-banner.js +81 -0
package/dist/tui/conversation-pane.js +85 -11
package/dist/tui/cost-table.js +111 -0
package/dist/tui/device-flow.js +2 -2
package/dist/tui/doctor-table.js +46 -0
package/dist/tui/feedback-prompt.js +156 -0
package/dist/tui/input-box.js +247 -32
package/dist/tui/login-picker.js +3 -3
package/dist/tui/markdown-render.js +6 -6
package/dist/tui/multi-file-diff-approval.js +375 -0
package/dist/tui/onboarding-wizard.js +240 -0
package/dist/tui/permissions-picker.js +86 -0
package/dist/tui/render.js +36 -1
package/dist/tui/repl-render.js +176 -25
package/dist/tui/repl-splash-art.js +16 -16
package/dist/tui/repl-splash-mascot.js +48 -24
package/dist/tui/repl-splash.js +22 -22
package/dist/tui/repl.js +125 -45
package/dist/tui/slash-palette.js +6 -6
package/dist/tui/splash.js +2 -2
package/dist/tui/status-bar.js +109 -31
package/dist/tui/status-table.js +7 -0
package/dist/tui/stickers-art.js +136 -0
package/dist/tui/style-table.js +28 -0
package/dist/tui/theme-table.js +29 -0
package/dist/tui/thinking-spinner.js +123 -0
package/dist/tui/tool-stream-pane.js +53 -4
package/dist/tui/update-banner.js +27 -2
package/dist/tui/vim-input.js +267 -0
package/dist/tui/welcome-banner.js +107 -0
package/dist/tui/welcome-data.js +293 -0
package/dist/tui/workspace-context.js +2 -2
package/package.json +31 -16
package/test/scenarios/codegen-create-file.scenario.txt +13 -0
package/test/scenarios/compact-force.scenario.txt +12 -0
package/test/scenarios/identity.scenario.txt +12 -0
package/test/scenarios/persona-handoff.scenario.txt +12 -0
package/test/scenarios/walkback.scenario.txt +12 -0
package/dist/core/engine/compaction-hook.js +0 -154

package/dist/core/evaluation/golden-dataset.js ADDED Viewed

@@ -0,0 +1,293 @@
+/**
+ * Golden dataset primitive — pugi-eval-v1 foundation (task).
+ *
+ * Formalizes a frozen set of representative CLI tasks that we replay
+ * against the agent loop to detect quality regressions. This module is
+ * the pure data layer:
+ *
+ *  1. `GoldenTask` — typed contract for one evaluation case (id, query,
+ *     expected file touches, expected output substrings, exit-code
+ *     gate, soft budgets, tags).
+ *  2. `loadGoldenDataset(path)` — reads a JSON file from disk, asserts
+ *     it is a non-empty array, and runs `validateGoldenTask` on every
+ *     element. Throws on the first malformed entry so the eval harness
+ *     cannot silently drop a task.
+ *  3. `validateGoldenTask(raw)` — schema validator. Enforces kebab-case
+ *     ids, non-empty query, optional arrays whose elements are
+ *     well-formed, and rejects parent-traversal `..` segments inside
+ *     `expectedFiles`. Throws `TypeError` with a specific field message.
+ *  4. `diffAgainstBaseline(current, baseline)` — turns two `TaskResult`
+ *     maps into a `DriftReport` that lists regressed / improved / new /
+ *     removed tasks. A regression is a task that PASSED in baseline and
+ *     FAILED in current; an improvement is the inverse. The report is
+ *     what the future CI gate consumes — a positive `regressed.length`
+ *     blocks the merge.
+ *
+ * Out of scope here: actually running tasks against the engine. The
+ * follow-up `runOfflineEval()` consumer reads a dataset via
+ * `loadGoldenDataset`, executes each task through `pugi code/explain/
+ * plan/fix/build`, collects pass/fail/latency/tokens into a
+ * `TaskResult[]`, and feeds the previous run's results into
+ * `diffAgainstBaseline` for the drift gate.
+ *
+ * Pure functions only. No file I/O beyond `fs/promises.readFile` inside
+ * `loadGoldenDataset` so the module composes cleanly with in-memory test
+ * fixtures and engine-side consumers that already hold dataset bytes.
+ */
+import { readFile } from 'node:fs/promises';
+const ID_PATTERN = /^[a-z][a-z0-9-]*$/;
+/**
+ * Validate one raw value as a `GoldenTask`. Throws `TypeError` with a
+ * field-specific message on any violation. Returns the typed task on
+ * success.
+ *
+ * The validator is intentionally hand-rolled — the shape is small, and
+ * adding zod here would obscure the per-field error contract that the
+ * eval harness logs at load time.
+ */
+export function validateGoldenTask(raw) {
+    if (typeof raw !== 'object' || raw === null || Array.isArray(raw)) {
+        throw new TypeError('golden task must be a JSON object');
+    }
+    const r = raw;
+    // id — required, kebab-case.
+    if (typeof r.id !== 'string' || r.id.length === 0) {
+        throw new TypeError('golden task: `id` required (non-empty string)');
+    }
+    if (!ID_PATTERN.test(r.id)) {
+        throw new TypeError(`golden task ${JSON.stringify(r.id)}: \`id\` must match ${ID_PATTERN.source} (kebab-case, leading letter)`);
+    }
+    const id = r.id;
+    // query — required.
+    if (typeof r.query !== 'string' || r.query.length === 0) {
+        throw new TypeError(`golden task ${id}: \`query\` required (non-empty string)`);
+    }
+    const query = r.query;
+    // expectedFiles — optional, when present must be non-empty array of
+    // relative paths without traversal.
+    let expectedFiles;
+    if (r.expectedFiles !== undefined) {
+        if (!Array.isArray(r.expectedFiles)) {
+            throw new TypeError(`golden task ${id}: \`expectedFiles\` must be an array`);
+        }
+        if (r.expectedFiles.length === 0) {
+            throw new TypeError(`golden task ${id}: \`expectedFiles\` must be non-empty (omit field instead of passing [])`);
+        }
+        expectedFiles = r.expectedFiles.map((entry, idx) => {
+            if (typeof entry !== 'string' || entry.length === 0) {
+                throw new TypeError(`golden task ${id}: \`expectedFiles[${idx}]\` must be a non-empty string`);
+            }
+            if (entry.startsWith('/')) {
+                throw new TypeError(`golden task ${id}: \`expectedFiles[${idx}]\` must be relative (no leading /)`);
+            }
+            const segments = entry.split('/');
+            if (segments.some((s) => s === '..')) {
+                throw new TypeError(`golden task ${id}: \`expectedFiles[${idx}]\` contains \`..\` traversal`);
+            }
+            return entry;
+        });
+    }
+    // expectedSubstrings — optional array of non-empty strings.
+    let expectedSubstrings;
+    if (r.expectedSubstrings !== undefined) {
+        if (!Array.isArray(r.expectedSubstrings)) {
+            throw new TypeError(`golden task ${id}: \`expectedSubstrings\` must be an array`);
+        }
+        if (r.expectedSubstrings.length === 0) {
+            throw new TypeError(`golden task ${id}: \`expectedSubstrings\` must be non-empty (omit field instead of passing [])`);
+        }
+        expectedSubstrings = r.expectedSubstrings.map((entry, idx) => {
+            if (typeof entry !== 'string' || entry.length === 0) {
+                throw new TypeError(`golden task ${id}: \`expectedSubstrings[${idx}]\` must be a non-empty string`);
+            }
+            return entry;
+        });
+    }
+    // expectedExitCode — optional integer.
+    let expectedExitCode;
+    if (r.expectedExitCode !== undefined) {
+        if (typeof r.expectedExitCode !== 'number' ||
+            !Number.isInteger(r.expectedExitCode)) {
+            throw new TypeError(`golden task ${id}: \`expectedExitCode\` must be an integer`);
+        }
+        expectedExitCode = r.expectedExitCode;
+    }
+    // maxTokens — optional positive integer.
+    let maxTokens;
+    if (r.maxTokens !== undefined) {
+        if (typeof r.maxTokens !== 'number' ||
+            !Number.isInteger(r.maxTokens) ||
+            r.maxTokens <= 0) {
+            throw new TypeError(`golden task ${id}: \`maxTokens\` must be a positive integer`);
+        }
+        maxTokens = r.maxTokens;
+    }
+    // maxLatencyMs — optional positive integer.
+    let maxLatencyMs;
+    if (r.maxLatencyMs !== undefined) {
+        if (typeof r.maxLatencyMs !== 'number' ||
+            !Number.isInteger(r.maxLatencyMs) ||
+            r.maxLatencyMs <= 0) {
+            throw new TypeError(`golden task ${id}: \`maxLatencyMs\` must be a positive integer`);
+        }
+        maxLatencyMs = r.maxLatencyMs;
+    }
+    // tags — optional array of non-empty strings.
+    let tags;
+    if (r.tags !== undefined) {
+        if (!Array.isArray(r.tags)) {
+            throw new TypeError(`golden task ${id}: \`tags\` must be an array`);
+        }
+        tags = r.tags.map((entry, idx) => {
+            if (typeof entry !== 'string' || entry.length === 0) {
+                throw new TypeError(`golden task ${id}: \`tags[${idx}]\` must be a non-empty string`);
+            }
+            return entry;
+        });
+    }
+    const task = { id, query };
+    if (expectedFiles !== undefined)
+        task.expectedFiles = expectedFiles;
+    if (expectedSubstrings !== undefined)
+        task.expectedSubstrings = expectedSubstrings;
+    if (expectedExitCode !== undefined)
+        task.expectedExitCode = expectedExitCode;
+    if (maxTokens !== undefined)
+        task.maxTokens = maxTokens;
+    if (maxLatencyMs !== undefined)
+        task.maxLatencyMs = maxLatencyMs;
+    if (tags !== undefined)
+        task.tags = tags;
+    return task;
+}
+/**
+ * Load and validate a golden dataset JSON file. The file must parse as
+ * a JSON array of objects, each one a valid `GoldenTask`. Duplicate
+ * ids are rejected — drift comparisons key by id and a duplicate would
+ * silently mask one row.
+ */
+export async function loadGoldenDataset(filePath) {
+    let raw;
+    try {
+        raw = await readFile(filePath, 'utf8');
+    }
+    catch (err) {
+        const message = err instanceof Error ? err.message : String(err);
+        throw new TypeError(`golden dataset: cannot read ${filePath}: ${message}`);
+    }
+    let parsed;
+    try {
+        parsed = JSON.parse(raw);
+    }
+    catch (err) {
+        const message = err instanceof Error ? err.message : String(err);
+        throw new TypeError(`golden dataset ${filePath}: invalid JSON (${message})`);
+    }
+    if (!Array.isArray(parsed)) {
+        throw new TypeError(`golden dataset ${filePath}: top-level value must be a JSON array`);
+    }
+    const tasks = [];
+    const seen = new Set();
+    for (let i = 0; i < parsed.length; i += 1) {
+        let task;
+        try {
+            task = validateGoldenTask(parsed[i]);
+        }
+        catch (err) {
+            const message = err instanceof Error ? err.message : String(err);
+            throw new TypeError(`golden dataset ${filePath}: entry [${i}]: ${message}`);
+        }
+        if (seen.has(task.id)) {
+            throw new TypeError(`golden dataset ${filePath}: duplicate task id ${JSON.stringify(task.id)} at entry [${i}]`);
+        }
+        seen.add(task.id);
+        tasks.push(task);
+    }
+    return tasks;
+}
+/**
+ * Compare a current run against a baseline run and return a drift
+ * report. Pure function — no I/O, no clock, deterministic ordering
+ * (regressed/improved sorted by id).
+ *
+ * Either input may be empty. An empty baseline produces an
+ * all-newTasks report without crashing — useful for the very first
+ * eval run when no previous artifact exists yet.
+ */
+export function diffAgainstBaseline(currentResults, baselineResults, options) {
+    const includeReason = options?.includeReason ?? true;
+    const currentById = new Map();
+    for (const r of currentResults) {
+        if (typeof r.id !== 'string' || r.id.length === 0)
+            continue;
+        currentById.set(r.id, r);
+    }
+    const baselineById = new Map();
+    for (const r of baselineResults) {
+        if (typeof r.id !== 'string' || r.id.length === 0)
+            continue;
+        baselineById.set(r.id, r);
+    }
+    const regressed = [];
+    const improved = [];
+    const newTasks = [];
+    const removedTasks = [];
+    for (const [id, currentRow] of currentById) {
+        const baselineRow = baselineById.get(id);
+        if (!baselineRow) {
+            newTasks.push(id);
+            continue;
+        }
+        if (baselineRow.passed && !currentRow.passed) {
+            const diff = {
+                id,
+                baselinePassed: true,
+                currentPassed: false,
+            };
+            if (includeReason && currentRow.reason !== undefined) {
+                diff.reason = currentRow.reason;
+            }
+            regressed.push(diff);
+        }
+        else if (!baselineRow.passed && currentRow.passed) {
+            const diff = {
+                id,
+                baselinePassed: false,
+                currentPassed: true,
+            };
+            if (includeReason && currentRow.reason !== undefined) {
+                diff.reason = currentRow.reason;
+            }
+            improved.push(diff);
+        }
+    }
+    for (const id of baselineById.keys()) {
+        if (!currentById.has(id)) {
+            removedTasks.push(id);
+        }
+    }
+    regressed.sort((a, b) => a.id.localeCompare(b.id));
+    improved.sort((a, b) => a.id.localeCompare(b.id));
+    newTasks.sort();
+    removedTasks.sort();
+    let passedNow = 0;
+    for (const r of currentById.values()) {
+        if (r.passed)
+            passedNow += 1;
+    }
+    let passedBaseline = 0;
+    for (const r of baselineById.values()) {
+        if (r.passed)
+            passedBaseline += 1;
+    }
+    return {
+        totalTasks: currentById.size,
+        passedNow,
+        passedBaseline,
+        regressed,
+        improved,
+        newTasks,
+        removedTasks,
+    };
+}
+//# sourceMappingURL=golden-dataset.js.map

package/dist/core/feedback/queue.js ADDED Viewed

@@ -0,0 +1,177 @@
+/**
+ * Local feedback queue — .
+ *
+ * `pugi feedback` POSTs collected operator feedback to the admin-api
+ * `/api/pugi/feedback` route. When that round-trip fails (endpoint
+ * missing, network down, server 5xx), the submitter falls back to
+ * appending the envelope to `<cwd>/.pugi/feedback-queue.jsonl`. On the
+ * next online session the flusher drains the queue silently in the
+ * background.
+ *
+ * # Module contract
+ *
+ *  - Per-workspace storage. The queue file lives at
+ *    `<cwd>/.pugi/feedback-queue.jsonl` so the operator-visible state
+ *    stays alongside the project's other Pugi metadata. Multi-repo
+ *    operators get one queue per repo — matches the rest of `.pugi/`.
+ *
+ *  - JSONL append-only format. One envelope per line. Newlines inside
+ *    the comment field are escaped as `\n` by `JSON.stringify`. The
+ *    enqueue path uses an atomic `O_APPEND` write so concurrent
+ *    `pugi feedback` invocations from a split-screen REPL + shell do
+ *    not interleave half-records.
+ *
+ *  - The flusher is best-effort. It returns counts but never throws —
+ *    a failed flush leaves the queue untouched and a successful flush
+ *    atomically rewrites the file with the remaining (unsubmitted)
+ *    envelopes. Partial-success is the normal path when the server
+ *    accepts the first N but 5xx's the (N+1)th.
+ *
+ *  - The queue file is intentionally NOT readable by anything beyond
+ *    the flusher. The operator's free-text comments are confidential
+ *    — we do not surface them in `/status` / `/doctor` / telemetry.
+ *
+ *  - All filesystem writes go through `mkdirSync({recursive: true})`
+ *    so the first-ever enqueue on a fresh workspace lazily creates
+ *    `.pugi/` without depending on an earlier `pugi init`.
+ */
+import { appendFileSync, existsSync, mkdirSync, readFileSync, renameSync, writeFileSync, } from 'node:fs';
+import { dirname, resolve } from 'node:path';
+/**
+ * Resolve the queue file path for a workspace. Centralised so the
+ * submitter + flusher + tests agree on a single canonical location.
+ */
+export function feedbackQueuePath(cwd) {
+    return resolve(cwd, '.pugi', 'feedback-queue.jsonl');
+}
+/**
+ * Append one envelope atomically. Uses `O_APPEND` semantics via
+ * `appendFileSync` so concurrent invocations from a split-screen
+ * REPL + shell cannot interleave bytes mid-line.
+ *
+ * Returns the absolute path written so callers can surface it in the
+ * "Feedback queued locally" toast.
+ */
+export function enqueueFeedback(env, cwd) {
+    const path = feedbackQueuePath(cwd);
+    mkdirSync(dirname(path), { recursive: true });
+    // JSON.stringify of an object never emits raw newlines; the trailing
+    // '\n' is the line separator. JSONL parsers split on '\n' so the
+    // separator survives round-trips.
+    const line = `${JSON.stringify(env)}\n`;
+    appendFileSync(path, line, { encoding: 'utf8' });
+    return path;
+}
+export function readFeedbackQueue(cwd) {
+    const path = feedbackQueuePath(cwd);
+    if (!existsSync(path)) {
+        return { envelopes: [], parseErrors: [] };
+    }
+    const contents = readFileSync(path, 'utf8');
+    const lines = contents.split('\n');
+    const envelopes = [];
+    const parseErrors = [];
+    for (let i = 0; i < lines.length; i += 1) {
+        const raw = lines[i]?.trim();
+        if (!raw)
+            continue;
+        try {
+            const parsed = JSON.parse(raw);
+            // Minimal shape check — we don't full-validate here because the
+            // server is the trust boundary. Just guard against obvious
+            // corruption that would make the line un-submittable.
+            if (typeof parsed.category === 'string'
+                && typeof parsed.rating === 'number'
+                && typeof parsed.comment === 'string'
+                && typeof parsed.ts === 'string'
+                && typeof parsed.cliVersion === 'string') {
+                envelopes.push(parsed);
+            }
+            else {
+                parseErrors.push(i + 1);
+            }
+        }
+        catch {
+            parseErrors.push(i + 1);
+        }
+    }
+    return { envelopes, parseErrors };
+}
+/**
+ * Rewrite the queue file atomically with the remaining (unsubmitted)
+ * envelopes. Called by the flusher after a partial-success drain.
+ *
+ * Atomicity: write to a sibling `.tmp` then rename. On a crash mid-
+ * rewrite the original file is preserved (rename is atomic on POSIX
+ * + on NTFS via `MoveFileEx`).
+ */
+export function rewriteFeedbackQueue(remaining, cwd) {
+    const path = feedbackQueuePath(cwd);
+    if (remaining.length === 0) {
+        // Clear the file by truncating to empty. Done in-place — we still
+        // want the file to exist (presence signals an active workspace)
+        // but with zero bytes so the next read returns no envelopes.
+        if (existsSync(path)) {
+            writeFileSync(path, '', { encoding: 'utf8' });
+        }
+        return;
+    }
+    mkdirSync(dirname(path), { recursive: true });
+    const tmp = `${path}.tmp`;
+    const body = remaining.map((env) => JSON.stringify(env)).join('\n') + '\n';
+    writeFileSync(tmp, body, { encoding: 'utf8' });
+    // Use writeFileSync's atomic-replace semantics by going through
+    // tmp + rename. Node's `fs.renameSync` is the atomic primitive
+    // on POSIX. We avoid `fs.writeFileSync` directly on `path`
+    // because writeFileSync truncates first which leaves a brief
+    // window of zero-byte state if the process is killed mid-write.
+    renameSync(tmp, path);
+}
+/**
+ * Drain the queue. Best-effort: each envelope is submitted in order;
+ * a `false` return keeps it in the queue for the next attempt; a
+ * `true` return removes it. After all envelopes are processed the
+ * queue file is rewritten with the unsubmitted ones.
+ *
+ * The function NEVER throws — it returns a structured result and
+ * the caller decides whether to log / surface failures. This keeps
+ * the silent-background-drain path on session-start safe.
+ */
+export async function flushFeedbackQueue(cwd, submit) {
+    const { envelopes, parseErrors } = readFeedbackQueue(cwd);
+    if (envelopes.length === 0) {
+        return {
+            attempted: 0,
+            succeeded: 0,
+            failed: 0,
+            failedEnvelopes: [],
+            parseErrors,
+        };
+    }
+    let succeeded = 0;
+    const failedEnvelopes = [];
+    for (const env of envelopes) {
+        let ok = false;
+        try {
+            ok = await submit(env);
+        }
+        catch {
+            ok = false;
+        }
+        if (ok) {
+            succeeded += 1;
+        }
+        else {
+            failedEnvelopes.push(env);
+        }
+    }
+    rewriteFeedbackQueue(failedEnvelopes, cwd);
+    return {
+        attempted: envelopes.length,
+        succeeded,
+        failed: failedEnvelopes.length,
+        failedEnvelopes,
+        parseErrors,
+    };
+}
+//# sourceMappingURL=queue.js.map

package/dist/core/feedback/submitter.js ADDED Viewed

@@ -0,0 +1,145 @@
+/**
+ * Feedback POST submitter — .
+ *
+ * Submits one `FeedbackEnvelope` to the admin-api `/api/pugi/feedback`
+ * route. Designed for graceful degradation:
+ *
+ *  - 200/201/204               → success
+ *  - 404 / route not found     → "endpoint missing, fall back to queue"
+ *  - 4xx (other)               → permanent — discard (do NOT requeue)
+ *  - 5xx / network error / abort → transient — caller should enqueue
+ *
+ * The submitter does NOT touch the local queue. The caller wires the
+ * submitter to `enqueueFeedback` on a `transient` result, and to a
+ * silent log on a `permanent` failure. This split keeps the submitter
+ * a pure HTTP wrapper that the flusher (`flushFeedbackQueue`) can
+ * reuse without filesystem side effects.
+ */
+const DEFAULT_TIMEOUT_MS = 8000;
+/**
+ * Build the absolute submit URL from the base API URL. Centralised so
+ * the spec can reference one canonical place when asserting the
+ * outgoing path. The leading slash is normalised so a base URL with
+ * or without trailing slash both produce a well-formed URL.
+ */
+export function feedbackSubmitUrl(apiUrl) {
+    const base = apiUrl.replace(/\/+$/u, '');
+    return `${base}/api/pugi/feedback`;
+}
+/**
+ * Submit one envelope. See `FeedbackSubmitResult` for the contract.
+ *
+ * Never throws — every failure path is mapped to a result variant so
+ * callers do not need a try/catch boundary.
+ */
+export async function submitFeedback(env, config) {
+    const url = feedbackSubmitUrl(config.apiUrl);
+    const fetchImpl = config.fetchImpl ?? fetch;
+    const timeoutMs = config.timeoutMs ?? DEFAULT_TIMEOUT_MS;
+    const controller = new AbortController();
+    const timer = setTimeout(() => controller.abort(), timeoutMs);
+    try {
+        const headers = {
+            'content-type': 'application/json',
+            'user-agent': `pugi-cli/${env.cliVersion}`,
+        };
+        if (config.apiKey) {
+            headers['authorization'] = `Bearer ${config.apiKey}`;
+        }
+        const res = await fetchImpl(url, {
+            method: 'POST',
+            headers,
+            body: JSON.stringify(env),
+            signal: controller.signal,
+        });
+        const status = res.status;
+        if (status >= 200 && status < 300) {
+            return { kind: 'ok', httpStatus: status };
+        }
+        if (status === 404) {
+            // The most common transient cause: admin-api hasn't shipped the
+            // route yet. Treat as retry-worthy so once the controller lands
+            // a future flush picks it up.
+            return {
+                kind: 'transient',
+                reason: 'admin-api /api/pugi/feedback not deployed yet',
+                httpStatus: status,
+            };
+        }
+        if (status >= 500) {
+            return {
+                kind: 'transient',
+                reason: `server error ${status}`,
+                httpStatus: status,
+            };
+        }
+        // Any other 4xx — auth failure, payload rejected, rate-limit
+        // exceeded. None of those will fix themselves on a silent retry,
+        // so we mark them permanent. The operator sees a one-line error
+        // and the envelope is dropped (not queued).
+        return {
+            kind: 'permanent',
+            reason: `client error ${status}`,
+            httpStatus: status,
+        };
+    }
+    catch (err) {
+        const message = err instanceof Error ? err.message : String(err);
+        // AbortController.abort fires when the timeout elapses. We treat
+        // it as transient so the queue picks it up on the next online
+        // session. Same for plain network errors (`fetch failed`, ECONNREFUSED).
+        return { kind: 'transient', reason: `network: ${message}` };
+    }
+    finally {
+        clearTimeout(timer);
+    }
+}
+/**
+ * Bundle the last N turns of the conversation into a redacted
+ * `FeedbackSessionContext`. The redactor:
+ *
+ *  - Caps at 5 turns (most recent). Older context is dropped — the
+ *    submitter never sees it.
+ *  - Truncates each turn to 240 chars + ellipsis. Operator comments
+ *    are the primary signal; raw transcript is just disambiguation.
+ *  - Strips bearer tokens, JWT-like blobs, and `PUGI_API_KEY=`-style
+ *    env-var prefixes. Conservative — we'd rather drop a few
+ *    non-secret characters than leak a key.
+ *
+ * The function is pure + sync so tests can pin its output without a
+ * worktree harness.
+ */
+export function redactSessionContext(turns, options = {}) {
+    const lastFive = turns.slice(-5);
+    const previewed = lastFive.map((turn) => ({
+        role: turn.role,
+        preview: redactPreview(truncate(turn.text, 240)),
+    }));
+    return {
+        turnCount: previewed.length,
+        turns: previewed,
+        ...(options.gitBranch ? { gitBranch: options.gitBranch } : {}),
+    };
+}
+function truncate(s, max) {
+    if (s.length <= max)
+        return s;
+    return `${s.slice(0, max - 1)}…`;
+}
+/**
+ * Conservative secret-blanking. The rules:
+ *  - Bearer tokens: `Bearer <token>` → `Bearer ***REDACTED***`
+ *  - Long base64/JWT-ish blobs (≥ 40 chars of [A-Za-z0-9_-/=+]):
+ *    replace the inner middle with `***`. Keeps a head + tail so the
+ *    operator can still spot which kind of secret it was.
+ *  - `PUGI_API_KEY=...` and similar `*_KEY=`/`*_TOKEN=` lookalikes:
+ *    replace the value with `***REDACTED***`.
+ */
+function redactPreview(s) {
+    let out = s;
+    out = out.replace(/bearer\s+[A-Za-z0-9._-]{20,}/giu, 'Bearer ***REDACTED***');
+    out = out.replace(/([A-Z][A-Z0-9_]*?(?:KEY|TOKEN|SECRET|PASSWORD))\s*=\s*\S+/gu, '$1=***REDACTED***');
+    out = out.replace(/\b([A-Za-z0-9_-]{6})[A-Za-z0-9_/+=-]{30,}([A-Za-z0-9_-]{4})\b/gu, '$1***$2');
+    return out;
+}
+//# sourceMappingURL=submitter.js.map