@pugi/cli 0.1.0-beta.3 → 0.1.0-beta.30

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (218) hide show
  1. package/THIRD_PARTY_NOTICES.md +40 -0
  2. package/assets/pugi-mascot.ansi +15 -40
  3. package/bin/run.js +33 -1
  4. package/dist/commands/jobs-watch.js +201 -0
  5. package/dist/commands/jobs.js +15 -0
  6. package/dist/core/agent-progress/cleanup.js +134 -0
  7. package/dist/core/agent-progress/schema.js +144 -0
  8. package/dist/core/agent-progress/writer.js +101 -0
  9. package/dist/core/artifact-chain/dispatcher.js +148 -0
  10. package/dist/core/artifact-chain/exporter.js +164 -0
  11. package/dist/core/artifact-chain/state.js +243 -0
  12. package/dist/core/artifact-chain/steps.js +169 -0
  13. package/dist/core/auth/env-provider.js +238 -0
  14. package/dist/core/auto-update/channels.js +122 -0
  15. package/dist/core/auto-update/checker.js +241 -0
  16. package/dist/core/auto-update/state.js +235 -0
  17. package/dist/core/bare-mode/index.js +107 -0
  18. package/dist/core/checkpoint/resumer.js +149 -0
  19. package/dist/core/checkpoint/rewinder.js +291 -0
  20. package/dist/core/compact/auto-trigger.js +96 -0
  21. package/dist/core/compact/buffer-rewriter.js +115 -0
  22. package/dist/core/compact/summarizer.js +208 -0
  23. package/dist/core/compact/token-counter.js +108 -0
  24. package/dist/core/consensus/diff-capture.js +73 -0
  25. package/dist/core/context/index.js +7 -0
  26. package/dist/core/context/markdown-traverse.js +255 -0
  27. package/dist/core/cost/rate-card.js +129 -0
  28. package/dist/core/cost/tracker.js +221 -0
  29. package/dist/core/denial-tracking/index.js +8 -0
  30. package/dist/core/denial-tracking/state.js +264 -0
  31. package/dist/core/diagnostics/probe-runner.js +93 -0
  32. package/dist/core/diagnostics/probes/api.js +46 -0
  33. package/dist/core/diagnostics/probes/auth.js +86 -0
  34. package/dist/core/diagnostics/probes/bare-mode.js +42 -0
  35. package/dist/core/diagnostics/probes/cli-version.js +127 -0
  36. package/dist/core/diagnostics/probes/config.js +72 -0
  37. package/dist/core/diagnostics/probes/denial-tracking.js +57 -0
  38. package/dist/core/diagnostics/probes/disk.js +81 -0
  39. package/dist/core/diagnostics/probes/git.js +65 -0
  40. package/dist/core/diagnostics/probes/mcp.js +75 -0
  41. package/dist/core/diagnostics/probes/node.js +59 -0
  42. package/dist/core/diagnostics/probes/pnpm.js +36 -0
  43. package/dist/core/diagnostics/probes/pugi-md.js +89 -0
  44. package/dist/core/diagnostics/probes/session.js +74 -0
  45. package/dist/core/diagnostics/probes/status-snapshot.js +442 -0
  46. package/dist/core/diagnostics/probes/workspace.js +63 -0
  47. package/dist/core/diagnostics/types.js +70 -0
  48. package/dist/core/dispatch/cache-cleanup.js +197 -0
  49. package/dist/core/dispatch/cache-handoff.js +295 -0
  50. package/dist/core/edits/dispatch.js +218 -2
  51. package/dist/core/edits/journal.js +199 -0
  52. package/dist/core/edits/layer-d-ast.js +557 -14
  53. package/dist/core/edits/verify-hook.js +273 -0
  54. package/dist/core/edits/worktree.js +111 -18
  55. package/dist/core/engine/anvil-client.js +115 -5
  56. package/dist/core/engine/budgets.js +89 -0
  57. package/dist/core/engine/context-prefix.js +155 -0
  58. package/dist/core/engine/intent.js +260 -0
  59. package/dist/core/engine/native-pugi.js +852 -210
  60. package/dist/core/engine/prompts.js +89 -6
  61. package/dist/core/engine/strip-internal-fields.js +124 -0
  62. package/dist/core/engine/tool-bridge.js +972 -33
  63. package/dist/core/feedback/queue.js +177 -0
  64. package/dist/core/feedback/submitter.js +145 -0
  65. package/dist/core/file-cache.js +113 -1
  66. package/dist/core/hooks/events.js +44 -0
  67. package/dist/core/hooks/index.js +15 -0
  68. package/dist/core/hooks/registry.js +213 -0
  69. package/dist/core/hooks/runner.js +236 -0
  70. package/dist/core/init/scaffold.js +195 -0
  71. package/dist/core/lsp/cache.js +105 -0
  72. package/dist/core/lsp/client.js +174 -29
  73. package/dist/core/lsp/language-detect.js +66 -0
  74. package/dist/core/lsp/post-edit-diagnostics.js +171 -0
  75. package/dist/core/mcp/client.js +75 -6
  76. package/dist/core/mcp/http-server.js +553 -0
  77. package/dist/core/mcp/permission.js +190 -0
  78. package/dist/core/mcp/registry.js +24 -2
  79. package/dist/core/mcp/server-tools.js +219 -0
  80. package/dist/core/mcp/server.js +397 -0
  81. package/dist/core/memory/dual-write.js +416 -0
  82. package/dist/core/memory/dual-write.spec.js +297 -0
  83. package/dist/core/memory/phase1-kinds.js +20 -0
  84. package/dist/core/memory-sync/queue.js +158 -0
  85. package/dist/core/memory-sync/queue.spec.js +105 -0
  86. package/dist/core/onboarding/marker.js +111 -0
  87. package/dist/core/onboarding/telemetry-state.js +108 -0
  88. package/dist/core/output-style/presets.js +176 -0
  89. package/dist/core/output-style/state.js +185 -0
  90. package/dist/core/permissions/gate.js +187 -0
  91. package/dist/core/permissions/index.js +18 -0
  92. package/dist/core/permissions/mode.js +102 -0
  93. package/dist/core/permissions/state.js +215 -0
  94. package/dist/core/permissions/tool-class.js +93 -0
  95. package/dist/core/prd-check/parser.js +215 -0
  96. package/dist/core/prd-check/reporter.js +127 -0
  97. package/dist/core/prd-check/verifiers.js +223 -0
  98. package/dist/core/pugi-md/context-injector.js +76 -0
  99. package/dist/core/pugi-md/walk-up.js +207 -0
  100. package/dist/core/release-notes/parser.js +241 -0
  101. package/dist/core/release-notes/state.js +116 -0
  102. package/dist/core/repl/codebase-survey.js +308 -0
  103. package/dist/core/repl/history.js +11 -1
  104. package/dist/core/repl/init-interview.js +457 -0
  105. package/dist/core/repl/model-pricing.js +135 -0
  106. package/dist/core/repl/onboarding-state.js +297 -0
  107. package/dist/core/repl/session.js +1486 -30
  108. package/dist/core/repl/slash-commands.js +345 -9
  109. package/dist/core/repl/store/session-store.js +31 -2
  110. package/dist/core/repl/workspace-context.js +22 -0
  111. package/dist/core/repo-map/build.js +125 -0
  112. package/dist/core/repo-map/cache.js +185 -0
  113. package/dist/core/repo-map/extractor.js +254 -0
  114. package/dist/core/repo-map/formatter.js +145 -0
  115. package/dist/core/repo-map/scanner.js +211 -0
  116. package/dist/core/retry-budget/budget.js +284 -0
  117. package/dist/core/retry-budget/index.js +5 -0
  118. package/dist/core/session.js +44 -0
  119. package/dist/core/settings.js +80 -0
  120. package/dist/core/share/formatter.js +271 -0
  121. package/dist/core/share/redactor.js +221 -0
  122. package/dist/core/share/uploader.js +267 -0
  123. package/dist/core/skills/defaults.js +457 -0
  124. package/dist/core/subagents/dispatcher-real.js +600 -0
  125. package/dist/core/subagents/dispatcher.js +113 -24
  126. package/dist/core/subagents/index.js +18 -5
  127. package/dist/core/subagents/isolation-matrix.js +213 -0
  128. package/dist/core/subagents/spawn.js +19 -4
  129. package/dist/core/telemetry/emitter.js +229 -0
  130. package/dist/core/telemetry/queue.js +251 -0
  131. package/dist/core/theme/context.js +91 -0
  132. package/dist/core/theme/presets.js +228 -0
  133. package/dist/core/theme/state.js +181 -0
  134. package/dist/core/todos/invariant.js +10 -0
  135. package/dist/core/todos/state.js +177 -0
  136. package/dist/core/transport/version-interceptor.js +166 -0
  137. package/dist/core/vim/keymap.js +288 -0
  138. package/dist/core/vim/state.js +92 -0
  139. package/dist/index.js +28 -0
  140. package/dist/runtime/bootstrap.js +190 -0
  141. package/dist/runtime/cli.js +2595 -278
  142. package/dist/runtime/commands/chain.js +489 -0
  143. package/dist/runtime/commands/compact.js +297 -0
  144. package/dist/runtime/commands/cost.js +199 -0
  145. package/dist/runtime/commands/delegate.js +312 -0
  146. package/dist/runtime/commands/dispatch.js +126 -0
  147. package/dist/runtime/commands/doctor.js +390 -0
  148. package/dist/runtime/commands/feedback.js +184 -0
  149. package/dist/runtime/commands/hooks.js +184 -0
  150. package/dist/runtime/commands/lsp.js +212 -28
  151. package/dist/runtime/commands/mcp.js +824 -0
  152. package/dist/runtime/commands/memory.js +508 -0
  153. package/dist/runtime/commands/memory.spec.js +174 -0
  154. package/dist/runtime/commands/model.js +237 -0
  155. package/dist/runtime/commands/onboarding.js +275 -0
  156. package/dist/runtime/commands/patch.js +17 -0
  157. package/dist/runtime/commands/permissions.js +87 -0
  158. package/dist/runtime/commands/plan.js +143 -0
  159. package/dist/runtime/commands/prd-check.js +235 -0
  160. package/dist/runtime/commands/release-notes.js +229 -0
  161. package/dist/runtime/commands/repo-map.js +95 -0
  162. package/dist/runtime/commands/report.js +299 -0
  163. package/dist/runtime/commands/resume.js +118 -0
  164. package/dist/runtime/commands/review-consensus.js +17 -2
  165. package/dist/runtime/commands/rewind.js +333 -0
  166. package/dist/runtime/commands/roster.js +117 -0
  167. package/dist/runtime/commands/sessions.js +163 -0
  168. package/dist/runtime/commands/share.js +316 -0
  169. package/dist/runtime/commands/status.js +178 -0
  170. package/dist/runtime/commands/stickers.js +82 -0
  171. package/dist/runtime/commands/style.js +194 -0
  172. package/dist/runtime/commands/theme.js +196 -0
  173. package/dist/runtime/commands/update.js +289 -0
  174. package/dist/runtime/commands/vim.js +140 -0
  175. package/dist/runtime/commands/worktree.js +50 -6
  176. package/dist/runtime/headless.js +543 -0
  177. package/dist/runtime/load-hooks-or-exit.js +71 -0
  178. package/dist/runtime/plan-decompose.js +531 -0
  179. package/dist/runtime/version.js +65 -0
  180. package/dist/tools/agent-tool.js +229 -0
  181. package/dist/tools/apply-patch.js +281 -39
  182. package/dist/tools/ask-user-question.js +213 -0
  183. package/dist/tools/ask-user.js +115 -0
  184. package/dist/tools/file-tools.js +85 -14
  185. package/dist/tools/mcp-tool.js +260 -0
  186. package/dist/tools/multi-edit.js +361 -0
  187. package/dist/tools/registry.js +30 -2
  188. package/dist/tools/skill-tool.js +96 -0
  189. package/dist/tools/tasks.js +208 -0
  190. package/dist/tools/todo-write.js +184 -0
  191. package/dist/tools/web-fetch.js +147 -2
  192. package/dist/tools/web-search.js +458 -0
  193. package/dist/tui/agent-progress-card.js +111 -0
  194. package/dist/tui/agent-tree.js +10 -0
  195. package/dist/tui/ask-modal.js +2 -2
  196. package/dist/tui/ask-user-question-prompt.js +192 -0
  197. package/dist/tui/compact-banner.js +81 -0
  198. package/dist/tui/conversation-pane.js +82 -8
  199. package/dist/tui/cost-table.js +111 -0
  200. package/dist/tui/doctor-table.js +46 -0
  201. package/dist/tui/feedback-prompt.js +156 -0
  202. package/dist/tui/input-box.js +46 -2
  203. package/dist/tui/markdown-render.js +4 -4
  204. package/dist/tui/onboarding-wizard.js +240 -0
  205. package/dist/tui/repl-render.js +293 -35
  206. package/dist/tui/repl-splash.js +2 -2
  207. package/dist/tui/repl.js +45 -13
  208. package/dist/tui/splash.js +1 -1
  209. package/dist/tui/status-bar.js +94 -16
  210. package/dist/tui/status-table.js +7 -0
  211. package/dist/tui/stickers-art.js +136 -0
  212. package/dist/tui/style-table.js +28 -0
  213. package/dist/tui/theme-table.js +29 -0
  214. package/dist/tui/tool-stream-pane.js +7 -0
  215. package/dist/tui/update-banner.js +20 -2
  216. package/dist/tui/vim-input.js +267 -0
  217. package/docs/examples/codegraph.mcp.json +10 -0
  218. package/package.json +9 -6
@@ -0,0 +1,115 @@
1
+ /**
2
+ * Type guard: discriminate a SessionEvent against the `compaction`
3
+ * kind. Used by replay code so the boundary marker drives a different
4
+ * code path than `user`/`persona`/`system` transcript rows.
5
+ */
6
+ export function isCompactBoundary(event) {
7
+ if (event.kind !== 'compaction')
8
+ return false;
9
+ const p = event.payload;
10
+ if (p === null || typeof p !== 'object')
11
+ return false;
12
+ if (p.version !== 1)
13
+ return false;
14
+ if (p.trigger !== 'manual' && p.trigger !== 'auto')
15
+ return false;
16
+ if (typeof p.summary !== 'string' || p.summary.length === 0)
17
+ return false;
18
+ if (typeof p.summaryTokenCount !== 'number')
19
+ return false;
20
+ if (typeof p.summaryTurnsBefore !== 'number')
21
+ return false;
22
+ if (typeof p.keptTailTurns !== 'number')
23
+ return false;
24
+ if (typeof p.coversUntilOffset !== 'number')
25
+ return false;
26
+ return true;
27
+ }
28
+ /**
29
+ * Append one `compaction` boundary marker to the SessionStore. Returns
30
+ * the SessionEvent we wrote so the caller can echo it into the in-
31
+ * memory transcript without a re-read. Throws on store error so the
32
+ * caller surfaces the failure inline.
33
+ */
34
+ export async function appendCompactBoundary(input) {
35
+ const ts = (input.now ?? (() => Date.now()))();
36
+ const payload = {
37
+ version: 1,
38
+ trigger: input.trigger,
39
+ summary: input.summary,
40
+ summaryTokenCount: input.summaryTokenCount,
41
+ summaryTurnsBefore: input.summaryTurnsBefore,
42
+ keptTailTurns: input.keptTailTurns,
43
+ coversUntilOffset: input.coversUntilOffset,
44
+ };
45
+ const event = {
46
+ t: ts,
47
+ kind: 'compaction',
48
+ payload,
49
+ };
50
+ await input.store.appendEvent(event);
51
+ return event;
52
+ }
53
+ /**
54
+ * Apply replay masking to a chronological event list. Given the full
55
+ * ordered events.jsonl content, return only the events the caller
56
+ * should render: every event AFTER the latest `compaction` boundary,
57
+ * plus the boundary itself (so the renderer can show the banner +
58
+ * summary), and the K kept-tail events that landed BEFORE the boundary
59
+ * but were preserved per the marker's `keptTailTurns`.
60
+ *
61
+ * Mask logic:
62
+ * 1. Walk events. Find the LATEST boundary by offset.
63
+ * 2. Index 0 .. coversUntilOffset-1 are masked, EXCEPT the last
64
+ * `keptTailTurns` of that range (which are the verbatim tail).
65
+ * 3. The boundary event itself + everything after it stays.
66
+ *
67
+ * Why we expose this here (and not in session.ts): keeping the mask
68
+ * logic next to the writer means the wire format is owned by one
69
+ * module. session.ts depends on this; this depends on nothing in
70
+ * session.ts. Unidirectional.
71
+ */
72
+ export function applyCompactMask(events) {
73
+ // Find latest compaction event.
74
+ let latestIdx = -1;
75
+ let latestPayload = null;
76
+ for (let i = events.length - 1; i >= 0; i -= 1) {
77
+ const ev = events[i];
78
+ if (isCompactBoundary(ev)) {
79
+ latestIdx = i;
80
+ latestPayload = ev.payload;
81
+ break;
82
+ }
83
+ }
84
+ if (latestIdx === -1 || latestPayload === null) {
85
+ return events;
86
+ }
87
+ // `coversUntilOffset` is the count of events that existed in the
88
+ // store immediately before the marker append. Events 0 ..
89
+ // coversUntilOffset-1 are summarised; events keptTailTurns of them
90
+ // are surfaced anyway as the verbatim tail.
91
+ const cap = Math.max(0, Math.min(latestPayload.coversUntilOffset, latestIdx));
92
+ const tailKeepCount = Math.max(0, Math.min(latestPayload.keptTailTurns, cap));
93
+ // Take the LAST tailKeepCount events from the masked range, but only
94
+ // those that represent renderable turns (user/persona/system).
95
+ // Boundary markers and tool stream events are NOT counted as turns
96
+ // for the tail-keep window — using them would let the keptTailTurns
97
+ // budget be consumed by infra events and the operator would lose
98
+ // the last K real turns. The spec is about "last K human-visible
99
+ // turns", not "last K events".
100
+ const tailSlice = [];
101
+ for (let i = cap - 1; i >= 0 && tailSlice.length < tailKeepCount; i -= 1) {
102
+ const ev = events[i];
103
+ if (ev.kind === 'user' || ev.kind === 'persona' || ev.kind === 'system') {
104
+ tailSlice.push(ev);
105
+ }
106
+ }
107
+ tailSlice.reverse();
108
+ // After the marker: everything that landed AFTER the boundary
109
+ // append. These are post-compaction events the user has not yet
110
+ // seen folded into a summary; they pass through verbatim.
111
+ const afterMarker = events.slice(latestIdx + 1);
112
+ const markerEvent = events[latestIdx];
113
+ return [...tailSlice, markerEvent, ...afterMarker];
114
+ }
115
+ //# sourceMappingURL=buffer-rewriter.js.map
@@ -0,0 +1,208 @@
1
+ import { estimateTokens } from './token-counter.js';
2
+ /**
3
+ * System prompt for the summarizer. Six closed sections + brand
4
+ * voice clamp + "no tool calls" sentinel. The headings are stable
5
+ * markdown so a downstream renderer can split + reformat without
6
+ * re-parsing the model output.
7
+ *
8
+ * Why the explicit `If a section has no content` rule: empty sections
9
+ * cost zero tokens but their absence is meaningful — the second model
10
+ * reading the memo learns "no decisions were made yet" from the empty
11
+ * `## Decisions` header. Without the rule we observed models silently
12
+ * dropping empty sections and the reader could not distinguish "no
13
+ * decisions" from "summarizer forgot the section".
14
+ */
15
+ const SUMMARIZE_SYSTEM_PROMPT = [
16
+ 'You are the Pugi conversation summarizer. Compress the supplied',
17
+ 'transcript into a six-section memo. Operator picks the work back up',
18
+ 'from this memo — accuracy and completeness matter more than brevity.',
19
+ '',
20
+ 'OUTPUT FORMAT (verbatim section headings, in this order):',
21
+ '',
22
+ "## Intent",
23
+ '(What the operator is trying to accomplish, in one paragraph.)',
24
+ '',
25
+ "## Decisions",
26
+ '(Bullet list of decisions made + the reasoning. Empty section means',
27
+ 'no decisions yet — render the heading anyway.)',
28
+ '',
29
+ "## Files",
30
+ '(Bullet list of file paths touched, with one-line "why".)',
31
+ '',
32
+ "## Errors",
33
+ '(Bullet list of errors encountered + how each was resolved. Empty',
34
+ 'means no errors — still render the heading.)',
35
+ '',
36
+ "## Tools",
37
+ '(Bullet list of notable tool calls and their outcomes. Group similar',
38
+ 'calls; the goal is to surface meaningful state changes, not log',
39
+ 'every Read.)',
40
+ '',
41
+ "## Next",
42
+ '(One paragraph: the immediate next planned action.)',
43
+ '',
44
+ 'RULES:',
45
+ '- Do not invent state. Only summarise what is in the transcript.',
46
+ '- Preserve file paths verbatim.',
47
+ '- Do not call any tools (you have none).',
48
+ '- Do not address the operator. Write in third person.',
49
+ '- No emoji. No em dashes.',
50
+ ].join('\n');
51
+ /**
52
+ * Convert a slice of session events into the user message body the
53
+ * summarizer ingests. We keep the format simple: one event per line,
54
+ * prefixed with the kind, so the model can see role boundaries. Tool
55
+ * outputs are length-capped at 4 KB each so a single 200 KB grep result
56
+ * does not blow the summarizer's own context budget.
57
+ */
58
+ const TOOL_PAYLOAD_CAP_BYTES = 4096;
59
+ export function renderEventsForSummary(events) {
60
+ const lines = [];
61
+ for (const event of events) {
62
+ const rendered = renderOneEvent(event);
63
+ if (rendered !== null)
64
+ lines.push(rendered);
65
+ }
66
+ return lines.join('\n');
67
+ }
68
+ function renderOneEvent(event) {
69
+ const payload = (event.payload ?? null);
70
+ switch (event.kind) {
71
+ case 'user': {
72
+ const text = stringField(payload, 'brief') ?? stringField(payload, 'text') ?? '';
73
+ if (text.length === 0)
74
+ return null;
75
+ return `[operator] ${text}`;
76
+ }
77
+ case 'persona': {
78
+ const text = stringField(payload, 'text') ?? '';
79
+ if (text.length === 0)
80
+ return null;
81
+ const slug = stringField(payload, 'personaSlug') ?? 'persona';
82
+ return `[${slug}] ${text}`;
83
+ }
84
+ case 'system': {
85
+ const text = stringField(payload, 'text') ?? '';
86
+ if (text.length === 0)
87
+ return null;
88
+ return `[system] ${text}`;
89
+ }
90
+ case 'tool.start': {
91
+ const toolName = stringField(payload, 'toolName') ?? 'unknown';
92
+ const args = stringField(payload, 'args') ?? '';
93
+ return `[tool.start ${toolName}] ${truncate(args, TOOL_PAYLOAD_CAP_BYTES)}`;
94
+ }
95
+ case 'tool.result': {
96
+ const toolName = stringField(payload, 'toolName') ?? 'unknown';
97
+ const result = stringField(payload, 'result') ?? '';
98
+ return `[tool.result ${toolName}] ${truncate(result, TOOL_PAYLOAD_CAP_BYTES)}`;
99
+ }
100
+ case 'agent.spawned': {
101
+ const slug = stringField(payload, 'personaSlug') ?? 'unknown';
102
+ return `[agent.spawned ${slug}]`;
103
+ }
104
+ case 'agent.completed': {
105
+ const slug = stringField(payload, 'personaSlug') ?? 'unknown';
106
+ return `[agent.completed ${slug}]`;
107
+ }
108
+ case 'compaction': {
109
+ // Pre-existing compact marker — its `summary` payload IS the
110
+ // condensed form of older history. We pass it through verbatim so
111
+ // the summarizer treats it as already-summarised state and folds
112
+ // it into the new memo (rather than re-summarising garbage).
113
+ const summary = stringField(payload, 'summary') ?? '';
114
+ if (summary.length === 0)
115
+ return null;
116
+ return `[prior compaction]\n${summary}`;
117
+ }
118
+ case 'rewind-marker': {
119
+ // L9 (2026-05-27): rewind tombstones are infrastructure rows that
120
+ // describe a transcript edit, not conversation content. They
121
+ // never carry user-visible prose; the summariser drops them so
122
+ // the produced memo focuses on actual operator/persona turns.
123
+ // The masked range (events the marker covers) is already elided
124
+ // by `applyRewindMask` before this function is reached, so the
125
+ // summariser only sees a marker when it sits OUTSIDE every active
126
+ // rewind range — in which case the marker has already been
127
+ // cancelled by an undo-rewind and contributes nothing.
128
+ return null;
129
+ }
130
+ default: {
131
+ // Forward-compat: unknown kinds get a structural fingerprint so
132
+ // the summarizer can still represent them.
133
+ const exhaustive = event.kind;
134
+ void exhaustive;
135
+ return null;
136
+ }
137
+ }
138
+ }
139
+ function stringField(payload, key) {
140
+ if (!payload)
141
+ return undefined;
142
+ const value = payload[key];
143
+ return typeof value === 'string' ? value : undefined;
144
+ }
145
+ function truncate(s, capBytes) {
146
+ if (Buffer.byteLength(s, 'utf8') <= capBytes)
147
+ return s;
148
+ // Naive cut on UTF-16 chars — good enough for the summarizer; we
149
+ // append a marker so the model knows content was elided.
150
+ return `${s.slice(0, Math.floor(capBytes / 2))}\n... [truncated]`;
151
+ }
152
+ /**
153
+ * Run one summarisation round. Throws on transport error (the caller
154
+ * surfaces a one-line message to the operator and aborts the compact).
155
+ * Returns the structured result on success.
156
+ */
157
+ export async function summarizeEvents(input) {
158
+ if (input.events.length === 0) {
159
+ throw new SummarizerError('refusing-to-summarize-empty-slice', 'No events to summarize.');
160
+ }
161
+ const userBody = renderEventsForSummary(input.events);
162
+ if (userBody.length === 0) {
163
+ throw new SummarizerError('refusing-to-summarize-empty-slice', 'All events rendered as empty.');
164
+ }
165
+ const messages = [
166
+ { role: 'system', content: SUMMARIZE_SYSTEM_PROMPT },
167
+ { role: 'user', content: userBody },
168
+ ];
169
+ const response = await input.client.send(messages, [], {
170
+ personaSlug: input.personaSlug,
171
+ tag: { tag: 'summarize' },
172
+ maxTokens: 2048,
173
+ temperature: 0.1,
174
+ ...(input.model !== undefined ? { model: input.model } : {}),
175
+ ...(input.signal !== undefined ? { signal: input.signal } : {}),
176
+ });
177
+ if (response.stop === 'error') {
178
+ throw new SummarizerError(response.code, `Summarizer transport failed: ${response.message}`);
179
+ }
180
+ if (response.stop === 'tool_use') {
181
+ // Sanity guard. We pass tools: [] so the model should not be able
182
+ // to invoke any; if Anvil's prompt template ever leaks tool defs
183
+ // we want a hard failure rather than a silent dropped summary.
184
+ throw new SummarizerError('unexpected-tool-call', 'Summarizer returned tool_use despite tools: []. Treating as failure.');
185
+ }
186
+ const summary = response.content.trim();
187
+ if (summary.length === 0) {
188
+ throw new SummarizerError('empty-summary', 'Summarizer returned an empty body.');
189
+ }
190
+ return {
191
+ summary,
192
+ tokensSummarised: estimateTokens(userBody),
193
+ eventsSummarised: input.events.length,
194
+ };
195
+ }
196
+ /**
197
+ * Error class so the caller can branch on `error instanceof
198
+ * SummarizerError` and surface `error.code` to the operator.
199
+ */
200
+ export class SummarizerError extends Error {
201
+ code;
202
+ constructor(code, message) {
203
+ super(message);
204
+ this.name = 'SummarizerError';
205
+ this.code = code;
206
+ }
207
+ }
208
+ //# sourceMappingURL=summarizer.js.map
@@ -0,0 +1,108 @@
1
+ /**
2
+ * Approximate token counter for the `/compact` auto-trigger gate.
3
+ *
4
+ * Pugi does not bundle tiktoken — adding a 3 MB native module for a
5
+ * single heuristic check after every turn is the wrong trade. We instead
6
+ * use the OpenAI rule-of-thumb that 1 token ≈ 4 characters of English
7
+ * (≈ ¾ of a word). For mixed-language conversations the approximation
8
+ * skews high by 10-20% which is the safe direction — the auto-compact
9
+ * threshold trips slightly EARLY, never LATE. A late trigger would
10
+ * exceed the model's actual context window and crash the next turn.
11
+ *
12
+ * Per-model context windows are exported from `MODEL_CONTEXT_WINDOW` so
13
+ * the caller can resolve the budget from the active model slug without
14
+ * round-tripping to the server. New models added in Anvil should grow
15
+ * this table in lockstep; the fall-back is the conservative 32k window.
16
+ *
17
+ * Override hook: when `PUGI_TOKEN_COUNTER_OVERRIDE` is set the function
18
+ * parses it as a JSON object `{"text": <n>}` (number of tokens to claim
19
+ * per char). Used only by the integration spec — never by production.
20
+ */
21
+ /** Default chars-per-token ratio for the OpenAI rule-of-thumb. */
22
+ const DEFAULT_CHARS_PER_TOKEN = 4;
23
+ /**
24
+ * Conservative fallback window when the model slug is unknown. 32k is
25
+ * the smallest window any current Anvil-served model exposes; using it
26
+ * as a fall-back guarantees we never overestimate budget and skip a
27
+ * compaction that should have fired.
28
+ */
29
+ const FALLBACK_WINDOW = 32_000;
30
+ /**
31
+ * Known context windows for models Anvil exposes today. Keep in sync
32
+ * with `apps/admin-api/src/pugi/model-registry.ts` — when a new model
33
+ * lands there, add it here. The table is intentionally narrow: only
34
+ * models we have actually validated.
35
+ */
36
+ export const MODEL_CONTEXT_WINDOW = Object.freeze({
37
+ 'sonnet-4.6': 200_000,
38
+ 'sonnet-4.5': 200_000,
39
+ 'opus-4.7': 1_000_000,
40
+ 'opus-4.6': 200_000,
41
+ 'haiku-4.5': 200_000,
42
+ 'deepseek-chat-v3.1': 128_000,
43
+ 'gpt-5': 200_000,
44
+ 'gemini-2.5-pro': 1_000_000,
45
+ });
46
+ /**
47
+ * Estimate the token count of a single string. Returns a positive
48
+ * integer for non-empty input and zero for empty input. The function is
49
+ * pure — same input always yields the same output.
50
+ *
51
+ * The approximation is `ceil(byteLength / chars-per-token)`. We use
52
+ * `Buffer.byteLength` so multi-byte UTF-8 sequences count proportionally
53
+ * to their on-the-wire size, not their char count — this matches the
54
+ * tokenizer's behaviour on CJK / cyrillic / emoji where one char often
55
+ * eats 3-4 tokens.
56
+ */
57
+ export function estimateTokens(text) {
58
+ if (text.length === 0)
59
+ return 0;
60
+ const ratio = readCharsPerTokenOverride() ?? DEFAULT_CHARS_PER_TOKEN;
61
+ const bytes = Buffer.byteLength(text, 'utf8');
62
+ return Math.max(1, Math.ceil(bytes / ratio));
63
+ }
64
+ /**
65
+ * Resolve the context window in tokens for the given model slug. Falls
66
+ * back to the conservative 32k window when the slug is unknown.
67
+ */
68
+ export function contextWindowForModel(model) {
69
+ if (!model)
70
+ return FALLBACK_WINDOW;
71
+ const known = MODEL_CONTEXT_WINDOW[model];
72
+ return known ?? FALLBACK_WINDOW;
73
+ }
74
+ /**
75
+ * Sum the token estimates of an arbitrary list of strings. Convenience
76
+ * for the auto-trigger which has to count across N transcript turns.
77
+ */
78
+ export function estimateTokensInMany(parts) {
79
+ let total = 0;
80
+ for (const part of parts) {
81
+ total += estimateTokens(part);
82
+ }
83
+ return total;
84
+ }
85
+ /**
86
+ * Read the test override env. Returns the parsed chars-per-token ratio
87
+ * when set, or undefined when absent / malformed. Never throws.
88
+ */
89
+ function readCharsPerTokenOverride() {
90
+ const raw = process.env['PUGI_TOKEN_COUNTER_OVERRIDE'];
91
+ if (!raw)
92
+ return undefined;
93
+ try {
94
+ const parsed = JSON.parse(raw);
95
+ if (typeof parsed === 'object'
96
+ && parsed !== null
97
+ && typeof parsed.charsPerToken === 'number') {
98
+ const ratio = parsed.charsPerToken;
99
+ if (Number.isFinite(ratio) && ratio > 0)
100
+ return ratio;
101
+ }
102
+ }
103
+ catch {
104
+ /* malformed env, fall through */
105
+ }
106
+ return undefined;
107
+ }
108
+ //# sourceMappingURL=token-counter.js.map
@@ -6,6 +6,10 @@
6
6
  *
7
7
  * 1. `--pr <number>` — uses `gh pr diff <num>` (gh CLI required).
8
8
  * 2. `--commit <sha>` — diff of that commit vs its first parent.
9
+ * When `--base <ref>` is ALSO provided, the
10
+ * diff is the range `<base>..<commit>` instead
11
+ * (mirrors `git diff base..commit` — covers the
12
+ * full PR-style payload, not just the tip).
9
13
  * 3. `--branch <name>` — diff of HEAD vs `origin/<name>` merge-base.
10
14
  * 4. (default) — diff of HEAD vs `origin/main` merge-base
11
15
  * covering BOTH committed-since-base AND
@@ -95,6 +99,16 @@ export function captureDiff(spec) {
95
99
  return captureFromPr(cwd, spec.pr);
96
100
  }
97
101
  if (typeof spec.commit === 'string' && spec.commit.length > 0) {
102
+ // When `--base` is supplied alongside `--commit`, callers want the
103
+ // full PR-style range diff (`base..commit`), not just the tip
104
+ // commit's parent diff. This matches the convention used by
105
+ // `git diff <base>..<commit>` everywhere else in the toolchain and
106
+ // is the verified-correct mode for reviewing a PR head ref. Without
107
+ // this branch, `--base` was silently ignored when `--commit` was
108
+ // present — see feedback_pugi_review_use_range_diff_not_worktree.
109
+ if (typeof spec.baseRef === 'string' && spec.baseRef.length > 0) {
110
+ return captureFromRange(cwd, spec.baseRef, spec.commit);
111
+ }
98
112
  return captureFromCommit(cwd, spec.commit);
99
113
  }
100
114
  if (typeof spec.branch === 'string' && spec.branch.length > 0) {
@@ -192,6 +206,65 @@ function captureFromCommit(cwd, commit) {
192
206
  },
193
207
  };
194
208
  }
209
+ /**
210
+ * Range capture for `--commit <X> --base <Y>` — diff equivalent to
211
+ * `git diff <base>..<commit>`. Used when the operator names BOTH endpoints
212
+ * (typical PR review against a remote head SHA).
213
+ *
214
+ * Critical: this MUST be a pure read-only range diff against named refs.
215
+ * The previous behavior fell through to `captureFromCommit` which only
216
+ * showed the tip commit (`commit~1..commit`) — fine for single-commit
217
+ * review, wrong for multi-commit PRs. Worse, a stale fallback path was
218
+ * sending the working tree diff (`git diff` with no args), which caused
219
+ * every review on 2026-05-27 to surface identical noise from uncommitted
220
+ * `.gitignore` edits instead of the actual PR contents.
221
+ *
222
+ * Working tree integrity: only `git diff <ref>..<ref>` and metadata
223
+ * `log` / `rev-parse` / `name-rev` are used — none of these touch the
224
+ * index, working tree, or HEAD.
225
+ */
226
+ function captureFromRange(cwd, baseRef, commit) {
227
+ // Resolve both endpoints up front so an unknown ref errors with a
228
+ // clear message before the diff invocation. `rev-parse` is read-only.
229
+ const fullCommit = safeExec(cwd, 'git', ['rev-parse', commit]).trim();
230
+ if (!fullCommit)
231
+ throw new Error(`Unknown commit ref: ${commit}`);
232
+ // Resolve the base: accept already-qualified refs (`origin/main`,
233
+ // `refs/heads/foo`) and bare branch names. If the bare name isn't
234
+ // locally resolvable, retry against `origin/<name>` — the common
235
+ // CI shape where local main is absent but the remote tracking ref is.
236
+ let resolvedBase = safeExecOptional(cwd, 'git', ['rev-parse', baseRef]).trim();
237
+ let effectiveBase = baseRef;
238
+ if (!resolvedBase && !baseRef.includes('/')) {
239
+ const remoteBase = `origin/${baseRef}`;
240
+ resolvedBase = safeExecOptional(cwd, 'git', ['rev-parse', remoteBase]).trim();
241
+ if (resolvedBase)
242
+ effectiveBase = remoteBase;
243
+ }
244
+ if (!resolvedBase)
245
+ throw new Error(`Unknown base ref: ${baseRef}`);
246
+ const diff = safeExec(cwd, 'git', [
247
+ 'diff',
248
+ `${resolvedBase}..${fullCommit}`,
249
+ '--',
250
+ '.',
251
+ ...PROTECTED_PATHSPEC_EXCLUDES,
252
+ ]);
253
+ const cappedDiff = capDiff(diff);
254
+ const subject = safeExec(cwd, 'git', ['log', '-1', '--pretty=%s', fullCommit]).trim();
255
+ const branch = safeExec(cwd, 'git', ['name-rev', '--name-only', fullCommit]).trim() || 'detached';
256
+ const stats = computeStats(cappedDiff);
257
+ return {
258
+ diff: cappedDiff,
259
+ context: {
260
+ branch,
261
+ commit: shortSha(fullCommit),
262
+ title: subject || `commit ${shortSha(fullCommit)}`,
263
+ ref: `range:${effectiveBase}..${shortSha(fullCommit)}`,
264
+ stats,
265
+ },
266
+ };
267
+ }
195
268
  function captureFromBranch(cwd, branch, baseRef) {
196
269
  const remoteRef = branch.includes('/') ? branch : `origin/${branch}`;
197
270
  const mergeBase = safeExec(cwd, 'git', ['merge-base', baseRef, remoteRef]).trim();
@@ -18,4 +18,11 @@ export { BASELINE_IGNORE_PATTERNS, SECRET_IGNORE_PATTERNS, globalPugiIgnorePath,
18
18
  export { COLLAPSE_DIR_ENTRIES, MAX_README_LINES, MAX_SKELETON_BYTES, MAX_TREE_DEPTH, MAX_WALK_NODES, TOP_LANGUAGES, buildRepoSkeleton, detectPackageManager, languageForExtension, readGitBranch, readPackageJson, readReadme, renderSkeleton, topLanguages, } from './repo-skeleton.js';
19
19
  export { DEFAULT_WORKING_SET_CAPACITY, WorkingSet, } from './working-set.js';
20
20
  export { MAX_WATCHED_PATHS, PugiWatcher, THROTTLE_WINDOW_MS, } from './watcher.js';
21
+ /**
22
+ * β5a R4+P5 — per-directory PUGI.md / AGENTS.md / CLAUDE.md / GEMINI.md
23
+ * traverse-up. Loads agent-context markdown at every directory between
24
+ * `cwd` and `workspaceRoot` (workspace root file is owned by
25
+ * `loadMarkdownContext` in `markdown-loader.ts` — no double-load).
26
+ */
27
+ export { MAX_TRAVERSE_BYTES, MAX_TRAVERSE_PER_FILE_BYTES, MAX_TRAVERSE_DEPTH, TRAVERSE_SOURCES, loadTraversedMarkdown, } from './markdown-traverse.js';
21
28
  //# sourceMappingURL=index.js.map