npm - @dreki-gg/pi-code-reviewer - Versions diffs - 0.6.0 → 0.6.2 - Mend

@dreki-gg/pi-code-reviewer 0.6.0 → 0.6.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/extensions/code-reviewer/commands/review-tool.ts +49 -61
package/extensions/code-reviewer/reviewer.ts +222 -1
package/package.json +1 -1

package/extensions/code-reviewer/commands/review-tool.ts CHANGED Viewed

@@ -1,3 +1,6 @@
+import { writeFile } from 'node:fs/promises';
+import { tmpdir } from 'node:os';
+import { join } from 'node:path';
 import type { ExtensionAPI } from '@earendil-works/pi-coding-agent';
 import { Type } from 'typebox';
@@ -7,16 +10,34 @@ import { discoverLenses, getLensContent } from '../lenses';
 import { resolveModelPlan } from '../model-plan';
 import { runPipeline } from '../passes';
 import {
-  buildDiffSection,
   buildLensResult,
+  buildPipelineResult,
   buildReviewBasePrompt,
+  buildSinglePassResult,
   pickLensToolOutputs,
-  renderPipelineReport,
   runTools,
 } from '../reviewer';
-import type { DiffSource } from '../diff';
+import type { ReviewPointer } from '../reviewer';
 import type { LensResult, ReviewConfig } from '../types';
+/**
+ * Spill the full review context to a temp Markdown file and return a pointer
+ * (path + byte size + line count). Both pi's tool-output and `read` caps are
+ * ~50KB / 2000 lines, so large reviews would otherwise be truncated and lost
+ * on compaction. The on-disk file survives compaction and can be paged.
+ *
+ * Node-only IO (no Bun) per the extension runtime constraint.
+ */
+async function writeReviewTempFile(content: string): Promise<ReviewPointer> {
+  const path = join(tmpdir(), `pi-code-review-${Date.now()}.md`);
+  await writeFile(path, content, 'utf8');
+  return {
+    path,
+    bytes: Buffer.byteLength(content, 'utf8'),
+    lines: content.split('\n').length,
+  };
+}
 export function registerReviewTool(pi: ExtensionAPI) {
   pi.registerTool({
     name: 'code_review',
@@ -155,17 +176,18 @@ export function registerReviewTool(pi: ExtensionAPI) {
           const allPassesFailed =
             config.review.passes > 0 && pipeline.telemetry.failedPasses >= config.review.passes;
           if (!allPassesFailed) {
-            return {
-              content: [{ type: 'text', text: renderPipelineReport(pipeline, diff) }],
-              details: {
-                mode: 'pipeline',
-                lensCount: lensNames.length,
+            return buildPipelineResult(
+              {
+                pipeline,
+                diff,
+                basePrompt,
+                lensNames,
                 availableLenses: [...available.keys()],
                 changedFiles,
-                findings: pipeline.findings,
-                telemetry: pipeline.telemetry,
               },
-            };
+              writeReviewTempFile,
+              onUpdate,
+            );
           }
           onUpdate?.({
             content: [{ type: 'text', text: 'all review passes failed — single-pass fallback' }],
@@ -187,20 +209,25 @@ export function registerReviewTool(pi: ExtensionAPI) {
       ctx.ui.setStatus('code-review', undefined);
-      // Fallback: return the review task for a single downstream pass (the
-      // agent produces findings in its follow-up message). Used when no model
-      // is available (e.g. print mode) or passes are disabled in config.
-      const text = buildToolContext(results, diff);
-      return {
-        content: [{ type: 'text', text }],
-        details: {
-          mode: 'single-pass',
-          lensCount: lensNames.length,
+      // Fallback: spill the full single-pass review context to a temp file and
+      // return a compact summary + pointer (degrades gracefully on empty
+      // context or a write failure). Used when no model is available (e.g.
+      // print mode) or passes are disabled in config.
+      //
+      // This is the PRIMARY truncation culprit: the full context embeds the
+      // diff (up to 50KB) plus every lens's tool outputs (20KB each), which
+      // easily blows past pi's 50KB tool-output cap.
+      return buildSinglePassResult(
+        {
+          results,
+          diff,
+          lensNames,
           availableLenses: [...available.keys()],
           changedFiles,
         },
-      };
+        writeReviewTempFile,
+        onUpdate,
+      );
     },
   });
 }
@@ -219,42 +246,3 @@ function resolveLensNames(
   return [...available.keys()];
 }
-/**
- * Build the agent-facing review instructions appended to the report. The diff
- * is embedded ONCE (not per lens) followed by each lens's section — large
- * diffs would otherwise be repeated for every lens, bloating the tool output.
- */
-function buildToolContext(results: LensResult[], diff: DiffSource): string {
-  const sections = results.map((r) => r._lensSection).filter(Boolean) as string[];
-  if (sections.length === 0) return '';
-  return [
-    `# Code Review — ${new Date().toISOString().slice(0, 10)}`,
-    '',
-    '## Changes',
-    '```',
-    diff.stat.trim() || '(no diffstat)',
-    '```',
-    '',
-    'Evaluate the diff through each lens below; the tool outputs are automated analysis.',
-    '',
-    buildDiffSection(diff),
-    '',
-    '## Lenses',
-    '',
-    ...sections,
-    '',
-    '## Instructions',
-    '',
-    'For each lens above, review the diff against its criteria and output a JSON array of findings:',
-    '',
-    '```json',
-    '[',
-    '  { "file": "path/to/file.ts", "line": 42, "severity": "warning", "message": "Description" }',
-    ']',
-    '```',
-    '',
-    'After each lens JSON array, write a 2-3 sentence summary.',
-    'If a lens has no findings, return an empty array `[]` and note the code looks good.',
-  ].join('\n');
-}

package/extensions/code-reviewer/reviewer.ts CHANGED Viewed

@@ -1,5 +1,9 @@
 import { platform } from 'node:os';
-import type { ExtensionAPI } from '@earendil-works/pi-coding-agent';
+import type {
+  AgentToolResult,
+  AgentToolUpdateCallback,
+  ExtensionAPI,
+} from '@earendil-works/pi-coding-agent';
 import { Effect } from 'effect';
 import type { DiffSource } from './diff';
@@ -118,6 +122,71 @@ export function buildReviewBasePrompt(lensSections: string[], diff: DiffSource):
   ].join('\n');
 }
+/** Pointer to the temp file holding the full review context. */
+export type ReviewPointer = { path: string; bytes: number; lines: number };
+/** Round bytes to whole KB for a human-readable size (min 1KB). */
+function toKb(bytes: number): number {
+  return Math.max(1, Math.round(bytes / 1024));
+}
+/**
+ * Condense a git `--stat` block into a one-line "N files, +ins -del" summary.
+ * Returns '' when the diffstat has no recognizable summary line.
+ */
+function summarizeDiffStat(stat: string): string {
+  const lastLine = stat.trim().split('\n').pop()?.trim() ?? '';
+  const files = lastLine.match(/(\d+) files? changed/)?.[1];
+  if (!files) return '';
+  const insertions = lastLine.match(/(\d+) insertions?\(\+\)/)?.[1];
+  const deletions = lastLine.match(/(\d+) deletions?\(-\)/)?.[1];
+  const parts = [`${files} file${files === '1' ? '' : 's'}`];
+  if (insertions) parts.push(`+${insertions}`);
+  if (deletions) parts.push(`-${deletions}`);
+  return parts.join(', ');
+}
+/**
+ * Compact inline header for the single-pass fallback. The full review context
+ * (diff, lenses, instructions) lives in a temp file — see {@link buildPointer} —
+ * so this only names the lenses and the diff scope. Pure (no IO).
+ */
+export function buildInlineSummary(lensNames: string[], diff: DiffSource): string {
+  const stat = summarizeDiffStat(diff.stat);
+  const diffLine = stat ? `${diff.label} (${stat})` : diff.label;
+  return [
+    '# Code Review Summary',
+    `- **Lenses**: ${lensNames.join(', ') || '(none)'}`,
+    `- **Diff**: ${diffLine}`,
+  ].join('\n');
+}
+/**
+ * Inline pointer to the temp file holding the full review context. pi's tool
+ * output / `read` caps are both ~50KB / 2000 lines, so the directive tells the
+ * agent to page large content with `read` offset/limit. Pure (no IO).
+ *
+ * `mode` switches the action sentence: single-pass needs the agent to perform
+ * the whole review from the file; pipeline only needs it to drill into the diff
+ * behind an already-rendered finding.
+ */
+export function buildPointer(pointer: ReviewPointer, mode: 'single-pass' | 'pipeline'): string {
+  const size = `(${pointer.lines} lines, ${toKb(pointer.bytes)}KB)`;
+  if (mode === 'single-pass') {
+    return [
+      '📄 Full review context (diff, lens definitions, tool outputs, instructions)',
+      `saved to: \`${pointer.path}\``,
+      `${size}. **Read that file** to perform the review — page large content with`,
+      '`read` offset/limit.',
+    ].join('\n');
+  }
+  return [
+    '---',
+    `📄 Full diff + lens context saved to: \`${pointer.path}\``,
+    `${size}. Use \`read\` (offset/limit) to inspect the diff behind a finding.`,
+  ].join('\n');
+}
 const SEVERITY_EMOJI: Record<ValidatedFinding['severity'], string> = {
   blocker: '🔴',
   warning: '🟡',
@@ -263,6 +332,158 @@ export function buildLensResult(
   };
 }
+/**
+ * Build the agent-facing review instructions for the single-pass fallback. The
+ * diff is embedded ONCE (not per lens) followed by each lens's section — large
+ * diffs would otherwise be repeated for every lens, bloating the tool output.
+ * Returns '' when no lens produced a section (nothing to review).
+ */
+export function buildToolContext(results: LensResult[], diff: DiffSource): string {
+  const sections = results.map((r) => r._lensSection).filter(Boolean) as string[];
+  if (sections.length === 0) return '';
+  return [
+    `# Code Review — ${new Date().toISOString().slice(0, 10)}`,
+    '',
+    '## Changes',
+    '```',
+    diff.stat.trim() || '(no diffstat)',
+    '```',
+    '',
+    'Evaluate the diff through each lens below; the tool outputs are automated analysis.',
+    '',
+    buildDiffSection(diff),
+    '',
+    '## Lenses',
+    '',
+    ...sections,
+    '',
+    '## Instructions',
+    '',
+    'For each lens above, review the diff against its criteria and output a JSON array of findings:',
+    '',
+    '```json',
+    '[',
+    '  { "file": "path/to/file.ts", "line": 42, "severity": "warning", "message": "Description" }',
+    ']',
+    '```',
+    '',
+    'After each lens JSON array, write a 2-3 sentence summary.',
+    'If a lens has no findings, return an empty array `[]` and note the code looks good.',
+  ].join('\n');
+}
+/** Persist the full review context somewhere durable, returning a pointer. */
+export type ReviewTempWriter = (content: string) => Promise<ReviewPointer>;
+type ReviewToolResult = AgentToolResult<Record<string, unknown>>;
+/**
+ * Assemble the single-pass fallback result. The full review context is spilled
+ * to a temp file (via the injected {@link ReviewTempWriter}) so it survives
+ * pi's tool-output cap; the inline payload is just a summary + pointer.
+ * Degrades gracefully: an empty context yields a "no applicable lenses" notice,
+ * and a temp-write failure falls back to the (truncation-prone) inline context
+ * rather than throwing out of the tool.
+ */
+export async function buildSinglePassResult(
+  args: {
+    results: LensResult[];
+    diff: DiffSource;
+    lensNames: string[];
+    availableLenses: string[];
+    changedFiles: string[];
+  },
+  writeTemp: ReviewTempWriter,
+  onUpdate?: AgentToolUpdateCallback,
+): Promise<ReviewToolResult> {
+  const fullContext = buildToolContext(args.results, args.diff);
+  const baseDetails: Record<string, unknown> = {
+    mode: 'single-pass',
+    lensCount: args.lensNames.length,
+    availableLenses: args.availableLenses,
+    changedFiles: args.changedFiles,
+  };
+  // No lens produced any context (e.g. the requested lenses matched none of the
+  // available ones) — there is nothing to review, so don't point the agent at
+  // an empty temp file.
+  if (!fullContext.trim()) {
+    return {
+      content: [
+        {
+          type: 'text',
+          text: `No applicable lenses for this review. Available: ${args.availableLenses.join(', ') || '(none)'}.`,
+        },
+      ],
+      details: baseDetails,
+    };
+  }
+  try {
+    const pointer = await writeTemp(fullContext);
+    const summary = `${buildInlineSummary(args.lensNames, args.diff)}\n\n${buildPointer(pointer, 'single-pass')}`;
+    return {
+      content: [{ type: 'text', text: summary }],
+      details: { ...baseDetails, contextFile: pointer.path },
+    };
+  } catch (cause) {
+    onUpdate?.({
+      content: [{ type: 'text', text: 'temp-file write failed — returning inline context' }],
+      details: { writeError: cause instanceof Error ? cause.message : String(cause) },
+    });
+    return { content: [{ type: 'text', text: fullContext }], details: baseDetails };
+  }
+}
+/**
+ * Assemble the pipeline result. The validated findings are the valuable output
+ * and stay inline; the diff + lens context is spilled to a temp file (via the
+ * injected {@link ReviewTempWriter}) purely so the agent can drill into the
+ * diff behind a finding. A write failure must NOT discard a completed pipeline,
+ * so on failure the findings are returned WITHOUT a pointer.
+ */
+export async function buildPipelineResult(
+  args: {
+    pipeline: PipelineResult;
+    diff: DiffSource;
+    basePrompt: string;
+    lensNames: string[];
+    availableLenses: string[];
+    changedFiles: string[];
+  },
+  writeTemp: ReviewTempWriter,
+  onUpdate?: AgentToolUpdateCallback,
+): Promise<ReviewToolResult> {
+  const report = renderPipelineReport(args.pipeline, args.diff);
+  let text = report;
+  let contextFile: string | undefined;
+  try {
+    const pointer = await writeTemp(args.basePrompt);
+    text = `${report}\n\n${buildPointer(pointer, 'pipeline')}`;
+    contextFile = pointer.path;
+  } catch (cause) {
+    onUpdate?.({
+      content: [
+        { type: 'text', text: 'temp-file write failed — findings returned without diff pointer' },
+      ],
+      details: { writeError: cause instanceof Error ? cause.message : String(cause) },
+    });
+  }
+  return {
+    content: [{ type: 'text', text }],
+    details: {
+      mode: 'pipeline',
+      lensCount: args.lensNames.length,
+      availableLenses: args.availableLenses,
+      changedFiles: args.changedFiles,
+      findings: args.pipeline.findings,
+      telemetry: args.pipeline.telemetry,
+      ...(contextFile ? { contextFile } : {}),
+    },
+  };
+}
 /** Promise wrapper: run a deduped tool set once, building a live Executor from `pi`. */
 export function runTools(
   pi: Pick<ExtensionAPI, 'exec'>,

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@dreki-gg/pi-code-reviewer",
-  "version": "0.6.0",
+  "version": "0.6.2",
   "description": "Multi-lens code review extension for pi — configurable review criteria per project",
   "keywords": [
     "pi-package"