npm - @chappibunny/repolens - Versions diffs - 1.7.0 → 1.7.1 - Mend

@chappibunny/repolens 1.7.0 → 1.7.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/CHANGELOG.md +10 -0
package/package.json +1 -1
package/src/ai/generate-sections.js +23 -2
package/src/ai/prompts.js +28 -7

package/CHANGELOG.md CHANGED Viewed

@@ -2,6 +2,16 @@
 All notable changes to RepoLens will be documented in this file.
+## 1.7.1
+### 🛡️ AI Output Guardrails
+- **System prompt hardening**: Added anti-conversational rules — AI now instructed to never offer additional work, never ask questions, never use second-person address (except onboarding), and to back every claim with context evidence.
+- **Evidence-only constraints**: Architecture weaknesses, exec summary risks, and onboarding complexity hotspots now require concrete evidence from context data (cycle counts, coupling metrics, orphan files). No speculation.
+- **Output sanitizer**: New `sanitizeAIOutput()` strips conversational patterns (`"If you want"`, `"I can produce"`, `"Shall I"`, `"Let me know"`) from both structured JSON and plain-text AI responses before they reach documents.
+- **Structured renderer sanitization**: `renderArchitectureOverviewJSON` now sanitizes weakness bullet items, removing conversational lines even if they survive prompt-level constraints.
+- **Dual-path coverage**: Sanitization applies to both structured JSON mode (Path A) and plain-text fallback (Path B), closing all AI output paths.
 ## 1.7.0
 ### ✨ Features

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@chappibunny/repolens",
-  "version": "1.7.0",
+  "version": "1.7.1",
   "description": "AI-assisted documentation intelligence system for technical and non-technical audiences",
   "license": "MIT",
   "type": "module",

package/src/ai/generate-sections.js CHANGED Viewed

@@ -18,6 +18,27 @@ import {
 import { identifyFlowDependencies } from "../analyzers/flow-inference.js";
 import { info, warn } from "../utils/logger.js";
+// Strip conversational patterns that LLMs sometimes inject into documentation
+const CONVERSATIONAL_PATTERNS = [
+  /^(?:[-*]\s*)?if you (?:want|need|would like|prefer)[^.\n]*[.\n]/gmi,
+  /^(?:[-*]\s*)?(?:shall|should) I [^.\n]*[.\n]/gmi,
+  /^(?:[-*]\s*)?(?:let me know|feel free)[^.\n]*[.\n]/gmi,
+  /^(?:[-*]\s*)?I can (?:also |additionally )?(?:produce|create|generate|help|provide|suggest|recommend)[^.\n]*[.\n]/gmi,
+  /^(?:[-*]\s*)?(?:would you like|do you want)[^.\n]*[.\n]/gmi,
+  /^(?:[-*]\s*)?(?:here is|here's) (?:a |the )?(?:summary|overview|breakdown)[^.\n]*:\s*$/gmi,
+];
+function sanitizeAIOutput(text) {
+  if (!text || typeof text !== "string") return text;
+  let cleaned = text;
+  for (const pattern of CONVERSATIONAL_PATTERNS) {
+    cleaned = cleaned.replace(pattern, "");
+  }
+  // Collapse multiple blank lines left by removals
+  cleaned = cleaned.replace(/\n{3,}/g, "\n\n").trim();
+  return cleaned;
+}
 /**
  * Try structured JSON mode first, fall back to plain-text AI, then deterministic.
  */
@@ -41,7 +62,7 @@ async function generateWithStructuredFallback(key, promptText, maxTokens, fallba
     if (result.success && result.parsed) {
       const md = renderStructuredToMarkdown(key, result.parsed);
-      if (md) return md;
+      if (md) return sanitizeAIOutput(md);
     }
     // If structured mode failed, fall through to plain-text
     warn(`Structured AI failed for ${key}, trying plain-text mode...`);
@@ -60,7 +81,7 @@ async function generateWithStructuredFallback(key, promptText, maxTokens, fallba
     return fallbackFn();
   }
-  return result.text;
+  return sanitizeAIOutput(result.text);
 }
 export async function generateExecutiveSummary(context, enrichment = {}) {

package/src/ai/prompts.js CHANGED Viewed

@@ -57,7 +57,12 @@ Rules:
 - Do not mention AI, LLMs, or that you are an assistant.
 - No markdown tables unless specifically requested.
 - Use simple formatting: headings, paragraphs, lists.
-- Maximum 2 heading levels deep within sections.`;
+- Maximum 2 heading levels deep within sections.
+- You are producing a static document, not participating in a conversation.
+- Never offer to do additional work (no "If you want", "I can also", "Let me know", "Shall I").
+- Never ask the reader questions or invite follow-up.
+- Never address the reader in second person ("you") unless the document type requires it (e.g. onboarding).
+- Every claim must be supported by concrete evidence from the supplied context data.`;
 export function createExecutiveSummaryPrompt(context) {
   return `Write an executive summary for a mixed audience of technical and non-technical readers.
@@ -70,7 +75,7 @@ Requirements:
 - Explain the main system areas using the domain information.
 - Explain the business capabilities implied by the codebase structure.
 - Mention key external dependencies only if they are present in the context.
-- Mention architectural or operational risks if they are strongly supported by the context.
+- Mention architectural or operational risks only if they are directly supported by concrete data in the context (e.g. cycle counts, orphan files, coupling metrics).
 - Do not mention file counts more than once.
 - Maximum 500 words.
 - Use this structure:
@@ -89,7 +94,9 @@ Requirements:
 ## Operational and architectural risks
-## Recommended focus areas`;
+## Recommended focus areas
+IMPORTANT: Only list risks and focus areas that are directly evidenced by the context data. Do not speculate.`;
 }
 export function createSystemOverviewPrompt(context) {
@@ -183,7 +190,9 @@ Requirements:
 ## Architectural strengths
-## Architectural weaknesses`;
+## Architectural weaknesses
+IMPORTANT: Only list weaknesses that are directly evidenced by the context data (e.g. cycle counts, orphan files, high coupling metrics, missing layers). Do not speculate about what the system lacks.`;
 }
 export function createDataFlowsPrompt(flows, context) {
@@ -249,7 +258,9 @@ Requirements:
 ## What to understand first
-## Known complexity hotspots`;
+## Known complexity hotspots
+IMPORTANT: Only cite complexity hotspots that are supported by concrete evidence in the context (e.g. high import counts, circular dependencies, large file counts). Do not speculate about what might be complex.`;
 }
 export function createModuleSummaryPrompt(module, context) {
@@ -520,12 +531,22 @@ function renderBusinessDomainsJSON(d) {
   return md;
 }
+function sanitizeBulletList(val) {
+  const raw = toBulletList(val);
+  if (!raw) return raw;
+  // Strip conversational lines from bullet lists
+  return raw.split("\n").filter(line => {
+    const lower = line.toLowerCase();
+    return !/(^|\s)(if you (?:want|need|would)|shall i |let me know|i can (?:also )?(?:produce|create|generate|help)|would you like|do you want|feel free)/i.test(lower);
+  }).join("\n");
+}
 function renderArchitectureOverviewJSON(d) {
   let md = `# Architecture Overview\n\n`;
   md += `## Architecture Style\n\n${safeStr(d.style)}\n\n`;
   md += `## Layers\n\n${toHeadingSections(d.layers)}\n\n`;
-  md += `## Architectural Strengths\n\n${toBulletList(d.strengths)}\n\n`;
-  md += `## Architectural Weaknesses\n\n${toBulletList(d.weaknesses)}\n`;
+  md += `## Architectural Strengths\n\n${sanitizeBulletList(d.strengths)}\n\n`;
+  md += `## Architectural Weaknesses\n\n${sanitizeBulletList(d.weaknesses)}\n`;
   return md;
 }