npm - jstar-reviewer - Versions diffs - 2.1.3 → 2.2.0 - Mend

jstar-reviewer 2.1.3 → 2.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (28) hide show

package/README.md +2 -2
package/bin/jstar.js +15 -4
package/dist/scripts/chat.js +150 -0
package/dist/scripts/config.js +6 -2
package/dist/scripts/core/critique.js +137 -0
package/dist/scripts/core/debate.js +95 -0
package/dist/scripts/detective.js +5 -4
package/dist/scripts/gemini-embedding.js +2 -2
package/dist/scripts/indexer.js +4 -3
package/dist/scripts/reviewer.js +139 -43
package/dist/scripts/session.js +273 -0
package/dist/scripts/ui/interaction.js +43 -0
package/dist/scripts/utils/logger.js +110 -0
package/package.json +14 -10
package/scripts/chat.ts +130 -0
package/scripts/config.ts +6 -2
package/scripts/core/critique.ts +162 -0
package/scripts/core/debate.ts +111 -0
package/scripts/detective.ts +5 -4
package/scripts/gemini-embedding.ts +2 -2
package/scripts/indexer.ts +4 -3
package/scripts/reviewer.ts +154 -43
package/scripts/session.ts +312 -0
package/scripts/types.ts +9 -0
package/scripts/ui/interaction.ts +38 -0
package/scripts/utils/logger.ts +118 -0
package/setup.js +5 -5
package/scripts/local-embedding.ts +0 -55

package/scripts/reviewer.ts CHANGED Viewed

@@ -5,12 +5,15 @@ import * as path from "path";
 import * as fs from "fs";
 import chalk from "chalk";
 import simpleGit from "simple-git";
+import { Logger } from "./utils/logger";
 import { Config } from "./config";
 import { Detective } from "./detective";
 import { GeminiEmbedding } from "./gemini-embedding";
 import { MockLLM } from "./mock-llm";
 import { FileFinding, DashboardReport, LLMReviewResponse, EMPTY_REVIEW } from "./types";
 import { renderDashboard, determineStatus, generateRecommendation } from "./dashboard";
+import { startInteractiveSession } from "./session";
+import { critiqueFindings } from "./core/critique";
 import {
     VectorStoreIndex,
     storageContextFromDefaults,
@@ -18,7 +21,8 @@ import {
     serviceContextFromDefaults
 } from "llamaindex";
-const google = createGoogleGenerativeAI({ apiKey: process.env.GOOGLE_API_KEY });
+const geminiKey = process.env.GEMINI_API_KEY || process.env.GOOGLE_API_KEY || process.env.GOOGLE_GENERATIVE_AI_API_KEY;
+const google = createGoogleGenerativeAI({ apiKey: geminiKey });
 const groq = createGroq({ apiKey: process.env.GROQ_API_KEY });
 const embedModel = new GeminiEmbedding();
@@ -65,6 +69,38 @@ function sleep(ms: number): Promise<void> {
     return new Promise(resolve => setTimeout(resolve, ms));
 }
+/**
+ * Filter issues by confidence threshold and log what was removed
+ */
+function filterByConfidence(findings: FileFinding[]): FileFinding[] {
+    const threshold = Config.CONFIDENCE_THRESHOLD;
+    let removedCount = 0;
+    const filtered = findings.map(finding => {
+        const validIssues = finding.issues.filter(issue => {
+            const confidence = issue.confidenceScore ?? 5; // Default to high if not specified
+            if (confidence < threshold) {
+                removedCount++;
+                Logger.info(chalk.dim(`   ⚡ Low confidence (${confidence}): "${issue.title}" - filtered out`));
+                return false;
+            }
+            return true;
+        });
+        return {
+            ...finding,
+            issues: validIssues,
+            severity: validIssues.length === 0 ? 'LGTM' as const : finding.severity
+        };
+    });
+    if (removedCount > 0) {
+        Logger.info(chalk.blue(`\n   📊 Confidence Filter: ${removedCount} low-confidence issue(s) removed\n`));
+    }
+    return filtered;
+}
 function parseReviewResponse(text: string): LLMReviewResponse {
     try {
         // Try to extract JSON from the response
@@ -107,20 +143,23 @@ function parseReviewResponse(text: string): LLMReviewResponse {
 // --- Main ---
 async function main() {
-    console.log(chalk.blue("🕵️  J-Star Reviewer: Analyzing your changes...\n"));
+    // Initialize logger mode based on CLI flags
+    Logger.init();
+    Logger.info(chalk.blue("🕵️  J-Star Reviewer: Analyzing your changes...\n"));
     // 0. Environment Validation
-    if (!process.env.GOOGLE_API_KEY || !process.env.GROQ_API_KEY) {
-        console.error(chalk.red("❌ Missing API Keys!"));
-        console.log(chalk.yellow("\nPlease ensure you have a .env.local file with:"));
-        console.log(chalk.white("- GOOGLE_API_KEY"));
-        console.log(chalk.white("- GROQ_API_KEY"));
-        console.log(chalk.white("\nCheck .env.example for a template.\n"));
+    if (!geminiKey || !process.env.GROQ_API_KEY) {
+        Logger.error(chalk.red("❌ Missing API Keys!"));
+        Logger.info(chalk.yellow("\nPlease ensure you have a .env.local file with:"));
+        Logger.info(chalk.white("- GEMINI_API_KEY (or GOOGLE_API_KEY)"));
+        Logger.info(chalk.white("- GROQ_API_KEY"));
+        Logger.info(chalk.white("\nCheck .env.example for a template.\n"));
         return;
     }
     // 1. Detective
-    console.log(chalk.blue("🔎 Running Detective Engine..."));
+    Logger.info(chalk.blue("🔎 Running Detective Engine..."));
     const detective = new Detective(SOURCE_DIR);
     await detective.scan();
@@ -129,13 +168,13 @@ async function main() {
     // 1. Get the Diff
     const diff = await git.diff(["--staged"]);
     if (!diff) {
-        console.log(chalk.green("\n✅ No staged changes to review. (Did you 'git add'?)"));
+        Logger.info(chalk.green("\n✅ No staged changes to review. (Did you 'git add'?)"));
         return;
     }
     // 2. Load the Brain
     if (!fs.existsSync(STORAGE_DIR)) {
-        console.error(chalk.red("❌ Local Brain not found. Run 'pnpm run index:init' first."));
+        Logger.error(chalk.red("❌ Local Brain not found. Run 'pnpm run index:init' first."));
         return;
     }
     const storageContext = await storageContextFromDefaults({ persistDir: STORAGE_DIR });
@@ -149,15 +188,15 @@ async function main() {
     const contextNodes = await retriever.retrieve(keywords);
     const relatedContext = contextNodes.map(n => n.node.getContent(MetadataMode.NONE).slice(0, 1500)).join("\n");
-    console.log(chalk.yellow(`\n🧠 Found ${contextNodes.length} context chunk.`));
+    Logger.info(chalk.yellow(`\n🧠 Found ${contextNodes.length} context chunk.`));
     // 4. Chunk the Diff
     const fileChunks = chunkDiffByFile(diff);
     const totalTokens = estimateTokens(diff);
-    console.log(chalk.dim(`   Total diff: ~${totalTokens} tokens across ${fileChunks.length} files.`));
+    Logger.info(chalk.dim(`   Total diff: ~${totalTokens} tokens across ${fileChunks.length} files.`));
-    // 5. Structured JSON Prompt
-    const systemPrompt = `You are J-Star, a Senior Code Reviewer. Be direct and professional.
+    // 5. Structured JSON Prompt (Conservative)
+    const systemPrompt = `You are J-Star, a Senior Code Reviewer. Be CONSERVATIVE and PRECISE.
 Analyze the Git Diff and return a JSON response with this EXACT structure:
 {
@@ -167,7 +206,8 @@ Analyze the Git Diff and return a JSON response with this EXACT structure:
       "title": "Short issue title",
       "description": "Detailed description of the problem",
       "line": 42,
-      "fixPrompt": "A specific prompt an AI can use to fix this issue"
+      "fixPrompt": "A specific prompt an AI can use to fix this issue",
+      "confidenceScore": 5
     }
   ]
 }
@@ -178,10 +218,20 @@ SEVERITY GUIDE:
 - P2_MEDIUM: Code quality, missing types, cleanup needed
 - LGTM: No issues found (return empty issues array)
-IMPORTANT:
-- Return ONLY valid JSON, no markdown or explanation
-- Each issue MUST have a fixPrompt that explains exactly how to fix it
-- If the file is clean, return {"severity": "LGTM", "issues": []}
+CONFIDENCE SCORE (1-5) - BE HONEST:
+- 5: Absolutely certain. The bug is obvious in the diff.
+- 4: Very likely. Clear code smell or anti-pattern.
+- 3: Probable issue, might be missing context.
+- 2: Unsure, could be intentional.
+- 1: Speculation, likely false positive.
+CRITICAL RULES:
+1. Only flag issues you are HIGHLY confident about (4-5).
+2. Test mocks, stubs, and intentional patterns are NOT bugs.
+3. If the code looks intentional or well-handled, it's probably fine.
+4. When in doubt, lean towards LGTM.
+5. Return ONLY valid JSON, no markdown.
+6. If the file is clean: {"severity": "LGTM", "issues": []}
 Context: ${relatedContext.slice(0, 800)}`;
@@ -189,7 +239,7 @@ Context: ${relatedContext.slice(0, 800)}`;
     let chunkIndex = 0;
     let skippedCount = 0;
-    console.log(chalk.blue("\n⚖️  Sending to Judge...\n"));
+    Logger.info(chalk.blue("\n⚖️  Sending to Judge...\n"));
     for (const chunk of fileChunks) {
         chunkIndex++;
@@ -197,7 +247,7 @@ Context: ${relatedContext.slice(0, 800)}`;
         // Skip excluded files
         if (shouldSkipFile(fileName)) {
-            console.log(chalk.dim(`   ⏭️  Skipping ${fileName} (excluded)`));
+            Logger.info(chalk.dim(`   ⏭️  Skipping ${fileName} (excluded)`));
             skippedCount++;
             continue;
         }
@@ -206,7 +256,7 @@ Context: ${relatedContext.slice(0, 800)}`;
         // Skip huge files
         if (chunkTokens > MAX_TOKENS_PER_REQUEST) {
-            console.log(chalk.yellow(`   ⚠️  Skipping ${fileName} (too large: ~${chunkTokens} tokens)`));
+            Logger.info(chalk.yellow(`   ⚠️  Skipping ${fileName} (too large: ~${chunkTokens} tokens)`));
             findings.push({
                 file: fileName,
                 severity: Config.DEFAULT_SEVERITY,
@@ -219,7 +269,7 @@ Context: ${relatedContext.slice(0, 800)}`;
             continue;
         }
-        process.stdout.write(chalk.dim(`   📄 ${fileName}...`));
+        Logger.progress(chalk.dim(`   📄 ${fileName}...`));
         try {
             const { text } = await generateText({
@@ -239,10 +289,10 @@ Context: ${relatedContext.slice(0, 800)}`;
             const emoji = response.severity === 'LGTM' ? '✅' :
                 response.severity === 'P0_CRITICAL' ? '🛑' :
                     response.severity === 'P1_HIGH' ? '⚠️' : '📝';
-            console.log(` ${emoji}`);
+            Logger.info(` ${emoji}`);
         } catch (error: any) {
-            console.log(chalk.red(` ❌ (${error.message.slice(0, 50)})`));
+            Logger.info(chalk.red(` ❌ (${error.message.slice(0, 50)})`));
             findings.push({
                 file: fileName,
                 severity: Config.DEFAULT_SEVERITY,
@@ -260,15 +310,24 @@ Context: ${relatedContext.slice(0, 800)}`;
         }
     }
-    // 6. Build Dashboard Report
+    // 6. Confidence Filtering
+    Logger.info(chalk.blue("\n🎯 Filtering by Confidence...\n"));
+    let filteredFindings = filterByConfidence(findings);
+    // 7. Self-Critique Pass (if enabled)
+    if (Config.ENABLE_SELF_CRITIQUE) {
+        filteredFindings = await critiqueFindings(filteredFindings, diff);
+    }
+    // 8. Build Dashboard Report
     const metrics = {
         filesScanned: fileChunks.length - skippedCount,
         totalTokens,
-        violations: findings.reduce((sum, f) => sum + f.issues.length, 0),
-        critical: findings.filter(f => f.severity === 'P0_CRITICAL').length,
-        high: findings.filter(f => f.severity === 'P1_HIGH').length,
-        medium: findings.filter(f => f.severity === 'P2_MEDIUM').length,
-        lgtm: findings.filter(f => f.severity === 'LGTM').length,
+        violations: filteredFindings.reduce((sum, f) => sum + f.issues.length, 0),
+        critical: filteredFindings.filter(f => f.severity === 'P0_CRITICAL').length,
+        high: filteredFindings.filter(f => f.severity === 'P1_HIGH').length,
+        medium: filteredFindings.filter(f => f.severity === 'P2_MEDIUM').length,
+        lgtm: filteredFindings.filter(f => f.severity === 'LGTM').length,
     };
     const report: DashboardReport = {
@@ -276,7 +335,7 @@ Context: ${relatedContext.slice(0, 800)}`;
         reviewer: 'Detective Engine & Judge',
         status: determineStatus(metrics),
         metrics,
-        findings,
+        findings: filteredFindings,
         recommendedAction: generateRecommendation(metrics)
     };
@@ -287,20 +346,72 @@ Context: ${relatedContext.slice(0, 800)}`;
     fs.mkdirSync(path.dirname(OUTPUT_FILE), { recursive: true });
     fs.writeFileSync(OUTPUT_FILE, dashboard);
-    console.log("\n" + chalk.bold.green("📊 DASHBOARD GENERATED"));
-    console.log(chalk.dim(`   Saved to: ${OUTPUT_FILE}`));
-    console.log("\n" + chalk.bold.white("─".repeat(50)));
+    // Save Session State for "jstar chat"
+    const SESSION_FILE = path.join(process.cwd(), ".jstar", "session.json");
+    fs.writeFileSync(SESSION_FILE, JSON.stringify({
+        date: report.date,
+        findings: report.findings,
+        metrics: report.metrics
+    }, null, 2));
+    Logger.info("\n" + chalk.bold.green("📊 DASHBOARD GENERATED"));
+    Logger.info(chalk.dim(`   Saved to: ${OUTPUT_FILE}`));
+    Logger.info("\n" + chalk.bold.white("─".repeat(50)));
     // Print summary to console
     const statusEmoji = report.status === 'APPROVED' ? '🟢' :
         report.status === 'NEEDS_REVIEW' ? '🟡' : '🔴';
-    console.log(`\n${statusEmoji} Status: ${report.status.replace('_', ' ')}`);
-    console.log(`   🛑 Critical: ${metrics.critical}`);
-    console.log(`   ⚠️  High: ${metrics.high}`);
-    console.log(`   📝 Medium: ${metrics.medium}`);
-    console.log(`   ✅ LGTM: ${metrics.lgtm}`);
-    console.log(`\n💡 ${report.recommendedAction}`);
-    console.log(chalk.dim(`\n📄 Full report: ${OUTPUT_FILE}`));
+    Logger.info(`\n${statusEmoji} Status: ${report.status.replace('_', ' ')}`);
+    Logger.info(`   🛑 Critical: ${metrics.critical}`);
+    Logger.info(`   ⚠️  High: ${metrics.high}`);
+    Logger.info(`   📝 Medium: ${metrics.medium}`);
+    Logger.info(`   ✅ LGTM: ${metrics.lgtm}`);
+    Logger.info(`\n💡 ${report.recommendedAction}`);
+    Logger.info(chalk.dim(`\n📄 Full report: ${OUTPUT_FILE}`));
+    // 8. Interactive Session OR JSON Output
+    if (Logger.isHeadless()) {
+        // In JSON mode: output report to stdout and skip interactive session
+        Logger.json(report);
+    } else {
+        // Normal TUI mode: start interactive session
+        const { updatedFindings, hasUpdates } = await startInteractiveSession(findings, index);
+        if (hasUpdates) {
+            Logger.info(chalk.blue("\n🔄 Updating Dashboard with session changes..."));
+            // Recalculate metrics
+            const newMetrics = {
+                filesScanned: fileChunks.length - skippedCount,
+                totalTokens,
+                violations: updatedFindings.reduce((sum, f) => sum + f.issues.length, 0),
+                critical: updatedFindings.filter(f => f.severity === 'P0_CRITICAL').length,
+                high: updatedFindings.filter(f => f.severity === 'P1_HIGH').length,
+                medium: updatedFindings.filter(f => f.severity === 'P2_MEDIUM').length,
+                lgtm: updatedFindings.filter(f => f.severity === 'LGTM').length,
+            };
+            const newReport: DashboardReport = {
+                ...report, // Keep date/reviewer
+                metrics: newMetrics,
+                findings: updatedFindings,
+                status: determineStatus(newMetrics),
+                recommendedAction: generateRecommendation(newMetrics)
+            };
+            const newDashboard = renderDashboard(newReport);
+            fs.writeFileSync(OUTPUT_FILE, newDashboard);
+            // Also update session file with new findings
+            fs.writeFileSync(SESSION_FILE, JSON.stringify({
+                date: newReport.date,
+                findings: newReport.findings,
+                metrics: newReport.metrics
+            }, null, 2));
+            Logger.info(chalk.bold.green("📊 DASHBOARD UPDATED"));
+        }
+    }
 }
 main().catch(console.error);

package/scripts/session.ts ADDED Viewed

@@ -0,0 +1,312 @@
+import { FileFinding, ReviewIssue } from "./types";
+import { showActionMenu, askForArgument } from "./ui/interaction";
+import { debateIssue } from "./core/debate";
+import { VectorStoreIndex } from "llamaindex";
+import { Logger } from "./utils/logger";
+import chalk from "chalk";
+import prompts from "prompts";
+import * as readline from "readline";
+export async function startInteractiveSession(
+    findings: FileFinding[],
+    index: VectorStoreIndex
+): Promise<{ updatedFindings: FileFinding[], hasUpdates: boolean }> {
+    // Deep clone to track local state without mutating original immediately (though we return updated findings)
+    const interactiveFindings: FileFinding[] = JSON.parse(JSON.stringify(findings));
+    let hasUpdates = false;
+    let active = true;
+    if (interactiveFindings.length === 0 || interactiveFindings.every(f => f.issues.length === 0)) {
+        return { updatedFindings: interactiveFindings, hasUpdates: false };
+    }
+    console.log(chalk.bold.magenta("\n🗣️  Interactive Review Session"));
+    console.log(chalk.dim("   Use arrow keys to navigate. Select an issue to debate."));
+    while (active) {
+        // Re-calculate choices every loop to reflect status changes
+        // Flatten
+        const flatIssues: {
+            issue: ReviewIssue,
+            fileIndex: number,
+            issueIndex: number,
+            file: string
+        }[] = [];
+        interactiveFindings.forEach((f, fIdx) => {
+            f.issues.forEach((i, iIdx) => {
+                flatIssues.push({
+                    issue: i,
+                    fileIndex: fIdx,
+                    issueIndex: iIdx,
+                    file: f.file
+                });
+            });
+        });
+        const choices = flatIssues.map((item, idx) => {
+            const i = item.issue;
+            const statusIcon = i.status === 'resolved' ? '✅ ' : i.status === 'ignored' ? '🗑️ ' : '';
+            return {
+                title: `${statusIcon}${i.confidenceScore ? `[${i.confidenceScore}/5] ` : ''}${i.title} ${chalk.dim(`(${item.file})`)}`,
+                value: idx,
+                description: i.status ? `Marked as ${i.status}` : i.description.slice(0, 80)
+            };
+        });
+        choices.push({ title: '🚪 Finish Review', value: -1, description: 'Exit and save report' });
+        const { selectedIdx } = await prompts({
+            type: 'select',
+            name: 'selectedIdx',
+            message: 'Select an issue:',
+            choices: choices,
+            initial: 0
+        });
+        if (selectedIdx === undefined || selectedIdx === -1) {
+            active = false;
+            break;
+        }
+        const selected = flatIssues[selectedIdx];
+        const { issue, file } = selected;
+        // Show Details
+        console.log(chalk.cyan(`\nTitle: ${issue.title}`));
+        console.log(chalk.white(issue.description));
+        console.log(chalk.dim(`File: ${file}`));
+        if (issue.confidenceScore) console.log(chalk.yellow(`Confidence: ${issue.confidenceScore}/5`));
+        if (issue.status) console.log(chalk.green(`Status: ${issue.status}`));
+        // Action Menu
+        const action = await showActionMenu(issue.title);
+        if (action === 'discuss') {
+            const argument = await askForArgument();
+            const result = await debateIssue(
+                issue.title,
+                issue.description,
+                file,
+                argument,
+                index
+            );
+            console.log(chalk.yellow(`\n🤖 Bot: ${result.text}`));
+            if (result.severity === 'LGTM') {
+                console.log(chalk.green("✅ Issue withdrawn by AI!"));
+                // Direct update to our state
+                interactiveFindings[selected.fileIndex].issues[selected.issueIndex].status = 'resolved';
+                hasUpdates = true;
+            }
+        } else if (action === 'ignore') {
+            console.log(chalk.dim('Issue ignored locally.'));
+            interactiveFindings[selected.fileIndex].issues[selected.issueIndex].status = 'ignored';
+            hasUpdates = true;
+        } else if (action === 'accept') {
+            console.log(chalk.green('Issue accepted.'));
+        } else if (action === 'exit') {
+            active = false;
+        }
+    }
+    // Filter out resolved/ignored issues for the final report
+    const finalFindings: FileFinding[] = interactiveFindings.map(f => ({
+        ...f,
+        issues: f.issues.filter(i => i.status !== 'resolved' && i.status !== 'ignored')
+    })).filter(f => f.issues.length > 0);
+    return { updatedFindings: finalFindings, hasUpdates };
+}
+/**
+ * Headless interface for flatIssues structure
+ */
+interface FlatIssue {
+    id: number;
+    title: string;
+    description: string;
+    file: string;
+    confidenceScore?: number;
+    status?: 'resolved' | 'ignored';
+    fileIndex: number;
+    issueIndex: number;
+}
+/**
+ * Headless command protocol
+ */
+interface HeadlessCommand {
+    action: 'list' | 'debate' | 'ignore' | 'accept' | 'exit';
+    issueId?: number;
+    argument?: string;
+}
+/**
+ * Flatten findings into a simple array for headless mode
+ */
+function flattenIssues(findings: FileFinding[]): FlatIssue[] {
+    const flat: FlatIssue[] = [];
+    findings.forEach((f, fIdx) => {
+        f.issues.forEach((i, iIdx) => {
+            flat.push({
+                id: flat.length,
+                title: i.title,
+                description: i.description,
+                file: f.file,
+                confidenceScore: i.confidenceScore,
+                status: i.status,
+                fileIndex: fIdx,
+                issueIndex: iIdx
+            });
+        });
+    });
+    return flat;
+}
+/**
+ * Headless session for AI agents and CI/CD.
+ *
+ * Protocol:
+ * - Input (stdin): JSON commands, one per line
+ *   { "action": "list" }
+ *   { "action": "debate", "issueId": 0, "argument": "This is intentional" }
+ *   { "action": "ignore", "issueId": 0 }
+ *   { "action": "accept", "issueId": 0 }
+ *   { "action": "exit" }
+ *
+ * - Output (stdout): JSON events, one per line
+ *   { "type": "ready", "issues": [...] }
+ *   { "type": "list", "issues": [...] }
+ *   { "type": "response", "issueId": 0, "text": "...", "verdict": "LGTM" | "STANDS" }
+ *   { "type": "update", "issueId": 0, "status": "ignored" | "resolved" | "accepted" }
+ *   { "type": "error", "message": "..." }
+ *   { "type": "done", "hasUpdates": true, "updatedFindings": [...] }
+ */
+export async function startHeadlessSession(
+    findings: FileFinding[],
+    index: VectorStoreIndex
+): Promise<{ updatedFindings: FileFinding[], hasUpdates: boolean }> {
+    // Deep clone to track state
+    const sessionFindings: FileFinding[] = JSON.parse(JSON.stringify(findings));
+    let hasUpdates = false;
+    // Emit ready event with all issues
+    const issues = flattenIssues(sessionFindings);
+    Logger.json({ type: 'ready', issues });
+    // Create readline interface for stdin
+    const rl = readline.createInterface({
+        input: process.stdin,
+        output: process.stdout,
+        terminal: false
+    });
+    // Process commands
+    for await (const line of rl) {
+        if (!line.trim()) continue;
+        let cmd: HeadlessCommand;
+        try {
+            cmd = JSON.parse(line);
+        } catch (e) {
+            Logger.json({ type: 'error', message: 'Invalid JSON command' });
+            continue;
+        }
+        const currentIssues = flattenIssues(sessionFindings);
+        switch (cmd.action) {
+            case 'list':
+                Logger.json({ type: 'list', issues: currentIssues });
+                break;
+            case 'debate':
+                if (cmd.issueId === undefined || !cmd.argument) {
+                    Logger.json({ type: 'error', message: 'debate requires issueId and argument' });
+                    break;
+                }
+                const debateTarget = currentIssues.find(i => i.id === cmd.issueId);
+                if (!debateTarget) {
+                    Logger.json({ type: 'error', message: `Issue ${cmd.issueId} not found` });
+                    break;
+                }
+                try {
+                    const result = await debateIssue(
+                        debateTarget.title,
+                        debateTarget.description,
+                        debateTarget.file,
+                        cmd.argument,
+                        index
+                    );
+                    const verdict = result.severity === 'LGTM' ? 'LGTM' : 'STANDS';
+                    Logger.json({
+                        type: 'response',
+                        issueId: cmd.issueId,
+                        text: result.text,
+                        verdict
+                    });
+                    if (result.severity === 'LGTM') {
+                        sessionFindings[debateTarget.fileIndex].issues[debateTarget.issueIndex].status = 'resolved';
+                        hasUpdates = true;
+                        Logger.json({ type: 'update', issueId: cmd.issueId, status: 'resolved' });
+                    }
+                } catch (e: any) {
+                    Logger.json({ type: 'error', message: e.message });
+                }
+                break;
+            case 'ignore':
+                if (cmd.issueId === undefined) {
+                    Logger.json({ type: 'error', message: 'ignore requires issueId' });
+                    break;
+                }
+                const ignoreTarget = currentIssues.find(i => i.id === cmd.issueId);
+                if (!ignoreTarget) {
+                    Logger.json({ type: 'error', message: `Issue ${cmd.issueId} not found` });
+                    break;
+                }
+                sessionFindings[ignoreTarget.fileIndex].issues[ignoreTarget.issueIndex].status = 'ignored';
+                hasUpdates = true;
+                Logger.json({ type: 'update', issueId: cmd.issueId, status: 'ignored' });
+                break;
+            case 'accept':
+                if (cmd.issueId === undefined) {
+                    Logger.json({ type: 'error', message: 'accept requires issueId' });
+                    break;
+                }
+                Logger.json({ type: 'update', issueId: cmd.issueId, status: 'accepted' });
+                break;
+            case 'exit':
+                // Filter out resolved/ignored for final report
+                const finalFindings: FileFinding[] = sessionFindings.map(f => ({
+                    ...f,
+                    issues: f.issues.filter(i => i.status !== 'resolved' && i.status !== 'ignored')
+                })).filter(f => f.issues.length > 0);
+                Logger.json({ type: 'done', hasUpdates, updatedFindings: finalFindings });
+                rl.close();
+                return { updatedFindings: finalFindings, hasUpdates };
+            default:
+                Logger.json({ type: 'error', message: `Unknown action: ${(cmd as any).action}` });
+        }
+    }
+    // If stdin closes without exit command, still return
+    const finalFindings: FileFinding[] = sessionFindings.map(f => ({
+        ...f,
+        issues: f.issues.filter(i => i.status !== 'resolved' && i.status !== 'ignored')
+    })).filter(f => f.issues.length > 0);
+    return { updatedFindings: finalFindings, hasUpdates };
+}

package/scripts/types.ts CHANGED Viewed

@@ -10,6 +10,8 @@ export interface ReviewIssue {
     description: string;
     line?: number;
     fixPrompt: string;
+    confidenceScore?: number;
+    status?: 'resolved' | 'ignored';
 }
 export interface FileFinding {
@@ -35,6 +37,12 @@ export interface DashboardReport {
     recommendedAction: string;
 }
+export interface SessionState {
+    date: string;
+    findings: FileFinding[];
+    metrics: DashboardReport['metrics'];
+}
 /**
  * Schema for LLM response (per-file review)
  */
@@ -45,6 +53,7 @@ export interface LLMReviewResponse {
         description: string;
         line?: number;
         fixPrompt: string;
+        confidenceScore?: number;  // 1-5 confidence rating
     }[];
 }