npm - @kevinrabun/judges - Versions diffs - 3.115.4 → 3.117.0 - Mend

@kevinrabun/judges 3.115.4 → 3.117.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (114) hide show

package/agents/accessibility.judge.md +7 -0
package/agents/agent-instructions.judge.md +7 -0
package/agents/ai-code-safety.judge.md +7 -0
package/agents/api-contract.judge.md +7 -0
package/agents/api-design.judge.md +7 -0
package/agents/authentication.judge.md +7 -0
package/agents/backwards-compatibility.judge.md +7 -0
package/agents/caching.judge.md +7 -0
package/agents/ci-cd.judge.md +7 -0
package/agents/cloud-readiness.judge.md +7 -0
package/agents/concurrency.judge.md +7 -0
package/agents/configuration-management.judge.md +7 -0
package/agents/cybersecurity.judge.md +7 -0
package/agents/data-security.judge.md +7 -0
package/agents/dependency-health.judge.md +7 -0
package/agents/documentation.judge.md +7 -0
package/agents/error-handling.judge.md +7 -0
package/agents/ethics-bias.judge.md +7 -0
package/agents/false-positive-review.judge.md +12 -0
package/agents/framework-safety.judge.md +7 -0
package/agents/hallucination-detection.judge.md +13 -0
package/agents/iac-security.judge.md +7 -0
package/agents/intent-alignment.judge.md +13 -0
package/agents/logging-privacy.judge.md +7 -0
package/agents/maintainability.judge.md +7 -0
package/agents/multi-turn-coherence.judge.md +7 -0
package/agents/observability.judge.md +7 -0
package/agents/portability.judge.md +7 -0
package/agents/rate-limiting.judge.md +7 -0
package/agents/reliability.judge.md +7 -0
package/agents/security.judge.md +13 -0
package/agents/testing.judge.md +7 -0
package/agents/ux.judge.md +7 -0
package/dist/a2a-protocol.d.ts +136 -0
package/dist/a2a-protocol.js +218 -0
package/dist/api.d.ts +21 -3
package/dist/api.js +21 -1
package/dist/audit-trail.d.ts +245 -0
package/dist/audit-trail.js +257 -0
package/dist/commands/benchmark-advanced.js +51 -51
package/dist/commands/benchmark-ai-agents.js +16 -16
package/dist/commands/benchmark-compliance-ethics.js +12 -12
package/dist/commands/benchmark-expanded-2.js +2 -2
package/dist/commands/benchmark-expanded.js +2 -2
package/dist/commands/benchmark-infrastructure.js +12 -12
package/dist/commands/benchmark-languages.js +11 -11
package/dist/commands/benchmark-quality-ops.js +7 -7
package/dist/commands/benchmark-security-deep.js +9 -9
package/dist/commands/benchmark.js +1 -1
package/dist/commands/llm-benchmark-optimizer.d.ts +78 -0
package/dist/commands/llm-benchmark-optimizer.js +241 -0
package/dist/commands/llm-benchmark.d.ts +4 -2
package/dist/commands/llm-benchmark.js +40 -12
package/dist/escalation.d.ts +100 -0
package/dist/escalation.js +292 -0
package/dist/evaluation-session.d.ts +74 -0
package/dist/evaluation-session.js +152 -0
package/dist/evaluators/index.d.ts +23 -1
package/dist/evaluators/index.js +192 -3
package/dist/evaluators/judge-selector.d.ts +19 -0
package/dist/evaluators/judge-selector.js +141 -0
package/dist/evaluators/recall-boost.d.ts +27 -0
package/dist/evaluators/recall-boost.js +409 -0
package/dist/feedback-loop.d.ts +62 -0
package/dist/feedback-loop.js +179 -0
package/dist/index.js +2 -0
package/dist/judges/accessibility.js +7 -0
package/dist/judges/agent-instructions.js +7 -0
package/dist/judges/ai-code-safety.js +7 -0
package/dist/judges/api-contract.js +7 -0
package/dist/judges/api-design.js +7 -0
package/dist/judges/authentication.js +7 -0
package/dist/judges/backwards-compatibility.js +7 -0
package/dist/judges/caching.js +7 -0
package/dist/judges/ci-cd.js +7 -0
package/dist/judges/cloud-readiness.js +7 -0
package/dist/judges/concurrency.js +7 -0
package/dist/judges/configuration-management.js +7 -0
package/dist/judges/cybersecurity.js +7 -0
package/dist/judges/data-security.js +7 -0
package/dist/judges/dependency-health.js +7 -0
package/dist/judges/documentation.js +7 -0
package/dist/judges/error-handling.js +7 -0
package/dist/judges/ethics-bias.js +7 -0
package/dist/judges/false-positive-review.js +13 -1
package/dist/judges/framework-safety.js +7 -0
package/dist/judges/hallucination-detection.js +14 -1
package/dist/judges/iac-security.js +7 -0
package/dist/judges/intent-alignment.js +14 -1
package/dist/judges/logging-privacy.js +7 -0
package/dist/judges/maintainability.js +7 -0
package/dist/judges/multi-turn-coherence.js +7 -0
package/dist/judges/observability.js +7 -0
package/dist/judges/portability.js +7 -0
package/dist/judges/rate-limiting.js +7 -0
package/dist/judges/reliability.js +7 -0
package/dist/judges/security.js +14 -1
package/dist/judges/testing.js +7 -0
package/dist/judges/ux.js +7 -0
package/dist/review-conversation.d.ts +87 -0
package/dist/review-conversation.js +307 -0
package/dist/sast-integration.d.ts +112 -0
package/dist/sast-integration.js +215 -0
package/dist/tools/register-evaluation.js +208 -8
package/dist/tools/register-fix.js +24 -1
package/dist/tools/register-resources.d.ts +6 -0
package/dist/tools/register-resources.js +177 -0
package/dist/tools/register-review.js +26 -1
package/dist/tools/register-workflow.js +384 -11
package/dist/tools/validation.d.ts +13 -0
package/dist/tools/validation.js +77 -0
package/dist/types.d.ts +122 -0
package/package.json +25 -12
package/server.json +2 -2

package/dist/tools/register-evaluation.js CHANGED Viewed

@@ -5,10 +5,12 @@ import { z } from "zod";
 import { readFileSync, existsSync } from "fs";
 import { extname } from "path";
 import { JUDGES, getJudge, getJudgeSummaries } from "../judges/index.js";
-import { evaluateWithJudge, evaluateWithTribunal, formatVerdictAsMarkdown, formatEvaluationAsMarkdown, } from "../evaluators/index.js";
+import { evaluateWithJudge, evaluateWithTribunal, evaluateWithTribunalStreaming, formatVerdictAsMarkdown, formatEvaluationAsMarkdown, } from "../evaluators/index.js";
 import { evaluateCodeV2, evaluateProjectV2, getSupportedPolicyProfiles } from "../evaluators/v2.js";
 import { detectProjectContext } from "../evaluators/shared.js";
+import { getGlobalSession } from "../evaluation-session.js";
 import { configSchema, toJudgesConfig } from "./schemas.js";
+import { validateCodeSize } from "./validation.js";
 import { buildSingleJudgeDeepReviewSection, buildTribunalDeepReviewSection } from "./deep-review.js";
 /**
  * Register evaluation-focused tools: get_judges, evaluate_code,
@@ -20,6 +22,7 @@ export function registerEvaluationTools(server) {
     registerEvaluateSingleJudge(server);
     registerEvaluateV2(server);
     registerEvaluateFile(server);
+    registerEvaluateCodeStreaming(server);
 }
 // ─── get_judges ──────────────────────────────────────────────────────────────
 function registerGetJudges(server) {
@@ -34,6 +37,15 @@ function registerGetJudges(server) {
                     type: "text",
                     text: `# Judges Panel\n\n${text}`,
                 },
+                {
+                    type: "text",
+                    text: "```json\n" +
+                        JSON.stringify({
+                            judgeCount: judges.length,
+                            judges: judges.map((j) => ({ id: j.id, name: j.name, domain: j.domain })),
+                        }, null, 2) +
+                        "\n```",
+                },
             ],
         };
     });
@@ -70,20 +82,52 @@ function registerEvaluateCode(server) {
         config: configSchema,
     }, async ({ code, language, context, includeAstFindings, minConfidence, relatedFiles, config }) => {
         try {
+            const sizeError = validateCodeSize(code);
+            if (sizeError) {
+                return { content: [{ type: "text", text: `Error: ${sizeError}` }], isError: true };
+            }
+            const session = getGlobalSession();
             const verdict = evaluateWithTribunal(code, language, context, {
                 includeAstFindings,
                 minConfidence,
                 config: toJudgesConfig(config),
+                adaptiveSelection: true,
+                filePath: context,
             });
+            // Track evaluation in session
+            session.recordEvaluation(context ?? `<inline:${language}>`, code, verdict);
             const projectContext = detectProjectContext(code, language);
             const patternResults = formatVerdictAsMarkdown(verdict);
             const deepReview = buildTribunalDeepReviewSection(JUDGES, language, context, relatedFiles, projectContext);
+            // Structured JSON content block for programmatic consumption
+            const structuredData = {
+                score: verdict.overallScore,
+                verdict: verdict.overallVerdict,
+                findingCount: verdict.findings.length,
+                criticalCount: verdict.findings.filter((f) => f.severity === "critical").length,
+                highCount: verdict.findings.filter((f) => f.severity === "high").length,
+                judgesRun: verdict.evaluations.length,
+                findings: verdict.findings.map((f) => ({
+                    ruleId: f.ruleId,
+                    severity: f.severity,
+                    title: f.title,
+                    lineNumbers: f.lineNumbers,
+                    confidence: f.confidence,
+                })),
+                sessionStats: {
+                    evaluationCount: session.evaluationCount,
+                },
+            };
             return {
                 content: [
                     {
                         type: "text",
                         text: patternResults + deepReview,
                     },
+                    {
+                        type: "text",
+                        text: "```json\n" + JSON.stringify(structuredData, null, 2) + "\n```",
+                    },
                 ],
             };
         }
@@ -130,6 +174,10 @@ function registerEvaluateSingleJudge(server) {
         config: configSchema,
     }, async ({ code, language, judgeId, context, minConfidence, relatedFiles, config }) => {
         try {
+            const sizeError = validateCodeSize(code);
+            if (sizeError) {
+                return { content: [{ type: "text", text: `Error: ${sizeError}` }], isError: true };
+            }
             const judge = getJudge(judgeId);
             if (!judge) {
                 return {
@@ -149,12 +197,25 @@ function registerEvaluateSingleJudge(server) {
             const projectContext = detectProjectContext(code, language);
             const patternResults = formatEvaluationAsMarkdown(evaluation);
             const deepReview = buildSingleJudgeDeepReviewSection(judge, language, context, relatedFiles, projectContext);
+            const structured = {
+                judgeId,
+                judgeName: judge.name,
+                domain: judge.domain,
+                score: evaluation.score,
+                verdict: evaluation.verdict,
+                findingCount: evaluation.findings.length,
+                findings: evaluation.findings.map((f) => ({
+                    ruleId: f.ruleId,
+                    severity: f.severity,
+                    title: f.title,
+                    lineNumbers: f.lineNumbers,
+                    confidence: f.confidence,
+                })),
+            };
             return {
                 content: [
-                    {
-                        type: "text",
-                        text: patternResults + deepReview,
-                    },
+                    { type: "text", text: patternResults + deepReview },
+                    { type: "text", text: "```json\n" + JSON.stringify(structured, null, 2) + "\n```" },
                 ],
             };
         }
@@ -173,7 +234,7 @@ function registerEvaluateSingleJudge(server) {
 }
 // ─── evaluate_v2 ─────────────────────────────────────────────────────────────
 function registerEvaluateV2(server) {
-    server.tool("evaluate_v2", "Run V2 context-aware tribunal evaluation with policy profiles, evidence calibration, specialty feedback, confidence scoring, and uncertainty reporting.", {
+    server.tool("evaluate_policy_aware", "Run policy-aware tribunal evaluation with named policy profiles (startup, regulated, healthcare, fintech, public-sector), evidence calibration from runtime metrics, specialty-per-judge feedback, confidence scoring, and uncertainty reporting. Use this when code must meet specific compliance or vertical requirements.", {
         code: z.string().optional().describe("Source code for single-file mode"),
         language: z.string().optional().describe("Language for single-file mode"),
         files: z
@@ -263,7 +324,7 @@ function registerEvaluateV2(server) {
                     evaluationContext,
                     evidence,
                 });
-            let md = `# V2 Tribunal Evaluation\n\n`;
+            let md = `# Policy-Aware Tribunal Evaluation\n\n`;
             md += `**Policy Profile:** ${result.policyProfile}\n`;
             md += `**Calibrated Verdict:** ${result.calibratedVerdict.toUpperCase()} (${result.calibratedScore}/100)\n`;
             md += `**Base Verdict:** ${result.baseVerdict.overallVerdict.toUpperCase()} (${result.baseVerdict.overallScore}/100)\n`;
@@ -310,7 +371,28 @@ function registerEvaluateV2(server) {
             md += `\n## Supported Policy Profiles\n\n`;
             md += supportedProfiles.map((profile) => `- ${profile}`).join("\n");
             md += "\n";
-            return { content: [{ type: "text", text: md }] };
+            const structured = {
+                policyProfile: result.policyProfile,
+                calibratedScore: result.calibratedScore,
+                calibratedVerdict: result.calibratedVerdict,
+                baseScore: result.baseVerdict.overallScore,
+                baseVerdict: result.baseVerdict.overallVerdict,
+                confidence: result.confidence,
+                findingCount: result.findings.length,
+                findings: result.findings.map((f) => ({
+                    ruleId: f.ruleId,
+                    severity: f.severity,
+                    title: f.title,
+                    confidence: f.confidence,
+                })),
+                uncertainty: result.uncertainty,
+            };
+            return {
+                content: [
+                    { type: "text", text: md },
+                    { type: "text", text: "```json\n" + JSON.stringify(structured, null, 2) + "\n```" },
+                ],
+            };
         }
         catch (error) {
             return {
@@ -382,20 +464,60 @@ function registerEvaluateFile(server) {
             }
             const code = readFileSync(filePath, "utf-8");
             const detectedLang = language || detectLanguageFromPath(filePath);
+            const session = getGlobalSession();
+            // Skip re-evaluation if verdict is stable for this file
+            if (session.isVerdictStable(filePath)) {
+                const history = session.getVerdictHistory(filePath);
+                return {
+                    content: [
+                        {
+                            type: "text",
+                            text: `# Evaluation: ${filePath}\n\n` +
+                                `> ⚡ **Verdict stable** — score has converged at **${history[0]?.score ?? 0}/100** ` +
+                                `across last evaluations. Skipping redundant re-evaluation.\n\n` +
+                                `Use \`evaluate_code\` with the code directly to force a fresh evaluation.`,
+                        },
+                    ],
+                };
+            }
             const verdict = evaluateWithTribunal(code, detectedLang, context, {
                 includeAstFindings,
                 minConfidence,
                 config: toJudgesConfig(config),
+                adaptiveSelection: true,
+                filePath,
             });
+            session.recordEvaluation(filePath, code, verdict);
             const projectContext = detectProjectContext(code, detectedLang, filePath);
             const patternResults = formatVerdictAsMarkdown(verdict);
             const deepReview = buildTribunalDeepReviewSection(JUDGES, detectedLang, context, undefined, projectContext);
+            const structuredData = {
+                filePath,
+                language: detectedLang,
+                score: verdict.overallScore,
+                verdict: verdict.overallVerdict,
+                findingCount: verdict.findings.length,
+                criticalCount: verdict.findings.filter((f) => f.severity === "critical").length,
+                highCount: verdict.findings.filter((f) => f.severity === "high").length,
+                judgesRun: verdict.evaluations.length,
+                findings: verdict.findings.map((f) => ({
+                    ruleId: f.ruleId,
+                    severity: f.severity,
+                    title: f.title,
+                    lineNumbers: f.lineNumbers,
+                    confidence: f.confidence,
+                })),
+            };
             return {
                 content: [
                     {
                         type: "text",
                         text: `# Evaluation: ${filePath}\n\n` + patternResults + deepReview,
                     },
+                    {
+                        type: "text",
+                        text: "```json\n" + JSON.stringify(structuredData, null, 2) + "\n```",
+                    },
                 ],
             };
         }
@@ -412,3 +534,81 @@ function registerEvaluateFile(server) {
         }
     });
 }
+// ─── evaluate_code_streaming ─────────────────────────────────────────────────
+function registerEvaluateCodeStreaming(server) {
+    server.tool("evaluate_code_streaming", `Submit code for streaming evaluation — returns per-judge results as each judge completes, with running aggregate scores. Ideal for long evaluations where you want progressive feedback. All ${JUDGES.length} judges run sequentially with per-judge results accumulated into a single structured response.`, {
+        code: z.string().describe("The source code to evaluate."),
+        language: z.string().describe("The programming language (e.g., 'typescript', 'python', 'javascript')."),
+        context: z.string().optional().describe("Optional context about the code."),
+        includeAstFindings: z.boolean().optional().describe("Include AST/code-structure findings (default: true)"),
+        minConfidence: z
+            .number()
+            .min(0)
+            .max(1)
+            .optional()
+            .describe("Minimum finding confidence to include (0-1, default: 0)"),
+        config: configSchema,
+    }, async ({ code, language, context, includeAstFindings, minConfidence, config }) => {
+        try {
+            const session = getGlobalSession();
+            const batches = [];
+            let finalBatch;
+            for await (const batch of evaluateWithTribunalStreaming(code, language, context, {
+                includeAstFindings,
+                minConfidence,
+                config: toJudgesConfig(config),
+                adaptiveSelection: true,
+            })) {
+                batches.push({
+                    judgeId: batch.judgeId,
+                    judgeName: batch.judgeName,
+                    findingCount: batch.evaluation.findings.length,
+                    durationMs: batch.evaluation.durationMs ?? 0,
+                    runningScore: batch.aggregate.currentScore,
+                    runningVerdict: batch.aggregate.currentVerdict,
+                });
+                finalBatch = batch;
+            }
+            // Build progressive markdown
+            let md = `# Streaming Evaluation Results\n\n`;
+            md += `**Final Score:** ${finalBatch?.aggregate.currentScore ?? 0}/100\n`;
+            md += `**Verdict:** ${(finalBatch?.aggregate.currentVerdict ?? "pass").toUpperCase()}\n`;
+            md += `**Judges Run:** ${finalBatch?.aggregate.completedJudges ?? 0}/${finalBatch?.aggregate.totalJudges ?? 0}\n`;
+            md += `**Total Findings:** ${finalBatch?.aggregate.findingsSoFar ?? 0}\n\n`;
+            md += `## Per-Judge Breakdown\n\n`;
+            md += `| Judge | Findings | Time (ms) | Running Score |\n`;
+            md += `|-------|----------|-----------|---------------|\n`;
+            for (const b of batches) {
+                md += `| ${b.judgeName} | ${b.findingCount} | ${b.durationMs} | ${b.runningScore}/100 |\n`;
+            }
+            const structuredData = {
+                score: finalBatch?.aggregate.currentScore ?? 0,
+                verdict: finalBatch?.aggregate.currentVerdict ?? "pass",
+                totalFindings: finalBatch?.aggregate.findingsSoFar ?? 0,
+                criticalFindings: finalBatch?.aggregate.criticalSoFar ?? 0,
+                highFindings: finalBatch?.aggregate.highSoFar ?? 0,
+                judgesRun: finalBatch?.aggregate.completedJudges ?? 0,
+                totalJudges: finalBatch?.aggregate.totalJudges ?? 0,
+                perJudge: batches,
+                sessionEvaluationCount: session.evaluationCount,
+            };
+            return {
+                content: [
+                    { type: "text", text: md },
+                    { type: "text", text: "```json\n" + JSON.stringify(structuredData, null, 2) + "\n```" },
+                ],
+            };
+        }
+        catch (error) {
+            return {
+                content: [
+                    {
+                        type: "text",
+                        text: error instanceof Error ? `Error: ${error.message}` : "Error: Streaming evaluation failed",
+                    },
+                ],
+                isError: true,
+            };
+        }
+    });
+}

package/dist/tools/register-fix.js CHANGED Viewed

@@ -7,6 +7,7 @@ import { evaluateWithTribunal, evaluateWithJudge } from "../evaluators/index.js"
 import { getJudge, JUDGES } from "../judges/index.js";
 import { applyPatches } from "../commands/fix.js";
 import { configSchema, toJudgesConfig } from "./schemas.js";
+import { validateCodeSize } from "./validation.js";
 /**
  * Register the fix_code tool for one-shot code evaluation + auto-fix.
  */
@@ -38,6 +39,10 @@ function registerFixCode(server) {
         config: configSchema,
     }, async ({ code, language, judgeId, context, minConfidence, config }) => {
         try {
+            const sizeError = validateCodeSize(code);
+            if (sizeError) {
+                return { content: [{ type: "text", text: `Error: ${sizeError}` }], isError: true };
+            }
             const effectiveMinConfidence = minConfidence ?? 0.5;
             // ── Evaluate ────────────────────────────────────────────────
             let allFindings;
@@ -133,8 +138,26 @@ function registerFixCode(server) {
                 text += `\n`;
             }
             text += `### Fixed Code\n\n\`\`\`${language}\n${fixedCode}\n\`\`\`\n`;
+            const structured = {
+                totalFindings: allFindings.length,
+                autoFixable: fixable.length,
+                applied,
+                skipped,
+                remaining: remaining.length,
+                patches: fixable.map((p) => ({
+                    ruleId: p.ruleId,
+                    severity: p.severity,
+                    title: p.title,
+                    line: p.patch.startLine,
+                    oldText: p.patch.oldText,
+                    newText: p.patch.newText,
+                })),
+            };
             return {
-                content: [{ type: "text", text }],
+                content: [
+                    { type: "text", text },
+                    { type: "text", text: "```json\n" + JSON.stringify(structured, null, 2) + "\n```" },
+                ],
             };
         }
         catch (error) {

package/dist/tools/register-resources.d.ts ADDED Viewed

@@ -0,0 +1,6 @@
+import type { McpServer } from "@modelcontextprotocol/sdk/server/mcp.js";
+/**
+ * Register MCP resources: judges catalog, presets, session state,
+ * and parameterized templates for single-judge / single-preset lookups.
+ */
+export declare function registerResources(server: McpServer): void;

package/dist/tools/register-resources.js ADDED Viewed

@@ -0,0 +1,177 @@
+// ─── MCP Resource Registration ───────────────────────────────────────────────
+// Expose judges metadata, presets, and session state as MCP resources.
+// Includes both static resources and parameterized resource templates for
+// efficient single-item lookups (judges://judge/{id}, judges://preset/{key}).
+// ──────────────────────────────────────────────────────────────────────────────
+import { ResourceTemplate } from "@modelcontextprotocol/sdk/server/mcp.js";
+import { getJudge, getJudgeSummaries, JUDGES } from "../judges/index.js";
+import { getPreset, PRESETS } from "../presets.js";
+import { getGlobalSession } from "../evaluation-session.js";
+/**
+ * Register MCP resources: judges catalog, presets, session state,
+ * and parameterized templates for single-judge / single-preset lookups.
+ */
+export function registerResources(server) {
+    registerJudgesCatalog(server);
+    registerPresetsResource(server);
+    registerSessionResource(server);
+    registerJudgeTemplate(server);
+    registerPresetTemplate(server);
+}
+// ─── judges://catalog ────────────────────────────────────────────────────────
+function registerJudgesCatalog(server) {
+    server.resource("judges-catalog", "judges://catalog", { description: "Full catalog of all judges on the panel — IDs, names, domains, and descriptions." }, async (uri) => {
+        const judges = getJudgeSummaries();
+        const data = judges.map((j) => ({
+            id: j.id,
+            name: j.name,
+            domain: j.domain,
+            description: j.description,
+        }));
+        return {
+            contents: [
+                {
+                    uri: uri.href,
+                    mimeType: "application/json",
+                    text: JSON.stringify(data, null, 2),
+                },
+            ],
+        };
+    });
+}
+// ─── judges://presets ────────────────────────────────────────────────────────
+function registerPresetsResource(server) {
+    server.resource("presets", "judges://presets", { description: "Available evaluation presets with names, descriptions, and configuration overrides." }, async (uri) => {
+        const data = Object.entries(PRESETS).map(([key, preset]) => ({
+            key,
+            name: preset.name,
+            description: preset.description,
+            config: preset.config,
+        }));
+        return {
+            contents: [
+                {
+                    uri: uri.href,
+                    mimeType: "application/json",
+                    text: JSON.stringify(data, null, 2),
+                },
+            ],
+        };
+    });
+}
+// ─── judges://session ────────────────────────────────────────────────────────
+function registerSessionResource(server) {
+    server.resource("session", "judges://session", {
+        description: "Current evaluation session state — evaluation count, detected frameworks, verdict history, and stability indicators.",
+    }, async (uri) => {
+        const session = getGlobalSession();
+        const ctx = session.getContext();
+        const filesEvaluated = [...ctx.verdictHistory.entries()].map(([file, history]) => ({
+            file,
+            evaluations: history.length,
+            latestScore: history[history.length - 1]?.score ?? 0,
+            stable: session.isVerdictStable(file),
+        }));
+        const data = {
+            evaluationCount: ctx.evaluationCount,
+            startedAt: ctx.startedAt,
+            frameworks: ctx.frameworks,
+            capabilities: [...ctx.capabilities],
+            filesEvaluated,
+        };
+        return {
+            contents: [
+                {
+                    uri: uri.href,
+                    mimeType: "application/json",
+                    text: JSON.stringify(data, null, 2),
+                },
+            ],
+        };
+    });
+}
+// ─── judges://judge/{id} (template) ─────────────────────────────────────────
+function registerJudgeTemplate(server) {
+    const judgeIds = JUDGES.map((j) => j.id);
+    server.resource("judge-detail", new ResourceTemplate("judges://judge/{id}", {
+        list: async () => ({
+            resources: judgeIds.map((id) => ({
+                uri: `judges://judge/${id}`,
+                name: id,
+            })),
+        }),
+        complete: {
+            id: (value) => judgeIds.filter((id) => id.startsWith(value)),
+        },
+    }), { description: "Detailed info for a single judge — rules, domain, system prompt summary." }, async (uri, { id }) => {
+        const judgeId = Array.isArray(id) ? id[0] : id;
+        const judge = getJudge(judgeId);
+        if (!judge) {
+            return {
+                contents: [
+                    {
+                        uri: uri.href,
+                        mimeType: "application/json",
+                        text: JSON.stringify({ error: `Judge '${judgeId}' not found` }),
+                    },
+                ],
+            };
+        }
+        const data = {
+            id: judge.id,
+            name: judge.name,
+            domain: judge.domain,
+            description: judge.description,
+            rulePrefix: judge.rulePrefix,
+            tableDescription: judge.tableDescription,
+            promptDescription: judge.promptDescription,
+        };
+        return {
+            contents: [
+                {
+                    uri: uri.href,
+                    mimeType: "application/json",
+                    text: JSON.stringify(data, null, 2),
+                },
+            ],
+        };
+    });
+}
+// ─── judges://preset/{key} (template) ───────────────────────────────────────
+function registerPresetTemplate(server) {
+    const presetKeys = Object.keys(PRESETS);
+    server.resource("preset-detail", new ResourceTemplate("judges://preset/{key}", {
+        list: async () => ({
+            resources: presetKeys.map((key) => ({
+                uri: `judges://preset/${key}`,
+                name: key,
+            })),
+        }),
+        complete: {
+            key: (value) => presetKeys.filter((k) => k.startsWith(value)),
+        },
+    }), { description: "Detailed configuration for a single evaluation preset." }, async (uri, { key }) => {
+        const presetKey = Array.isArray(key) ? key[0] : key;
+        const preset = getPreset(presetKey);
+        if (!preset) {
+            return {
+                contents: [
+                    {
+                        uri: uri.href,
+                        mimeType: "application/json",
+                        text: JSON.stringify({ error: `Preset '${presetKey}' not found` }),
+                    },
+                ],
+            };
+        }
+        return {
+            contents: [
+                {
+                    uri: uri.href,
+                    mimeType: "application/json",
+                    text: JSON.stringify({ key: presetKey, ...preset }, null, 2),
+                },
+            ],
+        };
+    });
+}

package/dist/tools/register-review.js CHANGED Viewed

@@ -115,8 +115,21 @@ function registerExplainFinding(server) {
             sections.push(`\n## Remediation\n${remediation}`);
         }
         sections.push(`\n## Next steps\n- Use \`triage_finding\` to accept, defer, or dismiss this finding\n- Use \`fix_code\` to auto-fix if a patch is available\n- Use \`evaluate_code\` to re-evaluate after fixing`);
+        const structured = {
+            ruleId,
+            prefix,
+            title: title ?? null,
+            severity: severity ?? null,
+            owasp: ctx?.owasp ?? null,
+            cwe: ctx?.cwe ?? null,
+            learn: ctx?.learn ?? null,
+            remediation: getRemediationGuidance(prefix) ?? null,
+        };
         return {
-            content: [{ type: "text", text: sections.join("\n") }],
+            content: [
+                { type: "text", text: sections.join("\n") },
+                { type: "text", text: "```json\n" + JSON.stringify(structured, null, 2) + "\n```" },
+            ],
         };
     });
 }
@@ -173,6 +186,18 @@ function registerTriageFinding(server) {
                         type: "text",
                         text: `✓ Triaged finding \`${result.ruleId}\` in ${result.filePath} as **${status}**${reason ? `\n\nReason: ${reason}` : ""}${triagedBy ? `\nTriaged by: ${triagedBy}` : ""}`,
                     },
+                    {
+                        type: "text",
+                        text: "```json\n" +
+                            JSON.stringify({
+                                ruleId: result.ruleId,
+                                filePath: result.filePath,
+                                status,
+                                reason: reason ?? null,
+                                triagedBy: triagedBy ?? null,
+                            }, null, 2) +
+                            "\n```",
+                    },
                 ],
             };
         }