npm - @sanity/ailf - Versions diffs - 4.6.0 → 6.0.0 - Mend

@sanity/ailf 4.6.0 → 6.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (185) hide show

package/dist/adapters/task-sources/repo-schemas.d.ts CHANGED Viewed

@@ -32,6 +32,40 @@ export type CuratedAssertionType = (typeof CURATED_ASSERTION_TYPES)[number];
  */
 export declare const RUBRIC_TEMPLATE_NAMES: readonly ["task-completion", "code-correctness", "doc-coverage", "mcp-input-validation", "mcp-output-correctness", "mcp-error-handling", "mcp-security", "factual-correctness", "completeness", "currency", "process-quality", "agent-output", "agent-tool-usage"];
 export type RubricTemplateName = (typeof RUBRIC_TEMPLATE_NAMES)[number];
+/**
+ * A single criterion within an llm-rubric assertion. Stable id-text pair.
+ */
+export declare const CriterionRefSchema: z.ZodObject<{
+    id: z.ZodString;
+    text: z.ZodString;
+}, z.core.$strip>;
+/**
+ * A templated LLM-rubric assertion — uses one of the predefined rubric
+ * templates with author-supplied criteria.
+ */
+export declare const TemplatedAssertionSchema: z.ZodObject<{
+    type: z.ZodLiteral<"llm-rubric">;
+    template: z.ZodEnum<{
+        "task-completion": "task-completion";
+        "code-correctness": "code-correctness";
+        "doc-coverage": "doc-coverage";
+        "mcp-input-validation": "mcp-input-validation";
+        "mcp-output-correctness": "mcp-output-correctness";
+        "mcp-error-handling": "mcp-error-handling";
+        "mcp-security": "mcp-security";
+        "factual-correctness": "factual-correctness";
+        completeness: "completeness";
+        currency: "currency";
+        "process-quality": "process-quality";
+        "agent-output": "agent-output";
+        "agent-tool-usage": "agent-tool-usage";
+    }>;
+    criteria: z.ZodArray<z.ZodObject<{
+        id: z.ZodString;
+        text: z.ZodString;
+    }, z.core.$strip>>;
+    weight: z.ZodOptional<z.ZodNumber>;
+}, z.core.$strip>;
 /**
  * Zod schema for a single task definition — a mode-discriminated union
  * mirroring `GeneralizedTaskDefinition`.
@@ -73,7 +107,10 @@ export declare const CanonicalTaskSchema: z.ZodDiscriminatedUnion<[z.ZodObject<{
             "agent-output": "agent-output";
             "agent-tool-usage": "agent-tool-usage";
         }>;
-        criteria: z.ZodArray<z.ZodString>;
+        criteria: z.ZodArray<z.ZodObject<{
+            id: z.ZodString;
+            text: z.ZodString;
+        }, z.core.$strip>>;
         weight: z.ZodOptional<z.ZodNumber>;
     }, z.core.$strip>, z.ZodObject<{
         type: z.ZodEnum<{
@@ -187,7 +224,10 @@ export declare const CanonicalTaskSchema: z.ZodDiscriminatedUnion<[z.ZodObject<{
             "agent-output": "agent-output";
             "agent-tool-usage": "agent-tool-usage";
         }>;
-        criteria: z.ZodArray<z.ZodString>;
+        criteria: z.ZodArray<z.ZodObject<{
+            id: z.ZodString;
+            text: z.ZodString;
+        }, z.core.$strip>>;
         weight: z.ZodOptional<z.ZodNumber>;
     }, z.core.$strip>, z.ZodObject<{
         type: z.ZodEnum<{
@@ -341,7 +381,10 @@ export declare const CanonicalTaskSchema: z.ZodDiscriminatedUnion<[z.ZodObject<{
             "agent-output": "agent-output";
             "agent-tool-usage": "agent-tool-usage";
         }>;
-        criteria: z.ZodArray<z.ZodString>;
+        criteria: z.ZodArray<z.ZodObject<{
+            id: z.ZodString;
+            text: z.ZodString;
+        }, z.core.$strip>>;
         weight: z.ZodOptional<z.ZodNumber>;
     }, z.core.$strip>, z.ZodObject<{
         type: z.ZodEnum<{
@@ -472,7 +515,10 @@ export declare const CanonicalTaskSchema: z.ZodDiscriminatedUnion<[z.ZodObject<{
             "agent-output": "agent-output";
             "agent-tool-usage": "agent-tool-usage";
         }>;
-        criteria: z.ZodArray<z.ZodString>;
+        criteria: z.ZodArray<z.ZodObject<{
+            id: z.ZodString;
+            text: z.ZodString;
+        }, z.core.$strip>>;
         weight: z.ZodOptional<z.ZodNumber>;
     }, z.core.$strip>, z.ZodObject<{
         type: z.ZodEnum<{
@@ -591,7 +637,10 @@ export declare const CanonicalTaskSchema: z.ZodDiscriminatedUnion<[z.ZodObject<{
             "agent-output": "agent-output";
             "agent-tool-usage": "agent-tool-usage";
         }>;
-        criteria: z.ZodArray<z.ZodString>;
+        criteria: z.ZodArray<z.ZodObject<{
+            id: z.ZodString;
+            text: z.ZodString;
+        }, z.core.$strip>>;
         weight: z.ZodOptional<z.ZodNumber>;
     }, z.core.$strip>, z.ZodObject<{
         type: z.ZodEnum<{
@@ -699,7 +748,10 @@ export declare const ContentLakeAuthorableTaskSchema: z.ZodObject<{
             "agent-output": "agent-output";
             "agent-tool-usage": "agent-tool-usage";
         }>;
-        criteria: z.ZodArray<z.ZodString>;
+        criteria: z.ZodArray<z.ZodObject<{
+            id: z.ZodString;
+            text: z.ZodString;
+        }, z.core.$strip>>;
         weight: z.ZodOptional<z.ZodNumber>;
     }, z.core.$strip>, z.ZodObject<{
         type: z.ZodEnum<{
@@ -819,7 +871,10 @@ export declare const CanonicalTaskFileSchema: z.ZodArray<z.ZodDiscriminatedUnion
             "agent-output": "agent-output";
             "agent-tool-usage": "agent-tool-usage";
         }>;
-        criteria: z.ZodArray<z.ZodString>;
+        criteria: z.ZodArray<z.ZodObject<{
+            id: z.ZodString;
+            text: z.ZodString;
+        }, z.core.$strip>>;
         weight: z.ZodOptional<z.ZodNumber>;
     }, z.core.$strip>, z.ZodObject<{
         type: z.ZodEnum<{
@@ -933,7 +988,10 @@ export declare const CanonicalTaskFileSchema: z.ZodArray<z.ZodDiscriminatedUnion
             "agent-output": "agent-output";
             "agent-tool-usage": "agent-tool-usage";
         }>;
-        criteria: z.ZodArray<z.ZodString>;
+        criteria: z.ZodArray<z.ZodObject<{
+            id: z.ZodString;
+            text: z.ZodString;
+        }, z.core.$strip>>;
         weight: z.ZodOptional<z.ZodNumber>;
     }, z.core.$strip>, z.ZodObject<{
         type: z.ZodEnum<{
@@ -1087,7 +1145,10 @@ export declare const CanonicalTaskFileSchema: z.ZodArray<z.ZodDiscriminatedUnion
             "agent-output": "agent-output";
             "agent-tool-usage": "agent-tool-usage";
         }>;
-        criteria: z.ZodArray<z.ZodString>;
+        criteria: z.ZodArray<z.ZodObject<{
+            id: z.ZodString;
+            text: z.ZodString;
+        }, z.core.$strip>>;
         weight: z.ZodOptional<z.ZodNumber>;
     }, z.core.$strip>, z.ZodObject<{
         type: z.ZodEnum<{
@@ -1218,7 +1279,10 @@ export declare const CanonicalTaskFileSchema: z.ZodArray<z.ZodDiscriminatedUnion
             "agent-output": "agent-output";
             "agent-tool-usage": "agent-tool-usage";
         }>;
-        criteria: z.ZodArray<z.ZodString>;
+        criteria: z.ZodArray<z.ZodObject<{
+            id: z.ZodString;
+            text: z.ZodString;
+        }, z.core.$strip>>;
         weight: z.ZodOptional<z.ZodNumber>;
     }, z.core.$strip>, z.ZodObject<{
         type: z.ZodEnum<{
@@ -1337,7 +1401,10 @@ export declare const CanonicalTaskFileSchema: z.ZodArray<z.ZodDiscriminatedUnion
             "agent-output": "agent-output";
             "agent-tool-usage": "agent-tool-usage";
         }>;
-        criteria: z.ZodArray<z.ZodString>;
+        criteria: z.ZodArray<z.ZodObject<{
+            id: z.ZodString;
+            text: z.ZodString;
+        }, z.core.$strip>>;
         weight: z.ZodOptional<z.ZodNumber>;
     }, z.core.$strip>, z.ZodObject<{
         type: z.ZodEnum<{
@@ -1468,6 +1535,7 @@ export declare const RepoConfigSchema: z.ZodObject<{
     execution: z.ZodOptional<z.ZodObject<{
         concurrency: z.ZodOptional<z.ZodNumber>;
         graderReplications: z.ZodOptional<z.ZodNumber>;
+        borderlineReplications: z.ZodOptional<z.ZodNumber>;
         gapAnalysis: z.ZodOptional<z.ZodBoolean>;
         apiUrl: z.ZodOptional<z.ZodString>;
     }, z.core.$strip>>;

package/dist/adapters/task-sources/repo-schemas.js CHANGED Viewed

@@ -111,14 +111,26 @@ const CanonicalDocRefSchema = z.union([
 // ---------------------------------------------------------------------------
 // Assertion schemas
 // ---------------------------------------------------------------------------
+/**
+ * A single criterion within an llm-rubric assertion. Stable id-text pair.
+ */
+export const CriterionRefSchema = z.object({
+    id: z
+        .string()
+        .min(1)
+        .regex(/^[a-z0-9][a-z0-9-]*$/, {
+        message: "criterion id must be lowercase alphanumeric with hyphens",
+    }),
+    text: z.string().min(1),
+});
 /**
  * A templated LLM-rubric assertion — uses one of the predefined rubric
  * templates with author-supplied criteria.
  */
-const TemplatedAssertionSchema = z.object({
+export const TemplatedAssertionSchema = z.object({
     type: z.literal("llm-rubric"),
     template: z.enum(RUBRIC_TEMPLATE_NAMES),
-    criteria: z.array(z.string().min(1)).min(1),
+    criteria: z.array(CriterionRefSchema).min(1),
     weight: z.number().optional(),
 });
 /**
@@ -562,6 +574,11 @@ const ExecutionConfigSchema = z
     .object({
     concurrency: z.number().int().positive().optional(),
     graderReplications: z.number().int().positive().optional(),
+    /**
+     * Plan 03-04 GRAD-04 — replications per borderline judgment.
+     * Default 3 (composition-root). Positive integer.
+     */
+    borderlineReplications: z.number().int().positive().optional(),
     gapAnalysis: z.boolean().optional(),
     apiUrl: z.string().url().optional(),
 })

package/dist/cli-program.js CHANGED Viewed

@@ -32,6 +32,7 @@ import { createFetchDocsCommand } from "./commands/fetch-docs.js";
 import { createGenerateConfigsCommand } from "./commands/generate-configs.js";
 import { createGraderCommand } from "./commands/grader/index.js";
 import { createInitCommand } from "./commands/init.js";
+import { createInterpretCommand } from "./commands/interpret.js";
 import { createInteractiveCommand } from "./commands/interactive.js";
 import { createLookupDocCommand } from "./commands/lookup-doc.js";
 import { createMeasureRetrievalCommand } from "./commands/measure-retrieval.js";
@@ -110,6 +111,8 @@ export function buildCliProgram(opts) {
         .addCommand(createWeeklyDigestCommand())
         .addCommand(createCheckStalenessCommand());
     program.addCommand(reportCommand.helpGroup(CommandGroup.AnalysisReports));
+    // `ailf interpret <reportId>` — top-level (not nested under report) per AI-SPEC
+    program.addCommand(createInterpretCommand().helpGroup(CommandGroup.AnalysisReports));
     // ── Grader Reliability ────────────────────────────────────────────────
     program.addCommand(createGraderCommand().helpGroup(CommandGroup.GraderReliability));
     // ── Setup & Configuration ─────────────────────────────────────────────

package/dist/commands/calculate-scores.js CHANGED Viewed

@@ -38,7 +38,7 @@ export function createCalculateScoresCommand() {
                 remote: false,
                 apiUrl: "https://ailf-api.sanity.build",
             });
-            const result = calculateAndWriteScores({
+            const result = await calculateAndWriteScores({
                 resultsPath,
                 rootDir: ctx.config.rootDir,
                 source: opts.source,

package/dist/commands/explain-handler.js CHANGED Viewed

@@ -298,7 +298,7 @@ const EXPLAIN_REGISTRY = {
         ],
     },
     "lookup-doc": {
-        description: "Search Sanity for documentation articles by keyword (find slugs for canonicalDocs)",
+        description: "Search Sanity for documentation articles by keyword (find slugs for contextDocs)",
         steps: [
             {
                 cacheStatus: "miss",

package/dist/commands/interpret.d.ts ADDED Viewed

@@ -0,0 +1,50 @@
+/**
+ * interpret command — generate a Diagnosis for a Report.
+ *
+ * Wraps `getDiagnosisRunner(ctx)` from the composition root in a Commander
+ * command for consistent CLI integration. Closest analog: compare.ts.
+ *
+ * Entry points:
+ *   ailf interpret <reportId>          — one-line-per-card summary
+ *   ailf interpret <reportId> --json   — full Diagnosis JSON
+ *   ailf interpret latest              — most recent report
+ *   ailf interpret <id> --compare <ref>  — DIAG-05 regression comparison
+ *   ailf interpret <id> --refresh      — bypass version-keyed cache
+ *
+ * @see packages/eval/src/commands/compare.ts — CLI factory analog
+ * @see packages/eval/src/composition-root.ts — getDiagnosisRunner
+ * @see .planning/phases/05-diagnosis-engine-cli-llm-cards/05-AI-SPEC.md §6
+ */
+import { Command } from "commander";
+import type { DiagnosisRunner, VersionedInputs } from "../_vendor/ailf-core/index.d.ts";
+interface MinimalReportStore {
+    read(id: string): Promise<unknown | null>;
+    latest(): Promise<unknown | null>;
+}
+export interface InterpretCommandOptions {
+    /**
+     * Override the runner factory for tests. When omitted, the command
+     * imports `getDiagnosisRunner` from the composition root at action time.
+     */
+    readonly runnerFactory?: (ctx: unknown) => DiagnosisRunner;
+    /**
+     * Override the store factory for tests. When omitted, the command
+     * creates the app context and uses `ctx.reportStore` at action time.
+     */
+    readonly storeFactory?: () => MinimalReportStore | null;
+    /**
+     * Override the versions resolver for tests. Receives the stored report
+     * record and returns the `VersionedInputs` needed by the runner.
+     * When omitted, the command derives versions from the report's metadata.
+     */
+    readonly versionsFromReport?: (report: unknown) => VersionedInputs;
+}
+/**
+ * Create the `ailf interpret <reportId>` Commander command.
+ *
+ * Accepts optional `InterpretCommandOptions` for testability — tests can
+ * inject a fake runner factory and store factory without touching module
+ * mocks (preferred per testing.md).
+ */
+export declare function createInterpretCommand(options?: InterpretCommandOptions): Command;
+export {};

package/dist/commands/interpret.js ADDED Viewed

@@ -0,0 +1,212 @@
+/**
+ * interpret command — generate a Diagnosis for a Report.
+ *
+ * Wraps `getDiagnosisRunner(ctx)` from the composition root in a Commander
+ * command for consistent CLI integration. Closest analog: compare.ts.
+ *
+ * Entry points:
+ *   ailf interpret <reportId>          — one-line-per-card summary
+ *   ailf interpret <reportId> --json   — full Diagnosis JSON
+ *   ailf interpret latest              — most recent report
+ *   ailf interpret <id> --compare <ref>  — DIAG-05 regression comparison
+ *   ailf interpret <id> --refresh      — bypass version-keyed cache
+ *
+ * @see packages/eval/src/commands/compare.ts — CLI factory analog
+ * @see packages/eval/src/composition-root.ts — getDiagnosisRunner
+ * @see .planning/phases/05-diagnosis-engine-cli-llm-cards/05-AI-SPEC.md §6
+ */
+import { dirname, resolve } from "path";
+import { fileURLToPath } from "url";
+import { Command } from "commander";
+import { addOutputDirOption } from "./shared/options.js";
+import { resolveOutputDir } from "./shared/resolve-output-dir.js";
+// ---------------------------------------------------------------------------
+// Module-level root constant (same pattern as compare.ts)
+// ---------------------------------------------------------------------------
+const __dirname = dirname(fileURLToPath(import.meta.url));
+const ROOT = resolve(__dirname, "..", "..");
+// ---------------------------------------------------------------------------
+// Card output formatting (AI-SPEC §6 graceful-degradation-visibility)
+// ---------------------------------------------------------------------------
+/**
+ * Visual status markers — locked visual contract per plan Test 7:
+ * ready: "✓", degraded: "⚠", missing: "—"
+ */
+const STATUS_ICONS = {
+    ready: "✓",
+    degraded: "⚠",
+    missing: "—",
+};
+function getCardSummaryText(card) {
+    if (card.status === "ready") {
+        return card.body.summary;
+    }
+    if (card.status === "degraded") {
+        return card.reason;
+    }
+    // missing
+    return card.reason;
+}
+/**
+ * Format a single card as a one-line summary string.
+ *
+ * Format: `<icon> <cardType>: <summary>`
+ * Per AI-SPEC §6: distinct icons for ready / degraded / missing.
+ */
+function formatCardSummaryLine(card) {
+    const icon = STATUS_ICONS[card.status];
+    const text = getCardSummaryText(card);
+    return `${icon} ${card.cardType}: ${text}`;
+}
+// ---------------------------------------------------------------------------
+// Default versions resolver
+// ---------------------------------------------------------------------------
+/**
+ * Derive VersionedInputs from a stored report record.
+ *
+ * The four-version chain is carried in `report.summary.versions` per the
+ * Phase 5 schema, with `diagnosisVersion` sourced from the runner's const.
+ * Falls back to hard-coded "unknown" values when the fields are not present
+ * (legacy reports without version metadata).
+ */
+function defaultVersionsFromReport(report) {
+    const rec = report;
+    const summary = rec.summary;
+    const versions = summary?.versions;
+    return {
+        graderJudgmentsVersion: typeof versions?.graderJudgmentsVersion === "string"
+            ? versions.graderJudgmentsVersion
+            : "unknown",
+        ensembleVersion: typeof versions?.ensembleVersion === "string"
+            ? versions.ensembleVersion
+            : "unknown",
+        diagnosisVersion: typeof versions?.diagnosisVersion === "string"
+            ? versions.diagnosisVersion
+            : "0.1.0",
+        cardVersion: typeof versions?.cardVersion === "string"
+            ? versions.cardVersion
+            : "0.1.0",
+    };
+}
+// ---------------------------------------------------------------------------
+// Command factory
+// ---------------------------------------------------------------------------
+/**
+ * Create the `ailf interpret <reportId>` Commander command.
+ *
+ * Accepts optional `InterpretCommandOptions` for testability — tests can
+ * inject a fake runner factory and store factory without touching module
+ * mocks (preferred per testing.md).
+ */
+export function createInterpretCommand(options = {}) {
+    const { runnerFactory, storeFactory, versionsFromReport } = options;
+    const cmd = new Command("interpret")
+        .description("Generate a Diagnosis for a Report — 8 typed cards explaining what's weak and what to do")
+        .argument("<reportId>", "Report ID (or 'latest' for the most recent)")
+        .option("-c, --compare <ref>", "Baseline report ID for regression-vs-baseline comparison")
+        .option("--refresh", "Bypass the version-keyed cache and recompute")
+        .option("--json", "Print full Diagnosis JSON instead of one-line-per-card summary")
+        .action(async (reportId, opts) => {
+        const outputDir = resolveOutputDir(opts.outputDir);
+        // ---------------------------------------------------------------------------
+        // Resolve store: injected factory (tests) or composition root (production)
+        // ---------------------------------------------------------------------------
+        let store;
+        let ctx;
+        if (storeFactory) {
+            store = storeFactory();
+            ctx = null;
+        }
+        else {
+            // Production path — lazy import to keep the module fast in tests
+            // Minimal config: report-read-only, no eval/fetch/publish.
+            const { createAppContext } = await import("../composition-root.js");
+            ctx = createAppContext({
+                compareEnabled: false,
+                gapAnalysisEnabled: false,
+                mode: "literacy",
+                noAutoScope: false,
+                noCache: true,
+                noRemoteCache: true,
+                outputDir,
+                publishEnabled: false,
+                rootDir: ROOT,
+                searchMode: "open",
+                skipEval: true,
+                skipFetch: true,
+                remote: false,
+                apiUrl: "https://ailf-api.sanity.build",
+            });
+            const prodCtx = ctx;
+            store = prodCtx.reportStore;
+        }
+        if (!store) {
+            process.stderr.write("Error: report store is not available\n");
+            process.exit(1);
+        }
+        // ---------------------------------------------------------------------------
+        // Resolve main report
+        // ---------------------------------------------------------------------------
+        const report = reportId === "latest"
+            ? await store.latest()
+            : await store.read(reportId);
+        if (!report) {
+            process.stderr.write(`Error: report not found: ${reportId}\n`);
+            process.exit(1);
+        }
+        // ---------------------------------------------------------------------------
+        // Optionally resolve baseline (DIAG-05)
+        // ---------------------------------------------------------------------------
+        let baseline;
+        if (opts.compare) {
+            baseline = await store.read(opts.compare);
+            if (!baseline) {
+                process.stderr.write(`Error: baseline report not found: ${opts.compare}\n`);
+                process.exit(1);
+            }
+        }
+        // ---------------------------------------------------------------------------
+        // Resolve versions
+        // ---------------------------------------------------------------------------
+        const versions = versionsFromReport
+            ? versionsFromReport(report)
+            : defaultVersionsFromReport(report);
+        // ---------------------------------------------------------------------------
+        // Build runner
+        // ---------------------------------------------------------------------------
+        let runner;
+        if (runnerFactory) {
+            runner = runnerFactory(ctx);
+        }
+        else {
+            const { getDiagnosisRunner } = await import("../composition-root.js");
+            // eslint-disable-next-line @typescript-eslint/no-explicit-any
+            runner = getDiagnosisRunner(ctx);
+        }
+        // ---------------------------------------------------------------------------
+        // Run diagnosis
+        // ---------------------------------------------------------------------------
+        const diagnosis = await runner.run({
+            // The report here is the eval's ReportStore record, which satisfies
+            // the Report interface for runner.run purposes (both carry id + provenance.runId).
+            // eslint-disable-next-line @typescript-eslint/no-explicit-any
+            report: report,
+            versions,
+            ...(baseline ? { baseline: baseline } : {}),
+            refresh: opts.refresh ?? false,
+        });
+        // ---------------------------------------------------------------------------
+        // Print output
+        // ---------------------------------------------------------------------------
+        if (opts.json) {
+            process.stdout.write(`${JSON.stringify(diagnosis, null, 2)}\n`);
+        }
+        else {
+            for (const card of diagnosis.cards) {
+                process.stdout.write(`${formatCardSummaryLine(card)}\n`);
+            }
+        }
+    });
+    addOutputDirOption(cmd);
+    return cmd;
+}

package/dist/commands/lookup-doc.d.ts CHANGED Viewed

@@ -1,7 +1,7 @@
 /**
  * lookup-doc command — search Sanity for documentation articles by keyword.
  *
- * Helps external contributors find the correct `slug` for canonicalDocs
+ * Helps external contributors find the correct `slug` for contextDocs
  * references without needing to browse the CMS or guess from URLs.
  *
  * Usage:

package/dist/commands/lookup-doc.js CHANGED Viewed

@@ -1,7 +1,7 @@
 /**
  * lookup-doc command — search Sanity for documentation articles by keyword.
  *
- * Helps external contributors find the correct `slug` for canonicalDocs
+ * Helps external contributors find the correct `slug` for contextDocs
  * references without needing to browse the CMS or guess from URLs.
  *
  * Usage:
@@ -14,7 +14,7 @@
 import { Command } from "commander";
 export function createLookupDocCommand() {
     return new Command("lookup-doc")
-        .description("Search Sanity docs by keyword — find slugs for canonicalDocs references")
+        .description("Search Sanity docs by keyword — find slugs for contextDocs references")
         .argument("<keyword>", "Search keyword (matches title and slug)")
         .option("-l, --limit <n>", "Maximum results to show", parseInt, 10)
         .option("-s, --source <name>", "Documentation source (from sources.yaml)")
@@ -73,7 +73,7 @@ export function createLookupDocCommand() {
             console.log(`  ${"".padEnd(maxSlugLen + 6)}  │ Section: ${section}\n`);
         }
         console.log("  Usage in .ailf/tasks/*.yaml:\n");
-        console.log("  canonicalDocs:");
+        console.log("  contextDocs:");
         console.log(`    - slug: ${results[0].slug}`);
         console.log(`      reason: "${results[0].title}"`);
         if (results[0].sectionSlug) {

package/dist/commands/pipeline-action.d.ts CHANGED Viewed

@@ -27,6 +27,12 @@ export interface ResolvedOptions {
     dryRun: boolean;
     gapAnalysisEnabled: boolean;
     graderReplications?: number;
+    /**
+     * Replications per borderline judgment for the GRAD-04 intra-grader
+     * consensus pass. Sourced from `.ailf/config.yaml`'s
+     * `execution.borderlineReplications`.
+     */
+    borderlineReplications?: number;
     /** Grader context policy from `.ailf/config.yaml` `grader.context` */
     graderContext?: "rubric-only" | "with-docs";
     headerArgs: string[];

package/dist/commands/pipeline-action.js CHANGED Viewed

@@ -248,6 +248,7 @@ export function computeResolvedOptions(opts) {
     //   env var (where one exists) > .ailf/config.yaml > built-in default
     const concurrency = repoConfig?.execution?.concurrency;
     const graderReplications = repoConfig?.execution?.graderReplications;
+    const borderlineReplications = repoConfig?.execution?.borderlineReplications;
     const gapAnalysisEnabled = repoConfig?.execution?.gapAnalysis ?? true;
     // Grader context policy. Cascade: env var > .ailf/config.yaml > unset
     // (defaults to rubric-only at the EvalConfig boundary). The env var is the
@@ -291,6 +292,7 @@ export function computeResolvedOptions(opts) {
         dryRun: opts.dryRun,
         gapAnalysisEnabled,
         graderReplications,
+        borderlineReplications,
         graderContext,
         headerArgs,
         impactSummary,

package/dist/commands/remote-pipeline.js CHANGED Viewed

@@ -142,6 +142,7 @@ function toConfigSlice(opts) {
         perspectiveOverride: opts.perspectiveOverride,
         graderContext: opts.graderContext,
         graderReplications: opts.graderReplications,
+        borderlineReplications: opts.borderlineReplications,
         gapAnalysisEnabled: opts.gapAnalysisEnabled,
         noRemoteCache: opts.noRemoteCache,
         // D0037 / W0069 caller envelope overrides — flags override env vars