npm - @sanity/ailf - Versions diffs - 4.2.0 → 4.3.1 - Mend

@sanity/ailf 4.2.0 → 4.3.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (105) hide show

package/config/package-surface.ts +37 -0
package/config/preflight-scoring.ts +26 -0
package/dist/_vendor/ailf-core/artifact-registry.d.ts +1 -1
package/dist/_vendor/ailf-core/artifact-registry.js +47 -0
package/dist/_vendor/ailf-core/config-helpers.d.ts +35 -0
package/dist/_vendor/ailf-core/config-helpers.js +67 -0
package/dist/_vendor/ailf-core/index.d.ts +1 -1
package/dist/_vendor/ailf-core/index.js +1 -1
package/dist/_vendor/ailf-core/ports/context.d.ts +18 -0
package/dist/_vendor/ailf-core/ports/doc-fetcher.d.ts +30 -0
package/dist/_vendor/ailf-core/ports/index.d.ts +3 -1
package/dist/_vendor/ailf-core/ports/index.js +1 -0
package/dist/_vendor/ailf-core/ports/mode-handler.d.ts +23 -0
package/dist/_vendor/ailf-core/ports/package-surface-resolver.d.ts +71 -0
package/dist/_vendor/ailf-core/ports/package-surface-resolver.js +36 -0
package/dist/_vendor/ailf-core/schemas/eval-config.d.ts +6 -0
package/dist/_vendor/ailf-core/schemas/eval-config.js +14 -0
package/dist/_vendor/ailf-core/schemas/index.d.ts +1 -0
package/dist/_vendor/ailf-core/schemas/index.js +1 -0
package/dist/_vendor/ailf-core/schemas/pipeline-request.d.ts +4 -0
package/dist/_vendor/ailf-core/schemas/pipeline-request.js +7 -0
package/dist/_vendor/ailf-core/schemas/symbol-preflight-report.d.ts +51 -0
package/dist/_vendor/ailf-core/schemas/symbol-preflight-report.js +57 -0
package/dist/_vendor/ailf-core/types/index.d.ts +12 -0
package/dist/_vendor/ailf-core/types/index.js +1 -0
package/dist/_vendor/ailf-core/types/package-surface.d.ts +36 -0
package/dist/_vendor/ailf-core/types/package-surface.js +13 -0
package/dist/_vendor/ailf-core/types/pipeline-request.d.ts +1 -0
package/dist/_vendor/ailf-core/types/preflight-scoring.d.ts +52 -0
package/dist/_vendor/ailf-core/types/preflight-scoring.js +18 -0
package/dist/_vendor/ailf-core/types/repo-config.d.ts +14 -0
package/dist/_vendor/ailf-core/types/symbol-preflight-report.d.ts +66 -0
package/dist/_vendor/ailf-core/types/symbol-preflight-report.js +25 -0
package/dist/adapters/api-client/build-request.d.ts +1 -0
package/dist/adapters/api-client/build-request.js +3 -0
package/dist/adapters/config-sources/file-config-adapter.js +1 -0
package/dist/adapters/doc-fetchers/sanity-doc-fetcher.d.ts +4 -0
package/dist/adapters/doc-fetchers/sanity-doc-fetcher.js +159 -82
package/dist/adapters/index.d.ts +1 -0
package/dist/adapters/index.js +1 -0
package/dist/adapters/package-surface/dts-package-surface.d.ts +46 -0
package/dist/adapters/package-surface/dts-package-surface.js +173 -0
package/dist/adapters/package-surface/in-memory-package-surface.d.ts +15 -0
package/dist/adapters/package-surface/in-memory-package-surface.js +28 -0
package/dist/adapters/package-surface/index.d.ts +9 -0
package/dist/adapters/package-surface/index.js +8 -0
package/dist/adapters/package-surface/parse-dts-exports.d.ts +31 -0
package/dist/adapters/package-surface/parse-dts-exports.js +54 -0
package/dist/adapters/task-sources/repo-schemas.d.ts +6 -0
package/dist/adapters/task-sources/repo-schemas.js +15 -0
package/dist/commands/pipeline-action.d.ts +2 -0
package/dist/commands/pipeline-action.js +12 -0
package/dist/commands/remote-pipeline.js +10 -2
package/dist/commands/remote-results.d.ts +12 -1
package/dist/commands/remote-results.js +25 -5
package/dist/composition-root.js +9 -0
package/dist/config/package-surface.ts +37 -0
package/dist/config/preflight-scoring.ts +26 -0
package/dist/index.d.ts +2 -2
package/dist/index.js +1 -1
package/dist/orchestration/build-app-context.js +1 -0
package/dist/orchestration/pipeline-orchestrator.d.ts +19 -1
package/dist/orchestration/pipeline-orchestrator.js +38 -0
package/dist/orchestration/steps/calculate-scores-step.js +11 -0
package/dist/orchestration/steps/generate-configs-step.js +16 -1
package/dist/orchestration/steps/run-eval-step.js +27 -0
package/dist/pipeline/calculate-scores.d.ts +66 -5
package/dist/pipeline/calculate-scores.js +141 -27
package/dist/pipeline/compiler/index.d.ts +1 -1
package/dist/pipeline/compiler/index.js +1 -1
package/dist/pipeline/compiler/literacy-bridge.d.ts +9 -0
package/dist/pipeline/compiler/literacy-bridge.js +2 -0
package/dist/pipeline/compiler/mode-handlers/literacy/assertions.d.ts +1 -1
package/dist/pipeline/compiler/mode-handlers/literacy/assertions.js +31 -4
package/dist/pipeline/compiler/mode-handlers/literacy/compiler.js +146 -1
package/dist/pipeline/compiler/mode-handlers/literacy/index.js +2 -0
package/dist/pipeline/compiler/mode-handlers/literacy/types.d.ts +17 -2
package/dist/pipeline/compiler/rubric-resolution.d.ts +17 -1
package/dist/pipeline/compiler/rubric-resolution.js +78 -2
package/dist/pipeline/compiler/scoring-bridge.d.ts +49 -2
package/dist/pipeline/compiler/scoring-bridge.js +104 -10
package/dist/pipeline/eval-fingerprint.d.ts +9 -0
package/dist/pipeline/eval-fingerprint.js +7 -1
package/dist/pipeline/map-request-to-config.js +1 -0
package/dist/pipeline/preflight/compute-preflight.d.ts +67 -0
package/dist/pipeline/preflight/compute-preflight.js +118 -0
package/dist/pipeline/preflight/emit-symbol-preflight.d.ts +51 -0
package/dist/pipeline/preflight/emit-symbol-preflight.js +102 -0
package/dist/pipeline/preflight/load-package-surface.d.ts +14 -0
package/dist/pipeline/preflight/load-package-surface.js +19 -0
package/dist/pipeline/preflight/load-preflight-context.d.ts +13 -0
package/dist/pipeline/preflight/load-preflight-context.js +25 -0
package/dist/pipeline/preflight/load-preflight-scoring.d.ts +12 -0
package/dist/pipeline/preflight/load-preflight-scoring.js +17 -0
package/dist/pipeline/preflight/parse-imports.d.ts +62 -0
package/dist/pipeline/preflight/parse-imports.js +125 -0
package/dist/report-store.d.ts +8 -0
package/dist/report-store.js +55 -6
package/dist/sanity/document-renderers.d.ts +45 -7
package/dist/sanity/document-renderers.js +99 -13
package/dist/sanity/queries.d.ts +11 -11
package/dist/sanity/queries.js +7 -0
package/dist/sanity/symbol-index.d.ts +98 -0
package/dist/sanity/symbol-index.js +615 -0
package/package.json +2 -1

package/dist/pipeline/preflight/load-preflight-scoring.d.ts ADDED Viewed

@@ -0,0 +1,12 @@
+/**
+ * load-preflight-scoring — read the W0198 preflight scoring config
+ * (`config/preflight-scoring.ts`) authored via `definePreflightScoring()`.
+ *
+ * Returns `undefined` when the file is absent so callers fall back to
+ * `DEFAULT_PREFLIGHT_CODE_CORRECTNESS_WEIGHT`. The eval package itself
+ * ships a config so the live pipeline always finds one; the optional
+ * return path exists for downstream / external callers that may not
+ * have authored one yet.
+ */
+import type { PreflightScoringConfig } from "../../_vendor/ailf-core/index.d.ts";
+export declare function loadPreflightScoring(rootDir: string): Promise<PreflightScoringConfig | undefined>;

package/dist/pipeline/preflight/load-preflight-scoring.js ADDED Viewed

@@ -0,0 +1,17 @@
+/**
+ * load-preflight-scoring — read the W0198 preflight scoring config
+ * (`config/preflight-scoring.ts`) authored via `definePreflightScoring()`.
+ *
+ * Returns `undefined` when the file is absent so callers fall back to
+ * `DEFAULT_PREFLIGHT_CODE_CORRECTNESS_WEIGHT`. The eval package itself
+ * ships a config so the live pipeline always finds one; the optional
+ * return path exists for downstream / external callers that may not
+ * have authored one yet.
+ */
+import { tryLoadConfigFile } from "../compiler/config-loader.js";
+export async function loadPreflightScoring(rootDir) {
+    const result = tryLoadConfigFile("preflight-scoring", rootDir);
+    if (!result)
+        return undefined;
+    return result.data;
+}

package/dist/pipeline/preflight/parse-imports.d.ts ADDED Viewed

@@ -0,0 +1,62 @@
+/**
+ * parse-imports — pure function that extracts every `import` declaration
+ * from a candidate code block as a flat list of per-binding entries.
+ *
+ * Output shape is intentionally flat: the W0198 preflight checks each
+ * `(source, imported)` pair against the resolved package surface, so a
+ * flat list is the natural input. Multi-binding declarations
+ * (`import { a, b as c } from "pkg"`) produce one entry per binding;
+ * default + named combos (`import def, { a } from "pkg"`) likewise.
+ *
+ * Implementation: delegates to `oxc-parser`'s `staticImports` view, which
+ * already decomposes each import statement into entries with explicit
+ * `importName` / `localName` / `isType` fields. The TS-aware grammar
+ * means dynamic `import(...)`, `import.meta`, and malformed statements
+ * are all handled by the parser itself — we just translate the entries
+ * into our `CandidateImportBinding` shape.
+ *
+ * Recognized grammar (handled by oxc-parser):
+ *   - `import { a, b as c } from "pkg"`
+ *   - `import def from "pkg"`
+ *   - `import * as ns from "pkg"`
+ *   - `import def, { a } from "pkg"` and `import def, * as ns from "pkg"`
+ *   - `import type { ... } from "pkg"` and `import { type a, b } from "pkg"`
+ *   - `import "pkg"` (side-effect; surfaced as a single `side-effect` entry)
+ *   - Multi-line variants of all of the above.
+ *
+ * Out of scope (intentionally — both regex and oxc-parser ignore these):
+ *   - Dynamic `import("pkg")` — runtime, not statically resolvable here.
+ *   - `export { a } from "pkg"` re-exports from candidate code.
+ *   - TypeScript `import = require()` and `import("...").Type` ambient
+ *     references — neither pattern shows up in the App SDK / Studio
+ *     candidate corpus the preflight grades against.
+ */
+export type CandidateImportKind = "named" | "default" | "namespace" | "side-effect";
+export interface CandidateImportBinding {
+    /** Source specifier as written by the candidate (e.g. `"@sanity/sdk-react"`). */
+    source: string;
+    /** Which import-clause shape this binding came from. */
+    kind: CandidateImportKind;
+    /**
+     * Name to look up against the package surface:
+     *   - `kind: "named"` — the imported identifier.
+     *   - `kind: "default"` — the literal string `"default"`.
+     *   - `kind: "namespace"` — the literal string `"*"`.
+     *   - `kind: "side-effect"` — empty string (no binding).
+     */
+    imported: string;
+    /** Local alias used in the candidate's body. Same as `imported` when no alias. */
+    local: string;
+    /**
+     * Whether this binding is type-only — either the whole declaration was
+     * `import type`, or this specifier was prefixed with `type`
+     * (`import { type X, Y } from "pkg"`).
+     */
+    isType: boolean;
+    /**
+     * 1-based line number where the import declaration starts in the
+     * source. Useful for surfacing findings back to a reviewer.
+     */
+    line: number;
+}
+export declare function parseImports(src: string): CandidateImportBinding[];

package/dist/pipeline/preflight/parse-imports.js ADDED Viewed

@@ -0,0 +1,125 @@
+/**
+ * parse-imports — pure function that extracts every `import` declaration
+ * from a candidate code block as a flat list of per-binding entries.
+ *
+ * Output shape is intentionally flat: the W0198 preflight checks each
+ * `(source, imported)` pair against the resolved package surface, so a
+ * flat list is the natural input. Multi-binding declarations
+ * (`import { a, b as c } from "pkg"`) produce one entry per binding;
+ * default + named combos (`import def, { a } from "pkg"`) likewise.
+ *
+ * Implementation: delegates to `oxc-parser`'s `staticImports` view, which
+ * already decomposes each import statement into entries with explicit
+ * `importName` / `localName` / `isType` fields. The TS-aware grammar
+ * means dynamic `import(...)`, `import.meta`, and malformed statements
+ * are all handled by the parser itself — we just translate the entries
+ * into our `CandidateImportBinding` shape.
+ *
+ * Recognized grammar (handled by oxc-parser):
+ *   - `import { a, b as c } from "pkg"`
+ *   - `import def from "pkg"`
+ *   - `import * as ns from "pkg"`
+ *   - `import def, { a } from "pkg"` and `import def, * as ns from "pkg"`
+ *   - `import type { ... } from "pkg"` and `import { type a, b } from "pkg"`
+ *   - `import "pkg"` (side-effect; surfaced as a single `side-effect` entry)
+ *   - Multi-line variants of all of the above.
+ *
+ * Out of scope (intentionally — both regex and oxc-parser ignore these):
+ *   - Dynamic `import("pkg")` — runtime, not statically resolvable here.
+ *   - `export { a } from "pkg"` re-exports from candidate code.
+ *   - TypeScript `import = require()` and `import("...").Type` ambient
+ *     references — neither pattern shows up in the App SDK / Studio
+ *     candidate corpus the preflight grades against.
+ */
+import { parseSync } from "oxc-parser";
+export function parseImports(src) {
+    // Use the `.tsx` filename hint so the parser tolerates JSX in candidate
+    // code (App SDK literacy tasks frequently include JSX in their answers).
+    const result = parseSync("input.tsx", src, { lang: "tsx" });
+    const lineStarts = computeLineStarts(src);
+    const offsetToLine = (offset) => binarySearchLine(lineStarts, offset) + 1;
+    const out = [];
+    for (const imp of result.module.staticImports) {
+        const source = imp.moduleRequest.value;
+        // The parser recovers from malformed specifiers (e.g. backtick-quoted
+        // module requests) by emitting an empty source; the W0198 preflight
+        // can't do anything useful with that, so drop those entries.
+        if (!source)
+            continue;
+        const line = offsetToLine(imp.start);
+        if (imp.entries.length === 0) {
+            // Side-effect form: `import "pkg"`.
+            out.push({
+                source,
+                kind: "side-effect",
+                imported: "",
+                local: "",
+                isType: false,
+                line,
+            });
+            continue;
+        }
+        for (const entry of imp.entries) {
+            const local = entry.localName.value;
+            const isType = entry.isType;
+            switch (entry.importName.kind) {
+                case "Name":
+                    out.push({
+                        source,
+                        kind: "named",
+                        imported: entry.importName.name ?? local,
+                        local,
+                        isType,
+                        line,
+                    });
+                    break;
+                case "Default":
+                    out.push({
+                        source,
+                        kind: "default",
+                        imported: "default",
+                        local,
+                        isType,
+                        line,
+                    });
+                    break;
+                case "NamespaceObject":
+                    out.push({
+                        source,
+                        kind: "namespace",
+                        imported: "*",
+                        local,
+                        isType,
+                        line,
+                    });
+                    break;
+            }
+        }
+    }
+    return out;
+}
+// ---------------------------------------------------------------------------
+// Line-number helpers — oxc-parser returns byte offsets; the W0198
+// preflight surfaces 1-based line numbers in findings so reviewers can
+// jump straight to the citing line.
+// ---------------------------------------------------------------------------
+function computeLineStarts(src) {
+    const offsets = [0];
+    for (let i = 0; i < src.length; i++) {
+        if (src[i] === "\n")
+            offsets.push(i + 1);
+    }
+    return offsets;
+}
+function binarySearchLine(offsets, target) {
+    let lo = 0;
+    let hi = offsets.length - 1;
+    while (lo < hi) {
+        const mid = (lo + hi + 1) >>> 1;
+        if (offsets[mid] <= target)
+            lo = mid;
+        else
+            hi = mid - 1;
+    }
+    return lo;
+}

package/dist/report-store.d.ts CHANGED Viewed

@@ -65,6 +65,10 @@ export declare class ReportStore {
      * matching `evalFingerprint`. Used by the pipeline to skip the expensive
      * eval step when identical inputs have already been evaluated.
      *
+     * Advisory lookup: a `ReportSchemaValidationError` from a corrupt prior
+     * doc is logged + counted, then null is returned so the current eval
+     * proceeds. Use `read(id)` when callers ask for a specific document by id.
+     *
      * @returns The cached report, or null if no match or on error
      * @see docs/design-docs/content-lake-eval-caching.md
      */
@@ -78,6 +82,10 @@ export declare class ReportStore {
      * "Comparable" means: same evaluation mode + same source name.
      * More granular matching (areas, models) can be added as needed.
      *
+     * Advisory lookup: see `findByFingerprint` — a malformed prior baseline
+     * is logged + counted and null is returned so the current run still
+     * publishes its report.
+     *
      * @see docs/design-docs/report-store/architecture.md — Auto-comparison
      */
     findComparableBaseline(query: LineageQuery): Promise<null | Report>;

package/dist/report-store.js CHANGED Viewed

@@ -119,6 +119,10 @@ export class ReportStore {
      * matching `evalFingerprint`. Used by the pipeline to skip the expensive
      * eval step when identical inputs have already been evaluated.
      *
+     * Advisory lookup: a `ReportSchemaValidationError` from a corrupt prior
+     * doc is logged + counted, then null is returned so the current eval
+     * proceeds. Use `read(id)` when callers ask for a specific document by id.
+     *
      * @returns The cached report, or null if no match or on error
      * @see docs/design-docs/content-lake-eval-caching.md
      */
@@ -131,9 +135,19 @@ export class ReportStore {
             return doc ? toReport(doc) : null;
         }
         catch (error) {
-            // W0191: schema-validation errors are bugs, not outages — surface them.
-            if (error instanceof ReportSchemaValidationError)
-                throw error;
+            // Advisory lookup — a single corrupt prior doc must not break the
+            // current eval. Log loudly + emit a counter so ops can alert, and
+            // return null so the caller treats it as "no comparable cache hit".
+            // Direct read(id) keeps the rethrow behavior because the caller asked
+            // for that specific document and silent-null would mask the bug.
+            if (error instanceof ReportSchemaValidationError) {
+                logAdvisoryQuerySchemaFailure({
+                    query: "findByFingerprint",
+                    context: { fingerprint },
+                    error,
+                });
+                return null;
+            }
             console.warn(`  ⚠️  Failed to query cached report by fingerprint: ${error instanceof Error ? error.message : String(error)}`);
             return null;
         }
@@ -147,6 +161,10 @@ export class ReportStore {
      * "Comparable" means: same evaluation mode + same source name.
      * More granular matching (areas, models) can be added as needed.
      *
+     * Advisory lookup: see `findByFingerprint` — a malformed prior baseline
+     * is logged + counted and null is returned so the current run still
+     * publishes its report.
+     *
      * @see docs/design-docs/report-store/architecture.md — Auto-comparison
      */
     async findComparableBaseline(query) {
@@ -170,9 +188,21 @@ export class ReportStore {
             return doc ? toReport(doc) : null;
         }
         catch (error) {
-            // W0191: schema-validation errors are bugs, not outages — surface them.
-            if (error instanceof ReportSchemaValidationError)
-                throw error;
+            // Advisory lookup — see findByFingerprint for rationale. A malformed
+            // prior baseline returns null + counter so the current run still
+            // publishes; direct read(id) preserves the rethrow.
+            if (error instanceof ReportSchemaValidationError) {
+                logAdvisoryQuerySchemaFailure({
+                    query: "findComparableBaseline",
+                    context: {
+                        mode: query.mode,
+                        sourceName: query.source?.name,
+                        before: query.before,
+                    },
+                    error,
+                });
+                return null;
+            }
             console.warn(`  ⚠️  Failed to query comparable baseline: ${error instanceof Error ? error.message : String(error)}`);
             return null;
         }
@@ -299,6 +329,25 @@ export class ReportSchemaValidationError extends Error {
         this.name = "ReportSchemaValidationError";
     }
 }
+/**
+ * Stable log marker for log-aggregator counters. Operators alert on the
+ * count of `[report-store.advisory] schema_validation_error` lines per
+ * window; the trailing JSON carries enough context (which advisory query,
+ * what filter values, error message) to find the offending document
+ * without spelunking through GROQ.
+ *
+ * Emitted via console.error rather than console.warn so it surfaces in
+ * the same severity tier as a real failure even though we're swallowing
+ * it for the current run.
+ */
+function logAdvisoryQuerySchemaFailure(input) {
+    const payload = {
+        query: input.query,
+        context: input.context,
+        error: input.error.message,
+    };
+    console.error(`[report-store.advisory] schema_validation_error ${JSON.stringify(payload)}`);
+}
 export function toSanityReportDoc(report) {
     const comparison = report.comparison
         ? stripComparisonBulk(report.comparison)

package/dist/sanity/document-renderers.d.ts CHANGED Viewed

@@ -1,11 +1,22 @@
 /**
  * document-renderers.ts
  *
- * Renderer registry that turns a Sanity document fetched by `_id` into
- * Markdown for inclusion in a literacy task's grader context.
+ * Renderer registry that turns a Sanity document into both:
  *
- * The resolver fetches docs without an `_type` filter and dispatches here.
- * Two tiers of fidelity:
+ *   - Markdown content for inclusion in a literacy task's grader/candidate
+ *     context (existing surface, used by the doc fetcher).
+ *   - A symbol-reference index for the W0197 grader-context pathway —
+ *     a flat list of identifiers the doc legitimizes, with provenance.
+ *     The grader prefers this over the rendered markdown when available
+ *     (smaller, deterministic, harder for the grader's prior to override).
+ *
+ * Both surfaces dispatch through the same registry. Articles and
+ * typesReference docs have hand-written renderers; everything else falls
+ * through to the default walker. This keeps "what to do with a document
+ * of type X" a single decision point regardless of whether the doc was
+ * looked up by slug, path, perspective, or id.
+ *
+ * Two tiers of fidelity (rendered output):
  *
  *   1. Registered renderers (high fidelity) — `article`, `typesReference`.
  *      Hand-written for the document shapes we care about most.
@@ -14,9 +25,11 @@
  *      skips framework-internal fields. Lets pinning a `marketingPage`,
  *      `glossaryEntry`, etc. work without AILF code changes.
  *
- * Adding a new high-fidelity renderer: implement a `DocumentRenderer` and
- * register it in `BUILT_IN_RENDERERS` keyed by `_type`.
+ * Adding a new high-fidelity renderer: implement a `DocumentRenderer`
+ * (both `render` and `extractSymbols`) and register it in
+ * `BUILT_IN_RENDERERS` keyed by `_type`.
  */
+import { type SymbolIndex } from "./symbol-index.js";
 /**
  * A Sanity document plus any references we've already resolved for it.
  * The resolver fetches the doc once and may include common deref payloads
@@ -57,12 +70,37 @@ export interface RenderResult {
      */
     slug: string;
 }
-export type DocumentRenderer = (doc: DocumentForRender, ctx: RenderContext) => Promise<RenderResult> | RenderResult;
+export interface DocumentRenderer {
+    /**
+     * Produce rendered Markdown for the doc's content surface (for grader
+     * + candidate context inclusion).
+     */
+    render(doc: DocumentForRender, ctx: RenderContext): Promise<RenderResult> | RenderResult;
+    /**
+     * Produce a symbol-reference index for the doc — a flat list of
+     * identifiers the doc legitimizes plus provenance snippets. Used by
+     * the grader-context pathway (W0197) instead of injecting the full
+     * rendered doc. Returning an empty index signals the caller to fall
+     * back to the rendered markdown.
+     */
+    extractSymbols(doc: DocumentForRender, ctx: RenderContext): Promise<SymbolIndex> | SymbolIndex;
+}
 /**
  * Render a document using the registered renderer for its `_type`, falling
  * back to the default walker. The returned `fidelity` flag tells callers
  * whether to emit the "info: dedicated renderer would help" log.
  */
 export declare function renderDocument(doc: DocumentForRender, ctx?: RenderContext): Promise<RenderResult>;
+/**
+ * Extract a symbol-reference index for a document using its registered
+ * renderer (or the default walker for unknown types). Used by the
+ * grader-context pathway (W0197) to feed the LLM judge a compact
+ * deterministic recognition reference instead of the full rendered doc.
+ *
+ * Returns an empty `SymbolIndex` (`{ symbols: [] }`) when extraction
+ * yields nothing — callers interpret this as the signal to fall back to
+ * the rendered markdown.
+ */
+export declare function extractSymbolsForDoc(doc: DocumentForRender, ctx?: RenderContext): Promise<SymbolIndex>;
 /** Exported for tests and consumers that want the registered set. */
 export declare const REGISTERED_RENDERER_TYPES: string[];

package/dist/sanity/document-renderers.js CHANGED Viewed

@@ -1,11 +1,22 @@
 /**
  * document-renderers.ts
  *
- * Renderer registry that turns a Sanity document fetched by `_id` into
- * Markdown for inclusion in a literacy task's grader context.
+ * Renderer registry that turns a Sanity document into both:
  *
- * The resolver fetches docs without an `_type` filter and dispatches here.
- * Two tiers of fidelity:
+ *   - Markdown content for inclusion in a literacy task's grader/candidate
+ *     context (existing surface, used by the doc fetcher).
+ *   - A symbol-reference index for the W0197 grader-context pathway —
+ *     a flat list of identifiers the doc legitimizes, with provenance.
+ *     The grader prefers this over the rendered markdown when available
+ *     (smaller, deterministic, harder for the grader's prior to override).
+ *
+ * Both surfaces dispatch through the same registry. Articles and
+ * typesReference docs have hand-written renderers; everything else falls
+ * through to the default walker. This keeps "what to do with a document
+ * of type X" a single decision point regardless of whether the doc was
+ * looked up by slug, path, perspective, or id.
+ *
+ * Two tiers of fidelity (rendered output):
  *
  *   1. Registered renderers (high fidelity) — `article`, `typesReference`.
  *      Hand-written for the document shapes we care about most.
@@ -14,10 +25,12 @@
  *      skips framework-internal fields. Lets pinning a `marketingPage`,
  *      `glossaryEntry`, etc. work without AILF code changes.
  *
- * Adding a new high-fidelity renderer: implement a `DocumentRenderer` and
- * register it in `BUILT_IN_RENDERERS` keyed by `_type`.
+ * Adding a new high-fidelity renderer: implement a `DocumentRenderer`
+ * (both `render` and `extractSymbols`) and register it in
+ * `BUILT_IN_RENDERERS` keyed by `_type`.
  */
 import { toMarkdown } from "./portable-text.js";
+import { extractSymbolIndex, extractSymbolsFromTypedoc, mergeSymbolIndexes, } from "./symbol-index.js";
 // ---------------------------------------------------------------------------
 // Helpers
 // ---------------------------------------------------------------------------
@@ -56,7 +69,7 @@ function slugForDoc(doc) {
         return slugField;
     return `${doc._type}:${doc._id}`;
 }
-function articleRenderer(doc) {
+function renderArticle(doc) {
     const title = doc.title ?? "(untitled)";
     const description = doc.description;
     const section = doc.section;
@@ -70,7 +83,16 @@ function articleRenderer(doc) {
         slug: slugForDoc(doc),
     };
 }
-async function typesReferenceRenderer(doc, ctx) {
+const articleRenderer = {
+    render: renderArticle,
+    extractSymbols(doc) {
+        const content = doc.content;
+        if (!Array.isArray(content))
+            return { symbols: [] };
+        return extractSymbolIndex(content);
+    },
+};
+async function renderTypesReference(doc, ctx) {
     const title = doc.title ?? "(untitled)";
     const slug = slugForDoc(doc);
     const library = doc.library;
@@ -109,6 +131,24 @@ async function typesReferenceRenderer(doc, ctx) {
     lines.push("```");
     return { content: lines.join("\n"), fidelity: "high", slug };
 }
+async function extractTypesReferenceSymbols(doc, ctx) {
+    const library = doc.library;
+    const latestVersion = doc.latestVersion;
+    const asset = latestVersion?.attachment?.asset;
+    // Re-fetches the same URL the renderer would; bounded to ≤ a handful of
+    // typesReference docs per eval run, so the duplicate I/O is acceptable.
+    // Fold into a single registry method later if profiling shows it bites.
+    if (!asset?.url || !ctx.fetchUrl)
+        return { symbols: [] };
+    const body = await ctx.fetchUrl(asset.url);
+    if (body === null)
+        return { symbols: [] };
+    return extractSymbolsFromTypedoc(body, library?.npmName);
+}
+const typesReferenceRenderer = {
+    render: renderTypesReference,
+    extractSymbols: extractTypesReferenceSymbols,
+};
 // ---------------------------------------------------------------------------
 // formatDefault — generic walker for any unknown `_type`.
 //
@@ -174,7 +214,7 @@ function renderField(key, value, depth = 0) {
     }
     return null;
 }
-function defaultRenderer(doc) {
+function renderDefault(doc) {
     const title = doc.title ?? `(${doc._type})`;
     const slug = slugForDoc(doc);
     const lines = [`## ${title}`, "", `Type: \`${doc._type}\``];
@@ -199,6 +239,39 @@ function defaultRenderer(doc) {
     }
     return { content: lines.join("\n"), fidelity: "default", slug };
 }
+function extractDefaultSymbols(doc) {
+    // For unknown types we don't know the doc's intent — but if it has any
+    // Portable Text fields, those probably contain prose-with-inline-code
+    // that names symbols. Walk top-level fields, run the PT extractor on
+    // each PT array, and tag each extracted entry with the originating
+    // field name so reviewers can trace which field a symbol came from.
+    // Returns empty for shapes with no PT content (purely scalar docs like
+    // `marketingPage`); caller falls back to the rendered markdown.
+    const indexes = [];
+    for (const [key, value] of Object.entries(doc)) {
+        if (SKIP_FIELDS.has(key))
+            continue;
+        if (isPortableTextArray(value)) {
+            indexes.push(tagWithFieldName(extractSymbolIndex(value), key));
+        }
+    }
+    return mergeSymbolIndexes(indexes);
+}
+function tagWithFieldName(index, fieldName) {
+    return {
+        symbols: index.symbols.map((entry) => ({
+            symbol: entry.symbol,
+            provenance: {
+                ...entry.provenance,
+                snippet: `[${fieldName}] ${entry.provenance.snippet}`,
+            },
+        })),
+    };
+}
+const defaultRenderer = {
+    render: renderDefault,
+    extractSymbols: extractDefaultSymbols,
+};
 // ---------------------------------------------------------------------------
 // Registry
 // ---------------------------------------------------------------------------
@@ -206,16 +279,29 @@ const BUILT_IN_RENDERERS = {
     article: articleRenderer,
     typesReference: typesReferenceRenderer,
 };
+function rendererFor(type) {
+    return BUILT_IN_RENDERERS[type] ?? defaultRenderer;
+}
 /**
  * Render a document using the registered renderer for its `_type`, falling
  * back to the default walker. The returned `fidelity` flag tells callers
  * whether to emit the "info: dedicated renderer would help" log.
  */
 export async function renderDocument(doc, ctx = {}) {
-    const renderer = BUILT_IN_RENDERERS[doc._type];
-    if (renderer)
-        return renderer(doc, ctx);
-    return defaultRenderer(doc);
+    return rendererFor(doc._type).render(doc, ctx);
+}
+/**
+ * Extract a symbol-reference index for a document using its registered
+ * renderer (or the default walker for unknown types). Used by the
+ * grader-context pathway (W0197) to feed the LLM judge a compact
+ * deterministic recognition reference instead of the full rendered doc.
+ *
+ * Returns an empty `SymbolIndex` (`{ symbols: [] }`) when extraction
+ * yields nothing — callers interpret this as the signal to fall back to
+ * the rendered markdown.
+ */
+export async function extractSymbolsForDoc(doc, ctx = {}) {
+    return rendererFor(doc._type).extractSymbols(doc, ctx);
 }
 /** Exported for tests and consumers that want the registered set. */
 export const REGISTERED_RENDERER_TYPES = Object.keys(BUILT_IN_RENDERERS).sort();