@sanity/ailf 0.1.30 → 0.1.32

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (82) hide show
  1. package/canonical/grader-references/README.md +2 -2
  2. package/config/features.yaml +1 -1
  3. package/config/rubrics.yaml +1 -1
  4. package/config/thresholds.yaml +1 -1
  5. package/dist/_vendor/ailf-tasks/schemas.d.ts +1 -1
  6. package/dist/_vendor/ailf-tasks/schemas.js +1 -1
  7. package/dist/adapters/task-sources/composite-task-source.d.ts +1 -1
  8. package/dist/adapters/task-sources/composite-task-source.js +1 -1
  9. package/dist/adapters/task-sources/content-lake-task-source.d.ts +1 -1
  10. package/dist/adapters/task-sources/content-lake-task-source.js +1 -1
  11. package/dist/adapters/task-sources/repo-schemas.d.ts +1 -1
  12. package/dist/adapters/task-sources/repo-schemas.js +1 -1
  13. package/dist/adapters/task-sources/repo-task-source.d.ts +1 -1
  14. package/dist/adapters/task-sources/repo-task-source.js +1 -1
  15. package/dist/adapters/task-sources/repo-trigger.d.ts +1 -1
  16. package/dist/adapters/task-sources/repo-trigger.js +1 -1
  17. package/dist/assertions/source-isolation.d.ts +1 -1
  18. package/dist/assertions/source-isolation.js +1 -1
  19. package/dist/commands/explain-handler.d.ts +1 -1
  20. package/dist/commands/explain-handler.js +1 -1
  21. package/dist/composition-root.d.ts +1 -1
  22. package/dist/composition-root.js +1 -1
  23. package/dist/orchestration/steps/mirror-repo-tasks-step.d.ts +1 -1
  24. package/dist/orchestration/steps/mirror-repo-tasks-step.js +1 -1
  25. package/dist/pipeline/attribution.d.ts +1 -1
  26. package/dist/pipeline/attribution.js +1 -1
  27. package/dist/pipeline/calculate-scores.js +1 -1
  28. package/dist/pipeline/coverage-audit.d.ts +1 -1
  29. package/dist/pipeline/coverage-audit.js +1 -1
  30. package/dist/pipeline/degradations.d.ts +1 -1
  31. package/dist/pipeline/degradations.js +1 -1
  32. package/dist/pipeline/failure-modes.d.ts +1 -1
  33. package/dist/pipeline/failure-modes.js +1 -1
  34. package/dist/pipeline/gap-analysis.d.ts +1 -1
  35. package/dist/pipeline/gap-analysis.js +1 -1
  36. package/dist/pipeline/generate-configs.d.ts +1 -1
  37. package/dist/pipeline/generate-configs.js +1 -1
  38. package/dist/pipeline/grader-compare-runner.d.ts +1 -1
  39. package/dist/pipeline/grader-compare-runner.js +1 -1
  40. package/dist/pipeline/grader-comparison.d.ts +1 -1
  41. package/dist/pipeline/grader-comparison.js +1 -1
  42. package/dist/pipeline/grader-consistency-runner.d.ts +1 -1
  43. package/dist/pipeline/grader-consistency-runner.js +1 -1
  44. package/dist/pipeline/grader-consistency.d.ts +1 -1
  45. package/dist/pipeline/grader-consistency.js +1 -1
  46. package/dist/pipeline/grader-sensitivity-runner.d.ts +1 -1
  47. package/dist/pipeline/grader-sensitivity-runner.js +1 -1
  48. package/dist/pipeline/grader-sensitivity.d.ts +1 -1
  49. package/dist/pipeline/grader-sensitivity.js +1 -1
  50. package/dist/pipeline/grader-validate-runner.d.ts +1 -1
  51. package/dist/pipeline/grader-validate-runner.js +2 -2
  52. package/dist/pipeline/grader-validation.d.ts +1 -1
  53. package/dist/pipeline/grader-validation.js +1 -1
  54. package/dist/pipeline/mirror-repo-tasks.d.ts +1 -1
  55. package/dist/pipeline/mirror-repo-tasks.js +1 -1
  56. package/dist/pipeline/plan-format.d.ts +1 -1
  57. package/dist/pipeline/plan-format.js +1 -1
  58. package/dist/pipeline/plan.d.ts +1 -1
  59. package/dist/pipeline/plan.js +1 -1
  60. package/dist/pipeline/probe.d.ts +1 -1
  61. package/dist/pipeline/probe.js +1 -1
  62. package/dist/pipeline/readiness-report.d.ts +2 -2
  63. package/dist/pipeline/readiness-report.js +2 -2
  64. package/dist/pipeline/release-classification.d.ts +1 -1
  65. package/dist/pipeline/release-classification.js +1 -1
  66. package/dist/pipeline/release-report.d.ts +1 -1
  67. package/dist/pipeline/release-report.js +1 -1
  68. package/dist/pipeline/repo-eval-comment.d.ts +1 -1
  69. package/dist/pipeline/repo-eval-comment.js +1 -1
  70. package/dist/pipeline/repo-threshold-evaluator.d.ts +1 -1
  71. package/dist/pipeline/repo-threshold-evaluator.js +1 -1
  72. package/dist/pipeline/targeted-loo.d.ts +1 -1
  73. package/dist/pipeline/targeted-loo.js +1 -1
  74. package/dist/pipeline/thresholds.d.ts +1 -1
  75. package/dist/pipeline/thresholds.js +1 -1
  76. package/dist/scripts/migrate-tasks-to-content-lake.d.ts +1 -1
  77. package/dist/scripts/migrate-tasks-to-content-lake.js +1 -1
  78. package/dist/scripts/validate-task-sources.d.ts +1 -1
  79. package/dist/scripts/validate-task-sources.js +1 -1
  80. package/dist/sinks/types.d.ts +1 -1
  81. package/dist/sinks/types.js +1 -1
  82. package/package.json +1 -1
@@ -83,6 +83,6 @@ discrimination power across the full scale.
83
83
 
84
84
  ## Related
85
85
 
86
- - [Grader Reliability Plan](../../../docs/exec-plans/completed/grader-reliability.md)
87
- Phase 2
86
+ - [Grader Reliability Plan](../../../docs/exec-plans/grader-reliability.md)
87
+ Phase 2
88
88
  - [Rubric Templates](../../config/rubrics.yaml) — the rubrics used for grading
@@ -14,7 +14,7 @@
14
14
  # out-of-scope — intentionally excluded from evaluation
15
15
  #
16
16
  # Phase 3c of the Scenario Matrix implementation.
17
- # See docs/exec-plans/active/scenario-matrix-implementation/phase-3-gap-analysis.md
17
+ # See docs/exec-plans/scenario-matrix-implementation/phase-3-gap-analysis.md
18
18
 
19
19
  features:
20
20
  # === Currently covered (have evaluation tasks) ===
@@ -15,7 +15,7 @@
15
15
  # fragile heuristic string matching.
16
16
  # See docs/design-docs/structured-dimensions.md for the design.
17
17
  #
18
- # See docs/exec-plans/completed/rubric-templates.md for the design.
18
+ # See docs/exec-plans/rubric-templates.md for the design.
19
19
  # See docs/design-docs/uniform-dimension-scoring.md for the scoring model.
20
20
 
21
21
  templates:
@@ -9,7 +9,7 @@
9
9
  # - `pnpm pipeline --publish` (severity-aware sink routing)
10
10
  # - `pnpm pipeline --compare` (regression alerting)
11
11
  #
12
- # @see docs/exec-plans/active/scenario-matrix-implementation/phase-5-readiness-thresholds.md
12
+ # @see docs/exec-plans/scenario-matrix-implementation/phase-5-readiness-thresholds.md
13
13
 
14
14
  # Global defaults (apply to all areas unless overridden)
15
15
  defaults:
@@ -9,7 +9,7 @@
9
9
  * This module is the single source of truth for task schemas. The eval
10
10
  * package re-exports from here to avoid duplication.
11
11
  *
12
- * @see docs/exec-plans/completed/tasks-as-content/phase-4-repo-based-tasks.md
12
+ * @see docs/exec-plans/tasks-as-content/phase-4-repo-based-tasks.md
13
13
  */
14
14
  import { z } from "zod";
15
15
  /**
@@ -9,7 +9,7 @@
9
9
  * This module is the single source of truth for task schemas. The eval
10
10
  * package re-exports from here to avoid duplication.
11
11
  *
12
- * @see docs/exec-plans/completed/tasks-as-content/phase-4-repo-based-tasks.md
12
+ * @see docs/exec-plans/tasks-as-content/phase-4-repo-based-tasks.md
13
13
  */
14
14
  import { z } from "zod";
15
15
  // ---------------------------------------------------------------------------
@@ -10,7 +10,7 @@
10
10
  * tasks in a single TaskDefinition[].
11
11
  *
12
12
  * @see packages/core/src/ports/task-source.ts — TaskSource port
13
- * @see docs/exec-plans/completed/tasks-as-content/phase-4-repo-based-tasks.md
13
+ * @see docs/exec-plans/tasks-as-content/phase-4-repo-based-tasks.md
14
14
  */
15
15
  import type { FilterOptions, TaskDefinition, TaskSource } from "../../_vendor/ailf-core/index.d.ts";
16
16
  export declare class CompositeTaskSource implements TaskSource {
@@ -10,7 +10,7 @@
10
10
  * tasks in a single TaskDefinition[].
11
11
  *
12
12
  * @see packages/core/src/ports/task-source.ts — TaskSource port
13
- * @see docs/exec-plans/completed/tasks-as-content/phase-4-repo-based-tasks.md
13
+ * @see docs/exec-plans/tasks-as-content/phase-4-repo-based-tasks.md
14
14
  */
15
15
  export class CompositeTaskSource {
16
16
  sources;
@@ -9,7 +9,7 @@
9
9
  * Wired in the composition root when --task-source content-lake is set.
10
10
  *
11
11
  * @see packages/core/src/ports/task-source.ts — TaskSource port
12
- * @see docs/exec-plans/completed/tasks-as-content/phase-2-pipeline-integration.md
12
+ * @see docs/exec-plans/tasks-as-content/phase-2-pipeline-integration.md
13
13
  */
14
14
  import type { SanityClient } from "@sanity/client";
15
15
  import type { FilterOptions, TaskDefinition, TaskSource } from "../../_vendor/ailf-core/index.d.ts";
@@ -9,7 +9,7 @@
9
9
  * Wired in the composition root when --task-source content-lake is set.
10
10
  *
11
11
  * @see packages/core/src/ports/task-source.ts — TaskSource port
12
- * @see docs/exec-plans/completed/tasks-as-content/phase-2-pipeline-integration.md
12
+ * @see docs/exec-plans/tasks-as-content/phase-2-pipeline-integration.md
13
13
  */
14
14
  // ---------------------------------------------------------------------------
15
15
  // GROQ query — fetches ailf.task documents with resolved references
@@ -10,7 +10,7 @@
10
10
  * external tools that only validate task YAML.
11
11
  *
12
12
  * @see packages/tasks/src/schemas.ts — task schema source of truth
13
- * @see docs/exec-plans/completed/tasks-as-content/phase-4-repo-based-tasks.md
13
+ * @see docs/exec-plans/tasks-as-content/phase-4-repo-based-tasks.md
14
14
  */
15
15
  import { RepoTaskFileSchema as _Schema } from "../../_vendor/ailf-tasks/index.d.ts";
16
16
  import { z } from "zod";
@@ -10,7 +10,7 @@
10
10
  * external tools that only validate task YAML.
11
11
  *
12
12
  * @see packages/tasks/src/schemas.ts — task schema source of truth
13
- * @see docs/exec-plans/completed/tasks-as-content/phase-4-repo-based-tasks.md
13
+ * @see docs/exec-plans/tasks-as-content/phase-4-repo-based-tasks.md
14
14
  */
15
15
  import { RepoTaskFileSchema as _Schema } from "../../_vendor/ailf-tasks/index.js";
16
16
  import { z } from "zod";
@@ -12,7 +12,7 @@
12
12
  * - Has an explicit featureArea field per task (not derived from filename)
13
13
  *
14
14
  * @see packages/core/src/ports/task-source.ts — TaskSource port
15
- * @see docs/exec-plans/completed/tasks-as-content/phase-4-repo-based-tasks.md
15
+ * @see docs/exec-plans/tasks-as-content/phase-4-repo-based-tasks.md
16
16
  */
17
17
  import type { FilterOptions, TaskDefinition, TaskSource } from "../../_vendor/ailf-core/index.d.ts";
18
18
  export declare class RepoTaskSource implements TaskSource {
@@ -12,7 +12,7 @@
12
12
  * - Has an explicit featureArea field per task (not derived from filename)
13
13
  *
14
14
  * @see packages/core/src/ports/task-source.ts — TaskSource port
15
- * @see docs/exec-plans/completed/tasks-as-content/phase-4-repo-based-tasks.md
15
+ * @see docs/exec-plans/tasks-as-content/phase-4-repo-based-tasks.md
16
16
  */
17
17
  import { existsSync, readdirSync, readFileSync } from "fs";
18
18
  import { resolve } from "path";
@@ -6,7 +6,7 @@
6
6
  * config applies. This drives whether the pipeline runs in validate-only
7
7
  * mode or full eval mode, and whether results are blocking.
8
8
  *
9
- * @see docs/exec-plans/completed/tasks-as-content/phase-4-repo-based-tasks.md
9
+ * @see docs/exec-plans/tasks-as-content/phase-4-repo-based-tasks.md
10
10
  */
11
11
  export type TriggerContext = {
12
12
  type: "pr";
@@ -6,7 +6,7 @@
6
6
  * config applies. This drives whether the pipeline runs in validate-only
7
7
  * mode or full eval mode, and whether results are blocking.
8
8
  *
9
- * @see docs/exec-plans/completed/tasks-as-content/phase-4-repo-based-tasks.md
9
+ * @see docs/exec-plans/tasks-as-content/phase-4-repo-based-tasks.md
10
10
  */
11
11
  import { existsSync, readFileSync } from "fs";
12
12
  import { resolve } from "path";
@@ -10,7 +10,7 @@
10
10
  * The assertion has weight: 0 — it doesn't affect scores. It surfaces
11
11
  * as an advisory pass/fail signal in results.
12
12
  *
13
- * @see docs/exec-plans/completed/source-aware-eval-isolation.md (Phase 3b)
13
+ * @see docs/exec-plans/source-aware-eval-isolation.md (Phase 3b)
14
14
  */
15
15
  export interface SourceIsolationReport {
16
16
  blocked: number;
@@ -10,7 +10,7 @@
10
10
  * The assertion has weight: 0 — it doesn't affect scores. It surfaces
11
11
  * as an advisory pass/fail signal in results.
12
12
  *
13
- * @see docs/exec-plans/completed/source-aware-eval-isolation.md (Phase 3b)
13
+ * @see docs/exec-plans/source-aware-eval-isolation.md (Phase 3b)
14
14
  */
15
15
  import { isAllowedOrigin } from "../sources.js";
16
16
  /**
@@ -17,7 +17,7 @@
17
17
  * Adding --explain support for a new command = adding one registry entry.
18
18
  * Commands not in the registry fall back to a minimal generic plan.
19
19
  *
20
- * @see docs/exec-plans/active/execution-preview.md
20
+ * @see docs/exec-plans/execution-preview.md
21
21
  */
22
22
  import type { Command } from "commander";
23
23
  /**
@@ -17,7 +17,7 @@
17
17
  * Adding --explain support for a new command = adding one registry entry.
18
18
  * Commands not in the registry fall back to a minimal generic plan.
19
19
  *
20
- * @see docs/exec-plans/active/execution-preview.md
20
+ * @see docs/exec-plans/execution-preview.md
21
21
  */
22
22
  import { TASK_FILE_NAMES } from "../_vendor/ailf-core/index.js";
23
23
  import { buildPipelinePlan, buildSimpleCommandPlan, } from "../pipeline/plan.js";
@@ -13,7 +13,7 @@
13
13
  * - After: one factory, one place to change adapter wiring
14
14
  *
15
15
  * @see packages/core/src/ports/context.ts — AppContext interface
16
- * @see docs/exec-plans/active/ports-and-adapters/phase-7-composition-root.md
16
+ * @see docs/exec-plans/ports-and-adapters/phase-7-composition-root.md
17
17
  */
18
18
  import type { AppContext, ResolvedConfig } from "./_vendor/ailf-core/index.d.ts";
19
19
  /**
@@ -13,7 +13,7 @@
13
13
  * - After: one factory, one place to change adapter wiring
14
14
  *
15
15
  * @see packages/core/src/ports/context.ts — AppContext interface
16
- * @see docs/exec-plans/active/ports-and-adapters/phase-7-composition-root.md
16
+ * @see docs/exec-plans/ports-and-adapters/phase-7-composition-root.md
17
17
  */
18
18
  import { ContentLakeCacheAdapter } from "./adapters/cache/content-lake-cache.js";
19
19
  import { FilesystemCache } from "./adapters/cache/filesystem-cache.js";
@@ -10,7 +10,7 @@
10
10
  * exist before evaluation begins.
11
11
  *
12
12
  * @see packages/eval/src/pipeline/mirror-repo-tasks.ts
13
- * @see docs/exec-plans/completed/tasks-as-content/phase-5-content-lake-mirroring.md
13
+ * @see docs/exec-plans/tasks-as-content/phase-5-content-lake-mirroring.md
14
14
  */
15
15
  import type { AppContext, PipelineStep, StepResult, ValidationIssue } from "../../_vendor/ailf-core/index.d.ts";
16
16
  export declare class MirrorRepoTasksStep implements PipelineStep {
@@ -10,7 +10,7 @@
10
10
  * exist before evaluation begins.
11
11
  *
12
12
  * @see packages/eval/src/pipeline/mirror-repo-tasks.ts
13
- * @see docs/exec-plans/completed/tasks-as-content/phase-5-content-lake-mirroring.md
13
+ * @see docs/exec-plans/tasks-as-content/phase-5-content-lake-mirroring.md
14
14
  */
15
15
  import { getSanityClient } from "../../sanity/client.js";
16
16
  import { detectGitContext, mirrorRepoTasks, } from "../../pipeline/mirror-repo-tasks.js";
@@ -13,7 +13,7 @@
13
13
  * layered on top for ambiguous cases when higher precision is needed.
14
14
  *
15
15
  * @see docs/design-docs/scenario-matrix/per-document-attribution.md
16
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-2-impact-scenarios.md
16
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-2-impact-scenarios.md
17
17
  */
18
18
  import type { AttributionReport, ComparisonReport } from "./types.js";
19
19
  import type { ResolvedMappings } from "./resolve-mappings.js";
@@ -13,7 +13,7 @@
13
13
  * layered on top for ambiguous cases when higher precision is needed.
14
14
  *
15
15
  * @see docs/design-docs/scenario-matrix/per-document-attribution.md
16
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-2-impact-scenarios.md
16
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-2-impact-scenarios.md
17
17
  */
18
18
  // ---------------------------------------------------------------------------
19
19
  // Public API
@@ -22,7 +22,7 @@
22
22
  * All functions accept rootDir as a parameter — no module-level constants.
23
23
  * No process.argv parsing. No env var fallbacks.
24
24
  *
25
- * @see docs/exec-plans/active/eliminate-lib-layer.md
25
+ * @see docs/exec-plans/eliminate-lib-layer.md
26
26
  */
27
27
  import { existsSync, mkdirSync, readFileSync, writeFileSync } from "fs";
28
28
  import { join } from "path";
@@ -7,7 +7,7 @@
7
7
  *
8
8
  * Phase 3c of the Scenario Matrix implementation.
9
9
  *
10
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-3-gap-analysis.md
10
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-3-gap-analysis.md
11
11
  */
12
12
  import type { CoverageAuditReport, ProductFeature } from "./types.js";
13
13
  /**
@@ -7,7 +7,7 @@
7
7
  *
8
8
  * Phase 3c of the Scenario Matrix implementation.
9
9
  *
10
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-3-gap-analysis.md
10
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-3-gap-analysis.md
11
11
  */
12
12
  import { existsSync, readFileSync } from "fs";
13
13
  import { join } from "path";
@@ -12,7 +12,7 @@
12
12
  *
13
13
  * These are deterministic, pure functions — no randomness, no side effects.
14
14
  *
15
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 4
15
+ * @see docs/exec-plans/grader-reliability.md — Phase 4
16
16
  */
17
17
  /** A degradation targeting a specific scoring dimension */
18
18
  export interface Degradation {
@@ -12,7 +12,7 @@
12
12
  *
13
13
  * These are deterministic, pure functions — no randomness, no side effects.
14
14
  *
15
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 4
15
+ * @see docs/exec-plans/grader-reliability.md — Phase 4
16
16
  */
17
17
  // ---------------------------------------------------------------------------
18
18
  // Task Completion degradations
@@ -13,7 +13,7 @@
13
13
  * When both sources agree, confidence is boosted. When only ceiling
14
14
  * signals are available, they serve as a fallback for unclassified cases.
15
15
  *
16
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-3-gap-analysis.md
16
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-3-gap-analysis.md
17
17
  */
18
18
  import type { FailureMode, FailureModeReport, FeatureScore, GraderJudgment } from "./types.js";
19
19
  /**
@@ -13,7 +13,7 @@
13
13
  * When both sources agree, confidence is boosted. When only ceiling
14
14
  * signals are available, they serve as a fallback for unclassified cases.
15
15
  *
16
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-3-gap-analysis.md
16
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-3-gap-analysis.md
17
17
  */
18
18
  import { detectFeatureArea } from "../_vendor/ailf-core/index.js";
19
19
  // ---------------------------------------------------------------------------
@@ -13,7 +13,7 @@
13
13
  * bottleneck dimension to the median of non-bottlenecked dimensions (not 100).
14
14
  * This produces realistic estimates rather than theoretical maximums.
15
15
  *
16
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-3-gap-analysis.md
16
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-3-gap-analysis.md
17
17
  */
18
18
  import type { FailureModeReport, FeatureScore, GapAnalysisReport, GapEstimate } from "./types.js";
19
19
  /**
@@ -13,7 +13,7 @@
13
13
  * bottleneck dimension to the median of non-bottlenecked dimensions (not 100).
14
14
  * This produces realistic estimates rather than theoretical maximums.
15
15
  *
16
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-3-gap-analysis.md
16
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-3-gap-analysis.md
17
17
  */
18
18
  // ---------------------------------------------------------------------------
19
19
  // Constants
@@ -16,7 +16,7 @@
16
16
  * No process.argv parsing. No env var fallbacks. Callers provide typed options.
17
17
  *
18
18
  * @see config/models.yaml — the central model registry
19
- * @see docs/exec-plans/active/eliminate-lib-layer.md
19
+ * @see docs/exec-plans/eliminate-lib-layer.md
20
20
  */
21
21
  import { type TaskDefinition } from "../_vendor/ailf-core/index.d.ts";
22
22
  import type { FilterOptions } from "./types.js";
@@ -16,7 +16,7 @@
16
16
  * No process.argv parsing. No env var fallbacks. Callers provide typed options.
17
17
  *
18
18
  * @see config/models.yaml — the central model registry
19
- * @see docs/exec-plans/active/eliminate-lib-layer.md
19
+ * @see docs/exec-plans/eliminate-lib-layer.md
20
20
  */
21
21
  import { extractModelName, extractProvider, mergeConfig, modelMatchesMode, } from "../_vendor/ailf-core/index.js";
22
22
  import { existsSync, readFileSync, readdirSync, writeFileSync } from "fs";
@@ -10,7 +10,7 @@
10
10
  * Migrated from lib/grader-compare.ts — no process.argv, no process.exit(),
11
11
  * no module-level constants. Accepts rootDir as parameter.
12
12
  *
13
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 3
13
+ * @see docs/exec-plans/grader-reliability.md — Phase 3
14
14
  */
15
15
  import { type GraderComparison } from "./grader-comparison.js";
16
16
  export interface GraderCompareRunnerOptions {
@@ -10,7 +10,7 @@
10
10
  * Migrated from lib/grader-compare.ts — no process.argv, no process.exit(),
11
11
  * no module-level constants. Accepts rootDir as parameter.
12
12
  *
13
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 3
13
+ * @see docs/exec-plans/grader-reliability.md — Phase 3
14
14
  */
15
15
  import { existsSync, mkdirSync, readFileSync, writeFileSync } from "fs";
16
16
  import { join } from "path";
@@ -10,7 +10,7 @@
10
10
  * This module has NO side effects — no file I/O, no API calls.
11
11
  * It operates on pre-collected data only.
12
12
  *
13
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 3
13
+ * @see docs/exec-plans/grader-reliability.md — Phase 3
14
14
  */
15
15
  import type { ComparisonReport, ScoreSummary } from "./types.js";
16
16
  /** Per-dimension comparison between two graders */
@@ -10,7 +10,7 @@
10
10
  * This module has NO side effects — no file I/O, no API calls.
11
11
  * It operates on pre-collected data only.
12
12
  *
13
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 3
13
+ * @see docs/exec-plans/grader-reliability.md — Phase 3
14
14
  */
15
15
  import { compare } from "./compare.js";
16
16
  import { pearsonCorrelation } from "./grader-validation.js";
@@ -12,7 +12,7 @@
12
12
  * Migrated from lib/grader-consistency.ts — no process.argv, no process.exit(),
13
13
  * no module-level constants.
14
14
  *
15
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 1
15
+ * @see docs/exec-plans/grader-reliability.md — Phase 1
16
16
  */
17
17
  import type { RawPromptfooFile } from "./calculate-scores.js";
18
18
  import { type GraderConsistency } from "./grader-consistency.js";
@@ -12,7 +12,7 @@
12
12
  * Migrated from lib/grader-consistency.ts — no process.argv, no process.exit(),
13
13
  * no module-level constants.
14
14
  *
15
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 1
15
+ * @see docs/exec-plans/grader-reliability.md — Phase 1
16
16
  */
17
17
  import { existsSync, mkdirSync, readFileSync, writeFileSync } from "fs";
18
18
  import { join } from "path";
@@ -10,7 +10,7 @@
10
10
  * This module has NO side effects — no file I/O, no API calls.
11
11
  * It operates on pre-collected data only.
12
12
  *
13
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 1
13
+ * @see docs/exec-plans/grader-reliability.md — Phase 1
14
14
  */
15
15
  /** Per-dimension consistency aggregates */
16
16
  export interface DimensionConsistency {
@@ -10,7 +10,7 @@
10
10
  * This module has NO side effects — no file I/O, no API calls.
11
11
  * It operates on pre-collected data only.
12
12
  *
13
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 1
13
+ * @see docs/exec-plans/grader-reliability.md — Phase 1
14
14
  */
15
15
  // ---------------------------------------------------------------------------
16
16
  // Pure computation
@@ -11,7 +11,7 @@
11
11
  * Migrated from lib/grader-sensitivity.ts — no process.argv, no process.exit(),
12
12
  * no module-level constants. Accepts rootDir as parameter.
13
13
  *
14
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 4
14
+ * @see docs/exec-plans/grader-reliability.md — Phase 4
15
15
  */
16
16
  import { type GraderSensitivityResult } from "./grader-sensitivity.js";
17
17
  export interface GraderSensitivityRunnerOptions {
@@ -11,7 +11,7 @@
11
11
  * Migrated from lib/grader-sensitivity.ts — no process.argv, no process.exit(),
12
12
  * no module-level constants. Accepts rootDir as parameter.
13
13
  *
14
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 4
14
+ * @see docs/exec-plans/grader-reliability.md — Phase 4
15
15
  */
16
16
  import { existsSync, mkdirSync, readdirSync, readFileSync, writeFileSync, } from "fs";
17
17
  import { basename, join } from "path";
@@ -11,7 +11,7 @@
11
11
  *
12
12
  * This module has NO side effects — no file I/O, no API calls.
13
13
  *
14
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 4
14
+ * @see docs/exec-plans/grader-reliability.md — Phase 4
15
15
  */
16
16
  /** Sensitivity broken down by degradation type */
17
17
  export interface DegradationSensitivity {
@@ -11,7 +11,7 @@
11
11
  *
12
12
  * This module has NO side effects — no file I/O, no API calls.
13
13
  *
14
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 4
14
+ * @see docs/exec-plans/grader-reliability.md — Phase 4
15
15
  */
16
16
  // ---------------------------------------------------------------------------
17
17
  // Pure computation
@@ -11,7 +11,7 @@
11
11
  * Migrated from lib/grader-validate.ts — no process.argv, no process.exit(),
12
12
  * no module-level constants. Accepts rootDir as parameter.
13
13
  *
14
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 2
14
+ * @see docs/exec-plans/grader-reliability.md — Phase 2
15
15
  */
16
16
  import { type GraderValidation } from "./grader-validation.js";
17
17
  export interface GraderValidateRunnerOptions {
@@ -11,7 +11,7 @@
11
11
  * Migrated from lib/grader-validate.ts — no process.argv, no process.exit(),
12
12
  * no module-level constants. Accepts rootDir as parameter.
13
13
  *
14
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 2
14
+ * @see docs/exec-plans/grader-reliability.md — Phase 2
15
15
  */
16
16
  import { existsSync, mkdirSync, readFileSync, readdirSync, writeFileSync, } from "fs";
17
17
  import { join } from "path";
@@ -42,7 +42,7 @@ function loadReferenceGrades(rootDir) {
42
42
  if (!existsSync(refsDir)) {
43
43
  throw new Error(`Reference grades directory not found: ${refsDir}. ` +
44
44
  "Create canonical/grader-references/ with YAML reference files. " +
45
- "See docs/exec-plans/completed/grader-reliability.md — Phase 2.");
45
+ "See docs/exec-plans/grader-reliability.md — Phase 2.");
46
46
  }
47
47
  const files = readdirSync(refsDir)
48
48
  .filter((f) => f.endsWith(".yaml") || f.endsWith(".yml"))
@@ -11,7 +11,7 @@
11
11
  *
12
12
  * This module has NO side effects — no file I/O, no API calls.
13
13
  *
14
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 2
14
+ * @see docs/exec-plans/grader-reliability.md — Phase 2
15
15
  */
16
16
  /** Quality label for a correlation value */
17
17
  export type CorrelationQuality = "excellent" | "good" | "moderate" | "poor" | "very-poor";
@@ -11,7 +11,7 @@
11
11
  *
12
12
  * This module has NO side effects — no file I/O, no API calls.
13
13
  *
14
- * @see docs/exec-plans/completed/grader-reliability.md — Phase 2
14
+ * @see docs/exec-plans/grader-reliability.md — Phase 2
15
15
  */
16
16
  // ---------------------------------------------------------------------------
17
17
  // Pure computation
@@ -10,7 +10,7 @@
10
10
  * means unchanged tasks are skipped. Changed tasks are upserted via
11
11
  * createOrReplace.
12
12
  *
13
- * @see docs/exec-plans/completed/tasks-as-content/phase-5-content-lake-mirroring.md
13
+ * @see docs/exec-plans/tasks-as-content/phase-5-content-lake-mirroring.md
14
14
  */
15
15
  import type { SanityClient } from "@sanity/client";
16
16
  import { type TaskDefinition } from "../_vendor/ailf-core/index.d.ts";
@@ -10,7 +10,7 @@
10
10
  * means unchanged tasks are skipped. Changed tasks are upserted via
11
11
  * createOrReplace.
12
12
  *
13
- * @see docs/exec-plans/completed/tasks-as-content/phase-5-content-lake-mirroring.md
13
+ * @see docs/exec-plans/tasks-as-content/phase-5-content-lake-mirroring.md
14
14
  */
15
15
  import { createHash } from "crypto";
16
16
  import { isSlugRef, } from "../_vendor/ailf-core/index.js";
@@ -7,7 +7,7 @@
7
7
  * emoji markers, alignment, and color-coding (via unicode markers).
8
8
  * The JSON formatter produces machine-readable output for CI/CD.
9
9
  *
10
- * @see docs/exec-plans/active/execution-preview.md
10
+ * @see docs/exec-plans/execution-preview.md
11
11
  */
12
12
  import type { ExecutionPlan } from "./plan.js";
13
13
  /**
@@ -7,7 +7,7 @@
7
7
  * emoji markers, alignment, and color-coding (via unicode markers).
8
8
  * The JSON formatter produces machine-readable output for CI/CD.
9
9
  *
10
- * @see docs/exec-plans/active/execution-preview.md
10
+ * @see docs/exec-plans/execution-preview.md
11
11
  */
12
12
  import { formatCost } from "../agent-observer/pricing.js";
13
13
  // ---------------------------------------------------------------------------
@@ -7,7 +7,7 @@
7
7
  * anything. Calls existing pure functions (task expansion, model loading,
8
8
  * cache hashing, pricing) and composes them into an `ExecutionPlan`.
9
9
  *
10
- * @see docs/exec-plans/active/execution-preview.md
10
+ * @see docs/exec-plans/execution-preview.md
11
11
  */
12
12
  import type { DebugOptions, EvalMode } from "./types.js";
13
13
  /** Comparison plan for --compare flag. */
@@ -7,7 +7,7 @@
7
7
  * anything. Calls existing pure functions (task expansion, model loading,
8
8
  * cache hashing, pricing) and composes them into an `ExecutionPlan`.
9
9
  *
10
- * @see docs/exec-plans/active/execution-preview.md
10
+ * @see docs/exec-plans/execution-preview.md
11
11
  */
12
12
  import { existsSync, readFileSync, readdirSync, statSync } from "fs";
13
13
  import { resolve } from "path";
@@ -14,7 +14,7 @@
14
14
  * not "are these docs good enough?" The output is always labeled as
15
15
  * directional and never displayed on the same scale as scored evaluations.
16
16
  *
17
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-4-content-release-integration.md
17
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-4-content-release-integration.md
18
18
  */
19
19
  import type { ProbeResult } from "./types.js";
20
20
  /** Generic probe prompt template */
@@ -14,7 +14,7 @@
14
14
  * not "are these docs good enough?" The output is always labeled as
15
15
  * directional and never displayed on the same scale as scored evaluations.
16
16
  *
17
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-4-content-release-integration.md
17
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-4-content-release-integration.md
18
18
  */
19
19
  // ---------------------------------------------------------------------------
20
20
  // Constants
@@ -13,8 +13,8 @@
13
13
  * - generateReadinessReport() — builds the structured report
14
14
  * - formatReadinessMarkdown() — renders the report as markdown
15
15
  *
16
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-5-readiness-thresholds.md
17
- * @see docs/exec-plans/active/eliminate-lib-layer.md
16
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-5-readiness-thresholds.md
17
+ * @see docs/exec-plans/eliminate-lib-layer.md
18
18
  */
19
19
  import type { ThresholdConfig } from "./schemas.js";
20
20
  import type { GapAnalysisReport, GapEstimate, ScoreSummary, ThresholdEvaluation, ThresholdViolation } from "./types.js";
@@ -13,8 +13,8 @@
13
13
  * - generateReadinessReport() — builds the structured report
14
14
  * - formatReadinessMarkdown() — renders the report as markdown
15
15
  *
16
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-5-readiness-thresholds.md
17
- * @see docs/exec-plans/active/eliminate-lib-layer.md
16
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-5-readiness-thresholds.md
17
+ * @see docs/exec-plans/eliminate-lib-layer.md
18
18
  */
19
19
  import { evaluateThresholds } from "./thresholds.js";
20
20
  // ---------------------------------------------------------------------------
@@ -15,7 +15,7 @@
15
15
  * - **not-applicable**: Updated, removed, or unchanged documents (these
16
16
  * follow the standard before/after comparison flow from Phase 2).
17
17
  *
18
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-4-content-release-integration.md
18
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-4-content-release-integration.md
19
19
  */
20
20
  import type { ClassifiedReleaseDocument, ProductFeature, ReleaseClassification } from "./types.js";
21
21
  import type { ReverseMapping } from "./reverse-mapping.js";
@@ -15,7 +15,7 @@
15
15
  * - **not-applicable**: Updated, removed, or unchanged documents (these
16
16
  * follow the standard before/after comparison flow from Phase 2).
17
17
  *
18
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-4-content-release-integration.md
18
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-4-content-release-integration.md
19
19
  */
20
20
  // ---------------------------------------------------------------------------
21
21
  // Public API
@@ -10,7 +10,7 @@
10
10
  * attribution (2c), and probe results (4b) into the document × area × task
11
11
  * impact matrix specified by Scenario 2.4.
12
12
  *
13
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-4-content-release-integration.md
13
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-4-content-release-integration.md
14
14
  */
15
15
  import type { AttributionReport, ComparisonReport, ProbeResult, ReleaseClassification, ReleaseImpactReport } from "./types.js";
16
16
  /**
@@ -10,7 +10,7 @@
10
10
  * attribution (2c), and probe results (4b) into the document × area × task
11
11
  * impact matrix specified by Scenario 2.4.
12
12
  *
13
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-4-content-release-integration.md
13
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-4-content-release-integration.md
14
14
  */
15
15
  // ---------------------------------------------------------------------------
16
16
  // Public API
@@ -12,7 +12,7 @@
12
12
  * - Clear "what does this mean?" context
13
13
  * - skip-ailf bypass instructions
14
14
  *
15
- * @see docs/exec-plans/completed/tasks-as-content/phase-6-pr-quality-gates.md
15
+ * @see docs/exec-plans/tasks-as-content/phase-6-pr-quality-gates.md
16
16
  * @see packages/eval/src/pipeline/repo-threshold-evaluator.ts
17
17
  */
18
18
  import type { ComparisonReport, ScoreSummary } from "./types.js";
@@ -12,7 +12,7 @@
12
12
  * - Clear "what does this mean?" context
13
13
  * - skip-ailf bypass instructions
14
14
  *
15
- * @see docs/exec-plans/completed/tasks-as-content/phase-6-pr-quality-gates.md
15
+ * @see docs/exec-plans/tasks-as-content/phase-6-pr-quality-gates.md
16
16
  * @see packages/eval/src/pipeline/repo-threshold-evaluator.ts
17
17
  */
18
18
  // ---------------------------------------------------------------------------
@@ -10,7 +10,7 @@
10
10
  * thresholds are per-area, defined by the AILF team, and drive
11
11
  * readiness reports.
12
12
  *
13
- * @see docs/exec-plans/completed/tasks-as-content/phase-6-pr-quality-gates.md
13
+ * @see docs/exec-plans/tasks-as-content/phase-6-pr-quality-gates.md
14
14
  * @see packages/eval/src/adapters/task-sources/repo-schemas.ts
15
15
  */
16
16
  import type { ScoreSummary } from "./types.js";
@@ -10,7 +10,7 @@
10
10
  * thresholds are per-area, defined by the AILF team, and drive
11
11
  * readiness reports.
12
12
  *
13
- * @see docs/exec-plans/completed/tasks-as-content/phase-6-pr-quality-gates.md
13
+ * @see docs/exec-plans/tasks-as-content/phase-6-pr-quality-gates.md
14
14
  * @see packages/eval/src/adapters/task-sources/repo-schemas.ts
15
15
  */
16
16
  // ---------------------------------------------------------------------------
@@ -18,7 +18,7 @@
18
18
  * The actual evaluation execution is handled by the pipeline orchestrator —
19
19
  * this module is pure computation on inputs and outputs.
20
20
  *
21
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-4-content-release-integration.md
21
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-4-content-release-integration.md
22
22
  * @see docs/design-docs/scenario-matrix/per-document-attribution.md
23
23
  */
24
24
  import type { AttributionReport, LOOCostEstimate, LOOResult, TaskAttribution } from "./types.js";
@@ -18,7 +18,7 @@
18
18
  * The actual evaluation execution is handled by the pipeline orchestrator —
19
19
  * this module is pure computation on inputs and outputs.
20
20
  *
21
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-4-content-release-integration.md
21
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-4-content-release-integration.md
22
22
  * @see docs/design-docs/scenario-matrix/per-document-attribution.md
23
23
  */
24
24
  // ---------------------------------------------------------------------------
@@ -8,7 +8,7 @@
8
8
  * publish-report-step.ts) is responsible for loading the threshold config
9
9
  * and score summary.
10
10
  *
11
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-5-readiness-thresholds.md
11
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-5-readiness-thresholds.md
12
12
  */
13
13
  import type { ThresholdConfig } from "./schemas.js";
14
14
  import type { ComparisonReport, ScoreSummary, ThresholdEvaluation, ThresholdViolation } from "./types.js";
@@ -8,7 +8,7 @@
8
8
  * publish-report-step.ts) is responsible for loading the threshold config
9
9
  * and score summary.
10
10
  *
11
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-5-readiness-thresholds.md
11
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-5-readiness-thresholds.md
12
12
  */
13
13
  // ---------------------------------------------------------------------------
14
14
  // Severity priority for sorting (higher = more severe)
@@ -19,6 +19,6 @@
19
19
  * - SANITY_API_TOKEN (or AILF_REPORT_SANITY_API_TOKEN) with write access
20
20
  * - SANITY_PROJECT_ID and SANITY_DATASET configured
21
21
  *
22
- * @see docs/exec-plans/completed/tasks-as-content/phase-3-migration.md
22
+ * @see docs/exec-plans/tasks-as-content/phase-3-migration.md
23
23
  */
24
24
  export {};
@@ -19,7 +19,7 @@
19
19
  * - SANITY_API_TOKEN (or AILF_REPORT_SANITY_API_TOKEN) with write access
20
20
  * - SANITY_PROJECT_ID and SANITY_DATASET configured
21
21
  *
22
- * @see docs/exec-plans/completed/tasks-as-content/phase-3-migration.md
22
+ * @see docs/exec-plans/tasks-as-content/phase-3-migration.md
23
23
  */
24
24
  import { config as dotenvConfig } from "dotenv";
25
25
  import { existsSync, readFileSync } from "fs";
@@ -16,6 +16,6 @@
16
16
  * - Migration script has been run (ailf.task documents exist in CL)
17
17
  * - SANITY_API_TOKEN configured for Content Lake reads
18
18
  *
19
- * @see docs/exec-plans/completed/tasks-as-content/phase-3-migration.md
19
+ * @see docs/exec-plans/tasks-as-content/phase-3-migration.md
20
20
  */
21
21
  export {};
@@ -16,7 +16,7 @@
16
16
  * - Migration script has been run (ailf.task documents exist in CL)
17
17
  * - SANITY_API_TOKEN configured for Content Lake reads
18
18
  *
19
- * @see docs/exec-plans/completed/tasks-as-content/phase-3-migration.md
19
+ * @see docs/exec-plans/tasks-as-content/phase-3-migration.md
20
20
  */
21
21
  import { config as dotenvConfig } from "dotenv";
22
22
  import { existsSync } from "fs";
@@ -54,6 +54,6 @@ export interface ReportSink {
54
54
  * - The payload's maxSeverity matches an enabled routing rule
55
55
  * - The payload has regressions and the sink's `regression` rule is enabled
56
56
  *
57
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-5-readiness-thresholds.md
57
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-5-readiness-thresholds.md
58
58
  */
59
59
  export declare function shouldDeliver(routing: SinkRouting | undefined, payload: SinkPayload): boolean;
@@ -21,7 +21,7 @@
21
21
  * - The payload's maxSeverity matches an enabled routing rule
22
22
  * - The payload has regressions and the sink's `regression` rule is enabled
23
23
  *
24
- * @see docs/exec-plans/completed/scenario-matrix-implementation/phase-5-readiness-thresholds.md
24
+ * @see docs/exec-plans/scenario-matrix-implementation/phase-5-readiness-thresholds.md
25
25
  */
26
26
  export function shouldDeliver(routing, payload) {
27
27
  // No routing config = deliver everything (backward compatible)
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@sanity/ailf",
3
- "version": "0.1.30",
3
+ "version": "0.1.32",
4
4
  "private": false,
5
5
  "publishConfig": {
6
6
  "access": "restricted"