npm - @sanity/ailf - Versions diffs - 3.3.1 → 3.4.1 - Mend

@sanity/ailf 3.3.1 → 3.4.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/dist/_vendor/ailf-core/artifact-registry.js +76 -0
package/dist/adapters/task-sources/repo-validation.js +4 -2
package/dist/commands/init.js +5 -0
package/package.json +1 -1

package/dist/_vendor/ailf-core/artifact-registry.js CHANGED Viewed

@@ -320,6 +320,32 @@ const graderPromptPreviewSchema = z.object({
     rubricName: z.string().max(60).optional(),
     snippet: z.string().max(120),
 });
+/**
+ * Preview shape for the run-scoped `pipelineContext` bulk artifact (W0063 /
+ * D0033 M7). Lets the Studio Overview tab render a Pipeline Execution header
+ * row (step count, wall-clock, failed-step badge, quality-gate badge, cache
+ * hit count) without fetching the full context payload — `config` and per-
+ * step detail only land when the panel is expanded.
+ *
+ * Bounds chosen so the worst-case preview fits comfortably under 384 bytes:
+ *   - `failedSteps` is capped at 5 entries with each name ≤ 40 chars. Real
+ *     step names ("fetch-docs", "calculate-scores", "gap-analysis") are 10–
+ *     25 chars; 40 is a defensive ceiling. The array cap exists because
+ *     `fitPreviewToCap` only shortens string fields — an unbounded array
+ *     could push the preview over cap and force it to drop entirely.
+ *     5 is a triage ceiling: the panel shows "showed 5 of N failed steps"
+ *     when `failedSteps.length < stepCount - successCount`, and the full
+ *     per-step list is available in the drilldown payload.
+ *   - `belowCritical` and `cacheHits` are optional — absent on old runs,
+ *     skipped pipelines, or runs without remote-cache telemetry.
+ */
+const pipelineContextPreviewSchema = z.object({
+    stepCount: z.number().int().nonnegative(),
+    totalDurationMs: z.number().nonnegative(),
+    failedSteps: z.array(z.string().max(40)).max(5),
+    belowCritical: z.boolean().optional(),
+    cacheHits: z.number().int().nonnegative().optional(),
+});
 // Aspirational: most payload shapes are still loose. Tightening per-type as
 // consumers stabilize is explicitly a W0050/W0051 concern — W0049 fixes the
 // structural shape around them without changing the payload contracts.
@@ -495,6 +521,56 @@ export const ARTIFACT_REGISTRY = {
         entrySchema: unknownEntry,
         mime: "application/json",
         capBytes: 64_000,
+        manifestPreview: {
+            schema: pipelineContextPreviewSchema,
+            extract: (entry) => {
+                // Producer shape from `capturePipelineContext` in
+                // packages/eval/src/orchestration/pipeline-orchestrator.ts:
+                //   { config, state: { belowCritical, remoteCacheHits, ... },
+                //     steps: [{ name, status: "success"|"failed"|"skipped",
+                //               durationMs? }] }
+                //
+                // `config` and everything else on `state` are drilldown-only and
+                // intentionally absent from the preview — they're what the panel
+                // fetches lazily when expanded.
+                const e = entry;
+                const stepsRaw = Array.isArray(e.steps) ? e.steps : [];
+                let totalDurationMs = 0;
+                const failedSteps = [];
+                let stepCount = 0;
+                for (const raw of stepsRaw) {
+                    if (raw === null || typeof raw !== "object")
+                        continue;
+                    stepCount += 1;
+                    const s = raw;
+                    if (typeof s.durationMs === "number" &&
+                        Number.isFinite(s.durationMs) &&
+                        s.durationMs >= 0) {
+                        totalDurationMs += s.durationMs;
+                    }
+                    if (s.status === "failed" &&
+                        typeof s.name === "string" &&
+                        failedSteps.length < 5) {
+                        failedSteps.push(truncateString(s.name, 40));
+                    }
+                }
+                const belowCritical = typeof e.state?.belowCritical === "boolean"
+                    ? e.state.belowCritical
+                    : undefined;
+                const cacheHitsRaw = e.state?.remoteCacheHits;
+                const cacheHits = Array.isArray(cacheHitsRaw)
+                    ? cacheHitsRaw.length
+                    : undefined;
+                return {
+                    stepCount,
+                    totalDurationMs,
+                    failedSteps,
+                    ...(belowCritical === undefined ? {} : { belowCritical }),
+                    ...(cacheHits === undefined ? {} : { cacheHits }),
+                };
+            },
+            capBytes: 384,
+        },
     }),
     documentManifest: buildDescriptor({
         type: "documentManifest",

package/dist/adapters/task-sources/repo-validation.js CHANGED Viewed

@@ -81,9 +81,11 @@ export function validateCanonicalTasks(tasks) {
                 }
             }
         }
-        // Check task has at least one llm-rubric assertion (recommended but not required)
+        // Check task has at least one llm-rubric assertion (recommended but not required).
+        // agent-harness tasks grade side-effects (file-exists, command-succeeds, etc.),
+        // not text output, so an llm-rubric is not expected.
         const hasLlmRubric = assertions.some((a) => a.type === "llm-rubric");
-        if (!hasLlmRubric) {
+        if (!hasLlmRubric && task.mode !== "agent-harness") {
             warnings.push({
                 taskId: task.id,
                 field: "assertions",

package/dist/commands/init.js CHANGED Viewed

@@ -258,6 +258,11 @@ async function runInit(opts) {
     console.log(`  1. Edit the example tasks in ${rel(targetDir, tasksDir)}/ — update`);
     console.log("     slugs and prompts for your documentation");
     console.log(`  2. Validate locally: npx @sanity/ailf@latest validate-tasks .ailf/tasks/`);
+    console.log();
+    console.log('     Note: tasks with status: "draft" are skipped on normal runs.');
+    console.log("     To run one anyway, target it explicitly with --task <id>, e.g.:");
+    console.log("       npx @sanity/ailf@latest pipeline --task example-agent-add-schema");
+    console.log();
     console.log("  3. Add a GitHub Actions secret");
     console.log("     (Settings → Secrets and variables → Actions):");
     console.log("     • AILF_API_KEY — your API key");

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@sanity/ailf",
-  "version": "3.3.1",
+  "version": "3.4.1",
   "private": false,
   "publishConfig": {
     "access": "public"