@sanity/ailf-studio 0.1.10 → 0.1.12

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/README.md CHANGED
@@ -222,10 +222,11 @@ The plugin exports building blocks for custom views or extensions.
222
222
 
223
223
  ### Document Actions
224
224
 
225
- | Export | Description |
226
- | --------------------------- | ----------------------------------------------------------------------------------- |
227
- | `GraduateToNativeAction` | Converts a mirrored (read-only) task to a native (editable) task by removing origin |
228
- | `createRunEvaluationAction` | Factory for creating a Studio action that triggers evaluations |
225
+ | Export | Description |
226
+ | --------------------------- | -------------------------------------------------------------------------------------------- |
227
+ | `GraduateToNativeAction` | Converts a mirrored (read-only) task to a native (editable) task by removing origin |
228
+ | `RunTaskEvaluationAction` | Triggers a pipeline evaluation scoped to a single task (registered on `ailf.task` documents) |
229
+ | `createRunEvaluationAction` | Factory for creating a Studio action that triggers release-scoped evaluations |
229
230
 
230
231
  ### Glossary
231
232
 
package/dist/index.d.ts CHANGED
@@ -27,6 +27,45 @@ import { DocumentRef } from './document-ref.js';
27
27
 
28
28
  declare const GraduateToNativeAction: DocumentActionComponent;
29
29
 
30
+ /**
31
+ * actions/RunTaskEvaluationAction.tsx
32
+ *
33
+ * Sanity Studio document action that triggers an AILF evaluation for a
34
+ * single task. Appears in the document action menu on `ailf.task` documents.
35
+ *
36
+ * ## Why this exists
37
+ *
38
+ * The release-level `RunEvaluationAction` answers "did my content changes
39
+ * help or hurt AI agents?". This task-level action answers "does this task
40
+ * definition actually work well?" — a tight authoring feedback loop for
41
+ * task authors iterating on prompts, rubrics, and canonical doc references.
42
+ *
43
+ * ## How it works
44
+ *
45
+ * Like `RunEvaluationAction`, this action does NOT hold any secrets. It
46
+ * creates an `ailf.evalRequest` document scoped to a single task. A
47
+ * server-side Sanity webhook picks up the document and dispatches the
48
+ * pipeline.
49
+ *
50
+ * ## Key differences from RunEvaluationAction
51
+ *
52
+ * - Scoped to a single task via `tasks: [taskId]`
53
+ * - No perspective/release — evaluates against the default doc source
54
+ * - Polls for reports matching the task's feature area
55
+ *
56
+ * @see packages/eval/src/webhook/eval-request-handler.ts
57
+ * @see .github/workflows/external-eval.yml
58
+ */
59
+
60
+ /**
61
+ * Document action that triggers a single-task evaluation.
62
+ *
63
+ * Registered on `ailf.task` documents in the plugin definition.
64
+ * Creates an `ailf.evalRequest` doc with `tasks: [taskId]` to
65
+ * run all test cases for the task.
66
+ */
67
+ declare const RunTaskEvaluationAction: DocumentActionComponent;
68
+
30
69
  declare function AssertionInput(props: ObjectInputProps): react_jsx_runtime.JSX.Element;
31
70
 
32
71
  declare function CanonicalDocInput(props: ObjectInputProps): react_jsx_runtime.JSX.Element;
@@ -309,6 +348,7 @@ declare const evalRequestSchema: {
309
348
  preview?: sanity.PreviewConfig<{
310
349
  perspective: string;
311
350
  status: string;
351
+ tasks: string;
312
352
  }, Record<string, unknown>> | undefined;
313
353
  };
314
354
 
@@ -731,11 +771,12 @@ interface TimelineDataPoint {
731
771
 
732
772
  /**
733
773
  * AILF Studio plugin — registers the report schema, dashboard tool,
734
- * and document actions (Graduate to Native for mirrored tasks).
774
+ * and document actions for `ailf.task` documents (Graduate to Native
775
+ * for mirrored tasks, Run Task Evaluation for single-task evals).
735
776
  *
736
777
  * This is the recommended way to install the plugin. It registers
737
778
  * schemas, the dashboard tool, and document-level actions in one call.
738
779
  */
739
780
  declare const ailfPlugin: sanity.Plugin<void>;
740
781
 
741
- export { AssertionInput, CanonicalDocInput, type ComparisonData, type ContentImpactItem, GLOSSARY, GraduateToNativeAction, MirrorBanner, type ProvenanceData, ReleasePicker, type ReportDetail, type ReportListItem, type RunEvaluationActionOptions, type ScoreItem, type SummaryData, SyncStatusBadge, type TimelineDataPoint, ailfPlugin, ailfTool, articleSearchQuery, comparisonPairQuery, contentImpactQuery, createRunEvaluationAction, distinctAreasQuery, distinctModesQuery, distinctPerspectivesQuery, distinctSourcesQuery, distinctTargetDocumentsQuery, evalRequestSchema, featureAreaSchema, latestReportsQuery, recentDocumentEvalsQuery, referenceSolutionSchema, reportDetailQuery, reportSchema, scoreTimelineQuery, taskSchema, webhookConfigSchema };
782
+ export { AssertionInput, CanonicalDocInput, type ComparisonData, type ContentImpactItem, GLOSSARY, GraduateToNativeAction, MirrorBanner, type ProvenanceData, ReleasePicker, type ReportDetail, type ReportListItem, type RunEvaluationActionOptions, RunTaskEvaluationAction, type ScoreItem, type SummaryData, SyncStatusBadge, type TimelineDataPoint, ailfPlugin, ailfTool, articleSearchQuery, comparisonPairQuery, contentImpactQuery, createRunEvaluationAction, distinctAreasQuery, distinctModesQuery, distinctPerspectivesQuery, distinctSourcesQuery, distinctTargetDocumentsQuery, evalRequestSchema, featureAreaSchema, latestReportsQuery, recentDocumentEvalsQuery, referenceSolutionSchema, reportDetailQuery, reportSchema, scoreTimelineQuery, taskSchema, webhookConfigSchema };