@sanity/ailf-studio 0.1.10 → 0.1.11
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +5 -4
- package/dist/index.d.ts +43 -2
- package/dist/index.js +504 -229
- package/package.json +1 -1
package/README.md
CHANGED
|
@@ -222,10 +222,11 @@ The plugin exports building blocks for custom views or extensions.
|
|
|
222
222
|
|
|
223
223
|
### Document Actions
|
|
224
224
|
|
|
225
|
-
| Export | Description
|
|
226
|
-
| --------------------------- |
|
|
227
|
-
| `GraduateToNativeAction` | Converts a mirrored (read-only) task to a native (editable) task by removing origin
|
|
228
|
-
| `
|
|
225
|
+
| Export | Description |
|
|
226
|
+
| --------------------------- | -------------------------------------------------------------------------------------------- |
|
|
227
|
+
| `GraduateToNativeAction` | Converts a mirrored (read-only) task to a native (editable) task by removing origin |
|
|
228
|
+
| `RunTaskEvaluationAction` | Triggers a pipeline evaluation scoped to a single task (registered on `ailf.task` documents) |
|
|
229
|
+
| `createRunEvaluationAction` | Factory for creating a Studio action that triggers release-scoped evaluations |
|
|
229
230
|
|
|
230
231
|
### Glossary
|
|
231
232
|
|
package/dist/index.d.ts
CHANGED
|
@@ -27,6 +27,45 @@ import { DocumentRef } from './document-ref.js';
|
|
|
27
27
|
|
|
28
28
|
declare const GraduateToNativeAction: DocumentActionComponent;
|
|
29
29
|
|
|
30
|
+
/**
|
|
31
|
+
* actions/RunTaskEvaluationAction.tsx
|
|
32
|
+
*
|
|
33
|
+
* Sanity Studio document action that triggers an AILF evaluation for a
|
|
34
|
+
* single task. Appears in the document action menu on `ailf.task` documents.
|
|
35
|
+
*
|
|
36
|
+
* ## Why this exists
|
|
37
|
+
*
|
|
38
|
+
* The release-level `RunEvaluationAction` answers "did my content changes
|
|
39
|
+
* help or hurt AI agents?". This task-level action answers "does this task
|
|
40
|
+
* definition actually work well?" — a tight authoring feedback loop for
|
|
41
|
+
* task authors iterating on prompts, rubrics, and canonical doc references.
|
|
42
|
+
*
|
|
43
|
+
* ## How it works
|
|
44
|
+
*
|
|
45
|
+
* Like `RunEvaluationAction`, this action does NOT hold any secrets. It
|
|
46
|
+
* creates an `ailf.evalRequest` document scoped to a single task. A
|
|
47
|
+
* server-side Sanity webhook picks up the document and dispatches the
|
|
48
|
+
* pipeline.
|
|
49
|
+
*
|
|
50
|
+
* ## Key differences from RunEvaluationAction
|
|
51
|
+
*
|
|
52
|
+
* - Scoped to a single task via `tasks: [taskId]`
|
|
53
|
+
* - No perspective/release — evaluates against the default doc source
|
|
54
|
+
* - Polls for reports matching the task's feature area
|
|
55
|
+
*
|
|
56
|
+
* @see packages/eval/src/webhook/eval-request-handler.ts
|
|
57
|
+
* @see .github/workflows/external-eval.yml
|
|
58
|
+
*/
|
|
59
|
+
|
|
60
|
+
/**
|
|
61
|
+
* Document action that triggers a single-task evaluation.
|
|
62
|
+
*
|
|
63
|
+
* Registered on `ailf.task` documents in the plugin definition.
|
|
64
|
+
* Creates an `ailf.evalRequest` doc with `tasks: [taskId]` to
|
|
65
|
+
* run all test cases for the task.
|
|
66
|
+
*/
|
|
67
|
+
declare const RunTaskEvaluationAction: DocumentActionComponent;
|
|
68
|
+
|
|
30
69
|
declare function AssertionInput(props: ObjectInputProps): react_jsx_runtime.JSX.Element;
|
|
31
70
|
|
|
32
71
|
declare function CanonicalDocInput(props: ObjectInputProps): react_jsx_runtime.JSX.Element;
|
|
@@ -309,6 +348,7 @@ declare const evalRequestSchema: {
|
|
|
309
348
|
preview?: sanity.PreviewConfig<{
|
|
310
349
|
perspective: string;
|
|
311
350
|
status: string;
|
|
351
|
+
tasks: string;
|
|
312
352
|
}, Record<string, unknown>> | undefined;
|
|
313
353
|
};
|
|
314
354
|
|
|
@@ -731,11 +771,12 @@ interface TimelineDataPoint {
|
|
|
731
771
|
|
|
732
772
|
/**
|
|
733
773
|
* AILF Studio plugin — registers the report schema, dashboard tool,
|
|
734
|
-
* and document actions (Graduate to Native
|
|
774
|
+
* and document actions for `ailf.task` documents (Graduate to Native
|
|
775
|
+
* for mirrored tasks, Run Task Evaluation for single-task evals).
|
|
735
776
|
*
|
|
736
777
|
* This is the recommended way to install the plugin. It registers
|
|
737
778
|
* schemas, the dashboard tool, and document-level actions in one call.
|
|
738
779
|
*/
|
|
739
780
|
declare const ailfPlugin: sanity.Plugin<void>;
|
|
740
781
|
|
|
741
|
-
export { AssertionInput, CanonicalDocInput, type ComparisonData, type ContentImpactItem, GLOSSARY, GraduateToNativeAction, MirrorBanner, type ProvenanceData, ReleasePicker, type ReportDetail, type ReportListItem, type RunEvaluationActionOptions, type ScoreItem, type SummaryData, SyncStatusBadge, type TimelineDataPoint, ailfPlugin, ailfTool, articleSearchQuery, comparisonPairQuery, contentImpactQuery, createRunEvaluationAction, distinctAreasQuery, distinctModesQuery, distinctPerspectivesQuery, distinctSourcesQuery, distinctTargetDocumentsQuery, evalRequestSchema, featureAreaSchema, latestReportsQuery, recentDocumentEvalsQuery, referenceSolutionSchema, reportDetailQuery, reportSchema, scoreTimelineQuery, taskSchema, webhookConfigSchema };
|
|
782
|
+
export { AssertionInput, CanonicalDocInput, type ComparisonData, type ContentImpactItem, GLOSSARY, GraduateToNativeAction, MirrorBanner, type ProvenanceData, ReleasePicker, type ReportDetail, type ReportListItem, type RunEvaluationActionOptions, RunTaskEvaluationAction, type ScoreItem, type SummaryData, SyncStatusBadge, type TimelineDataPoint, ailfPlugin, ailfTool, articleSearchQuery, comparisonPairQuery, contentImpactQuery, createRunEvaluationAction, distinctAreasQuery, distinctModesQuery, distinctPerspectivesQuery, distinctSourcesQuery, distinctTargetDocumentsQuery, evalRequestSchema, featureAreaSchema, latestReportsQuery, recentDocumentEvalsQuery, referenceSolutionSchema, reportDetailQuery, reportSchema, scoreTimelineQuery, taskSchema, webhookConfigSchema };
|