npm - @agentv/eval - Versions diffs - 3.4.0 → 3.6.0 - Mend

@agentv/eval 3.4.0 → 3.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/dist/index.d.cts CHANGED Viewed

@@ -153,8 +153,6 @@ declare const MessageSchema: z.ZodObject<{
  * strings. Structured fields (`input`, `output`, `expectedOutput`) are always `Message[]`.
  */
 declare const CodeGraderInputSchema: z.ZodObject<{
-    /** @deprecated Use `inputText` instead. First user message content as string. */
-    question: z.ZodString;
     criteria: z.ZodString;
     expectedOutput: z.ZodArray<z.ZodObject<{
         role: z.ZodEnum<["assistant", "user", "system", "tool"]>;
@@ -224,10 +222,8 @@ declare const CodeGraderInputSchema: z.ZodObject<{
         name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }>, "many">;
-    /** @deprecated Use `expectedOutputText` instead. Expected output content as string. */
-    referenceAnswer: z.ZodOptional<z.ZodString>;
-    /** @deprecated Use `outputText` instead. Last assistant message content as string. */
-    answer: z.ZodString;
+    /** Last assistant message content as string. */
+    outputText: z.ZodString;
     output: z.ZodOptional<z.ZodNullable<z.ZodArray<z.ZodObject<{
         role: z.ZodEnum<["assistant", "user", "system", "tool"]>;
         content: z.ZodOptional<z.ZodUnion<[z.ZodString, z.ZodRecord<z.ZodString, z.ZodUnknown>, z.ZodArray<z.ZodRecord<z.ZodString, z.ZodUnknown>, "many">]>>;
@@ -410,11 +406,9 @@ declare const CodeGraderInputSchema: z.ZodObject<{
     fileChanges: z.ZodOptional<z.ZodNullable<z.ZodString>>;
     workspacePath: z.ZodOptional<z.ZodNullable<z.ZodString>>;
     config: z.ZodOptional<z.ZodNullable<z.ZodRecord<z.ZodString, z.ZodUnknown>>>;
-    /** First user message content as string. Replaces `question`. */
-    inputText: z.ZodOptional<z.ZodString>;
-    /** Last assistant message content as string. Replaces `answer`. */
-    outputText: z.ZodOptional<z.ZodString>;
-    /** Expected output content as string. Replaces `referenceAnswer`. */
+    /** First user message content as string. */
+    inputText: z.ZodString;
+    /** Expected output content as string. */
     expectedOutputText: z.ZodOptional<z.ZodString>;
 }, "strip", z.ZodTypeAny, {
     input: {
@@ -435,7 +429,6 @@ declare const CodeGraderInputSchema: z.ZodObject<{
         name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }[];
-    question: string;
     criteria: string;
     expectedOutput: {
         role: "tool" | "assistant" | "user" | "system";
@@ -455,9 +448,10 @@ declare const CodeGraderInputSchema: z.ZodObject<{
         name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }[];
-    answer: string;
+    outputText: string;
     guidelineFiles: string[];
     inputFiles: string[];
+    inputText: string;
     output?: {
         role: "tool" | "assistant" | "user" | "system";
         startTime?: string | undefined;
@@ -479,7 +473,6 @@ declare const CodeGraderInputSchema: z.ZodObject<{
     startTime?: string | null | undefined;
     endTime?: string | null | undefined;
     durationMs?: number | null | undefined;
-    referenceAnswer?: string | undefined;
     outputPath?: string | undefined;
     trace?: {
         eventCount: number;
@@ -498,8 +491,6 @@ declare const CodeGraderInputSchema: z.ZodObject<{
     fileChanges?: string | null | undefined;
     workspacePath?: string | null | undefined;
     config?: Record<string, unknown> | null | undefined;
-    inputText?: string | undefined;
-    outputText?: string | undefined;
     expectedOutputText?: string | undefined;
 }, {
     input: {
@@ -520,7 +511,6 @@ declare const CodeGraderInputSchema: z.ZodObject<{
         name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }[];
-    question: string;
     criteria: string;
     expectedOutput: {
         role: "tool" | "assistant" | "user" | "system";
@@ -540,9 +530,10 @@ declare const CodeGraderInputSchema: z.ZodObject<{
         name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }[];
-    answer: string;
+    outputText: string;
     guidelineFiles: string[];
     inputFiles: string[];
+    inputText: string;
     output?: {
         role: "tool" | "assistant" | "user" | "system";
         startTime?: string | undefined;
@@ -564,7 +555,6 @@ declare const CodeGraderInputSchema: z.ZodObject<{
     startTime?: string | null | undefined;
     endTime?: string | null | undefined;
     durationMs?: number | null | undefined;
-    referenceAnswer?: string | undefined;
     outputPath?: string | undefined;
     trace?: {
         eventCount: number;
@@ -583,8 +573,6 @@ declare const CodeGraderInputSchema: z.ZodObject<{
     fileChanges?: string | null | undefined;
     workspacePath?: string | null | undefined;
     config?: Record<string, unknown> | null | undefined;
-    inputText?: string | undefined;
-    outputText?: string | undefined;
     expectedOutputText?: string | undefined;
 }>;
 /**
@@ -592,22 +580,36 @@ declare const CodeGraderInputSchema: z.ZodObject<{
  */
 declare const CodeGraderResultSchema: z.ZodObject<{
     score: z.ZodNumber;
-    hits: z.ZodDefault<z.ZodOptional<z.ZodArray<z.ZodString, "many">>>;
-    misses: z.ZodDefault<z.ZodOptional<z.ZodArray<z.ZodString, "many">>>;
-    reasoning: z.ZodOptional<z.ZodString>;
+    assertions: z.ZodDefault<z.ZodOptional<z.ZodArray<z.ZodObject<{
+        text: z.ZodString;
+        passed: z.ZodBoolean;
+        evidence: z.ZodOptional<z.ZodString>;
+    }, "strip", z.ZodTypeAny, {
+        text: string;
+        passed: boolean;
+        evidence?: string | undefined;
+    }, {
+        text: string;
+        passed: boolean;
+        evidence?: string | undefined;
+    }>, "many">>>;
     /** Optional structured details for domain-specific metrics (e.g., TP/TN/FP/FN counts, alignments). */
     details: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
 }, "strip", z.ZodTypeAny, {
     score: number;
-    hits: string[];
-    misses: string[];
-    reasoning?: string | undefined;
+    assertions: {
+        text: string;
+        passed: boolean;
+        evidence?: string | undefined;
+    }[];
     details?: Record<string, unknown> | undefined;
 }, {
     score: number;
-    hits?: string[] | undefined;
-    misses?: string[] | undefined;
-    reasoning?: string | undefined;
+    assertions?: {
+        text: string;
+        passed: boolean;
+        evidence?: string | undefined;
+    }[] | undefined;
     details?: Record<string, unknown> | undefined;
 }>;
 /**
@@ -618,19 +620,15 @@ type CodeGraderResult = z.infer<typeof CodeGraderResultSchema>;
 /**
  * CodeGraderInput after `enrichInput()` has run.
  *
- * The text convenience accessors (`inputText`, `outputText`, `expectedOutputText`)
+ * The text accessors (`inputText`, `outputText`, `expectedOutputText`)
  * are always populated by the runtime before the handler is called, so they are
  * guaranteed to be `string` (never `undefined`).
  *
  * Handler function signatures (`CodeGraderHandler`, `AssertionHandler`) use this
  * type so that user code can destructure `{ outputText }` without null-checks.
  */
-type EnrichedCodeGraderInput = Omit<CodeGraderInput, 'inputText' | 'outputText' | 'expectedOutputText'> & {
-    /** First user message content as string. Replaces `question`. */
-    readonly inputText: string;
-    /** Last assistant message content as string. Replaces `answer`. */
-    readonly outputText: string;
-    /** Expected output content as string. Replaces `referenceAnswer`. */
+type EnrichedCodeGraderInput = Omit<CodeGraderInput, 'expectedOutputText'> & {
+    /** Expected output content as string. */
     readonly expectedOutputText: string;
 };
 type TraceSummary = z.infer<typeof TraceSummarySchema>;
@@ -642,8 +640,6 @@ type TokenUsage = z.infer<typeof TokenUsageSchema>;
  * Uses the same schema as CodeGraderInput since the orchestrator sends identical payloads.
  */
 declare const PromptTemplateInputSchema: z.ZodObject<{
-    /** @deprecated Use `inputText` instead. First user message content as string. */
-    question: z.ZodString;
     criteria: z.ZodString;
     expectedOutput: z.ZodArray<z.ZodObject<{
         role: z.ZodEnum<["assistant", "user", "system", "tool"]>;
@@ -713,10 +709,8 @@ declare const PromptTemplateInputSchema: z.ZodObject<{
         name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }>, "many">;
-    /** @deprecated Use `expectedOutputText` instead. Expected output content as string. */
-    referenceAnswer: z.ZodOptional<z.ZodString>;
-    /** @deprecated Use `outputText` instead. Last assistant message content as string. */
-    answer: z.ZodString;
+    /** Last assistant message content as string. */
+    outputText: z.ZodString;
     output: z.ZodOptional<z.ZodNullable<z.ZodArray<z.ZodObject<{
         role: z.ZodEnum<["assistant", "user", "system", "tool"]>;
         content: z.ZodOptional<z.ZodUnion<[z.ZodString, z.ZodRecord<z.ZodString, z.ZodUnknown>, z.ZodArray<z.ZodRecord<z.ZodString, z.ZodUnknown>, "many">]>>;
@@ -899,11 +893,9 @@ declare const PromptTemplateInputSchema: z.ZodObject<{
     fileChanges: z.ZodOptional<z.ZodNullable<z.ZodString>>;
     workspacePath: z.ZodOptional<z.ZodNullable<z.ZodString>>;
     config: z.ZodOptional<z.ZodNullable<z.ZodRecord<z.ZodString, z.ZodUnknown>>>;
-    /** First user message content as string. Replaces `question`. */
-    inputText: z.ZodOptional<z.ZodString>;
-    /** Last assistant message content as string. Replaces `answer`. */
-    outputText: z.ZodOptional<z.ZodString>;
-    /** Expected output content as string. Replaces `referenceAnswer`. */
+    /** First user message content as string. */
+    inputText: z.ZodString;
+    /** Expected output content as string. */
     expectedOutputText: z.ZodOptional<z.ZodString>;
 }, "strip", z.ZodTypeAny, {
     input: {
@@ -924,7 +916,6 @@ declare const PromptTemplateInputSchema: z.ZodObject<{
         name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }[];
-    question: string;
     criteria: string;
     expectedOutput: {
         role: "tool" | "assistant" | "user" | "system";
@@ -944,9 +935,10 @@ declare const PromptTemplateInputSchema: z.ZodObject<{
         name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }[];
-    answer: string;
+    outputText: string;
     guidelineFiles: string[];
     inputFiles: string[];
+    inputText: string;
     output?: {
         role: "tool" | "assistant" | "user" | "system";
         startTime?: string | undefined;
@@ -968,7 +960,6 @@ declare const PromptTemplateInputSchema: z.ZodObject<{
     startTime?: string | null | undefined;
     endTime?: string | null | undefined;
     durationMs?: number | null | undefined;
-    referenceAnswer?: string | undefined;
     outputPath?: string | undefined;
     trace?: {
         eventCount: number;
@@ -987,8 +978,6 @@ declare const PromptTemplateInputSchema: z.ZodObject<{
     fileChanges?: string | null | undefined;
     workspacePath?: string | null | undefined;
     config?: Record<string, unknown> | null | undefined;
-    inputText?: string | undefined;
-    outputText?: string | undefined;
     expectedOutputText?: string | undefined;
 }, {
     input: {
@@ -1009,7 +998,6 @@ declare const PromptTemplateInputSchema: z.ZodObject<{
         name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }[];
-    question: string;
     criteria: string;
     expectedOutput: {
         role: "tool" | "assistant" | "user" | "system";
@@ -1029,9 +1017,10 @@ declare const PromptTemplateInputSchema: z.ZodObject<{
         name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }[];
-    answer: string;
+    outputText: string;
     guidelineFiles: string[];
     inputFiles: string[];
+    inputText: string;
     output?: {
         role: "tool" | "assistant" | "user" | "system";
         startTime?: string | undefined;
@@ -1053,7 +1042,6 @@ declare const PromptTemplateInputSchema: z.ZodObject<{
     startTime?: string | null | undefined;
     endTime?: string | null | undefined;
     durationMs?: number | null | undefined;
-    referenceAnswer?: string | undefined;
     outputPath?: string | undefined;
     trace?: {
         eventCount: number;
@@ -1072,15 +1060,11 @@ declare const PromptTemplateInputSchema: z.ZodObject<{
     fileChanges?: string | null | undefined;
     workspacePath?: string | null | undefined;
     config?: Record<string, unknown> | null | undefined;
-    inputText?: string | undefined;
-    outputText?: string | undefined;
     expectedOutputText?: string | undefined;
 }>;
 type PromptTemplateInput = CodeGraderInput;
 /** @deprecated Use CodeGraderInputSchema */
 declare const CodeJudgeInputSchema: z.ZodObject<{
-    /** @deprecated Use `inputText` instead. First user message content as string. */
-    question: z.ZodString;
     criteria: z.ZodString;
     expectedOutput: z.ZodArray<z.ZodObject<{
         role: z.ZodEnum<["assistant", "user", "system", "tool"]>;
@@ -1150,10 +1134,8 @@ declare const CodeJudgeInputSchema: z.ZodObject<{
         name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }>, "many">;
-    /** @deprecated Use `expectedOutputText` instead. Expected output content as string. */
-    referenceAnswer: z.ZodOptional<z.ZodString>;
-    /** @deprecated Use `outputText` instead. Last assistant message content as string. */
-    answer: z.ZodString;
+    /** Last assistant message content as string. */
+    outputText: z.ZodString;
     output: z.ZodOptional<z.ZodNullable<z.ZodArray<z.ZodObject<{
         role: z.ZodEnum<["assistant", "user", "system", "tool"]>;
         content: z.ZodOptional<z.ZodUnion<[z.ZodString, z.ZodRecord<z.ZodString, z.ZodUnknown>, z.ZodArray<z.ZodRecord<z.ZodString, z.ZodUnknown>, "many">]>>;
@@ -1336,11 +1318,9 @@ declare const CodeJudgeInputSchema: z.ZodObject<{
     fileChanges: z.ZodOptional<z.ZodNullable<z.ZodString>>;
     workspacePath: z.ZodOptional<z.ZodNullable<z.ZodString>>;
     config: z.ZodOptional<z.ZodNullable<z.ZodRecord<z.ZodString, z.ZodUnknown>>>;
-    /** First user message content as string. Replaces `question`. */
-    inputText: z.ZodOptional<z.ZodString>;
-    /** Last assistant message content as string. Replaces `answer`. */
-    outputText: z.ZodOptional<z.ZodString>;
-    /** Expected output content as string. Replaces `referenceAnswer`. */
+    /** First user message content as string. */
+    inputText: z.ZodString;
+    /** Expected output content as string. */
     expectedOutputText: z.ZodOptional<z.ZodString>;
 }, "strip", z.ZodTypeAny, {
     input: {
@@ -1361,7 +1341,6 @@ declare const CodeJudgeInputSchema: z.ZodObject<{
         name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }[];
-    question: string;
     criteria: string;
     expectedOutput: {
         role: "tool" | "assistant" | "user" | "system";
@@ -1381,9 +1360,10 @@ declare const CodeJudgeInputSchema: z.ZodObject<{
         name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }[];
-    answer: string;
+    outputText: string;
     guidelineFiles: string[];
     inputFiles: string[];
+    inputText: string;
     output?: {
         role: "tool" | "assistant" | "user" | "system";
         startTime?: string | undefined;
@@ -1405,7 +1385,6 @@ declare const CodeJudgeInputSchema: z.ZodObject<{
     startTime?: string | null | undefined;
     endTime?: string | null | undefined;
     durationMs?: number | null | undefined;
-    referenceAnswer?: string | undefined;
     outputPath?: string | undefined;
     trace?: {
         eventCount: number;
@@ -1424,8 +1403,6 @@ declare const CodeJudgeInputSchema: z.ZodObject<{
     fileChanges?: string | null | undefined;
     workspacePath?: string | null | undefined;
     config?: Record<string, unknown> | null | undefined;
-    inputText?: string | undefined;
-    outputText?: string | undefined;
     expectedOutputText?: string | undefined;
 }, {
     input: {
@@ -1446,7 +1423,6 @@ declare const CodeJudgeInputSchema: z.ZodObject<{
         name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }[];
-    question: string;
     criteria: string;
     expectedOutput: {
         role: "tool" | "assistant" | "user" | "system";
@@ -1466,9 +1442,10 @@ declare const CodeJudgeInputSchema: z.ZodObject<{
         name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }[];
-    answer: string;
+    outputText: string;
     guidelineFiles: string[];
     inputFiles: string[];
+    inputText: string;
     output?: {
         role: "tool" | "assistant" | "user" | "system";
         startTime?: string | undefined;
@@ -1490,7 +1467,6 @@ declare const CodeJudgeInputSchema: z.ZodObject<{
     startTime?: string | null | undefined;
     endTime?: string | null | undefined;
     durationMs?: number | null | undefined;
-    referenceAnswer?: string | undefined;
     outputPath?: string | undefined;
     trace?: {
         eventCount: number;
@@ -1509,29 +1485,41 @@ declare const CodeJudgeInputSchema: z.ZodObject<{
     fileChanges?: string | null | undefined;
     workspacePath?: string | null | undefined;
     config?: Record<string, unknown> | null | undefined;
-    inputText?: string | undefined;
-    outputText?: string | undefined;
     expectedOutputText?: string | undefined;
 }>;
 /** @deprecated Use CodeGraderResultSchema */
 declare const CodeJudgeResultSchema: z.ZodObject<{
     score: z.ZodNumber;
-    hits: z.ZodDefault<z.ZodOptional<z.ZodArray<z.ZodString, "many">>>;
-    misses: z.ZodDefault<z.ZodOptional<z.ZodArray<z.ZodString, "many">>>;
-    reasoning: z.ZodOptional<z.ZodString>;
+    assertions: z.ZodDefault<z.ZodOptional<z.ZodArray<z.ZodObject<{
+        text: z.ZodString;
+        passed: z.ZodBoolean;
+        evidence: z.ZodOptional<z.ZodString>;
+    }, "strip", z.ZodTypeAny, {
+        text: string;
+        passed: boolean;
+        evidence?: string | undefined;
+    }, {
+        text: string;
+        passed: boolean;
+        evidence?: string | undefined;
+    }>, "many">>>;
     /** Optional structured details for domain-specific metrics (e.g., TP/TN/FP/FN counts, alignments). */
     details: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
 }, "strip", z.ZodTypeAny, {
     score: number;
-    hits: string[];
-    misses: string[];
-    reasoning?: string | undefined;
+    assertions: {
+        text: string;
+        passed: boolean;
+        evidence?: string | undefined;
+    }[];
     details?: Record<string, unknown> | undefined;
 }, {
     score: number;
-    hits?: string[] | undefined;
-    misses?: string[] | undefined;
-    reasoning?: string | undefined;
+    assertions?: {
+        text: string;
+        passed: boolean;
+        evidence?: string | undefined;
+    }[] | undefined;
     details?: Record<string, unknown> | undefined;
 }>;
 /** @deprecated Use CodeGraderInput */
@@ -1634,7 +1622,7 @@ declare class TargetInvocationError extends Error {
  *
  *   if (!target) {
  *     // Target not available - no target config on this evaluator
- *     return { score: 0.5, reasoning: 'Target not available' };
+ *     return { score: 0.5, assertions: [{ text: 'Target not available', passed: false }] };
  *   }
  *
  *   const response = await target.invoke({
@@ -1675,19 +1663,23 @@ type AssertionType = 'llm-grader' | 'code-grader' | 'rubrics' | 'composite' | 't
 /**
  * Result returned from an assertion handler.
  *
- * @example Pass with reasoning
+ * @example Pass with score
  * ```ts
- * { pass: true, reasoning: 'Output contains expected keywords' }
+ * { pass: true, assertions: [{ text: 'Output contains expected keywords', passed: true }] }
  * ```
  *
- * @example Fail with misses
+ * @example Fail with evidence
  * ```ts
- * { pass: false, misses: ['Missing required header'], score: 0.3 }
+ * { pass: false, score: 0.3, assertions: [{ text: 'Missing required header', passed: false }] }
  * ```
  *
  * @example Granular score (0-1)
  * ```ts
- * { score: 0.75, hits: ['Format correct', 'Content relevant'], misses: ['Missing citation'] }
+ * { score: 0.75, assertions: [
+ *   { text: 'Format correct', passed: true },
+ *   { text: 'Content relevant', passed: true },
+ *   { text: 'Missing citation', passed: false },
+ * ] }
  * ```
  */
 interface AssertionScore {
@@ -1695,12 +1687,12 @@ interface AssertionScore {
     readonly pass?: boolean;
     /** Numeric score between 0 and 1. Defaults to 1 if pass=true, 0 if pass=false. */
     readonly score?: number;
-    /** Aspects that passed. */
-    readonly hits?: readonly string[];
-    /** Aspects that failed. */
-    readonly misses?: readonly string[];
-    /** Human-readable explanation. */
-    readonly reasoning?: string;
+    /** Per-assertion verdicts with optional evidence. */
+    readonly assertions?: readonly {
+        readonly text: string;
+        readonly passed: boolean;
+        readonly evidence?: string;
+    }[];
     /** Optional structured details for domain-specific metrics. */
     readonly details?: Record<string, unknown>;
 }
@@ -1740,7 +1732,7 @@ type CodeJudgeHandler = CodeGraderHandler;
  *
  * export default defineAssertion(({ outputText }) => ({
  *   pass: outputText.includes('hello'),
- *   reasoning: 'Checks greeting',
+ *   assertions: [{ text: 'Checks greeting', passed: outputText.includes('hello') }],
  * }));
  * ```
  *
@@ -1751,8 +1743,7 @@ type CodeJudgeHandler = CodeGraderHandler;
  *
  * export default defineCodeGrader(({ trace, outputText }) => ({
  *   score: trace?.eventCount <= 5 ? 1.0 : 0.5,
- *   hits: ['Efficient tool usage'],
- *   misses: [],
+ *   assertions: [{ text: 'Efficient tool usage', passed: trace?.eventCount <= 5 }],
  * }));
  * ```
  *
@@ -1764,7 +1755,7 @@ type CodeJudgeHandler = CodeGraderHandler;
  * export default defineCodeGrader(async ({ inputText }) => {
  *   const target = createTargetClient();
  *   if (!target) {
- *     return { score: 0, misses: ['Target not available'] };
+ *     return { score: 0, assertions: [{ text: 'Target not available', passed: false }] };
  *   }
  *
  *   const response = await target.invoke({
@@ -1798,14 +1789,13 @@ type CodeJudgeHandler = CodeGraderHandler;
  *
  * export default defineCodeGrader(({ trace }) => {
  *   if (!trace) {
- *     return { score: 0.5, reasoning: 'No trace available' };
+ *     return { score: 0.5, assertions: [{ text: 'No trace available', passed: false }] };
  *   }
  *
  *   const efficient = trace.eventCount <= 10;
  *   return {
  *     score: efficient ? 1.0 : 0.5,
- *     hits: efficient ? ['Efficient execution'] : [],
- *     misses: efficient ? [] : ['Too many tool calls'],
+ *     assertions: [{ text: efficient ? 'Efficient execution' : 'Too many tool calls', passed: efficient }],
  *   };
  * });
  * ```
@@ -1889,7 +1879,7 @@ declare function definePromptTemplate(handler: PromptTemplateHandler): void;
  *
  * export default defineAssertion(({ outputText }) => ({
  *   pass: outputText.toLowerCase().includes('hello'),
- *   reasoning: 'Checks for greeting',
+ *   assertions: [{ text: 'Checks for greeting', passed: outputText.toLowerCase().includes('hello') }],
  * }));
  * ```
  *
@@ -1902,9 +1892,9 @@ declare function definePromptTemplate(handler: PromptTemplateHandler): void;
  *   const isEfficient = (trace?.eventCount ?? 0) <= 5 ? 0.5 : 0;
  *   return {
  *     score: hasContent + isEfficient,
- *     hits: [
- *       ...(hasContent ? ['Has content'] : []),
- *       ...(isEfficient ? ['Efficient'] : []),
+ *     assertions: [
+ *       { text: 'Has content', passed: !!hasContent },
+ *       { text: 'Efficient', passed: !!isEfficient },
  *     ],
  *   };
  * });