npm - @wix/evalforge-types - Versions diffs - 0.66.0 → 0.68.0 - Mend

@wix/evalforge-types 0.66.0 → 0.68.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

package/build/index.js +18 -3
package/build/index.js.map +2 -2
package/build/index.mjs +18 -3
package/build/index.mjs.map +2 -2
package/build/types/evaluation/eval-result.d.ts +2 -0
package/build/types/evaluation/eval-run.d.ts +21 -0
package/package.json +2 -2

package/build/index.mjs CHANGED Viewed

@@ -1159,7 +1159,17 @@ var EvalRunSchema = TenantEntitySchema.extend({
   /** Rule IDs to enable for this run (optional) */
   ruleIds: z28.array(z28.string()).optional(),
   /** Tags used to select scenarios for this run (for traceability) */
-  tags: z28.array(z28.string()).optional()
+  tags: z28.array(z28.string()).optional(),
+  /** How many times each scenario is executed within this eval run. Default: 1. Max: 20. */
+  runsPerScenario: z28.number().int().min(1).max(20).optional(),
+  /** Snapshot of agent configuration captured at run creation time */
+  agentSnapshot: z28.object({
+    name: z28.string().optional(),
+    agentType: AgentTypeSchema.optional(),
+    runCommand: AgentRunCommandSchema.optional(),
+    systemPrompt: z28.string().nullable().optional(),
+    modelConfig: ModelConfigSchema.optional()
+  }).optional()
 });
 var CreateEvalRunInputSchema = EvalRunSchema.omit({
   id: true,
@@ -1171,7 +1181,8 @@ var CreateEvalRunInputSchema = EvalRunSchema.omit({
   aggregateMetrics: true,
   startedAt: true,
   completedAt: true,
-  scenarioIds: true
+  scenarioIds: true,
+  agentSnapshot: true
 }).extend({
   /** Optional on input — backend resolves from tags when not provided */
   scenarioIds: z28.array(z28.string()).optional()
@@ -1283,6 +1294,8 @@ var EvalRunResultSchema = z30.object({
   skillVersion: z30.string().optional(),
   scenarioId: z30.string(),
   scenarioName: z30.string(),
+  /** Snapshot of the trigger prompt used during the run (prevents stale display after edits) */
+  triggerPrompt: z30.string().optional(),
   modelConfig: ModelConfigSchema.optional(),
   assertionResults: z30.array(AssertionResultSchema),
   metrics: EvalMetricsSchema.optional(),
@@ -1299,7 +1312,9 @@ var EvalRunResultSchema = z30.object({
   completedAt: z30.string().optional(),
   llmTrace: LLMTraceSchema.optional(),
   /** Full conversation messages (only present in transit; stripped before DB storage) */
-  conversation: z30.array(ConversationMessageSchema).optional()
+  conversation: z30.array(ConversationMessageSchema).optional(),
+  /** 0-based iteration index when a scenario is run multiple times within a single eval run */
+  iterationIndex: z30.number().int().min(0).optional()
 });
 var PromptResultSchema = z30.object({
   text: z30.string(),