@wix/evalforge-types 0.67.0 → 0.69.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/build/index.mjs
CHANGED
|
@@ -1161,7 +1161,19 @@ var EvalRunSchema = TenantEntitySchema.extend({
|
|
|
1161
1161
|
/** Tags used to select scenarios for this run (for traceability) */
|
|
1162
1162
|
tags: z28.array(z28.string()).optional(),
|
|
1163
1163
|
/** How many times each scenario is executed within this eval run. Default: 1. Max: 20. */
|
|
1164
|
-
runsPerScenario: z28.number().int().min(1).max(20).optional()
|
|
1164
|
+
runsPerScenario: z28.number().int().min(1).max(20).optional(),
|
|
1165
|
+
/** Snapshot of agent configuration captured at run creation time */
|
|
1166
|
+
agentSnapshot: z28.object({
|
|
1167
|
+
name: z28.string().optional(),
|
|
1168
|
+
agentType: AgentTypeSchema.optional(),
|
|
1169
|
+
runCommand: AgentRunCommandSchema.optional(),
|
|
1170
|
+
systemPrompt: z28.string().nullable().optional(),
|
|
1171
|
+
modelConfig: ModelConfigSchema.optional()
|
|
1172
|
+
}).optional(),
|
|
1173
|
+
/** UUID linking all runs in a comparison group */
|
|
1174
|
+
comparisonGroupId: z28.string().optional(),
|
|
1175
|
+
/** Human-readable label for this variant (e.g., "MCP: Wix Stores") */
|
|
1176
|
+
comparisonLabel: z28.string().optional()
|
|
1165
1177
|
});
|
|
1166
1178
|
var CreateEvalRunInputSchema = EvalRunSchema.omit({
|
|
1167
1179
|
id: true,
|
|
@@ -1173,7 +1185,8 @@ var CreateEvalRunInputSchema = EvalRunSchema.omit({
|
|
|
1173
1185
|
aggregateMetrics: true,
|
|
1174
1186
|
startedAt: true,
|
|
1175
1187
|
completedAt: true,
|
|
1176
|
-
scenarioIds: true
|
|
1188
|
+
scenarioIds: true,
|
|
1189
|
+
agentSnapshot: true
|
|
1177
1190
|
}).extend({
|
|
1178
1191
|
/** Optional on input — backend resolves from tags when not provided */
|
|
1179
1192
|
scenarioIds: z28.array(z28.string()).optional()
|
|
@@ -1285,6 +1298,8 @@ var EvalRunResultSchema = z30.object({
|
|
|
1285
1298
|
skillVersion: z30.string().optional(),
|
|
1286
1299
|
scenarioId: z30.string(),
|
|
1287
1300
|
scenarioName: z30.string(),
|
|
1301
|
+
/** Snapshot of the trigger prompt used during the run (prevents stale display after edits) */
|
|
1302
|
+
triggerPrompt: z30.string().optional(),
|
|
1288
1303
|
modelConfig: ModelConfigSchema.optional(),
|
|
1289
1304
|
assertionResults: z30.array(AssertionResultSchema),
|
|
1290
1305
|
metrics: EvalMetricsSchema.optional(),
|