@wix/evalforge-types 0.39.0 → 0.40.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/build/index.mjs CHANGED
@@ -1363,8 +1363,6 @@ var LlmJudgeAssertionSchema = z21.object({
1363
1363
  type: z21.literal("llm_judge"),
1364
1364
  /** Prompt template; placeholders: {{output}}, {{cwd}}, {{changedFiles}}, {{trace}} */
1365
1365
  prompt: z21.string(),
1366
- /** Optional system prompt for the judge (default asks for JSON with score) */
1367
- systemPrompt: z21.string().optional(),
1368
1366
  /** Minimum score to pass (0-100, default 70) */
1369
1367
  minScore: z21.number().int().min(0).max(100).optional(),
1370
1368
  /** Model for the judge (e.g. claude-3-5-haiku) */
@@ -1497,8 +1495,6 @@ var LlmJudgeConfigSchema = z23.object({
1497
1495
  * - Custom parameters defined in the parameters array
1498
1496
  */
1499
1497
  prompt: z23.string().min(1),
1500
- /** Optional system prompt for the judge */
1501
- systemPrompt: z23.string().optional(),
1502
1498
  /** Minimum score to pass (0-100, default 70) */
1503
1499
  minScore: z23.number().int().min(0).max(100).optional(),
1504
1500
  /** Model for the judge (e.g. claude-3-5-haiku-20241022) */
@@ -2178,19 +2174,6 @@ var SYSTEM_ASSERTIONS = {
2178
2174
  required: true,
2179
2175
  defaultValue: "Verify the output meets the acceptance criteria."
2180
2176
  },
2181
- {
2182
- name: "systemPrompt",
2183
- label: "System Prompt (optional)",
2184
- type: "string",
2185
- required: false,
2186
- defaultValue: `You are judging a scenario run. Use these values:
2187
- - {{output}}: the agent's final output
2188
- - {{cwd}}: working directory
2189
- - {{changedFiles}}: list of files changed (or "No files were changed")
2190
- - {{trace}}: step-by-step trace (tool calls, completions) to check e.g. which tools were called and how many times
2191
-
2192
- Judge how well the output meets the acceptance criteria stated in the user prompt.`
2193
- },
2194
2177
  {
2195
2178
  name: "minScore",
2196
2179
  label: "Minimum Score (0-100)",