@wix/evalforge-types 0.39.0 → 0.40.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/build/index.js +0 -17
- package/build/index.js.map +2 -2
- package/build/index.mjs +0 -17
- package/build/index.mjs.map +2 -2
- package/build/types/assertion/assertion.d.ts +0 -5
- package/build/types/scenario/assertions.d.ts +0 -2
- package/build/types/scenario/test-scenario.d.ts +0 -3
- package/package.json +2 -2
package/build/index.mjs
CHANGED
|
@@ -1363,8 +1363,6 @@ var LlmJudgeAssertionSchema = z21.object({
|
|
|
1363
1363
|
type: z21.literal("llm_judge"),
|
|
1364
1364
|
/** Prompt template; placeholders: {{output}}, {{cwd}}, {{changedFiles}}, {{trace}} */
|
|
1365
1365
|
prompt: z21.string(),
|
|
1366
|
-
/** Optional system prompt for the judge (default asks for JSON with score) */
|
|
1367
|
-
systemPrompt: z21.string().optional(),
|
|
1368
1366
|
/** Minimum score to pass (0-100, default 70) */
|
|
1369
1367
|
minScore: z21.number().int().min(0).max(100).optional(),
|
|
1370
1368
|
/** Model for the judge (e.g. claude-3-5-haiku) */
|
|
@@ -1497,8 +1495,6 @@ var LlmJudgeConfigSchema = z23.object({
|
|
|
1497
1495
|
* - Custom parameters defined in the parameters array
|
|
1498
1496
|
*/
|
|
1499
1497
|
prompt: z23.string().min(1),
|
|
1500
|
-
/** Optional system prompt for the judge */
|
|
1501
|
-
systemPrompt: z23.string().optional(),
|
|
1502
1498
|
/** Minimum score to pass (0-100, default 70) */
|
|
1503
1499
|
minScore: z23.number().int().min(0).max(100).optional(),
|
|
1504
1500
|
/** Model for the judge (e.g. claude-3-5-haiku-20241022) */
|
|
@@ -2178,19 +2174,6 @@ var SYSTEM_ASSERTIONS = {
|
|
|
2178
2174
|
required: true,
|
|
2179
2175
|
defaultValue: "Verify the output meets the acceptance criteria."
|
|
2180
2176
|
},
|
|
2181
|
-
{
|
|
2182
|
-
name: "systemPrompt",
|
|
2183
|
-
label: "System Prompt (optional)",
|
|
2184
|
-
type: "string",
|
|
2185
|
-
required: false,
|
|
2186
|
-
defaultValue: `You are judging a scenario run. Use these values:
|
|
2187
|
-
- {{output}}: the agent's final output
|
|
2188
|
-
- {{cwd}}: working directory
|
|
2189
|
-
- {{changedFiles}}: list of files changed (or "No files were changed")
|
|
2190
|
-
- {{trace}}: step-by-step trace (tool calls, completions) to check e.g. which tools were called and how many times
|
|
2191
|
-
|
|
2192
|
-
Judge how well the output meets the acceptance criteria stated in the user prompt.`
|
|
2193
|
-
},
|
|
2194
2177
|
{
|
|
2195
2178
|
name: "minScore",
|
|
2196
2179
|
label: "Minimum Score (0-100)",
|