@wix/evalforge-evaluator 0.93.0 → 0.95.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/build/index.js +18 -10
- package/build/index.js.map +2 -2
- package/build/index.mjs +18 -10
- package/build/index.mjs.map +2 -2
- package/package.json +5 -5
package/build/index.js
CHANGED
|
@@ -223,23 +223,15 @@ function applyParamsToAssertion(assertion, params) {
|
|
|
223
223
|
}
|
|
224
224
|
if (assertion.type === "llm_judge") {
|
|
225
225
|
let prompt = assertion.prompt;
|
|
226
|
-
let systemPrompt = assertion.systemPrompt;
|
|
227
226
|
for (const [key, value] of Object.entries(params)) {
|
|
228
227
|
const placeholder = `{{${key}}}`;
|
|
229
228
|
const escapedPlaceholder = placeholder.replace(/[{}]/g, "\\$&");
|
|
230
229
|
const replacement = String(value ?? "");
|
|
231
230
|
prompt = prompt.replace(new RegExp(escapedPlaceholder, "g"), replacement);
|
|
232
|
-
if (systemPrompt) {
|
|
233
|
-
systemPrompt = systemPrompt.replace(
|
|
234
|
-
new RegExp(escapedPlaceholder, "g"),
|
|
235
|
-
replacement
|
|
236
|
-
);
|
|
237
|
-
}
|
|
238
231
|
}
|
|
239
232
|
return {
|
|
240
233
|
...assertion,
|
|
241
234
|
prompt,
|
|
242
|
-
systemPrompt,
|
|
243
235
|
...params.model !== void 0 && { model: params.model },
|
|
244
236
|
...params.maxTokens !== void 0 && {
|
|
245
237
|
maxTokens: params.maxTokens
|
|
@@ -264,6 +256,17 @@ function applyParamsToAssertion(assertion, params) {
|
|
|
264
256
|
skillNames: parseSkillNamesFromParams(params.skillNames)
|
|
265
257
|
};
|
|
266
258
|
}
|
|
259
|
+
if (assertion.type === "tool_called_with_param") {
|
|
260
|
+
return {
|
|
261
|
+
...assertion,
|
|
262
|
+
...params.toolName !== void 0 && {
|
|
263
|
+
toolName: params.toolName
|
|
264
|
+
},
|
|
265
|
+
...params.expectedParams !== void 0 && {
|
|
266
|
+
expectedParams: params.expectedParams
|
|
267
|
+
}
|
|
268
|
+
};
|
|
269
|
+
}
|
|
267
270
|
return { ...assertion, ...params };
|
|
268
271
|
}
|
|
269
272
|
function resolveSystemAssertion(assertionId, params) {
|
|
@@ -276,6 +279,13 @@ function resolveSystemAssertion(assertionId, params) {
|
|
|
276
279
|
skillNames: parseSkillNamesFromParams(params?.skillNames)
|
|
277
280
|
};
|
|
278
281
|
break;
|
|
282
|
+
case "tool_called_with_param":
|
|
283
|
+
baseAssertion = {
|
|
284
|
+
type: "tool_called_with_param",
|
|
285
|
+
toolName: params?.toolName ?? "",
|
|
286
|
+
expectedParams: params?.expectedParams ?? "{}"
|
|
287
|
+
};
|
|
288
|
+
break;
|
|
279
289
|
case "build_passed":
|
|
280
290
|
baseAssertion = {
|
|
281
291
|
type: "build_passed",
|
|
@@ -299,7 +309,6 @@ function resolveSystemAssertion(assertionId, params) {
|
|
|
299
309
|
baseAssertion = {
|
|
300
310
|
type: "llm_judge",
|
|
301
311
|
prompt: params?.prompt ?? "",
|
|
302
|
-
systemPrompt: params?.systemPrompt,
|
|
303
312
|
minScore: params?.minScore,
|
|
304
313
|
model: params?.model,
|
|
305
314
|
maxTokens: params?.maxTokens,
|
|
@@ -316,7 +325,6 @@ function customAssertionToAssertion(ca, params) {
|
|
|
316
325
|
const baseAssertion = {
|
|
317
326
|
type: "llm_judge",
|
|
318
327
|
prompt: config?.prompt ?? "",
|
|
319
|
-
systemPrompt: config?.systemPrompt,
|
|
320
328
|
minScore: config?.minScore,
|
|
321
329
|
model: config?.model,
|
|
322
330
|
maxTokens: config?.maxTokens,
|