@wix/evalforge-evaluator 0.93.0 → 0.95.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/build/index.js CHANGED
@@ -223,23 +223,15 @@ function applyParamsToAssertion(assertion, params) {
223
223
  }
224
224
  if (assertion.type === "llm_judge") {
225
225
  let prompt = assertion.prompt;
226
- let systemPrompt = assertion.systemPrompt;
227
226
  for (const [key, value] of Object.entries(params)) {
228
227
  const placeholder = `{{${key}}}`;
229
228
  const escapedPlaceholder = placeholder.replace(/[{}]/g, "\\$&");
230
229
  const replacement = String(value ?? "");
231
230
  prompt = prompt.replace(new RegExp(escapedPlaceholder, "g"), replacement);
232
- if (systemPrompt) {
233
- systemPrompt = systemPrompt.replace(
234
- new RegExp(escapedPlaceholder, "g"),
235
- replacement
236
- );
237
- }
238
231
  }
239
232
  return {
240
233
  ...assertion,
241
234
  prompt,
242
- systemPrompt,
243
235
  ...params.model !== void 0 && { model: params.model },
244
236
  ...params.maxTokens !== void 0 && {
245
237
  maxTokens: params.maxTokens
@@ -264,6 +256,17 @@ function applyParamsToAssertion(assertion, params) {
264
256
  skillNames: parseSkillNamesFromParams(params.skillNames)
265
257
  };
266
258
  }
259
+ if (assertion.type === "tool_called_with_param") {
260
+ return {
261
+ ...assertion,
262
+ ...params.toolName !== void 0 && {
263
+ toolName: params.toolName
264
+ },
265
+ ...params.expectedParams !== void 0 && {
266
+ expectedParams: params.expectedParams
267
+ }
268
+ };
269
+ }
267
270
  return { ...assertion, ...params };
268
271
  }
269
272
  function resolveSystemAssertion(assertionId, params) {
@@ -276,6 +279,13 @@ function resolveSystemAssertion(assertionId, params) {
276
279
  skillNames: parseSkillNamesFromParams(params?.skillNames)
277
280
  };
278
281
  break;
282
+ case "tool_called_with_param":
283
+ baseAssertion = {
284
+ type: "tool_called_with_param",
285
+ toolName: params?.toolName ?? "",
286
+ expectedParams: params?.expectedParams ?? "{}"
287
+ };
288
+ break;
279
289
  case "build_passed":
280
290
  baseAssertion = {
281
291
  type: "build_passed",
@@ -299,7 +309,6 @@ function resolveSystemAssertion(assertionId, params) {
299
309
  baseAssertion = {
300
310
  type: "llm_judge",
301
311
  prompt: params?.prompt ?? "",
302
- systemPrompt: params?.systemPrompt,
303
312
  minScore: params?.minScore,
304
313
  model: params?.model,
305
314
  maxTokens: params?.maxTokens,
@@ -316,7 +325,6 @@ function customAssertionToAssertion(ca, params) {
316
325
  const baseAssertion = {
317
326
  type: "llm_judge",
318
327
  prompt: config?.prompt ?? "",
319
- systemPrompt: config?.systemPrompt,
320
328
  minScore: config?.minScore,
321
329
  model: config?.model,
322
330
  maxTokens: config?.maxTokens,