@wix/evalforge-evaluator 0.86.0 → 0.88.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/build/index.js CHANGED
@@ -233,7 +233,21 @@ function applyParamsToAssertion(assertion, params) {
233
233
  );
234
234
  }
235
235
  }
236
- return { ...assertion, prompt, systemPrompt };
236
+ return {
237
+ ...assertion,
238
+ prompt,
239
+ systemPrompt,
240
+ ...params.model !== void 0 && { model: params.model },
241
+ ...params.maxTokens !== void 0 && {
242
+ maxTokens: params.maxTokens
243
+ },
244
+ ...params.temperature !== void 0 && {
245
+ temperature: params.temperature
246
+ },
247
+ ...params.minScore !== void 0 && {
248
+ minScore: params.minScore
249
+ }
250
+ };
237
251
  }
238
252
  if (assertion.type === "skill_was_called" && params.skillNames !== void 0) {
239
253
  return {
@@ -265,7 +279,10 @@ function resolveSystemAssertion(assertionId, params) {
265
279
  type: "llm_judge",
266
280
  prompt: params?.prompt ?? "",
267
281
  systemPrompt: params?.systemPrompt,
268
- minScore: params?.minScore
282
+ minScore: params?.minScore,
283
+ model: params?.model,
284
+ maxTokens: params?.maxTokens,
285
+ temperature: params?.temperature
269
286
  };
270
287
  break;
271
288
  default:
@@ -2520,7 +2537,7 @@ async function runScenario(config, evalRunId2, scenario, evalData, template, res
2520
2537
  }))
2521
2538
  };
2522
2539
  const { "x-wix-ai-gateway-stream": _stream, ...judgeHeaders } = config.aiGatewayHeaders;
2523
- const defaultJudgeModel = import_evalforge_types4.AVAILABLE_MODEL_IDS[0];
2540
+ const defaultJudgeModel = import_evalforge_types4.DEFAULT_JUDGE_MODEL;
2524
2541
  const assertionContext = {
2525
2542
  workDir,
2526
2543
  defaultJudgeModel,