@wix/evalforge-evaluator 0.87.0 → 0.88.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/build/index.js +20 -3
- package/build/index.js.map +2 -2
- package/build/index.mjs +21 -4
- package/build/index.mjs.map +2 -2
- package/package.json +4 -4
package/build/index.js
CHANGED
|
@@ -233,7 +233,21 @@ function applyParamsToAssertion(assertion, params) {
|
|
|
233
233
|
);
|
|
234
234
|
}
|
|
235
235
|
}
|
|
236
|
-
return {
|
|
236
|
+
return {
|
|
237
|
+
...assertion,
|
|
238
|
+
prompt,
|
|
239
|
+
systemPrompt,
|
|
240
|
+
...params.model !== void 0 && { model: params.model },
|
|
241
|
+
...params.maxTokens !== void 0 && {
|
|
242
|
+
maxTokens: params.maxTokens
|
|
243
|
+
},
|
|
244
|
+
...params.temperature !== void 0 && {
|
|
245
|
+
temperature: params.temperature
|
|
246
|
+
},
|
|
247
|
+
...params.minScore !== void 0 && {
|
|
248
|
+
minScore: params.minScore
|
|
249
|
+
}
|
|
250
|
+
};
|
|
237
251
|
}
|
|
238
252
|
if (assertion.type === "skill_was_called" && params.skillNames !== void 0) {
|
|
239
253
|
return {
|
|
@@ -265,7 +279,10 @@ function resolveSystemAssertion(assertionId, params) {
|
|
|
265
279
|
type: "llm_judge",
|
|
266
280
|
prompt: params?.prompt ?? "",
|
|
267
281
|
systemPrompt: params?.systemPrompt,
|
|
268
|
-
minScore: params?.minScore
|
|
282
|
+
minScore: params?.minScore,
|
|
283
|
+
model: params?.model,
|
|
284
|
+
maxTokens: params?.maxTokens,
|
|
285
|
+
temperature: params?.temperature
|
|
269
286
|
};
|
|
270
287
|
break;
|
|
271
288
|
default:
|
|
@@ -2520,7 +2537,7 @@ async function runScenario(config, evalRunId2, scenario, evalData, template, res
|
|
|
2520
2537
|
}))
|
|
2521
2538
|
};
|
|
2522
2539
|
const { "x-wix-ai-gateway-stream": _stream, ...judgeHeaders } = config.aiGatewayHeaders;
|
|
2523
|
-
const defaultJudgeModel = import_evalforge_types4.
|
|
2540
|
+
const defaultJudgeModel = import_evalforge_types4.DEFAULT_JUDGE_MODEL;
|
|
2524
2541
|
const assertionContext = {
|
|
2525
2542
|
workDir,
|
|
2526
2543
|
defaultJudgeModel,
|