@wix/evalforge-evaluator 0.199.0 → 0.201.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/build/index.js +31 -15
- package/build/index.js.map +2 -2
- package/build/index.mjs +31 -15
- package/build/index.mjs.map +2 -2
- package/package.json +3 -3
package/build/index.js
CHANGED
|
@@ -7372,7 +7372,7 @@ var import_fs = require("fs");
|
|
|
7372
7372
|
var import_crypto = require("crypto");
|
|
7373
7373
|
var import_path2 = __toESM(require("path"));
|
|
7374
7374
|
var import_child_process = require("child_process");
|
|
7375
|
-
var INSTALL_TIMEOUT_MS =
|
|
7375
|
+
var INSTALL_TIMEOUT_MS = 12e4;
|
|
7376
7376
|
var HEARTBEAT_INTERVAL_MS = 5e3;
|
|
7377
7377
|
function reportRegistry(workDir, onProgress) {
|
|
7378
7378
|
try {
|
|
@@ -11021,22 +11021,38 @@ async function executeWithAiSdk(context) {
|
|
|
11021
11021
|
...topLevelExtras,
|
|
11022
11022
|
model,
|
|
11023
11023
|
abortSignal: abortController.signal,
|
|
11024
|
-
|
|
11025
|
-
|
|
11026
|
-
|
|
11024
|
+
// Anthropic prompt caching: the Vercel AI SDK can't attach cache_control
|
|
11025
|
+
// to the top-level `system` string, so the system prompt is sent as a
|
|
11026
|
+
// `system` message carrying an ephemeral cache breakpoint (Anthropic only).
|
|
11027
|
+
// Anthropic renders tools -> system -> messages, so a breakpoint on the
|
|
11028
|
+
// system block caches the tool definitions too — high value for MCP
|
|
11029
|
+
// scenarios that share a large tool set + system prompt across runs.
|
|
11030
|
+
messages: [
|
|
11031
|
+
...systemPrompt ? [
|
|
11027
11032
|
{
|
|
11028
|
-
role: "
|
|
11029
|
-
content:
|
|
11030
|
-
|
|
11031
|
-
|
|
11032
|
-
|
|
11033
|
-
|
|
11034
|
-
|
|
11035
|
-
}
|
|
11036
|
-
|
|
11033
|
+
role: "system",
|
|
11034
|
+
content: systemPrompt,
|
|
11035
|
+
...isAnthropic ? {
|
|
11036
|
+
providerOptions: {
|
|
11037
|
+
anthropic: {
|
|
11038
|
+
cacheControl: { type: "ephemeral" }
|
|
11039
|
+
}
|
|
11040
|
+
}
|
|
11041
|
+
} : {}
|
|
11037
11042
|
}
|
|
11038
|
-
]
|
|
11039
|
-
|
|
11043
|
+
] : [],
|
|
11044
|
+
{
|
|
11045
|
+
role: "user",
|
|
11046
|
+
content: hasImages ? [
|
|
11047
|
+
{ type: "text", text: scenario.triggerPrompt },
|
|
11048
|
+
...triggerPromptImages.map((img) => ({
|
|
11049
|
+
type: "image",
|
|
11050
|
+
image: img.base64,
|
|
11051
|
+
mediaType: img.mediaType
|
|
11052
|
+
}))
|
|
11053
|
+
] : scenario.triggerPrompt
|
|
11054
|
+
}
|
|
11055
|
+
],
|
|
11040
11056
|
temperature: supportsThinking ? void 0 : cfg.temperature,
|
|
11041
11057
|
topP: supportsThinking ? void 0 : cfg.topP,
|
|
11042
11058
|
frequencyPenalty: cfg.frequencyPenalty,
|